From c0dad2ef161eebb8db1fca975affe104ff71b844 Mon Sep 17 00:00:00 2001
From: Terts Diepraam <terts.diepraam@gmail.com>
Date: Fri, 7 Jul 2023 14:37:08 +0200
Subject: [PATCH 001/429] add nushell dependency analysis script

---
 util/deps.nu | 155 +++++++++++++++++++++++++++++++++++++++++++++++++++
 1 file changed, 155 insertions(+)
 create mode 100644 util/deps.nu
diff --git a/util/deps.nu b/util/deps.nu
new file mode 100644
index 00000000000..a5bd94c8f51
--- /dev/null
+++ b/util/deps.nu
@@ -0,0 +1,155 @@
+# This is a script to analyze the dependencies of this project.
+# It is a replacement of / complement to
+#
+#  - cargo tree (used by this script)
+#  - cargo deps
+#  - cargo deny
+#
+# The idea is that by calling all_dep_info, you get a table of all dependencies
+# in Cargo.lock, with a few additional columns based on some other tools.
+# Currently, these tools are
+#
+#  - cargo tree
+#  - the crates.io API
+#
+# The most useful columns in the table are:
+#
+#  - `name`: the name of the crate.
+#  - `version`: the version of the crate.
+#  - `num_versions`: the number of versions in Cargo.lock.
+#  - `normal_dep`: whether the crate is a normal dependency.
+#  - `build_dep`: whether the crate is a build dependency.
+#  - `dev_dep`: whether the crate is a dev dependency.
+#  - `organisation`: the GitHub/GitLab organisation or user of the repository of the crate.
+#  - `repository_name`: the name of the repository the crate is in. The format is "{owner}/{repo}".
+#  - `dependencies`: direct dependencies of the crate (in the format of Cargo.lock).
+#
+# To use this script, start nushell (tested only on version 0.82.0), import the library and
+# call `all_dep_info`:
+#
+# ```
+# > nu
+# > use util/deps.nu
+# > let dep = (deps all_dep_info)
+# ```
+#
+# Then you can perform analysis. For example, to group the dependencies by organisation:
+#
+# ```
+# > $dep | group-by organisation   
+# ```
+#
+# Or to find all crates with multiple versions (like cargo deny):
+# ```
+# > $dep | where versions > 1   
+# ```
+#
+# Ideas to expand this:
+# 
+#  - Figure out the whole dependency graph
+#  - Figure out which platforms and which features enable which crates
+#  - Figure out which utils require which crates
+#  - Count the number of crates on different platforms
+#  - Add license information
+#  - Add functions to perform common analyses
+#  - Add info from cargo bloat
+#  - Add MSRV info
+#  - Add up-to-date info (the necessary info is there, it just needs to be derived)
+#  - Check the number of owners/contributors
+#  - Make a webpage to more easily explore the data
+
+# Read the packages a Cargo.lock file
+def read_lockfile [name: path] {
+    open $name | from toml | get package
+}
+
+# Read the names output by cargo tree
+export def read_tree_names [edges: string, features: string] {
+    cargo tree -e $edges --features $features
+    | rg "[a-zA-Z0-9_-]+ v[0-9.]+" -o
+    | lines
+    | each {|x| parse_name_and_version $x }
+}
+
+def parse_name_and_version [s: string] {
+    let s = ($s | split row " ")
+
+    let name = $s.0
+    let version = if ($s | length) > 1 {
+        $s.1 | str substring 1..
+    } else {
+        ""
+    }
+
+    {name: $name, version: $version}
+}
+
+# Read the crates.io info for a list of crates names
+def read_crates_io [names: list<string>] {
+    let total = ($names | length)
+    $names | enumerate | par-each {|el|
+        let key = $el.index
+        let name = $el.item
+        print $"($key)/($total): ($name)"
+        http get $"https://crates.io/api/v1/crates/($name)" | get crate
+    }
+}
+
+def in_table [col_name, table] {
+    insert $col_name {|el|
+        $table
+        | any {|table_el|
+            $table_el.name == $el.name and $table_el.version == $el.version }
+        }
+}
+
+# Add column for a dependency type
+def add_dep_type [dep_type: string, features: string] {
+    in_table $"($dep_type)_dep" (read_tree_names $dep_type $features)
+}
+
+export def all_dep_info [] {
+    let features = unix,feat_selinux
+
+    let lock = (read_lockfile Cargo.lock)
+
+    $lock
+    # Add number of versions
+    | join ($lock | group-by name | transpose | update column1 { length } | rename name num_versions) name
+    # Add dependency types
+    | add_dep_type normal $features
+    | add_dep_type build $features
+    | add_dep_type dev $features
+    | insert used {|x| $x.normal_dep or $x.build_dep or $x.dev_dep}
+    # Add crates.io info
+    | join (read_crates_io ($lock.name | uniq)) name
+    # Add GH org or user info
+    # The organisation is an indicator that crates should be treated as one dependency.
+    # However, there are also unrelated projects by a single organisation, so it's not
+    # clear.
+    | insert organisation {|x|
+        let repository = $x.repository?
+        if ($repository == null) { "" } else {
+            $repository | url parse | get path | path split | get 1
+        }
+    }
+    # Add repository (truncate everything after repo name)
+    # If we get a url like
+    #  https://github.com/uutils/coreutils/tree/src/uu/ls
+    # we only keep
+    #  uutils/coreutils
+    # The idea is that crates in the same repo definitely belong to the same project and should
+    # be treated as one dependency.
+    | insert repository_name {|x|
+        let repository = $x.repository?
+        if ($repository == null) { '' } else {
+            $repository
+            | url parse
+            | get path
+            | path split
+            | select 1 2
+            | path join
+        }
+    }
+}
+

From 948836fb8ff099af1fb78fbf38f315ac52001142 Mon Sep 17 00:00:00 2001
From: Terts Diepraam <terts.diepraam@gmail.com>
Date: Sun, 9 Jul 2023 16:43:48 +0200
Subject: [PATCH 002/429] Update util/deps.nu

Co-authored-by: Daniel Hofstetter <daniel.hofstetter@42dh.com>
---
 util/deps.nu | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/util/deps.nu b/util/deps.nu
index a5bd94c8f51..a35e2d98c96 100644
--- a/util/deps.nu
+++ b/util/deps.nu
@@ -41,7 +41,7 @@
 #
 # Or to find all crates with multiple versions (like cargo deny):
 # ```
-# > $dep | where versions > 1   
+# > $dep | where num_versions > 1   
 # ```
 #
 # Ideas to expand this:

From a3e68d5bbd3d063cac01f77e9870121791e24012 Mon Sep 17 00:00:00 2001
From: Terts Diepraam <terts.diepraam@gmail.com>
Date: Wed, 2 Aug 2023 23:57:26 +0200
Subject: [PATCH 003/429] uucore: start work on a completely new printf
 implementation

---
 src/uucore/Cargo.toml                         |   2 +-
 src/uucore/src/lib/features.rs                |   6 +-
 src/uucore/src/lib/features/format/mod.rs     | 144 +++++
 src/uucore/src/lib/features/format/spec.rs    | 523 ++++++++++++++++++
 src/uucore/src/lib/features/memo.rs           | 175 ------
 src/uucore/src/lib/features/tokenize/mod.rs   |   5 -
 .../tokenize/num_format/format_field.rs       |  43 --
 .../features/tokenize/num_format/formatter.rs |  59 --
 .../num_format/formatters/base_conv/mod.rs    | 270 ---------
 .../num_format/formatters/base_conv/tests.rs  |  56 --
 .../formatters/cninetyninehexfloatf.rs        | 115 ----
 .../tokenize/num_format/formatters/decf.rs    | 185 -------
 .../num_format/formatters/float_common.rs     | 377 -------------
 .../tokenize/num_format/formatters/floatf.rs  |  43 --
 .../tokenize/num_format/formatters/intf.rs    | 282 ----------
 .../tokenize/num_format/formatters/mod.rs     |   9 -
 .../tokenize/num_format/formatters/scif.rs    |  43 --
 .../lib/features/tokenize/num_format/mod.rs   |   4 -
 .../tokenize/num_format/num_format.rs         | 271 ---------
 src/uucore/src/lib/features/tokenize/sub.rs   | 452 ---------------
 src/uucore/src/lib/features/tokenize/token.rs |  39 --
 .../lib/features/tokenize/unescaped_text.rs   | 279 ----------
 src/uucore/src/lib/lib.rs                     |   4 +-
 23 files changed, 672 insertions(+), 2714 deletions(-)
 create mode 100644 src/uucore/src/lib/features/format/mod.rs
 create mode 100644 src/uucore/src/lib/features/format/spec.rs
 delete mode 100644 src/uucore/src/lib/features/memo.rs
 delete mode 100644 src/uucore/src/lib/features/tokenize/mod.rs
 delete mode 100644 src/uucore/src/lib/features/tokenize/num_format/format_field.rs
 delete mode 100644 src/uucore/src/lib/features/tokenize/num_format/formatter.rs
 delete mode 100644 src/uucore/src/lib/features/tokenize/num_format/formatters/base_conv/mod.rs
 delete mode 100644 src/uucore/src/lib/features/tokenize/num_format/formatters/base_conv/tests.rs
 delete mode 100644 src/uucore/src/lib/features/tokenize/num_format/formatters/cninetyninehexfloatf.rs
 delete mode 100644 src/uucore/src/lib/features/tokenize/num_format/formatters/decf.rs
 delete mode 100644 src/uucore/src/lib/features/tokenize/num_format/formatters/float_common.rs
 delete mode 100644 src/uucore/src/lib/features/tokenize/num_format/formatters/floatf.rs
 delete mode 100644 src/uucore/src/lib/features/tokenize/num_format/formatters/intf.rs
 delete mode 100644 src/uucore/src/lib/features/tokenize/num_format/formatters/mod.rs
 delete mode 100644 src/uucore/src/lib/features/tokenize/num_format/formatters/scif.rs
 delete mode 100644 src/uucore/src/lib/features/tokenize/num_format/mod.rs
 delete mode 100644 src/uucore/src/lib/features/tokenize/num_format/num_format.rs
 delete mode 100644 src/uucore/src/lib/features/tokenize/sub.rs
 delete mode 100644 src/uucore/src/lib/features/tokenize/token.rs
 delete mode 100644 src/uucore/src/lib/features/tokenize/unescaped_text.rs

diff --git a/src/uucore/Cargo.toml b/src/uucore/Cargo.toml
index d376e807a20..1c1d4c75443 100644
--- a/src/uucore/Cargo.toml
+++ b/src/uucore/Cargo.toml
@@ -76,7 +76,7 @@ entries = ["libc"]
 fs = ["libc", "winapi-util", "windows-sys"]
 fsext = ["libc", "time", "windows-sys"]
 lines = []
-memo = ["itertools"]
+format = ["itertools"]
 mode = ["libc"]
 perms = ["libc", "walkdir"]
 process = ["libc"]
diff --git a/src/uucore/src/lib/features.rs b/src/uucore/src/lib/features.rs
index f8a8d2d10df..fe48399877b 100644
--- a/src/uucore/src/lib/features.rs
+++ b/src/uucore/src/lib/features.rs
@@ -8,14 +8,12 @@ pub mod fs;
 pub mod fsext;
 #[cfg(feature = "lines")]
 pub mod lines;
-#[cfg(feature = "memo")]
-pub mod memo;
+#[cfg(feature = "format")]
+pub mod format;
 #[cfg(feature = "ringbuffer")]
 pub mod ringbuffer;
 #[cfg(feature = "sum")]
 pub mod sum;
-#[cfg(feature = "memo")]
-mod tokenize;
 
 // * (platform-specific) feature-gated modules
 // ** non-windows (i.e. Unix + Fuchsia)
diff --git a/src/uucore/src/lib/features/format/mod.rs b/src/uucore/src/lib/features/format/mod.rs
new file mode 100644
index 00000000000..abd92011cc4
--- /dev/null
+++ b/src/uucore/src/lib/features/format/mod.rs
@@ -0,0 +1,144 @@
+//! Main entry point for our implementation of printf.
+//!
+//! The [`printf`] and [`sprintf`] closely match the behavior of the
+//! corresponding C functions: the former renders a formatted string
+//! to stdout, the latter renders to a new [`String`] object.
+//! 
+//! In addition to the [`printf`] and [`sprintf`] functions, we expose the
+//! [`Format`] struct, which represents a parsed format string. This reduces
+//! the need for parsing a format string multiple times and assures that no
+//! parsing errors occur during writing.
+// spell-checker:ignore (vars) charf decf floatf intf scif strf Cninety
+
+// mod num_format;
+mod spec;
+
+use spec::Spec;
+use std::io::{stdout, Write};
+
+pub enum FormatError {
+    SpecError,
+    IoError(std::io::Error),
+    NoMoreArguments,
+    InvalidArgument(FormatArgument),
+}
+
+/// A single item to format
+enum FormatItem {
+    /// A format specifier
+    Spec(Spec),
+    /// Some plain text
+    Text(Vec<u8>),
+    /// A single character
+    /// 
+    /// Added in addition to `Text` as an optimization.
+    Char(u8),
+}
+
+pub enum FormatArgument {
+    Char(char),
+    String(String),
+    UnsignedInt(u64),
+    SignedInt(i64),
+    Float(f64),
+}
+
+impl FormatItem {
+    fn write<'a>(&self, mut writer: impl Write, args: &mut impl Iterator<Item = FormatArgument>) -> Result<(), FormatError> {
+        match self {
+            FormatItem::Spec(spec) => spec.write(writer, args),
+            FormatItem::Text(bytes) => writer.write_all(bytes).map_err(FormatError::IoError),
+            FormatItem::Char(char) => writer.write_all(&[*char]).map_err(FormatError::IoError),
+        }
+    }
+}
+
+fn parse_iter(fmt: &[u8]) -> impl Iterator<Item = Result<FormatItem, FormatError>> + '_ {
+    let mut rest = fmt;
+    std::iter::from_fn(move || {
+        if rest.is_empty() {
+            return None;
+        }
+
+        match rest.iter().position(|c| *c == b'%') {
+            None => {
+                let final_text = rest;
+                rest = &[];
+                Some(Ok(FormatItem::Text(final_text.into())))
+            }
+            Some(0) => {
+                // Handle the spec
+                rest = &rest[1..];
+                match rest.get(0) {
+                    None => Some(Ok(FormatItem::Char(b'%'))),
+                    Some(b'%') => {
+                        rest = &rest[1..];
+                        Some(Ok(FormatItem::Char(b'%')))
+                    }
+                    Some(_) => {
+                        let spec = match Spec::parse(&mut rest) {
+                            Some(spec) => spec,
+                            None => return Some(Err(FormatError::SpecError)),
+                        };
+                        Some(Ok(FormatItem::Spec(spec)))
+                    }
+                }
+            }
+            Some(i) => {
+                // The `after` slice includes the % so it will be handled correctly
+                // in the next iteration.
+                let (before, after) = rest.split_at(i);
+                rest = after;
+                return Some(Ok(FormatItem::Text(before.into())));
+            }
+        }
+    })
+}
+
+/// Write a formatted string to stdout.
+///
+/// `format_string` contains the template and `args` contains the
+/// arguments to render into the template.
+///
+/// See also [`sprintf`], which creates a new formatted [`String`].
+///
+/// # Examples
+///
+/// ```rust
+/// use uucore::format::printf;
+///
+/// printf("hello %s", &["world".to_string()]).unwrap();
+/// // prints "hello world"
+/// ```
+pub fn printf(format_string: &[u8], arguments: impl IntoIterator<Item = FormatArgument>) -> Result<(), FormatError> {
+    printf_writer(stdout(), format_string, arguments)
+}
+
+fn printf_writer(mut writer: impl Write, format_string: &[u8], args: impl IntoIterator<Item = FormatArgument>) -> Result<(), FormatError> {
+    let mut args = args.into_iter();
+    for item in parse_iter(format_string) {
+        item?.write(&mut writer, &mut args)?;
+    }
+    Ok(())
+}
+
+/// Create a new formatted string.
+///
+/// `format_string` contains the template and `args` contains the
+/// arguments to render into the template.
+///
+/// See also [`printf`], which prints to stdout.
+///
+/// # Examples
+///
+/// ```rust
+/// use uucore::format::sprintf;
+///
+/// let s = sprintf("hello %s", &["world".to_string()]).unwrap();
+/// assert_eq!(s, "hello world".to_string());
+/// ```
+pub fn sprintf(format_string: &[u8], arguments: impl IntoIterator<Item = FormatArgument>) -> Result<Vec<u8>, FormatError> {
+    let mut writer = Vec::new();
+    printf_writer(&mut writer, format_string, arguments)?;
+    Ok(writer)
+}
diff --git a/src/uucore/src/lib/features/format/spec.rs b/src/uucore/src/lib/features/format/spec.rs
new file mode 100644
index 00000000000..4319e44d93f
--- /dev/null
+++ b/src/uucore/src/lib/features/format/spec.rs
@@ -0,0 +1,523 @@
+// spell-checker:ignore (vars) charf decf floatf intf scif strf Cninety
+
+use super::{FormatArgument, FormatError};
+use std::{fmt::Display, io::Write};
+
+pub enum Spec {
+    Char {
+        width: Option<CanAsterisk<usize>>,
+        align_left: bool,
+    },
+    String {
+        width: Option<CanAsterisk<usize>>,
+        align_left: bool,
+    },
+    SignedInt {
+        width: Option<CanAsterisk<usize>>,
+        positive_sign: PositiveSign,
+        alignment: NumberAlignment,
+    },
+    UnsignedInt {
+        variant: UnsignedIntVariant,
+        width: Option<CanAsterisk<usize>>,
+        alignment: NumberAlignment,
+    },
+    Float {
+        variant: FloatVariant,
+        case: Case,
+        force_decimal: ForceDecimal,
+        width: Option<CanAsterisk<usize>>,
+        positive_sign: PositiveSign,
+        alignment: NumberAlignment,
+        precision: Option<CanAsterisk<usize>>,
+    },
+}
+
+#[derive(Clone, Copy)]
+pub enum UnsignedIntVariant {
+    Decimal,
+    Octal(Prefix),
+    Hexadecimal(Case, Prefix),
+}
+
+#[derive(Clone, Copy)]
+
+pub enum FloatVariant {
+    Decimal,
+    Scientific,
+    Shortest,
+    Hexadecimal,
+}
+
+#[derive(Clone, Copy, PartialEq, Eq)]
+pub enum Case {
+    Lowercase,
+    Uppercase,
+}
+
+#[derive(Clone, Copy, PartialEq, Eq)]
+pub enum Prefix {
+    No,
+    Yes,
+}
+
+#[derive(Clone, Copy, PartialEq, Eq)]
+pub enum ForceDecimal {
+    No,
+    Yes,
+}
+
+#[derive(Clone, Copy)]
+pub enum PositiveSign {
+    None,
+    Plus,
+    Space,
+}
+
+#[derive(Clone, Copy)]
+pub enum NumberAlignment {
+    Left,
+    RightSpace,
+    RightZero,
+}
+
+/// Precision and width specified might use an asterisk to indicate that they are
+/// determined by an argument.
+#[derive(Clone, Copy)]
+pub enum CanAsterisk<T> {
+    Fixed(T),
+    Asterisk,
+}
+
+/// Size of the expected type (ignored)
+///
+/// We ignore this parameter entirely, but we do parse it.
+/// It could be used in the future if the need arises.
+enum Length {
+    /// signed/unsigned char ("hh")
+    Char,
+    /// signed/unsigned short int ("h")
+    Short,
+    /// signed/unsigned long int ("l")
+    Long,
+    /// signed/unsigned long long int ("ll")
+    LongLong,
+    /// intmax_t ("j")
+    IntMaxT,
+    /// size_t ("z")
+    SizeT,
+    /// ptrdiff_t ("t")
+    PtfDiffT,
+    /// long double ("L")
+    LongDouble,
+}
+
+impl Spec {
+    pub fn parse(rest: &mut &[u8]) -> Option<Self> {
+        // Based on the C++ reference, the spec format looks like:
+        //
+        //   %[flags][width][.precision][length]specifier
+        //
+        // However, we have already parsed the '%'.
+
+        let mut minus = false;
+        let mut plus = false;
+        let mut space = false;
+        let mut hash = false;
+        let mut zero = false;
+
+        while let Some(x @ (b'-' | b'+' | b' ' | b'#' | b'0')) = rest.get(0) {
+            match x {
+                b'-' => minus = true,
+                b'+' => plus = true,
+                b' ' => space = true,
+                b'#' => hash = true,
+                b'0' => zero = true,
+                _ => unreachable!(),
+            }
+            *rest = &rest[1..]
+        }
+
+        let width = eat_asterisk_or_number(rest);
+
+        let precision = if let Some(b'.') = rest.get(0) {
+            Some(eat_asterisk_or_number(rest).unwrap_or(CanAsterisk::Fixed(0)))
+        } else {
+            None
+        };
+
+        let length = rest.get(0).and_then(|c| {
+            Some(match c {
+                b'h' => {
+                    if let Some(b'h') = rest.get(1) {
+                        *rest = &rest[1..];
+                        Length::Char
+                    } else {
+                        Length::Short
+                    }
+                }
+                b'l' => {
+                    if let Some(b'l') = rest.get(1) {
+                        *rest = &rest[1..];
+                        Length::Long
+                    } else {
+                        Length::LongLong
+                    }
+                }
+                b'j' => Length::IntMaxT,
+                b'z' => Length::SizeT,
+                b't' => Length::PtfDiffT,
+                b'L' => Length::LongDouble,
+                _ => return None,
+            })
+        });
+
+        if length.is_some() {
+            *rest = &rest[1..];
+        }
+
+        Some(match rest.get(0)? {
+            b'c' => Spec::Char {
+                width,
+                align_left: minus,
+            },
+            b's' => Spec::String {
+                width,
+                align_left: minus,
+            },
+            b'd' | b'i' => Spec::SignedInt {
+                width,
+                alignment: match (minus, zero) {
+                    (true, _) => NumberAlignment::Left,
+                    (false, true) => NumberAlignment::RightZero,
+                    (false, false) => NumberAlignment::RightSpace,
+                },
+                positive_sign: match (plus, space) {
+                    (true, _) => PositiveSign::Plus,
+                    (false, true) => PositiveSign::Space,
+                    (false, false) => PositiveSign::None,
+                },
+            },
+            c @ (b'u' | b'o' | b'x' | b'X') => {
+                let prefix = match hash {
+                    false => Prefix::No,
+                    true => Prefix::Yes,
+                };
+                let alignment = match (minus, zero) {
+                    (true, _) => NumberAlignment::Left,
+                    (false, true) => NumberAlignment::RightZero,
+                    (false, false) => NumberAlignment::RightSpace,
+                };
+                let variant = match c {
+                    b'u' => UnsignedIntVariant::Decimal,
+                    b'o' => UnsignedIntVariant::Octal(prefix),
+                    b'x' => UnsignedIntVariant::Hexadecimal(Case::Lowercase, prefix),
+                    b'X' => UnsignedIntVariant::Hexadecimal(Case::Uppercase, prefix),
+                    _ => unreachable!(),
+                };
+                Spec::UnsignedInt {
+                    variant,
+                    width,
+                    alignment,
+                }
+            }
+            c @ (b'f' | b'F' | b'e' | b'E' | b'g' | b'G' | b'a' | b'A') => Spec::Float {
+                width,
+                precision,
+                variant: match c {
+                    b'f' | b'F' => FloatVariant::Decimal,
+                    b'e' | b'E' => FloatVariant::Scientific,
+                    b'g' | b'G' => FloatVariant::Shortest,
+                    b'a' | b'A' => FloatVariant::Hexadecimal,
+                    _ => unreachable!(),
+                },
+                force_decimal: match hash {
+                    false => ForceDecimal::No,
+                    true => ForceDecimal::Yes,
+                },
+                case: match c.is_ascii_uppercase() {
+                    false => Case::Lowercase,
+                    true => Case::Uppercase,
+                },
+                alignment: match (minus, zero) {
+                    (true, _) => NumberAlignment::Left,
+                    (false, true) => NumberAlignment::RightZero,
+                    (false, false) => NumberAlignment::RightSpace,
+                },
+                positive_sign: match (plus, space) {
+                    (true, _) => PositiveSign::Plus,
+                    (false, true) => PositiveSign::Space,
+                    (false, false) => PositiveSign::None,
+                },
+            },
+            _ => return None,
+        })
+    }
+
+    pub fn write<'a>(
+        &self,
+        mut writer: impl Write,
+        mut args: impl Iterator<Item = FormatArgument>,
+    ) -> Result<(), FormatError> {
+        match self {
+            &Spec::Char { width, align_left } => {
+                let width = resolve_asterisk(width, &mut args)?.unwrap_or(0);
+                let arg = next_arg(&mut args)?;
+                match arg {
+                    FormatArgument::Char(c) => write_padded(writer, c, width, false, align_left),
+                    _ => Err(FormatError::InvalidArgument(arg)),
+                }
+            }
+            &Spec::String { width, align_left } => {
+                let width = resolve_asterisk(width, &mut args)?.unwrap_or(0);
+                let arg = next_arg(&mut args)?;
+                match arg {
+                    FormatArgument::String(s) => write_padded(writer, s, width, false, align_left),
+                    _ => Err(FormatError::InvalidArgument(arg)),
+                }
+            }
+            &Spec::SignedInt {
+                width,
+                positive_sign,
+                alignment,
+            } => {
+                let width = resolve_asterisk(width, &mut args)?.unwrap_or(0);
+
+                let arg = next_arg(&mut args)?;
+                let FormatArgument::SignedInt(i) = arg else {
+                    return Err(FormatError::InvalidArgument(arg));
+                };
+
+                if i >= 0 {
+                    match positive_sign {
+                        PositiveSign::None => Ok(()),
+                        PositiveSign::Plus => write!(writer, "+"),
+                        PositiveSign::Space => write!(writer, " "),
+                    }
+                    .map_err(FormatError::IoError)?;
+                }
+
+                match alignment {
+                    NumberAlignment::Left => write!(writer, "{i:<width$}"),
+                    NumberAlignment::RightSpace => write!(writer, "{i:>width$}"),
+                    NumberAlignment::RightZero => write!(writer, "{i:0>width$}"),
+                }
+                .map_err(FormatError::IoError)
+            }
+            &Spec::UnsignedInt {
+                variant,
+                width,
+                alignment,
+            } => {
+                let width = resolve_asterisk(width, &mut args)?.unwrap_or(0);
+
+                let arg = next_arg(args)?;
+                let FormatArgument::SignedInt(i) = arg else {
+                    return Err(FormatError::InvalidArgument(arg));
+                };
+
+                let s = match variant {
+                    UnsignedIntVariant::Decimal => format!("{i}"),
+                    UnsignedIntVariant::Octal(Prefix::No) => format!("{i:o}"),
+                    UnsignedIntVariant::Octal(Prefix::Yes) => format!("{i:#o}"),
+                    UnsignedIntVariant::Hexadecimal(Case::Lowercase, Prefix::No) => {
+                        format!("{i:x}")
+                    }
+                    UnsignedIntVariant::Hexadecimal(Case::Lowercase, Prefix::Yes) => {
+                        format!("{i:#x}")
+                    }
+                    UnsignedIntVariant::Hexadecimal(Case::Uppercase, Prefix::No) => {
+                        format!("{i:X}")
+                    }
+                    UnsignedIntVariant::Hexadecimal(Case::Uppercase, Prefix::Yes) => {
+                        format!("{i:#X}")
+                    }
+                };
+
+                match alignment {
+                    NumberAlignment::Left => write!(writer, "{s:<width$}"),
+                    NumberAlignment::RightSpace => write!(writer, "{s:>width$}"),
+                    NumberAlignment::RightZero => write!(writer, "{s:0>width$}"),
+                }
+                .map_err(FormatError::IoError)
+            }
+            &Spec::Float {
+                variant,
+                case,
+                force_decimal,
+                width,
+                positive_sign,
+                alignment,
+                precision,
+            } => {
+                let width = resolve_asterisk(width, &mut args)?.unwrap_or(0);
+                let precision = resolve_asterisk(precision, &mut args)?.unwrap_or(6);
+
+                let arg = next_arg(args)?;
+                let FormatArgument::Float(f) = arg else {
+                    return Err(FormatError::InvalidArgument(arg));
+                };
+
+                match positive_sign {
+                    PositiveSign::None => Ok(()),
+                    PositiveSign::Plus => write!(writer, "+"),
+                    PositiveSign::Space => write!(writer, " "),
+                }
+                .map_err(FormatError::IoError)?;
+
+                let s = match variant {
+                    FloatVariant::Decimal => format_float_decimal(f, precision, case, force_decimal),
+                    FloatVariant::Scientific => {
+                        format_float_scientific(f, precision, case, force_decimal)
+                    }
+                    FloatVariant::Shortest => format_float_shortest(f, precision, case, force_decimal),
+                    FloatVariant::Hexadecimal => todo!(),
+                };
+
+                match alignment {
+                    NumberAlignment::Left => write!(writer, "{s:<width$}"),
+                    NumberAlignment::RightSpace => write!(writer, "{s:>width$}"),
+                    NumberAlignment::RightZero => write!(writer, "{s:0>width$}"),
+                }
+                .map_err(FormatError::IoError)
+            }
+        }
+    }
+}
+
+fn format_float_decimal(
+    f: f64,
+    precision: usize,
+    case: Case,
+    force_decimal: ForceDecimal,
+) -> String {
+    if !f.is_finite() {
+        let mut s = format!("{f}");
+        if case == Case::Lowercase {
+            s.make_ascii_uppercase();
+        }
+        return s;
+    }
+
+    if precision == 0 && force_decimal == ForceDecimal::Yes {
+        format!("{f:.0}.")
+    } else {
+        format!("{f:.*}", precision)
+    }
+}
+
+fn format_float_scientific(
+    f: f64,
+    precision: usize,
+    case: Case,
+    force_decimal: ForceDecimal,
+) -> String {
+    // If the float is NaN, -Nan, Inf or -Inf, format like any other float
+    if !f.is_finite() {
+        let mut s = format!("{f}");
+        if case == Case::Lowercase {
+            s.make_ascii_uppercase();
+        }
+        return s;
+    }
+
+    let exponent: i32 = f.log10().floor() as i32;
+    let normalized = f / 10.0_f64.powi(exponent);
+
+    let additional_dot = if precision == 0 && ForceDecimal::Yes == force_decimal {
+        "."
+    } else {
+        ""
+    };
+
+    let exp_char = match case {
+        Case::Lowercase => 'e',
+        Case::Uppercase => 'E',
+    };
+
+    format!(
+        "{normalized:.*}{additional_dot}{exp_char}{exponent:+03}",
+        precision
+    )
+}
+
+// TODO: This could be optimized. It's not terribly important though.
+fn format_float_shortest(
+    f: f64,
+    precision: usize,
+    case: Case,
+    force_decimal: ForceDecimal,
+) -> String {
+    let a = format_float_decimal(f, precision, case, force_decimal);
+    let b = format_float_scientific(f, precision, case, force_decimal);
+
+    if a.len() > b.len() {
+        b
+    } else {
+        a
+    }
+}
+
+fn resolve_asterisk(
+    option: Option<CanAsterisk<usize>>,
+    args: impl Iterator<Item = FormatArgument>,
+) -> Result<Option<usize>, FormatError> {
+    Ok(match option {
+        None => None,
+        Some(CanAsterisk::Asterisk) => {
+            let arg = next_arg(args)?;
+            match arg {
+                FormatArgument::UnsignedInt(u) => match usize::try_from(u) {
+                    Ok(u) => Some(u),
+                    Err(_) => return Err(FormatError::InvalidArgument(arg)),
+                },
+                _ => return Err(FormatError::InvalidArgument(arg)),
+            }
+        }
+        Some(CanAsterisk::Fixed(w)) => Some(w),
+    })
+}
+
+fn next_arg(
+    mut arguments: impl Iterator<Item = FormatArgument>,
+) -> Result<FormatArgument, FormatError> {
+    arguments.next().ok_or(FormatError::NoMoreArguments)
+}
+
+fn write_padded(
+    mut writer: impl Write,
+    text: impl Display,
+    width: usize,
+    pad_zero: bool,
+    left: bool,
+) -> Result<(), FormatError> {
+    match (left, pad_zero) {
+        (false, false) => write!(writer, "{text: >width$}"),
+        (false, true) => write!(writer, "{text:0>width$}"),
+        // 0 is ignored if we pad left.
+        (true, _) => write!(writer, "{text: <width$}"),
+    }
+    .map_err(FormatError::IoError)
+}
+
+fn eat_asterisk_or_number(rest: &mut &[u8]) -> Option<CanAsterisk<usize>> {
+    if let Some(b'*') = rest.get(0) {
+        *rest = &rest[1..];
+        Some(CanAsterisk::Asterisk)
+    } else {
+        eat_number(rest).map(CanAsterisk::Fixed)
+    }
+}
+
+fn eat_number(rest: &mut &[u8]) -> Option<usize> {
+    match rest.iter().position(|b| !b.is_ascii_digit()) {
+        None | Some(0) => None,
+        Some(i) => {
+            // TODO: This might need to handle errors better
+            // For example in case of overflow.
+            let parsed = std::str::from_utf8(&rest[..i]).unwrap().parse().unwrap();
+            *rest = &rest[i..];
+            Some(parsed)
+        }
+    }
+}
diff --git a/src/uucore/src/lib/features/memo.rs b/src/uucore/src/lib/features/memo.rs
deleted file mode 100644
index 47d04f5b861..00000000000
--- a/src/uucore/src/lib/features/memo.rs
+++ /dev/null
@@ -1,175 +0,0 @@
-//! Main entry point for our implementation of printf.
-//!
-//! The [`printf`] and [`sprintf`] closely match the behavior of the
-//! corresponding C functions: the former renders a formatted string
-//! to stdout, the latter renders to a new [`String`] object.
-use crate::display::Quotable;
-use crate::error::{UResult, USimpleError};
-use crate::features::tokenize::sub::SubParser;
-use crate::features::tokenize::token::Token;
-use crate::features::tokenize::unescaped_text::UnescapedText;
-use crate::show_warning;
-use itertools::put_back_n;
-use std::io::{stdout, Cursor, Write};
-use std::iter::Peekable;
-use std::slice::Iter;
-
-/// Memo runner of printf
-/// Takes a format string and arguments
-/// 1. tokenize format string into tokens, consuming
-/// any subst. arguments along the way.
-/// 2. feeds remaining arguments into function
-/// that prints tokens.
-struct Memo {
-    tokens: Vec<Token>,
-}
-
-fn warn_excess_args(first_arg: &str) {
-    show_warning!(
-        "ignoring excess arguments, starting with {}",
-        first_arg.quote()
-    );
-}
-
-impl Memo {
-    fn new<W>(
-        writer: &mut W,
-        pf_string: &str,
-        pf_args_it: &mut Peekable<Iter<String>>,
-    ) -> UResult<Self>
-    where
-        W: Write,
-    {
-        let mut pm = Self { tokens: Vec::new() };
-        let mut it = put_back_n(pf_string.chars());
-        let mut has_sub = false;
-        loop {
-            if let Some(x) = UnescapedText::from_it_core(writer, &mut it, false) {
-                pm.tokens.push(x);
-            }
-            if let Some(x) = SubParser::from_it(writer, &mut it, pf_args_it)? {
-                if !has_sub {
-                    has_sub = true;
-                }
-                pm.tokens.push(x);
-            }
-            if let Some(x) = it.next() {
-                it.put_back(x);
-            } else {
-                break;
-            }
-        }
-        if !has_sub {
-            let mut drain = false;
-            if let Some(first_arg) = pf_args_it.peek() {
-                warn_excess_args(first_arg);
-                drain = true;
-            }
-            if drain {
-                loop {
-                    // drain remaining args;
-                    if pf_args_it.next().is_none() {
-                        break;
-                    }
-                }
-            }
-        }
-        Ok(pm)
-    }
-    fn apply<W>(&self, writer: &mut W, pf_args_it: &mut Peekable<Iter<String>>)
-    where
-        W: Write,
-    {
-        for tkn in &self.tokens {
-            tkn.write(writer, pf_args_it);
-        }
-    }
-    fn run_all<W>(writer: &mut W, pf_string: &str, pf_args: &[String]) -> UResult<()>
-    where
-        W: Write,
-    {
-        let mut arg_it = pf_args.iter().peekable();
-        let pm = Self::new(writer, pf_string, &mut arg_it)?;
-        loop {
-            if arg_it.peek().is_none() {
-                return Ok(());
-            }
-            pm.apply(writer, &mut arg_it);
-        }
-    }
-}
-
-/// Write a formatted string to stdout.
-///
-/// `format_string` contains the template and `args` contains the
-/// arguments to render into the template.
-///
-/// See also [`sprintf`], which creates a new formatted [`String`].
-///
-/// # Examples
-///
-/// ```rust
-/// use uucore::memo::printf;
-///
-/// printf("hello %s", &["world".to_string()]).unwrap();
-/// // prints "hello world"
-/// ```
-pub fn printf(format_string: &str, args: &[String]) -> UResult<()> {
-    let mut writer = stdout();
-    Memo::run_all(&mut writer, format_string, args)
-}
-
-/// Create a new formatted string.
-///
-/// `format_string` contains the template and `args` contains the
-/// arguments to render into the template.
-///
-/// See also [`printf`], which prints to stdout.
-///
-/// # Examples
-///
-/// ```rust
-/// use uucore::memo::sprintf;
-///
-/// let s = sprintf("hello %s", &["world".to_string()]).unwrap();
-/// assert_eq!(s, "hello world".to_string());
-/// ```
-pub fn sprintf(format_string: &str, args: &[String]) -> UResult<String> {
-    let mut writer = Cursor::new(vec![]);
-    Memo::run_all(&mut writer, format_string, args)?;
-    let buf = writer.into_inner();
-    match String::from_utf8(buf) {
-        Ok(s) => Ok(s),
-        Err(e) => Err(USimpleError::new(
-            1,
-            format!("failed to parse formatted string as UTF-8: {e}"),
-        )),
-    }
-}
-
-#[cfg(test)]
-mod tests {
-
-    use crate::memo::sprintf;
-
-    #[test]
-    fn test_sprintf_smoke() {
-        assert_eq!(sprintf("", &[]).unwrap(), "".to_string());
-    }
-
-    #[test]
-    fn test_sprintf_no_args() {
-        assert_eq!(
-            sprintf("hello world", &[]).unwrap(),
-            "hello world".to_string()
-        );
-    }
-
-    #[test]
-    fn test_sprintf_string() {
-        assert_eq!(
-            sprintf("hello %s", &["world".to_string()]).unwrap(),
-            "hello world".to_string()
-        );
-    }
-}
diff --git a/src/uucore/src/lib/features/tokenize/mod.rs b/src/uucore/src/lib/features/tokenize/mod.rs
deleted file mode 100644
index dfe44a0e56b..00000000000
--- a/src/uucore/src/lib/features/tokenize/mod.rs
+++ /dev/null
@@ -1,5 +0,0 @@
-#[allow(clippy::module_inception)]
-mod num_format;
-pub mod sub;
-pub mod token;
-pub mod unescaped_text;
diff --git a/src/uucore/src/lib/features/tokenize/num_format/format_field.rs b/src/uucore/src/lib/features/tokenize/num_format/format_field.rs
deleted file mode 100644
index 02998cde540..00000000000
--- a/src/uucore/src/lib/features/tokenize/num_format/format_field.rs
+++ /dev/null
@@ -1,43 +0,0 @@
-// spell-checker:ignore (vars) charf decf floatf intf scif strf Cninety
-
-//! Primitives used by Sub Tokenizer
-//! and num_format modules
-#[derive(Clone)]
-pub enum FieldType {
-    Strf,
-    Floatf,
-    CninetyNineHexFloatf,
-    Scif,
-    Decf,
-    Intf,
-    Charf,
-}
-
-// #[allow(non_camel_case_types)]
-// pub enum FChar {
-// d,
-// e,
-// E,
-// i,
-// f,
-// F,
-// g,
-// G,
-// u,
-// x,
-// X,
-// o
-// }
-//
-
-// a Sub Tokens' fields are stored
-// as a single object so they can be more simply
-// passed by ref to num_format in a Sub method
-#[derive(Clone)]
-pub struct FormatField<'a> {
-    pub min_width: Option<isize>,
-    pub second_field: Option<u32>,
-    pub field_char: &'a char,
-    pub field_type: &'a FieldType,
-    pub orig: &'a String,
-}
diff --git a/src/uucore/src/lib/features/tokenize/num_format/formatter.rs b/src/uucore/src/lib/features/tokenize/num_format/formatter.rs
deleted file mode 100644
index ed7d5a0f609..00000000000
--- a/src/uucore/src/lib/features/tokenize/num_format/formatter.rs
+++ /dev/null
@@ -1,59 +0,0 @@
-//! Primitives used by num_format and sub_modules.
-//! never dealt with above (e.g. Sub Tokenizer never uses these)
-
-use crate::{display::Quotable, show_error};
-use itertools::{put_back_n, PutBackN};
-use std::str::Chars;
-
-use super::format_field::FormatField;
-
-// contains the rough ingredients to final
-// output for a number, organized together
-// to allow for easy generalization of output manipulation
-// (e.g. max number of digits after decimal)
-#[derive(Default)]
-pub struct FormatPrimitive {
-    pub prefix: Option<String>,
-    pub pre_decimal: Option<String>,
-    pub post_decimal: Option<String>,
-    pub suffix: Option<String>,
-}
-
-#[derive(Clone, PartialEq, Eq)]
-pub enum Base {
-    Ten = 10,
-    Hex = 16,
-    Octal = 8,
-}
-
-// information from the beginning of a numeric argument
-// the precedes the beginning of a numeric value
-pub struct InitialPrefix {
-    pub radix_in: Base,
-    pub sign: i8,
-    pub offset: usize,
-}
-
-pub trait Formatter {
-    //  return a FormatPrimitive for
-    // particular field char(s), given the argument
-    // string and prefix information (sign, radix)
-    fn get_primitive(
-        &self,
-        field: &FormatField,
-        in_prefix: &InitialPrefix,
-        str_in: &str,
-    ) -> Option<FormatPrimitive>;
-    // return a string from a FormatPrimitive,
-    // given information about the field
-    fn primitive_to_str(&self, prim: &FormatPrimitive, field: FormatField) -> String;
-}
-pub fn get_it_at(offset: usize, str_in: &str) -> PutBackN<Chars> {
-    put_back_n(str_in[offset..].chars())
-}
-
-// TODO: put this somewhere better
-pub fn warn_incomplete_conv(pf_arg: &str) {
-    // important: keep println here not print
-    show_error!("{}: value not completely converted", pf_arg.maybe_quote());
-}
diff --git a/src/uucore/src/lib/features/tokenize/num_format/formatters/base_conv/mod.rs b/src/uucore/src/lib/features/tokenize/num_format/formatters/base_conv/mod.rs
deleted file mode 100644
index 3df9f7129bc..00000000000
--- a/src/uucore/src/lib/features/tokenize/num_format/formatters/base_conv/mod.rs
+++ /dev/null
@@ -1,270 +0,0 @@
-// spell-checker:ignore (ToDO) arrnum arr_num mult basenum bufferval refd vals arrfloat conv intermed addl
-
-pub fn arrnum_int_mult(arr_num: &[u8], basenum: u8, base_ten_int_fact: u8) -> Vec<u8> {
-    let mut carry: u16 = 0;
-    let mut rem: u16;
-    let mut new_amount: u16;
-    let fact: u16 = u16::from(base_ten_int_fact);
-    let base: u16 = u16::from(basenum);
-
-    let mut ret_rev: Vec<u8> = Vec::new();
-    let mut it = arr_num.iter().rev();
-    loop {
-        let i = it.next();
-        match i {
-            Some(u) => {
-                new_amount = (u16::from(*u) * fact) + carry;
-                rem = new_amount % base;
-                carry = (new_amount - rem) / base;
-                ret_rev.push(rem as u8);
-            }
-            None => {
-                while carry != 0 {
-                    rem = carry % base;
-                    carry = (carry - rem) / base;
-                    ret_rev.push(rem as u8);
-                }
-                break;
-            }
-        }
-    }
-    let ret: Vec<u8> = ret_rev.into_iter().rev().collect();
-    ret
-}
-
-#[allow(dead_code)]
-pub struct Remainder<'a> {
-    pub position: usize,
-    pub replace: Vec<u8>,
-    pub arr_num: &'a Vec<u8>,
-}
-
-#[allow(dead_code)]
-pub struct DivOut<'a> {
-    pub quotient: u8,
-    pub remainder: Remainder<'a>,
-}
-
-#[allow(dead_code)]
-pub fn arrnum_int_div_step<'a>(
-    rem_in: &'a Remainder,
-    radix_in: u8,
-    base_ten_int_divisor: u8,
-    after_decimal: bool,
-) -> DivOut<'a> {
-    let mut rem_out = Remainder {
-        position: rem_in.position,
-        replace: Vec::new(),
-        arr_num: rem_in.arr_num,
-    };
-
-    let mut bufferval: u16 = 0;
-    let base: u16 = u16::from(radix_in);
-    let divisor: u16 = u16::from(base_ten_int_divisor);
-    let mut traversed = 0;
-
-    let mut quotient = 0;
-    let refd_vals = &rem_in.arr_num[rem_in.position + rem_in.replace.len()..];
-    let mut it_replace = rem_in.replace.iter();
-    let mut it_f = refd_vals.iter();
-    loop {
-        let u = match it_replace.next() {
-            Some(u_rep) => u16::from(*u_rep),
-            None => match it_f.next() {
-                Some(u_orig) => u16::from(*u_orig),
-                None => {
-                    if !after_decimal {
-                        break;
-                    }
-                    0
-                }
-            },
-        };
-        traversed += 1;
-        bufferval += u;
-        if bufferval > divisor {
-            while bufferval >= divisor {
-                quotient += 1;
-                bufferval -= divisor;
-            }
-            rem_out.replace = if bufferval == 0 {
-                Vec::new()
-            } else {
-                let remainder_as_arrnum = unsigned_to_arrnum(bufferval);
-                base_conv_vec(&remainder_as_arrnum, 10, radix_in)
-            };
-            rem_out.position += 1 + (traversed - rem_out.replace.len());
-            break;
-        } else {
-            bufferval *= base;
-        }
-    }
-    DivOut {
-        quotient,
-        remainder: rem_out,
-    }
-}
-pub fn arrnum_int_add(arrnum: &[u8], basenum: u8, base_ten_int_term: u8) -> Vec<u8> {
-    let mut carry: u16 = u16::from(base_ten_int_term);
-    let mut rem: u16;
-    let mut new_amount: u16;
-    let base: u16 = u16::from(basenum);
-
-    let mut ret_rev: Vec<u8> = Vec::new();
-    let mut it = arrnum.iter().rev();
-    loop {
-        let i = it.next();
-        match i {
-            Some(u) => {
-                new_amount = u16::from(*u) + carry;
-                rem = new_amount % base;
-                carry = (new_amount - rem) / base;
-                ret_rev.push(rem as u8);
-            }
-            None => {
-                while carry != 0 {
-                    rem = carry % base;
-                    carry = (carry - rem) / base;
-                    ret_rev.push(rem as u8);
-                }
-                break;
-            }
-        }
-    }
-    let ret: Vec<u8> = ret_rev.into_iter().rev().collect();
-    ret
-}
-
-pub fn base_conv_vec(src: &[u8], radix_src: u8, radix_dest: u8) -> Vec<u8> {
-    let mut result = vec![0];
-    for i in src {
-        result = arrnum_int_mult(&result, radix_dest, radix_src);
-        result = arrnum_int_add(&result, radix_dest, *i);
-    }
-    result
-}
-
-#[allow(dead_code)]
-pub fn unsigned_to_arrnum(src: u16) -> Vec<u8> {
-    let mut result: Vec<u8> = Vec::new();
-    let mut src_tmp: u16 = src;
-    while src_tmp > 0 {
-        result.push((src_tmp % 10) as u8);
-        src_tmp /= 10;
-    }
-    result.reverse();
-    result
-}
-
-// temporary needs-improvement-function
-pub fn base_conv_float(src: &[u8], radix_src: u8, _radix_dest: u8) -> f64 {
-    // it would require a lot of addl code
-    // to implement this for arbitrary string input.
-    // until then, the below operates as an outline
-    // of how it would work.
-    let mut factor: f64 = 1_f64;
-    let radix_src_float: f64 = f64::from(radix_src);
-    let mut r: f64 = 0_f64;
-    for (i, u) in src.iter().enumerate() {
-        if i > 15 {
-            break;
-        }
-        factor /= radix_src_float;
-        r += factor * f64::from(*u);
-    }
-    r
-}
-
-pub fn str_to_arrnum(src: &str, radix_def_src: &dyn RadixDef) -> Vec<u8> {
-    let mut intermed_in: Vec<u8> = Vec::new();
-    for c in src.chars() {
-        #[allow(clippy::single_match)]
-        match radix_def_src.parse_char(c) {
-            Some(u) => {
-                intermed_in.push(u);
-            }
-            None => {} //todo err msg on incorrect
-        }
-    }
-    intermed_in
-}
-
-pub fn arrnum_to_str(src: &[u8], radix_def_dest: &dyn RadixDef) -> String {
-    let mut str_out = String::new();
-    for u in src.iter() {
-        #[allow(clippy::single_match)]
-        match radix_def_dest.format_u8(*u) {
-            Some(c) => {
-                str_out.push(c);
-            }
-            None => {} //todo
-        }
-    }
-    str_out
-}
-
-pub fn base_conv_str(
-    src: &str,
-    radix_def_src: &dyn RadixDef,
-    radix_def_dest: &dyn RadixDef,
-) -> String {
-    let intermed_in: Vec<u8> = str_to_arrnum(src, radix_def_src);
-    let intermed_out = base_conv_vec(
-        &intermed_in,
-        radix_def_src.get_max(),
-        radix_def_dest.get_max(),
-    );
-    arrnum_to_str(&intermed_out, radix_def_dest)
-}
-
-pub trait RadixDef {
-    fn get_max(&self) -> u8;
-    fn parse_char(&self, x: char) -> Option<u8>;
-    fn format_u8(&self, x: u8) -> Option<char>;
-}
-pub struct RadixTen;
-
-const ZERO_ASC: u8 = b'0';
-const UPPER_A_ASC: u8 = b'A';
-const LOWER_A_ASC: u8 = b'a';
-
-impl RadixDef for RadixTen {
-    fn get_max(&self) -> u8 {
-        10
-    }
-    fn parse_char(&self, c: char) -> Option<u8> {
-        match c {
-            '0'..='9' => Some(c as u8 - ZERO_ASC),
-            _ => None,
-        }
-    }
-    fn format_u8(&self, u: u8) -> Option<char> {
-        match u {
-            0..=9 => Some((ZERO_ASC + u) as char),
-            _ => None,
-        }
-    }
-}
-pub struct RadixHex;
-impl RadixDef for RadixHex {
-    fn get_max(&self) -> u8 {
-        16
-    }
-    fn parse_char(&self, c: char) -> Option<u8> {
-        match c {
-            '0'..='9' => Some(c as u8 - ZERO_ASC),
-            'A'..='F' => Some(c as u8 + 10 - UPPER_A_ASC),
-            'a'..='f' => Some(c as u8 + 10 - LOWER_A_ASC),
-            _ => None,
-        }
-    }
-    fn format_u8(&self, u: u8) -> Option<char> {
-        match u {
-            0..=9 => Some((ZERO_ASC + u) as char),
-            10..=15 => Some((UPPER_A_ASC + (u - 10)) as char),
-            _ => None,
-        }
-    }
-}
-
-mod tests;
diff --git a/src/uucore/src/lib/features/tokenize/num_format/formatters/base_conv/tests.rs b/src/uucore/src/lib/features/tokenize/num_format/formatters/base_conv/tests.rs
deleted file mode 100644
index 903a3faf142..00000000000
--- a/src/uucore/src/lib/features/tokenize/num_format/formatters/base_conv/tests.rs
+++ /dev/null
@@ -1,56 +0,0 @@
-// spell-checker:ignore (ToDO) arrnum mult
-
-#[cfg(test)]
-use super::*;
-
-#[test]
-fn test_arrnum_int_mult() {
-    // (in base 10) 12 * 4 = 48
-    let factor: Vec<u8> = vec![1, 2];
-    let base_num = 10;
-    let base_ten_int_fact: u8 = 4;
-    let should_output: Vec<u8> = vec![4, 8];
-
-    let product = arrnum_int_mult(&factor, base_num, base_ten_int_fact);
-    assert!(product == should_output);
-}
-
-#[test]
-fn test_arrnum_int_non_base_10() {
-    // (in base 3)
-    // 5 * 4 = 20
-    let factor: Vec<u8> = vec![1, 2];
-    let base_num = 3;
-    let base_ten_int_fact: u8 = 4;
-    let should_output: Vec<u8> = vec![2, 0, 2];
-
-    let product = arrnum_int_mult(&factor, base_num, base_ten_int_fact);
-    assert!(product == should_output);
-}
-
-#[test]
-fn test_arrnum_int_div_short_circuit() {
-    // (
-    let arrnum: Vec<u8> = vec![5, 5, 5, 5, 0];
-    let base_num = 10;
-    let base_ten_int_divisor: u8 = 41;
-    let remainder_passed_in = Remainder {
-        position: 1,
-        replace: vec![1, 3],
-        arr_num: &arrnum,
-    };
-
-    // the "replace" should mean the number being divided
-    // is 1350, the first time you can get 41 to go into
-    // 1350, its at 135, where you can get a quotient of
-    // 3 and a remainder of 12;
-
-    let quotient_should_be: u8 = 3;
-    let remainder_position_should_be: usize = 3;
-    let remainder_replace_should_be = vec![1, 2];
-
-    let result = arrnum_int_div_step(&remainder_passed_in, base_num, base_ten_int_divisor, false);
-    assert!(quotient_should_be == result.quotient);
-    assert!(remainder_position_should_be == result.remainder.position);
-    assert!(remainder_replace_should_be == result.remainder.replace);
-}
diff --git a/src/uucore/src/lib/features/tokenize/num_format/formatters/cninetyninehexfloatf.rs b/src/uucore/src/lib/features/tokenize/num_format/formatters/cninetyninehexfloatf.rs
deleted file mode 100644
index a5c51153efd..00000000000
--- a/src/uucore/src/lib/features/tokenize/num_format/formatters/cninetyninehexfloatf.rs
+++ /dev/null
@@ -1,115 +0,0 @@
-// spell-checker:ignore (vars) charf decf floatf intf scif strf Cninety
-// spell-checker:ignore (ToDO) arrnum
-
-//! formatter for %a %F C99 Hex-floating-point subs
-use super::super::format_field::FormatField;
-use super::super::formatter::{FormatPrimitive, Formatter, InitialPrefix};
-use super::base_conv;
-use super::base_conv::RadixDef;
-use super::float_common::{primitive_to_str_common, FloatAnalysis};
-
-#[derive(Default)]
-pub struct CninetyNineHexFloatf {
-    #[allow(dead_code)]
-    as_num: f64,
-}
-impl CninetyNineHexFloatf {
-    pub fn new() -> Self {
-        Self::default()
-    }
-}
-
-impl Formatter for CninetyNineHexFloatf {
-    fn get_primitive(
-        &self,
-        field: &FormatField,
-        initial_prefix: &InitialPrefix,
-        str_in: &str,
-    ) -> Option<FormatPrimitive> {
-        let second_field = field.second_field.unwrap_or(6) + 1;
-        let analysis = FloatAnalysis::analyze(
-            str_in,
-            initial_prefix,
-            Some(second_field as usize),
-            None,
-            true,
-        );
-        let f = get_primitive_hex(
-            initial_prefix,
-            &str_in[initial_prefix.offset..],
-            &analysis,
-            second_field as usize,
-            *field.field_char == 'A',
-        );
-        Some(f)
-    }
-    fn primitive_to_str(&self, prim: &FormatPrimitive, field: FormatField) -> String {
-        primitive_to_str_common(prim, &field)
-    }
-}
-
-// c99 hex has unique requirements of all floating point subs in pretty much every part of building a primitive, from prefix and suffix to need for base conversion (in all other cases if you don't have decimal you must have decimal, here it's the other way around)
-
-// on the todo list is to have a trait for get_primitive that is implemented by each float formatter and can override a default. when that happens we can take the parts of get_primitive_dec specific to dec and spin them out to their own functions that can be overridden.
-fn get_primitive_hex(
-    initial_prefix: &InitialPrefix,
-    _str_in: &str,
-    _analysis: &FloatAnalysis,
-    _last_dec_place: usize,
-    capitalized: bool,
-) -> FormatPrimitive {
-    let prefix = Some(String::from(if initial_prefix.sign == -1 {
-        "-0x"
-    } else {
-        "0x"
-    }));
-
-    // TODO actual conversion, make sure to get back mantissa.
-    // for hex to hex, it's really just a matter of moving the
-    // decimal point and calculating the mantissa by its initial
-    // position and its moves, with every position counting for
-    // the addition or subtraction of 4 (2**4, because 4 bits in a hex digit)
-    // to the exponent.
-    // decimal's going to be a little more complicated. correct simulation
-    // of glibc will require after-decimal division to a specified precision.
-    // the difficult part of this (arrnum_int_div_step) is already implemented.
-
-    // the hex float name may be a bit misleading in terms of how to go about the
-    // conversion. The best way to do it is to just convert the float number
-    // directly to base 2 and then at the end translate back to hex.
-    let mantissa = 0;
-    let suffix = Some({
-        let ind = if capitalized { "P" } else { "p" };
-        if mantissa >= 0 {
-            format!("{ind}+{mantissa}")
-        } else {
-            format!("{ind}{mantissa}")
-        }
-    });
-    FormatPrimitive {
-        prefix,
-        suffix,
-        ..Default::default()
-    }
-}
-
-#[allow(dead_code)]
-fn to_hex(src: &str, before_decimal: bool) -> String {
-    let radix_ten = base_conv::RadixTen;
-    let radix_hex = base_conv::RadixHex;
-    if before_decimal {
-        base_conv::base_conv_str(src, &radix_ten, &radix_hex)
-    } else {
-        let as_arrnum_ten = base_conv::str_to_arrnum(src, &radix_ten);
-        let s = format!(
-            "{}",
-            base_conv::base_conv_float(&as_arrnum_ten, radix_ten.get_max(), radix_hex.get_max())
-        );
-        if s.len() > 2 {
-            String::from(&s[2..])
-        } else {
-            // zero
-            s
-        }
-    }
-}
diff --git a/src/uucore/src/lib/features/tokenize/num_format/formatters/decf.rs b/src/uucore/src/lib/features/tokenize/num_format/formatters/decf.rs
deleted file mode 100644
index 2ee53882e5d..00000000000
--- a/src/uucore/src/lib/features/tokenize/num_format/formatters/decf.rs
+++ /dev/null
@@ -1,185 +0,0 @@
-// spell-checker:ignore (vars) charf decf floatf intf scif strf Cninety
-
-//! formatter for %g %G decimal subs
-use super::super::format_field::FormatField;
-use super::super::formatter::{FormatPrimitive, Formatter, InitialPrefix};
-use super::float_common::{get_primitive_dec, primitive_to_str_common, FloatAnalysis};
-
-const SIGNIFICANT_FIGURES: usize = 6;
-
-// Parse a numeric string as the nearest integer with a given significance.
-// This is a helper function for round().
-// Examples:
-//  round_to_significance("456", 1) == 500
-//  round_to_significance("456", 2) == 460
-//  round_to_significance("456", 9) == 456
-fn round_to_significance(input: &str, significant_figures: usize) -> u32 {
-    if significant_figures < input.len() {
-        // If the input has too many digits, use a float intermediary
-        // to round it before converting to an integer. Otherwise,
-        // converting straight to integer will truncate.
-        // There might be a cleaner way to do this...
-        let digits = &input[..significant_figures + 1];
-        let float_representation = digits.parse::<f32>().unwrap();
-        (float_representation / 10.0).round() as u32
-    } else {
-        input.parse::<u32>().unwrap_or(0)
-    }
-}
-
-// Removing trailing zeroes, expressing the result as an integer where
-// possible. This is a helper function for round().
-fn truncate(mut format: FormatPrimitive) -> FormatPrimitive {
-    if let Some(ref post_dec) = format.post_decimal {
-        let trimmed = post_dec.trim_end_matches('0');
-
-        if trimmed.is_empty() {
-            // If there are no nonzero digits after the decimal point,
-            // use integer formatting by clearing post_decimal and suffix.
-            format.post_decimal = Some(String::new());
-            if format.suffix == Some("e+00".into()) {
-                format.suffix = Some(String::new());
-            }
-        } else if trimmed.len() != post_dec.len() {
-            // Otherwise, update the format to remove only the trailing
-            // zeroes (e.g. "4.50" becomes "4.5", not "4"). If there were
-            // no trailing zeroes, do nothing.
-            format.post_decimal = Some(trimmed.to_owned());
-        }
-    }
-    format
-}
-
-// Round a format to six significant figures and remove trailing zeroes.
-fn round(mut format: FormatPrimitive) -> FormatPrimitive {
-    let mut significant_digits_remaining = SIGNIFICANT_FIGURES;
-
-    // First, take as many significant digits as possible from pre_decimal,
-    if format.pre_decimal.is_some() {
-        let input = format.pre_decimal.as_ref().unwrap();
-        let rounded = round_to_significance(input, significant_digits_remaining);
-        let mut rounded_str = rounded.to_string();
-        significant_digits_remaining -= rounded_str.len();
-
-        // If the pre_decimal has exactly enough significant digits,
-        // round the input to the nearest integer. If the first
-        // post_decimal digit is 5 or higher, round up by incrementing
-        // the pre_decimal number. Otherwise, use the pre_decimal as-is.
-        if significant_digits_remaining == 0 {
-            if let Some(digits) = &format.post_decimal {
-                if digits.chars().next().unwrap_or('0') >= '5' {
-                    let rounded = rounded + 1;
-                    rounded_str = rounded.to_string();
-                }
-            }
-        }
-        format.pre_decimal = Some(rounded_str);
-    }
-
-    // If no significant digits remain, or there's no post_decimal to
-    // round, return the rounded pre_decimal value with no post_decimal.
-    // Otherwise, round the post_decimal to the remaining significance.
-    if significant_digits_remaining == 0 {
-        format.post_decimal = Some(String::new());
-    } else if let Some(input) = format.post_decimal {
-        let leading_zeroes = input.len() - input.trim_start_matches('0').len();
-        let digits = &input[leading_zeroes..];
-
-        // In the post_decimal, leading zeroes are significant. "01.0010"
-        // has one significant digit in pre_decimal, and 3 from post_decimal.
-        let mut post_decimal_str = String::with_capacity(significant_digits_remaining);
-        for _ in 0..leading_zeroes {
-            post_decimal_str.push('0');
-        }
-
-        if leading_zeroes < significant_digits_remaining {
-            // After significant leading zeroes, round the remaining digits
-            // to any remaining significance.
-            let rounded = round_to_significance(digits, significant_digits_remaining);
-            post_decimal_str.push_str(&rounded.to_string());
-        } else if leading_zeroes == significant_digits_remaining
-            && digits.chars().next().unwrap_or('0') >= '5'
-        {
-            // If necessary, round up the post_decimal ("1.000009" should
-            // round to 1.00001, instead of truncating after the last
-            // significant leading zero).
-            post_decimal_str.pop();
-            post_decimal_str.push('1');
-        } else {
-            // If the rounded post_decimal is entirely zeroes, discard
-            // it and use integer formatting instead.
-            post_decimal_str = String::new();
-        }
-
-        format.post_decimal = Some(post_decimal_str);
-    }
-    truncate(format)
-}
-
-// Given an exponent used in scientific notation, return whether the
-// number is small enough to be expressed as a decimal instead. "Small
-// enough" is based only on the number's magnitude, not the length of
-// any string representation.
-fn should_represent_as_decimal(suffix: &Option<String>) -> bool {
-    match suffix {
-        Some(exponent) => {
-            if exponent.chars().nth(1) == Some('-') {
-                exponent < &"e-05".into()
-            } else {
-                exponent < &"e+06".into()
-            }
-        }
-        None => true,
-    }
-}
-
-pub struct Decf;
-
-impl Decf {
-    pub fn new() -> Self {
-        Self
-    }
-}
-impl Formatter for Decf {
-    fn get_primitive(
-        &self,
-        field: &FormatField,
-        initial_prefix: &InitialPrefix,
-        str_in: &str,
-    ) -> Option<FormatPrimitive> {
-        let second_field = field.second_field.unwrap_or(6) + 1;
-        // default to scif interpretation so as to not truncate input vals
-        // (that would be displayed in scif) based on relation to decimal place
-        let analysis = FloatAnalysis::analyze(
-            str_in,
-            initial_prefix,
-            Some(second_field as usize + 1),
-            None,
-            false,
-        );
-        let mut f_dec = get_primitive_dec(
-            initial_prefix,
-            &str_in[initial_prefix.offset..],
-            &analysis,
-            second_field as usize,
-            Some(*field.field_char == 'G'),
-        );
-
-        if should_represent_as_decimal(&f_dec.suffix) {
-            // Use decimal formatting instead of scientific notation
-            // if the input's magnitude is small.
-            f_dec = get_primitive_dec(
-                initial_prefix,
-                &str_in[initial_prefix.offset..],
-                &analysis,
-                second_field as usize,
-                None,
-            );
-        }
-
-        Some(round(f_dec))
-    }
-    fn primitive_to_str(&self, prim: &FormatPrimitive, field: FormatField) -> String {
-        primitive_to_str_common(prim, &field)
-    }
-}
diff --git a/src/uucore/src/lib/features/tokenize/num_format/formatters/float_common.rs b/src/uucore/src/lib/features/tokenize/num_format/formatters/float_common.rs
deleted file mode 100644
index e0a29217c4a..00000000000
--- a/src/uucore/src/lib/features/tokenize/num_format/formatters/float_common.rs
+++ /dev/null
@@ -1,377 +0,0 @@
-// spell-checker:ignore (vars) charf decf floatf intf scif strf Cninety
-// spell-checker:ignore (ToDO) arrnum
-
-use super::super::format_field::FormatField;
-use super::super::formatter::{
-    get_it_at, warn_incomplete_conv, Base, FormatPrimitive, InitialPrefix,
-};
-use super::base_conv;
-use super::base_conv::RadixDef;
-
-// if the memory, copy, and comparison cost of chars
-//  becomes an issue, we can always operate in vec<u8> here
-//  rather than just at de_hex
-
-pub struct FloatAnalysis {
-    pub len_important: usize,
-    // none means no decimal point.
-    pub decimal_pos: Option<usize>,
-    pub follow: Option<char>,
-}
-fn has_enough_digits(
-    hex_input: bool,
-    hex_output: bool,
-    string_position: usize,
-    starting_position: usize,
-    limit: usize,
-) -> bool {
-    // -1s are for rounding
-    if hex_output {
-        if hex_input {
-            (string_position - 1) - starting_position >= limit
-        } else {
-            false //undecidable without converting
-        }
-    } else if hex_input {
-        (((string_position - 1) - starting_position) * 9) / 8 >= limit
-    } else {
-        (string_position - 1) - starting_position >= limit
-    }
-}
-
-impl FloatAnalysis {
-    #[allow(clippy::cognitive_complexity)]
-    pub fn analyze(
-        str_in: &str,
-        initial_prefix: &InitialPrefix,
-        max_sd_opt: Option<usize>,
-        max_after_dec_opt: Option<usize>,
-        hex_output: bool,
-    ) -> Self {
-        // this fn assumes
-        // the input string
-        // has no leading spaces or 0s
-        let str_it = get_it_at(initial_prefix.offset, str_in);
-        let mut ret = Self {
-            len_important: 0,
-            decimal_pos: None,
-            follow: None,
-        };
-        let hex_input = match initial_prefix.radix_in {
-            Base::Hex => true,
-            Base::Ten => false,
-            Base::Octal => {
-                panic!("this should never happen: floats should never receive octal input");
-            }
-        };
-        let mut i = 0;
-        let mut pos_before_first_nonzero_after_decimal: Option<usize> = None;
-        for c in str_it {
-            match c {
-                e @ ('0'..='9' | 'A'..='F' | 'a'..='f') => {
-                    if !hex_input {
-                        match e {
-                            '0'..='9' => {}
-                            _ => {
-                                warn_incomplete_conv(str_in);
-                                break;
-                            }
-                        }
-                    }
-                    if ret.decimal_pos.is_some()
-                        && pos_before_first_nonzero_after_decimal.is_none()
-                        && e != '0'
-                    {
-                        pos_before_first_nonzero_after_decimal = Some(i - 1);
-                    }
-                    if let Some(max_sd) = max_sd_opt {
-                        if i == max_sd {
-                            // follow is used in cases of %g
-                            // where the character right after the last
-                            // sd is considered is rounded affecting
-                            // the previous digit in 1/2 of instances
-                            ret.follow = Some(e);
-                        } else if ret.decimal_pos.is_some() && i > max_sd {
-                            break;
-                        }
-                    }
-                    if let Some(max_after_dec) = max_after_dec_opt {
-                        if let Some(p) = ret.decimal_pos {
-                            if has_enough_digits(hex_input, hex_output, i, p, max_after_dec) {
-                                break;
-                            }
-                        }
-                    } else if let Some(max_sd) = max_sd_opt {
-                        if let Some(p) = pos_before_first_nonzero_after_decimal {
-                            if has_enough_digits(hex_input, hex_output, i, p, max_sd) {
-                                break;
-                            }
-                        }
-                    }
-                }
-                '.' => {
-                    if ret.decimal_pos.is_none() {
-                        ret.decimal_pos = Some(i);
-                    } else {
-                        warn_incomplete_conv(str_in);
-                        break;
-                    }
-                }
-                _ => {
-                    warn_incomplete_conv(str_in);
-                    break;
-                }
-            };
-            i += 1;
-        }
-        ret.len_important = i;
-        ret
-    }
-}
-
-fn de_hex(src: &str, before_decimal: bool) -> String {
-    let radix_ten = base_conv::RadixTen;
-    let radix_hex = base_conv::RadixHex;
-    if before_decimal {
-        base_conv::base_conv_str(src, &radix_hex, &radix_ten)
-    } else {
-        let as_arrnum_hex = base_conv::str_to_arrnum(src, &radix_hex);
-        let s = format!(
-            "{}",
-            base_conv::base_conv_float(&as_arrnum_hex, radix_hex.get_max(), radix_ten.get_max())
-        );
-        if s.len() > 2 {
-            String::from(&s[2..])
-        } else {
-            // zero
-            s
-        }
-    }
-}
-
-// takes a string in,
-// truncates to a position,
-// bumps the last digit up one,
-// and if the digit was nine
-// propagate to the next, etc.
-// If before the decimal and the most
-// significant digit is a 9, it becomes a 1
-fn _round_str_from(in_str: &str, position: usize, before_dec: bool) -> (String, bool) {
-    let mut it = in_str[0..position].chars();
-    let mut rev = String::new();
-    let mut i = position;
-    let mut finished_in_dec = false;
-    while let Some(c) = it.next_back() {
-        i -= 1;
-        match c {
-            '9' => {
-                // If we're before the decimal
-                // and on the most significant digit,
-                // round 9 to 1, else to 0.
-                if before_dec && i == 0 {
-                    rev.push('1');
-                } else {
-                    rev.push('0');
-                }
-            }
-            e => {
-                rev.push(((e as u8) + 1) as char);
-                finished_in_dec = true;
-                break;
-            }
-        }
-    }
-    let mut fwd = String::from(&in_str[0..i]);
-    for ch in rev.chars().rev() {
-        fwd.push(ch);
-    }
-    (fwd, finished_in_dec)
-}
-
-fn round_terminal_digit(
-    before_dec: String,
-    after_dec: String,
-    position: usize,
-) -> (String, String, bool) {
-    if position < after_dec.len() {
-        let digit_at_pos: char;
-        {
-            digit_at_pos = after_dec[position..=position].chars().next().expect("");
-        }
-        if let '5'..='9' = digit_at_pos {
-            let (new_after_dec, finished_in_dec) = _round_str_from(&after_dec, position, false);
-            if finished_in_dec {
-                return (before_dec, new_after_dec, false);
-            } else {
-                let (new_before_dec, _) = _round_str_from(&before_dec, before_dec.len(), true);
-                let mut dec_place_chg = false;
-                let mut before_dec_chars = new_before_dec.chars();
-                if before_dec_chars.next() == Some('1') && before_dec_chars.all(|c| c == '0') {
-                    // If the first digit is a one and remaining are zeros, we have
-                    // rounded to a new decimal place, so the decimal place must be updated.
-                    // Only update decimal place if the before decimal != 0
-                    dec_place_chg = before_dec != "0";
-                }
-                return (new_before_dec, new_after_dec, dec_place_chg);
-            }
-            // TODO
-        }
-    }
-    (before_dec, after_dec, false)
-}
-
-#[allow(clippy::cognitive_complexity)]
-pub fn get_primitive_dec(
-    initial_prefix: &InitialPrefix,
-    str_in: &str,
-    analysis: &FloatAnalysis,
-    last_dec_place: usize,
-    sci_mode: Option<bool>,
-) -> FormatPrimitive {
-    let mut f = FormatPrimitive::default();
-
-    // add negative sign section
-    if initial_prefix.sign == -1 {
-        f.prefix = Some(String::from("-"));
-    }
-
-    // assign the digits before and after the decimal points
-    // to separate slices. If no digits after decimal point,
-    // assign 0
-    let (mut first_segment_raw, second_segment_raw) = match analysis.decimal_pos {
-        Some(pos) => (&str_in[..pos], &str_in[pos + 1..]),
-        None => (str_in, "0"),
-    };
-    if first_segment_raw.is_empty() {
-        first_segment_raw = "0";
-    }
-    // convert to string, de_hexifying if input is in hex   // spell-checker:disable-line
-    let (first_segment, second_segment) = match initial_prefix.radix_in {
-        Base::Hex => (
-            de_hex(first_segment_raw, true),
-            de_hex(second_segment_raw, false),
-        ),
-        _ => (
-            String::from(first_segment_raw),
-            String::from(second_segment_raw),
-        ),
-    };
-    let (pre_dec_unrounded, post_dec_unrounded, mut mantissa) = if sci_mode.is_some() {
-        if first_segment.len() > 1 {
-            let mut post_dec = String::from(&first_segment[1..]);
-            post_dec.push_str(&second_segment);
-            (
-                String::from(&first_segment[0..1]),
-                post_dec,
-                first_segment.len() as isize - 1,
-            )
-        } else {
-            match first_segment
-                .chars()
-                .next()
-                .expect("float_common: no chars in first segment.")
-            {
-                '0' => {
-                    let it = second_segment.chars().enumerate();
-                    let mut m: isize = 0;
-                    let mut pre = String::from("0");
-                    let mut post = String::from("0");
-                    for (i, c) in it {
-                        match c {
-                            '0' => {}
-                            _ => {
-                                m = -((i as isize) + 1);
-                                pre = String::from(&second_segment[i..=i]);
-                                post = String::from(&second_segment[i + 1..]);
-                                break;
-                            }
-                        }
-                    }
-                    (pre, post, m)
-                }
-                _ => (first_segment, second_segment, 0),
-            }
-        }
-    } else {
-        (first_segment, second_segment, 0)
-    };
-
-    let (pre_dec_draft, post_dec_draft, dec_place_chg) =
-        round_terminal_digit(pre_dec_unrounded, post_dec_unrounded, last_dec_place - 1);
-    f.post_decimal = Some(post_dec_draft);
-    if let Some(capitalized) = sci_mode {
-        let si_ind = if capitalized { 'E' } else { 'e' };
-        // Increase the mantissa if we're adding a decimal place
-        if dec_place_chg {
-            mantissa += 1;
-        }
-        f.suffix = Some(if mantissa >= 0 {
-            format!("{si_ind}+{mantissa:02}")
-        } else {
-            // negative sign is considered in format!s
-            // leading zeroes
-            format!("{si_ind}{mantissa:03}")
-        });
-        f.pre_decimal = Some(pre_dec_draft);
-    } else if dec_place_chg {
-        // We've rounded up to a new decimal place so append 0
-        f.pre_decimal = Some(pre_dec_draft + "0");
-    } else {
-        f.pre_decimal = Some(pre_dec_draft);
-    }
-
-    f
-}
-
-pub fn primitive_to_str_common(prim: &FormatPrimitive, field: &FormatField) -> String {
-    let mut final_str = String::new();
-    if let Some(ref prefix) = prim.prefix {
-        final_str.push_str(prefix);
-    }
-    match prim.pre_decimal {
-        Some(ref pre_decimal) => {
-            final_str.push_str(pre_decimal);
-        }
-        None => {
-            panic!(
-                "error, format primitives provided to int, will, incidentally under correct \
-                 behavior, always have a pre_dec value."
-            );
-        }
-    }
-    let decimal_places = field.second_field.unwrap_or(6);
-    match prim.post_decimal {
-        Some(ref post_decimal) => {
-            if !post_decimal.is_empty() && decimal_places > 0 {
-                final_str.push('.');
-                let len_avail = post_decimal.len() as u32;
-
-                if decimal_places >= len_avail {
-                    // println!("dec {}, len avail {}", decimal_places, len_avail);
-                    final_str.push_str(post_decimal);
-
-                    if *field.field_char != 'g' && *field.field_char != 'G' {
-                        let diff = decimal_places - len_avail;
-                        for _ in 0..diff {
-                            final_str.push('0');
-                        }
-                    }
-                } else {
-                    // println!("printing to only {}", decimal_places);
-                    final_str.push_str(&post_decimal[0..decimal_places as usize]);
-                }
-            }
-        }
-        None => {
-            panic!(
-                "error, format primitives provided to int, will, incidentally under correct \
-                 behavior, always have a pre_dec value."
-            );
-        }
-    }
-    if let Some(ref suffix) = prim.suffix {
-        final_str.push_str(suffix);
-    }
-
-    final_str
-}
diff --git a/src/uucore/src/lib/features/tokenize/num_format/formatters/floatf.rs b/src/uucore/src/lib/features/tokenize/num_format/formatters/floatf.rs
deleted file mode 100644
index cca2750dc55..00000000000
--- a/src/uucore/src/lib/features/tokenize/num_format/formatters/floatf.rs
+++ /dev/null
@@ -1,43 +0,0 @@
-// spell-checker:ignore (vars) charf decf floatf intf scif strf Cninety
-// spell-checker:ignore (ToDO) arrnum
-
-//! formatter for %f %F common-notation floating-point subs
-use super::super::format_field::FormatField;
-use super::super::formatter::{FormatPrimitive, Formatter, InitialPrefix};
-use super::float_common::{get_primitive_dec, primitive_to_str_common, FloatAnalysis};
-
-#[derive(Default)]
-pub struct Floatf;
-impl Floatf {
-    pub fn new() -> Self {
-        Self
-    }
-}
-impl Formatter for Floatf {
-    fn get_primitive(
-        &self,
-        field: &FormatField,
-        initial_prefix: &InitialPrefix,
-        str_in: &str,
-    ) -> Option<FormatPrimitive> {
-        let second_field = field.second_field.unwrap_or(6) + 1;
-        let analysis = FloatAnalysis::analyze(
-            str_in,
-            initial_prefix,
-            None,
-            Some(second_field as usize),
-            false,
-        );
-        let f = get_primitive_dec(
-            initial_prefix,
-            &str_in[initial_prefix.offset..],
-            &analysis,
-            second_field as usize,
-            None,
-        );
-        Some(f)
-    }
-    fn primitive_to_str(&self, prim: &FormatPrimitive, field: FormatField) -> String {
-        primitive_to_str_common(prim, &field)
-    }
-}
diff --git a/src/uucore/src/lib/features/tokenize/num_format/formatters/intf.rs b/src/uucore/src/lib/features/tokenize/num_format/formatters/intf.rs
deleted file mode 100644
index 0f6e78de6f6..00000000000
--- a/src/uucore/src/lib/features/tokenize/num_format/formatters/intf.rs
+++ /dev/null
@@ -1,282 +0,0 @@
-// spell-checker:ignore (vars) charf decf floatf intf scif strf Cninety
-// spell-checker:ignore (ToDO) arrnum
-
-//! formatter for unsigned and signed int subs
-//! unsigned int: %X %x (hex u64) %o (octal u64) %u (base ten u64)
-//! signed int: %i %d (both base ten i64)
-use super::super::format_field::FormatField;
-use super::super::formatter::{
-    get_it_at, warn_incomplete_conv, Base, FormatPrimitive, Formatter, InitialPrefix,
-};
-use std::i64;
-use std::u64;
-
-#[derive(Default)]
-pub struct Intf {
-    _a: u32,
-}
-
-// see the Intf::analyze() function below
-struct IntAnalysis {
-    check_past_max: bool,
-    past_max: bool,
-    is_zero: bool,
-    len_digits: u8,
-}
-
-impl Intf {
-    pub fn new() -> Self {
-        Self::default()
-    }
-    // take a ref to argument string, and basic information
-    // about prefix (offset, radix, sign), and analyze string
-    // to gain the IntAnalysis information above
-    // check_past_max: true if the number *may* be above max,
-    //   but we don't know either way. One of several reasons
-    //   we may have to parse as int.
-    // past_max: true if the object is past max, false if not
-    //  in the future we should probably combine these into an
-    //  Option<bool>
-    // is_zero: true if number is zero, false otherwise
-    // len_digits: length of digits used to create the int
-    //   important, for example, if we run into a non-valid character
-    #[allow(clippy::cognitive_complexity)]
-    fn analyze(str_in: &str, signed_out: bool, initial_prefix: &InitialPrefix) -> IntAnalysis {
-        // the maximum number of digits we could conceivably
-        // have before the decimal point without exceeding the
-        // max
-        let mut str_it = get_it_at(initial_prefix.offset, str_in);
-        let max_sd_in = if signed_out {
-            match initial_prefix.radix_in {
-                Base::Ten => 19,
-                Base::Octal => 21,
-                Base::Hex => 16,
-            }
-        } else {
-            match initial_prefix.radix_in {
-                Base::Ten => 20,
-                Base::Octal => 22,
-                Base::Hex => 16,
-            }
-        };
-        let mut ret = IntAnalysis {
-            check_past_max: false,
-            past_max: false,
-            is_zero: false,
-            len_digits: 0,
-        };
-
-        // todo turn this to a while let now that we know
-        // no special behavior on EOI break
-        loop {
-            let c_opt = str_it.next();
-            if let Some(c) = c_opt {
-                match c {
-                    '0'..='9' | 'a'..='f' | 'A'..='F' => {
-                        if ret.len_digits == 0 && c == '0' {
-                            ret.is_zero = true;
-                        } else if ret.is_zero {
-                            ret.is_zero = false;
-                        }
-                        ret.len_digits += 1;
-                        if ret.len_digits == max_sd_in {
-                            if let Some(next_ch) = str_it.next() {
-                                match next_ch {
-                                    '0'..='9' => {
-                                        ret.past_max = true;
-                                    }
-                                    _ => {
-                                        // force conversion
-                                        // to check if its above max.
-                                        // todo: spin out convert
-                                        // into fn, call it here to try
-                                        // read val, on Ok()
-                                        // save val for reuse later
-                                        // that way on same-base in and out
-                                        // we don't needlessly convert int
-                                        // to str, we can just copy it over.
-                                        ret.check_past_max = true;
-                                        str_it.put_back(next_ch);
-                                    }
-                                }
-                                if ret.past_max {
-                                    break;
-                                }
-                            } else {
-                                ret.check_past_max = true;
-                            }
-                        }
-                    }
-                    _ => {
-                        warn_incomplete_conv(str_in);
-                        break;
-                    }
-                }
-            } else {
-                // breaks on EOL
-                break;
-            }
-        }
-        ret
-    }
-    // get a FormatPrimitive of the maximum value for the field char
-    //  and given sign
-    fn get_max(field_char: char, sign: i8) -> FormatPrimitive {
-        let mut fmt_primitive = FormatPrimitive::default();
-        fmt_primitive.pre_decimal = Some(String::from(match field_char {
-            'd' | 'i' => match sign {
-                1 => "9223372036854775807",
-                _ => {
-                    fmt_primitive.prefix = Some(String::from("-"));
-                    "9223372036854775808"
-                }
-            },
-            'x' | 'X' => "ffffffffffffffff",
-            'o' => "1777777777777777777777",
-            /* 'u' | */ _ => "18446744073709551615",
-        }));
-        fmt_primitive
-    }
-    // conv_from_segment contract:
-    // 1. takes
-    // - a string that begins with a non-zero digit, and proceeds
-    //  with zero or more following digits until the end of the string
-    // - a radix to interpret those digits as
-    // - a char that communicates:
-    //     whether to interpret+output the string as an i64 or u64
-    //     what radix to write the parsed number as.
-    // 2. parses it as a rust integral type
-    // 3. outputs FormatPrimitive with:
-    // - if the string falls within bounds:
-    //   number parsed and written in the correct radix
-    // - if the string falls outside bounds:
-    //   for i64 output, the int minimum or int max (depending on sign)
-    //   for u64 output, the u64 max in the output radix
-    fn conv_from_segment(
-        segment: &str,
-        radix_in: Base,
-        field_char: char,
-        sign: i8,
-    ) -> FormatPrimitive {
-        match field_char {
-            'i' | 'd' => match i64::from_str_radix(segment, radix_in as u32) {
-                Ok(i) => {
-                    let mut fmt_prim = FormatPrimitive::default();
-                    if sign == -1 {
-                        fmt_prim.prefix = Some(String::from("-"));
-                    }
-                    fmt_prim.pre_decimal = Some(format!("{i}"));
-                    fmt_prim
-                }
-                Err(_) => Self::get_max(field_char, sign),
-            },
-            _ => match u64::from_str_radix(segment, radix_in as u32) {
-                Ok(u) => {
-                    let mut fmt_prim = FormatPrimitive::default();
-                    let u_f = if sign == -1 { u64::MAX - (u - 1) } else { u };
-                    fmt_prim.pre_decimal = Some(match field_char {
-                        'X' => format!("{u_f:X}"),
-                        'x' => format!("{u_f:x}"),
-                        'o' => format!("{u_f:o}"),
-                        _ => format!("{u_f}"),
-                    });
-                    fmt_prim
-                }
-                Err(_) => Self::get_max(field_char, sign),
-            },
-        }
-    }
-}
-impl Formatter for Intf {
-    fn get_primitive(
-        &self,
-        field: &FormatField,
-        initial_prefix: &InitialPrefix,
-        str_in: &str,
-    ) -> Option<FormatPrimitive> {
-        let begin = initial_prefix.offset;
-
-        // get information about the string. see Intf::Analyze
-        // def above.
-        let convert_hints = Self::analyze(
-            str_in,
-            *field.field_char == 'i' || *field.field_char == 'd',
-            initial_prefix,
-        );
-        // We always will have a format primitive to return
-        Some(if convert_hints.len_digits == 0 || convert_hints.is_zero {
-            // if non-digit or end is reached before a non-zero digit
-            FormatPrimitive {
-                pre_decimal: Some(String::from("0")),
-                ..Default::default()
-            }
-        } else if !convert_hints.past_max {
-            // if the number is or may be below the bounds limit
-            let radix_out = match *field.field_char {
-                'd' | 'i' | 'u' => Base::Ten,
-                'x' | 'X' => Base::Hex,
-                /* 'o' | */ _ => Base::Octal,
-            };
-            let radix_mismatch = !radix_out.eq(&initial_prefix.radix_in);
-            let decrease_from_max: bool = initial_prefix.sign == -1 && *field.field_char != 'i';
-            let end = begin + convert_hints.len_digits as usize;
-
-            // convert to int if any one of these is true:
-            // - number of digits in int indicates it may be past max
-            // - we're subtracting from the max
-            // - we're converting the base
-            if convert_hints.check_past_max || decrease_from_max || radix_mismatch {
-                // radix of in and out is the same.
-                let segment = String::from(&str_in[begin..end]);
-                Self::conv_from_segment(
-                    &segment,
-                    initial_prefix.radix_in.clone(),
-                    *field.field_char,
-                    initial_prefix.sign,
-                )
-            } else {
-                // otherwise just do a straight string copy.
-                let mut fmt_prim = FormatPrimitive::default();
-
-                // this is here and not earlier because
-                // zero doesn't get a sign, and conv_from_segment
-                // creates its format primitive separately
-                if initial_prefix.sign == -1 && *field.field_char == 'i' {
-                    fmt_prim.prefix = Some(String::from("-"));
-                }
-                fmt_prim.pre_decimal = Some(String::from(&str_in[begin..end]));
-                fmt_prim
-            }
-        } else {
-            Self::get_max(*field.field_char, initial_prefix.sign)
-        })
-    }
-    fn primitive_to_str(&self, prim: &FormatPrimitive, field: FormatField) -> String {
-        let mut final_str: String = String::new();
-        if let Some(ref prefix) = prim.prefix {
-            final_str.push_str(prefix);
-        }
-        // integral second fields is zero-padded minimum-width
-        // which gets handled before general minimum-width
-        match prim.pre_decimal {
-            Some(ref pre_decimal) => {
-                if let Some(min) = field.second_field {
-                    let mut i = min;
-                    let len = pre_decimal.len() as u32;
-                    while i > len {
-                        final_str.push('0');
-                        i -= 1;
-                    }
-                }
-                final_str.push_str(pre_decimal);
-            }
-            None => {
-                panic!(
-                    "error, format primitives provided to int, will, incidentally under \
-                     correct behavior, always have a pre_dec value."
-                );
-            }
-        }
-        final_str
-    }
-}
diff --git a/src/uucore/src/lib/features/tokenize/num_format/formatters/mod.rs b/src/uucore/src/lib/features/tokenize/num_format/formatters/mod.rs
deleted file mode 100644
index e232300718b..00000000000
--- a/src/uucore/src/lib/features/tokenize/num_format/formatters/mod.rs
+++ /dev/null
@@ -1,9 +0,0 @@
-// spell-checker:ignore (vars) charf cninetyninehexfloatf decf floatf intf scif strf Cninety
-
-mod base_conv;
-pub mod cninetyninehexfloatf;
-pub mod decf;
-mod float_common;
-pub mod floatf;
-pub mod intf;
-pub mod scif;
diff --git a/src/uucore/src/lib/features/tokenize/num_format/formatters/scif.rs b/src/uucore/src/lib/features/tokenize/num_format/formatters/scif.rs
deleted file mode 100644
index c871dc4e552..00000000000
--- a/src/uucore/src/lib/features/tokenize/num_format/formatters/scif.rs
+++ /dev/null
@@ -1,43 +0,0 @@
-// spell-checker:ignore (vars) charf cninetyninehexfloatf decf floatf intf scif strf Cninety
-
-//! formatter for %e %E scientific notation subs
-use super::super::format_field::FormatField;
-use super::super::formatter::{FormatPrimitive, Formatter, InitialPrefix};
-use super::float_common::{get_primitive_dec, primitive_to_str_common, FloatAnalysis};
-
-#[derive(Default)]
-pub struct Scif;
-
-impl Scif {
-    pub fn new() -> Self {
-        Self
-    }
-}
-impl Formatter for Scif {
-    fn get_primitive(
-        &self,
-        field: &FormatField,
-        initial_prefix: &InitialPrefix,
-        str_in: &str,
-    ) -> Option<FormatPrimitive> {
-        let second_field = field.second_field.unwrap_or(6) + 1;
-        let analysis = FloatAnalysis::analyze(
-            str_in,
-            initial_prefix,
-            Some(second_field as usize + 1),
-            None,
-            false,
-        );
-        let f = get_primitive_dec(
-            initial_prefix,
-            &str_in[initial_prefix.offset..],
-            &analysis,
-            second_field as usize,
-            Some(*field.field_char == 'E'),
-        );
-        Some(f)
-    }
-    fn primitive_to_str(&self, prim: &FormatPrimitive, field: FormatField) -> String {
-        primitive_to_str_common(prim, &field)
-    }
-}
diff --git a/src/uucore/src/lib/features/tokenize/num_format/mod.rs b/src/uucore/src/lib/features/tokenize/num_format/mod.rs
deleted file mode 100644
index d40cf92deff..00000000000
--- a/src/uucore/src/lib/features/tokenize/num_format/mod.rs
+++ /dev/null
@@ -1,4 +0,0 @@
-pub mod format_field;
-mod formatter;
-mod formatters;
-pub mod num_format;
diff --git a/src/uucore/src/lib/features/tokenize/num_format/num_format.rs b/src/uucore/src/lib/features/tokenize/num_format/num_format.rs
deleted file mode 100644
index c9b1178b6ac..00000000000
--- a/src/uucore/src/lib/features/tokenize/num_format/num_format.rs
+++ /dev/null
@@ -1,271 +0,0 @@
-// spell-checker:ignore (vars) charf cninetyninehexfloatf decf floatf intf scif strf Cninety
-
-//! handles creating printed output for numeric substitutions
-
-// spell-checker:ignore (vars) charf decf floatf intf scif strf Cninety
-
-use std::env;
-use std::vec::Vec;
-
-use crate::display::Quotable;
-use crate::{show_error, show_warning};
-
-use super::format_field::{FieldType, FormatField};
-use super::formatter::{Base, FormatPrimitive, Formatter, InitialPrefix};
-use super::formatters::cninetyninehexfloatf::CninetyNineHexFloatf;
-use super::formatters::decf::Decf;
-use super::formatters::floatf::Floatf;
-use super::formatters::intf::Intf;
-use super::formatters::scif::Scif;
-
-pub fn warn_expected_numeric(pf_arg: &str) {
-    // important: keep println here not print
-    show_error!("{}: expected a numeric value", pf_arg.maybe_quote());
-}
-
-// when character constant arguments have excess characters
-// issue a warning when POSIXLY_CORRECT is not set
-fn warn_char_constant_ign(remaining_bytes: &[u8]) {
-    match env::var("POSIXLY_CORRECT") {
-        Ok(_) => {}
-        Err(e) => {
-            if let env::VarError::NotPresent = e {
-                show_warning!(
-                    "{:?}: character(s) following character \
-                     constant have been ignored",
-                    remaining_bytes
-                );
-            }
-        }
-    }
-}
-
-// this function looks at the first few
-// characters of an argument and returns a value if we can learn
-// a value from that (e.g. no argument? return 0, char constant? ret value)
-fn get_provided(str_in_opt: Option<&String>) -> Option<u8> {
-    const C_S_QUOTE: u8 = 39;
-    const C_D_QUOTE: u8 = 34;
-    match str_in_opt {
-        Some(str_in) => {
-            let mut byte_it = str_in.bytes();
-            if let Some(ch) = byte_it.next() {
-                match ch {
-                    C_S_QUOTE | C_D_QUOTE => {
-                        Some(match byte_it.next() {
-                            Some(second_byte) => {
-                                let mut ignored: Vec<u8> = Vec::new();
-                                for cont in byte_it {
-                                    ignored.push(cont);
-                                }
-                                if !ignored.is_empty() {
-                                    warn_char_constant_ign(&ignored);
-                                }
-                                second_byte
-                            }
-                            // no byte after quote
-                            None => {
-                                let so_far = (ch as char).to_string();
-                                warn_expected_numeric(&so_far);
-                                0_u8
-                            }
-                        })
-                    }
-                    // first byte is not quote
-                    _ => None, // no first byte
-                }
-            } else {
-                Some(0_u8)
-            }
-        }
-        None => Some(0),
-    }
-}
-
-// takes a string and returns
-// a sign,
-// a base,
-// and an offset for index after all
-//  initial spacing, sign, base prefix, and leading zeroes
-#[allow(clippy::cognitive_complexity)]
-fn get_initial_prefix(str_in: &str, field_type: &FieldType) -> InitialPrefix {
-    let mut str_it = str_in.chars();
-    let mut ret = InitialPrefix {
-        radix_in: Base::Ten,
-        sign: 1,
-        offset: 0,
-    };
-    let mut top_char = str_it.next();
-    // skip spaces and ensure top_char is the first non-space char
-    // (or None if none exists)
-    while let Some(' ') = top_char {
-        ret.offset += 1;
-        top_char = str_it.next();
-    }
-    // parse sign
-    match top_char {
-        Some('+') => {
-            ret.offset += 1;
-            top_char = str_it.next();
-        }
-        Some('-') => {
-            ret.sign = -1;
-            ret.offset += 1;
-            top_char = str_it.next();
-        }
-        _ => {}
-    }
-    // we want to exit with offset being
-    // the index of the first non-zero
-    // digit before the decimal point or
-    // if there is none, the zero before the
-    // decimal point, or, if there is none,
-    // the decimal point.
-
-    // while we are determining the offset
-    // we will ensure as a convention
-    // the offset is always on the first character
-    // that we are yet unsure if it is the
-    // final offset. If the zero could be before
-    // a decimal point we don't move past the zero.
-    let mut is_hex = false;
-    if Some('0') == top_char {
-        if let Some(base) = str_it.next() {
-            // lead zeroes can only exist in
-            // octal and hex base
-            let mut do_clean_lead_zeroes = false;
-            match base {
-                'x' | 'X' => {
-                    is_hex = true;
-                    ret.offset += 2;
-                    ret.radix_in = Base::Hex;
-                    do_clean_lead_zeroes = true;
-                }
-                e @ '0'..='9' => {
-                    ret.offset += 1;
-                    if let FieldType::Intf = *field_type {
-                        ret.radix_in = Base::Octal;
-                    }
-                    if e == '0' {
-                        do_clean_lead_zeroes = true;
-                    }
-                }
-                _ => {}
-            }
-            if do_clean_lead_zeroes {
-                let mut first = true;
-                for ch_zero in str_it {
-                    // see notes on offset above:
-                    // this is why the offset for octal and decimal numbers
-                    // that reach this branch is 1 even though
-                    // they have already eaten the characters '00'
-                    // this is also why when hex encounters its
-                    // first zero it does not move its offset
-                    // forward because it does not know for sure
-                    // that it's current offset (of that zero)
-                    // is not the final offset,
-                    // whereas at that point octal knows its
-                    // current offset is not the final offset.
-                    match ch_zero {
-                        '0' => {
-                            if !(is_hex && first) {
-                                ret.offset += 1;
-                            }
-                        }
-                        // if decimal, keep last zero if one exists
-                        // (it's possible for last zero to
-                        // not exist at this branch if we're in hex input)
-                        '.' => break,
-                        // other digit, etc.
-                        _ => {
-                            if !(is_hex && first) {
-                                ret.offset += 1;
-                            }
-                            break;
-                        }
-                    }
-                    if first {
-                        first = false;
-                    }
-                }
-            }
-        }
-    }
-    ret
-}
-
-// this is the function a Sub's print will delegate to
-// if it is a numeric field, passing the field details
-// and an iterator to the argument
-pub fn num_format(field: &FormatField, in_str_opt: Option<&String>) -> Option<String> {
-    let field_char = field.field_char;
-
-    // num format mainly operates by further delegating to one of
-    // several Formatter structs depending on the field
-    // see formatter.rs for more details
-
-    // to do switch to static dispatch
-    let formatter: Box<dyn Formatter> = match *field.field_type {
-        FieldType::Intf => Box::new(Intf::new()),
-        FieldType::Floatf => Box::new(Floatf::new()),
-        FieldType::CninetyNineHexFloatf => Box::new(CninetyNineHexFloatf::new()),
-        FieldType::Scif => Box::new(Scif::new()),
-        FieldType::Decf => Box::new(Decf::new()),
-        _ => {
-            panic!("asked to do num format with non-num field type");
-        }
-    };
-    let prim_opt=
-        // if we can get an assumed value from looking at the first
-        // few characters, use that value to create the FormatPrimitive
-        if let Some(provided_num) = get_provided(in_str_opt) {
-            let mut tmp = FormatPrimitive::default();
-            match field_char {
-                'u' | 'i' | 'd' => {
-                    tmp.pre_decimal = Some(
-                        format!("{provided_num}"));
-                },
-                'x' | 'X' => {
-                    tmp.pre_decimal = Some(
-                        format!("{provided_num:x}"));
-                },
-                'o' => {
-                    tmp.pre_decimal = Some(
-                        format!("{provided_num:o}"));
-                },
-                'e' | 'E' | 'g' | 'G' => {
-                    let as_str = format!("{provided_num}");
-                    let initial_prefix = get_initial_prefix(
-                        &as_str,
-                        field.field_type
-                    );
-                    tmp=formatter.get_primitive(field, &initial_prefix, &as_str)
-                        .expect("err during default provided num");
-                },
-                _ => {
-                    tmp.pre_decimal = Some(
-                        format!("{provided_num}"));
-                    tmp.post_decimal = Some(String::from("0"));
-                }
-            }
-            Some(tmp)
-        } else {
-            // otherwise we'll interpret the argument as a number
-            // using the appropriate Formatter
-            let in_str = in_str_opt.expect(
-                "please send the devs this message:
-                \n get_provided is failing to ret as Some(0) on no str ");
-            // first get information about the beginning of the
-            // numeric argument that would be useful for
-            // any formatter (int or float)
-            let initial_prefix = get_initial_prefix(
-                in_str,
-                field.field_type
-            );
-            // then get the FormatPrimitive from the Formatter
-            formatter.get_primitive(field, &initial_prefix, in_str)
-        };
-    // if we have a formatPrimitive, print its results
-    // according to the field-char appropriate Formatter
-    prim_opt.map(|prim| formatter.primitive_to_str(&prim, field.clone()))
-}
diff --git a/src/uucore/src/lib/features/tokenize/sub.rs b/src/uucore/src/lib/features/tokenize/sub.rs
deleted file mode 100644
index 5bdb24dc633..00000000000
--- a/src/uucore/src/lib/features/tokenize/sub.rs
+++ /dev/null
@@ -1,452 +0,0 @@
-// spell-checker:ignore (vars) charf decf floatf intf scif strf Cninety
-
-//! Sub is a token that represents a
-//! segment of the format string that is a substitution
-//! it is created by Sub's implementation of the Tokenizer trait
-//! Subs which have numeric field chars make use of the num_format
-//! submodule
-use crate::error::{UError, UResult};
-use itertools::{put_back_n, PutBackN};
-use std::error::Error;
-use std::fmt::Display;
-use std::io::Write;
-use std::iter::Peekable;
-use std::process::exit;
-use std::slice::Iter;
-use std::str::Chars;
-// use std::collections::HashSet;
-
-use super::num_format::format_field::{FieldType, FormatField};
-use super::num_format::num_format;
-use super::token;
-use super::unescaped_text::UnescapedText;
-
-const EXIT_ERR: i32 = 1;
-
-#[derive(Debug)]
-pub enum SubError {
-    InvalidSpec(String),
-}
-
-impl Display for SubError {
-    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> Result<(), std::fmt::Error> {
-        match self {
-            Self::InvalidSpec(s) => write!(f, "%{s}: invalid conversion specification"),
-        }
-    }
-}
-
-impl Error for SubError {}
-
-impl UError for SubError {}
-
-fn convert_asterisk_arg_int(asterisk_arg: &str) -> isize {
-    // this is a costly way to parse the
-    // args used for asterisk values into integers
-    // from various bases. Actually doing it correctly
-    // (going through the pipeline to intf, but returning
-    // the integer instead of writing it to string and then
-    // back) is on the refactoring TODO
-    let field_type = FieldType::Intf;
-    let field_char = 'i';
-    let field_info = FormatField {
-        min_width: Some(0),
-        second_field: Some(0),
-        orig: &asterisk_arg.to_string(),
-        field_type: &field_type,
-        field_char: &field_char,
-    };
-    num_format::num_format(&field_info, Some(&asterisk_arg.to_string()))
-        .unwrap()
-        .parse::<isize>()
-        .unwrap()
-}
-
-pub enum CanAsterisk<T> {
-    Fixed(T),
-    Asterisk,
-}
-
-// Sub is a tokenizer which creates tokens
-// for substitution segments of a format string
-pub struct Sub {
-    min_width: CanAsterisk<Option<isize>>,
-    second_field: CanAsterisk<Option<u32>>,
-    field_char: char,
-    field_type: FieldType,
-    orig: String,
-    prefix_char: char,
-}
-impl Sub {
-    pub fn new(
-        min_width: CanAsterisk<Option<isize>>,
-        second_field: CanAsterisk<Option<u32>>,
-        field_char: char,
-        orig: String,
-        prefix_char: char,
-    ) -> Self {
-        // for more dry printing, field characters are grouped
-        // in initialization of token.
-        let field_type = match field_char {
-            's' | 'b' => FieldType::Strf,
-            'd' | 'i' | 'u' | 'o' | 'x' | 'X' => FieldType::Intf,
-            'f' | 'F' => FieldType::Floatf,
-            'a' | 'A' => FieldType::CninetyNineHexFloatf,
-            'e' | 'E' => FieldType::Scif,
-            'g' | 'G' => FieldType::Decf,
-            'c' => FieldType::Charf,
-            _ => {
-                // should be unreachable.
-                println!("Invalid field type");
-                exit(EXIT_ERR);
-            }
-        };
-        Self {
-            min_width,
-            second_field,
-            field_char,
-            field_type,
-            orig,
-            prefix_char,
-        }
-    }
-}
-
-#[derive(Default)]
-pub(crate) struct SubParser {
-    min_width_tmp: Option<String>,
-    min_width_is_asterisk: bool,
-    past_decimal: bool,
-    second_field_tmp: Option<String>,
-    second_field_is_asterisk: bool,
-    specifiers_found: bool,
-    field_char: Option<char>,
-    text_so_far: String,
-}
-
-impl SubParser {
-    fn new() -> Self {
-        Self::default()
-    }
-    pub(crate) fn from_it<W>(
-        writer: &mut W,
-        it: &mut PutBackN<Chars>,
-        args: &mut Peekable<Iter<String>>,
-    ) -> UResult<Option<token::Token>>
-    where
-        W: Write,
-    {
-        let mut parser = Self::new();
-        if parser.sub_vals_retrieved(it)? {
-            let t = Self::build_token(parser);
-            t.write(writer, args);
-            Ok(Some(t))
-        } else {
-            Ok(None)
-        }
-    }
-    fn build_token(parser: Self) -> token::Token {
-        // not a self method so as to allow move of sub-parser vals.
-        // return new Sub struct as token
-        let prefix_char = match &parser.min_width_tmp {
-            Some(width) if width.starts_with('0') => '0',
-            _ => ' ',
-        };
-
-        token::Token::Sub(Sub::new(
-            if parser.min_width_is_asterisk {
-                CanAsterisk::Asterisk
-            } else {
-                CanAsterisk::Fixed(
-                    parser
-                        .min_width_tmp
-                        .map(|x| x.parse::<isize>().unwrap_or(1)),
-                )
-            },
-            if parser.second_field_is_asterisk {
-                CanAsterisk::Asterisk
-            } else {
-                CanAsterisk::Fixed(parser.second_field_tmp.map(|x| x.parse::<u32>().unwrap()))
-            },
-            parser.field_char.unwrap(),
-            parser.text_so_far,
-            prefix_char,
-        ))
-    }
-    #[allow(clippy::cognitive_complexity)]
-    fn sub_vals_retrieved(&mut self, it: &mut PutBackN<Chars>) -> UResult<bool> {
-        if !Self::successfully_eat_prefix(it, &mut self.text_so_far)? {
-            return Ok(false);
-        }
-        // this fn in particular is much longer than it needs to be
-        // .could get a lot
-        // of code savings just by cleaning it up. shouldn't use a regex
-        // though, as we want to mimic the original behavior of printing
-        // the field as interpreted up until the error in the field.
-
-        let mut legal_fields = vec![
-            // 'a', 'A', //c99 hex float implementation not yet complete
-            'b', 'c', 'd', 'e', 'E', 'f', 'F', 'g', 'G', 'i', 'o', 's', 'u', 'x', 'X',
-        ];
-        let mut specifiers = vec!['h', 'j', 'l', 'L', 't', 'z'];
-        legal_fields.sort_unstable();
-        specifiers.sort_unstable();
-
-        // divide substitution from %([0-9]+)?(.[0-9+])?([a-zA-Z])
-        // into min_width, second_field, field_char
-        for ch in it {
-            self.text_so_far.push(ch);
-            match ch {
-                '-' | '*' | '0'..='9' => {
-                    if self.past_decimal {
-                        // second field should never have a
-                        // negative value
-                        if self.second_field_is_asterisk || ch == '-' || self.specifiers_found {
-                            return Err(SubError::InvalidSpec(self.text_so_far.clone()).into());
-                        }
-                        if self.second_field_tmp.is_none() {
-                            self.second_field_tmp = Some(String::new());
-                        }
-                        match self.second_field_tmp.as_mut() {
-                            Some(x) => {
-                                if ch == '*' && !x.is_empty() {
-                                    return Err(
-                                        SubError::InvalidSpec(self.text_so_far.clone()).into()
-                                    );
-                                }
-                                if ch == '*' {
-                                    self.second_field_is_asterisk = true;
-                                }
-                                x.push(ch);
-                            }
-                            None => {
-                                panic!("should be unreachable");
-                            }
-                        }
-                    } else {
-                        if self.min_width_is_asterisk || self.specifiers_found {
-                            return Err(SubError::InvalidSpec(self.text_so_far.clone()).into());
-                        }
-                        if self.min_width_tmp.is_none() {
-                            self.min_width_tmp = Some(String::new());
-                        }
-                        match self.min_width_tmp.as_mut() {
-                            Some(x) => {
-                                if (ch == '-' || ch == '*') && !x.is_empty() {
-                                    return Err(
-                                        SubError::InvalidSpec(self.text_so_far.clone()).into()
-                                    );
-                                }
-                                if ch == '*' {
-                                    self.min_width_is_asterisk = true;
-                                }
-                                x.push(ch);
-                            }
-                            None => {
-                                panic!("should be unreachable");
-                            }
-                        }
-                    }
-                }
-                '.' => {
-                    if self.past_decimal {
-                        return Err(SubError::InvalidSpec(self.text_so_far.clone()).into());
-                    } else {
-                        self.past_decimal = true;
-                    }
-                }
-                x if legal_fields.binary_search(&x).is_ok() => {
-                    self.field_char = Some(ch);
-                    self.text_so_far.push(ch);
-                    break;
-                }
-                x if specifiers.binary_search(&x).is_ok() => {
-                    if !self.past_decimal {
-                        self.past_decimal = true;
-                    }
-                    if !self.specifiers_found {
-                        self.specifiers_found = true;
-                    }
-                }
-                _ => {
-                    return Err(SubError::InvalidSpec(self.text_so_far.clone()).into());
-                }
-            }
-        }
-        if self.field_char.is_none() {
-            return Err(SubError::InvalidSpec(self.text_so_far.clone()).into());
-        }
-        let field_char_retrieved = self.field_char.unwrap();
-        if self.past_decimal && self.second_field_tmp.is_none() {
-            self.second_field_tmp = Some(String::from("0"));
-        }
-        self.validate_field_params(field_char_retrieved)?;
-        // if the dot is provided without a second field
-        // printf interprets it as 0.
-        if let Some(x) = self.second_field_tmp.as_mut() {
-            if x.is_empty() {
-                self.min_width_tmp = Some(String::from("0"));
-            }
-        }
-
-        Ok(true)
-    }
-    fn successfully_eat_prefix(
-        it: &mut PutBackN<Chars>,
-        text_so_far: &mut String,
-    ) -> UResult<bool> {
-        // get next two chars,
-        // if they're '%%' we're not tokenizing it
-        // else put chars back
-        let preface = it.next();
-        let n_ch = it.next();
-        if preface == Some('%') && n_ch != Some('%') {
-            match n_ch {
-                Some(x) => {
-                    it.put_back(x);
-                    Ok(true)
-                }
-                None => {
-                    text_so_far.push('%');
-                    Err(SubError::InvalidSpec(text_so_far.clone()).into())
-                }
-            }
-        } else {
-            if let Some(x) = n_ch {
-                it.put_back(x);
-            };
-            if let Some(x) = preface {
-                it.put_back(x);
-            };
-            Ok(false)
-        }
-    }
-    fn validate_field_params(&self, field_char: char) -> UResult<()> {
-        // check for illegal combinations here when possible vs
-        // on each application so we check less per application
-        // to do: move these checks to Sub::new
-        if (field_char == 's' && self.min_width_tmp == Some(String::from("0")))
-            || (field_char == 'c'
-                && (self.min_width_tmp == Some(String::from("0")) || self.past_decimal))
-            || (field_char == 'b'
-                && (self.min_width_tmp.is_some()
-                    || self.past_decimal
-                    || self.second_field_tmp.is_some()))
-        {
-            // invalid string substitution
-            // to do: include information about an invalid
-            // string substitution
-            return Err(SubError::InvalidSpec(self.text_so_far.clone()).into());
-        }
-        Ok(())
-    }
-}
-
-impl Sub {
-    #[allow(clippy::cognitive_complexity)]
-    pub(crate) fn write<W>(&self, writer: &mut W, pf_args_it: &mut Peekable<Iter<String>>)
-    where
-        W: Write,
-    {
-        let field = FormatField {
-            min_width: match self.min_width {
-                CanAsterisk::Fixed(x) => x,
-                CanAsterisk::Asterisk => {
-                    match pf_args_it.next() {
-                        // temporary, use intf.rs instead
-                        Some(x) => Some(convert_asterisk_arg_int(x)),
-                        None => Some(0),
-                    }
-                }
-            },
-            second_field: match self.second_field {
-                CanAsterisk::Fixed(x) => x,
-                CanAsterisk::Asterisk => {
-                    match pf_args_it.next() {
-                        // temporary, use intf.rs instead
-                        Some(x) => {
-                            let result = convert_asterisk_arg_int(x);
-                            if result < 0 {
-                                None
-                            } else {
-                                Some(result as u32)
-                            }
-                        }
-                        None => Some(0),
-                    }
-                }
-            },
-            field_char: &self.field_char,
-            field_type: &self.field_type,
-            orig: &self.orig,
-        };
-        let pf_arg = pf_args_it.next();
-
-        // minimum width is handled independently of actual
-        // field char
-        let pre_min_width_opt: Option<String> = match *field.field_type {
-            // if %s just return arg
-            // if %b use UnescapedText module's unescape-fn
-            // if %c return first char of arg
-            FieldType::Strf | FieldType::Charf => {
-                match pf_arg {
-                    Some(arg_string) => {
-                        match *field.field_char {
-                            's' => Some(match field.second_field {
-                                Some(max) => String::from(&arg_string[..max as usize]),
-                                None => arg_string.clone(),
-                            }),
-                            'b' => {
-                                let mut a_it = put_back_n(arg_string.chars());
-                                UnescapedText::from_it_core(writer, &mut a_it, true);
-                                None
-                            }
-                            // for 'c': get iter of string vals,
-                            // get opt<char> of first val
-                            // and map it to opt<String>
-                            /* 'c' | */
-                            _ => arg_string.chars().next().map(|x| x.to_string()),
-                        }
-                    }
-                    None => None,
-                }
-            }
-            _ => {
-                // non string/char fields are delegated to num_format
-                num_format::num_format(&field, pf_arg)
-            }
-        };
-        if let Some(pre_min_width) = pre_min_width_opt {
-            // if have a string, print it, ensuring minimum width is met.
-            write!(
-                writer,
-                "{}",
-                match field.min_width {
-                    Some(min_width) => {
-                        let diff: isize = min_width.abs() - pre_min_width.len() as isize;
-                        if diff > 0 {
-                            let mut final_str = String::new();
-                            // definitely more efficient ways
-                            //  to do this.
-                            let pad_before = min_width > 0;
-                            if !pad_before {
-                                final_str.push_str(&pre_min_width);
-                            }
-                            for _ in 0..diff {
-                                final_str.push(self.prefix_char);
-                            }
-                            if pad_before {
-                                final_str.push_str(&pre_min_width);
-                            }
-                            final_str
-                        } else {
-                            pre_min_width
-                        }
-                    }
-                    None => pre_min_width,
-                }
-            )
-            .ok();
-        }
-    }
-}
diff --git a/src/uucore/src/lib/features/tokenize/token.rs b/src/uucore/src/lib/features/tokenize/token.rs
deleted file mode 100644
index b522c99a4e0..00000000000
--- a/src/uucore/src/lib/features/tokenize/token.rs
+++ /dev/null
@@ -1,39 +0,0 @@
-//! Traits and enums dealing with Tokenization of printf Format String
-use std::io::Write;
-use std::iter::Peekable;
-use std::slice::Iter;
-
-use crate::features::tokenize::sub::Sub;
-use crate::features::tokenize::unescaped_text::UnescapedText;
-
-// A token object is an object that can print the expected output
-// of a contiguous segment of the format string, and
-// requires at most 1 argument
-pub enum Token {
-    Sub(Sub),
-    UnescapedText(UnescapedText),
-}
-
-impl Token {
-    pub(crate) fn write<W>(&self, writer: &mut W, args: &mut Peekable<Iter<String>>)
-    where
-        W: Write,
-    {
-        match self {
-            Self::Sub(sub) => sub.write(writer, args),
-            Self::UnescapedText(unescaped_text) => unescaped_text.write(writer),
-        }
-    }
-}
-
-// A tokenizer object is an object that takes an iterator
-// at a position in a format string, and sees whether
-// it can return a token of a type it knows how to produce
-// if so, return the token, move the iterator past the
-// format string text the token represents, and if an
-// argument is used move the argument iter forward one
-
-// creating token of a format string segment should also cause
-// printing of that token's value. Essentially tokenizing
-// a whole format string will print the format string and consume
-// a number of arguments equal to the number of argument-using tokens
diff --git a/src/uucore/src/lib/features/tokenize/unescaped_text.rs b/src/uucore/src/lib/features/tokenize/unescaped_text.rs
deleted file mode 100644
index 29c657ed863..00000000000
--- a/src/uucore/src/lib/features/tokenize/unescaped_text.rs
+++ /dev/null
@@ -1,279 +0,0 @@
-//! UnescapedText is a tokenizer impl
-//! for tokenizing character literals,
-//! and escaped character literals (of allowed escapes),
-//! into an unescaped text byte array
-
-// spell-checker:ignore (ToDO) retval hexchars octals printf's bvec vals coreutil addchar eval bytecode bslice
-
-use itertools::PutBackN;
-use std::char::from_u32;
-use std::io::Write;
-use std::process::exit;
-use std::str::Chars;
-
-use super::token;
-
-const EXIT_OK: i32 = 0;
-const EXIT_ERR: i32 = 1;
-
-// by default stdout only flushes
-// to console when a newline is passed.
-macro_rules! write_and_flush {
-    ($writer:expr, $($args:tt)+) => ({
-        write!($writer, "{}", $($args)+).ok();
-        $writer.flush().ok();
-    })
-}
-
-fn flush_bytes<W>(writer: &mut W, bslice: &[u8])
-where
-    W: Write,
-{
-    writer.write_all(bslice).ok();
-    writer.flush().ok();
-}
-
-#[derive(Default)]
-pub struct UnescapedText(Vec<u8>);
-impl UnescapedText {
-    fn new() -> Self {
-        Self::default()
-    }
-    // take an iterator to the format string
-    // consume between min and max chars
-    // and return it as a base-X number
-    fn base_to_u32(min_chars: u8, max_chars: u8, base: u32, it: &mut PutBackN<Chars>) -> u32 {
-        let mut retval: u32 = 0;
-        let mut found = 0;
-        while found < max_chars {
-            // if end of input break
-            let nc = it.next();
-            match nc {
-                Some(digit) => {
-                    // if end of hexchars break
-                    match digit.to_digit(base) {
-                        Some(d) => {
-                            found += 1;
-                            retval *= base;
-                            retval += d;
-                        }
-                        None => {
-                            it.put_back(digit);
-                            break;
-                        }
-                    }
-                }
-                None => {
-                    break;
-                }
-            }
-        }
-        if found < min_chars {
-            // only ever expected for hex
-            println!("missing hexadecimal number in escape"); //todo stderr
-            exit(EXIT_ERR);
-        }
-        retval
-    }
-    // validates against valid
-    // IEC 10646 vals - these values
-    // are pinned against the more popular
-    // printf so as to not disrupt when
-    // dropped-in as a replacement.
-    fn validate_iec(val: u32, eight_word: bool) {
-        let mut preface = 'u';
-        let leading_zeros = if eight_word {
-            preface = 'U';
-            8
-        } else {
-            4
-        };
-        let err_msg = format!("invalid universal character name {preface}{val:0leading_zeros$x}");
-        if (val < 159 && (val != 36 && val != 64 && val != 96)) || (val > 55296 && val < 57343) {
-            println!("{err_msg}"); //todo stderr
-            exit(EXIT_ERR);
-        }
-    }
-    // pass an iterator that succeeds an '/',
-    // and process the remaining character
-    // adding the unescaped bytes
-    // to the passed byte_vec
-    // in subs_mode change octal behavior
-    fn handle_escaped<W>(
-        writer: &mut W,
-        byte_vec: &mut Vec<u8>,
-        it: &mut PutBackN<Chars>,
-        subs_mode: bool,
-    ) where
-        W: Write,
-    {
-        let ch = it.next().unwrap_or('\\');
-        match ch {
-            '0'..='9' | 'x' => {
-                let min_len = 1;
-                let mut max_len = 2;
-                let mut base = 16;
-                let ignore = false;
-                match ch {
-                    'x' => {}
-                    e @ '0'..='9' => {
-                        max_len = 3;
-                        base = 8;
-                        // in practice, gnu coreutils printf
-                        // interprets octals without a
-                        // leading zero in %b
-                        // but it only skips leading zeros
-                        // in %b mode.
-                        // if we ever want to match gnu coreutil
-                        // printf's docs instead of its behavior
-                        // we'd set this to true.
-                        // if subs_mode && e != '0'
-                        //  { ignore = true; }
-                        if !subs_mode || e != '0' {
-                            it.put_back(ch);
-                        }
-                    }
-                    _ => {}
-                }
-                if ignore {
-                    byte_vec.push(ch as u8);
-                } else {
-                    let val = (Self::base_to_u32(min_len, max_len, base, it) % 256) as u8;
-                    byte_vec.push(val);
-                    let bvec = [val];
-                    flush_bytes(writer, &bvec);
-                }
-            }
-            e => {
-                // only for hex and octal
-                // is byte encoding specified.
-                // otherwise, why not leave the door open
-                // for other encodings unless it turns out
-                // a bottleneck.
-                let mut s = String::new();
-                let ch = match e {
-                    '\\' => '\\',
-                    '"' => '"',
-                    'n' => '\n',
-                    'r' => '\r',
-                    't' => '\t',
-                    // bell
-                    'a' => '\x07',
-                    // backspace
-                    'b' => '\x08',
-                    // vertical tab
-                    'v' => '\x0B',
-                    // form feed
-                    'f' => '\x0C',
-                    // escape character
-                    'e' => '\x1B',
-                    'c' => exit(EXIT_OK),
-                    'u' | 'U' => {
-                        let len = match e {
-                            'u' => 4,
-                            /* 'U' | */ _ => 8,
-                        };
-                        let val = Self::base_to_u32(len, len, 16, it);
-                        Self::validate_iec(val, false);
-                        if let Some(c) = from_u32(val) {
-                            c
-                        } else {
-                            '-'
-                        }
-                    }
-                    _ => {
-                        s.push('\\');
-                        ch
-                    }
-                };
-                s.push(ch);
-                write_and_flush!(writer, &s);
-                byte_vec.extend(s.bytes());
-            }
-        };
-    }
-
-    // take an iterator to a string,
-    // and return a wrapper around a Vec<u8> of unescaped bytes
-    // break on encounter of sub symbol ('%[^%]') unless called
-    // through %b subst.
-    #[allow(clippy::cognitive_complexity)]
-    pub fn from_it_core<W>(
-        writer: &mut W,
-        it: &mut PutBackN<Chars>,
-        subs_mode: bool,
-    ) -> Option<token::Token>
-    where
-        W: Write,
-    {
-        let mut addchar = false;
-        let mut new_text = Self::new();
-        let mut tmp_str = String::new();
-        {
-            let new_vec: &mut Vec<u8> = &mut (new_text.0);
-            while let Some(ch) = it.next() {
-                if !addchar {
-                    addchar = true;
-                }
-                match ch {
-                    x if x != '\\' && x != '%' => {
-                        // lazy branch eval
-                        // remember this fn could be called
-                        // many times in a single exec through %b
-                        write_and_flush!(writer, ch);
-                        tmp_str.push(ch);
-                    }
-                    '\\' => {
-                        // the literal may be a literal bytecode
-                        // and not valid utf-8. Str only supports
-                        // valid utf-8.
-                        // if we find the unnecessary drain
-                        // on non hex or octal escapes is costly
-                        // then we can make it faster/more complex
-                        // with as-necessary draining.
-                        if !tmp_str.is_empty() {
-                            new_vec.extend(tmp_str.bytes());
-                            tmp_str = String::new();
-                        }
-                        Self::handle_escaped(writer, new_vec, it, subs_mode);
-                    }
-                    x if x == '%' && !subs_mode => {
-                        if let Some(follow) = it.next() {
-                            if follow == '%' {
-                                write_and_flush!(writer, ch);
-                                tmp_str.push(ch);
-                            } else {
-                                it.put_back(follow);
-                                it.put_back(ch);
-                                break;
-                            }
-                        } else {
-                            it.put_back(ch);
-                            break;
-                        }
-                    }
-                    _ => {
-                        write_and_flush!(writer, ch);
-                        tmp_str.push(ch);
-                    }
-                }
-            }
-            if !tmp_str.is_empty() {
-                new_vec.extend(tmp_str.bytes());
-            }
-        }
-        if addchar {
-            Some(token::Token::UnescapedText(new_text))
-        } else {
-            None
-        }
-    }
-}
-impl UnescapedText {
-    pub(crate) fn write<W>(&self, writer: &mut W)
-    where
-        W: Write,
-    {
-        flush_bytes(writer, &self.0[..]);
-    }
-}
diff --git a/src/uucore/src/lib/lib.rs b/src/uucore/src/lib/lib.rs
index ca9a48d258a..7f5cc99db34 100644
--- a/src/uucore/src/lib/lib.rs
+++ b/src/uucore/src/lib/lib.rs
@@ -44,8 +44,8 @@ pub use crate::features::fs;
 pub use crate::features::fsext;
 #[cfg(feature = "lines")]
 pub use crate::features::lines;
-#[cfg(feature = "memo")]
-pub use crate::features::memo;
+#[cfg(feature = "format")]
+pub use crate::features::format;
 #[cfg(feature = "ringbuffer")]
 pub use crate::features::ringbuffer;
 #[cfg(feature = "sum")]

From 66eb64e41f1da4c32d692da957847c09eb478e17 Mon Sep 17 00:00:00 2001
From: Terts Diepraam <terts.diepraam@gmail.com>
Date: Wed, 2 Aug 2023 23:57:53 +0200
Subject: [PATCH 004/429] dd, printf, seq: update to new printf

---
 src/uu/dd/Cargo.toml        |  2 +-
 src/uu/dd/src/progress.rs   |  2 +-
 src/uu/printf/Cargo.toml    |  2 +-
 src/uu/printf/src/printf.rs |  2 +-
 src/uu/seq/Cargo.toml       |  2 +-
 src/uu/seq/src/seq.rs       | 19 +++++--------------
 6 files changed, 10 insertions(+), 19 deletions(-)

diff --git a/src/uu/dd/Cargo.toml b/src/uu/dd/Cargo.toml
index 0a69ae37435..aa19dc760e1 100644
--- a/src/uu/dd/Cargo.toml
+++ b/src/uu/dd/Cargo.toml
@@ -18,7 +18,7 @@ path = "src/dd.rs"
 clap = { workspace = true }
 gcd = { workspace = true }
 libc = { workspace = true }
-uucore = { workspace = true, features = ["memo"] }
+uucore = { workspace = true, features = ["format"] }
 
 [target.'cfg(any(target_os = "linux"))'.dependencies]
 nix = { workspace = true, features = ["fs"] }
diff --git a/src/uu/dd/src/progress.rs b/src/uu/dd/src/progress.rs
index a9d29ff6325..674d90984ca 100644
--- a/src/uu/dd/src/progress.rs
+++ b/src/uu/dd/src/progress.rs
@@ -14,7 +14,7 @@ use std::sync::mpsc;
 use std::time::Duration;
 
 use uucore::error::UResult;
-use uucore::memo::sprintf;
+use uucore::format::sprintf;
 
 use crate::numbers::{to_magnitude_and_suffix, SuffixType};
 
diff --git a/src/uu/printf/Cargo.toml b/src/uu/printf/Cargo.toml
index eefcf33c07e..9acd2c78c9d 100644
--- a/src/uu/printf/Cargo.toml
+++ b/src/uu/printf/Cargo.toml
@@ -16,7 +16,7 @@ path = "src/printf.rs"
 
 [dependencies]
 clap = { workspace = true }
-uucore = { workspace = true, features = ["memo"] }
+uucore = { workspace = true, features = ["format"] }
 
 [[bin]]
 name = "printf"
diff --git a/src/uu/printf/src/printf.rs b/src/uu/printf/src/printf.rs
index bf79369ccab..042e0932eaf 100644
--- a/src/uu/printf/src/printf.rs
+++ b/src/uu/printf/src/printf.rs
@@ -4,7 +4,7 @@
 
 use clap::{crate_version, Arg, ArgAction, Command};
 use uucore::error::{UResult, UUsageError};
-use uucore::memo::printf;
+use uucore::format::printf;
 use uucore::{format_usage, help_about, help_section, help_usage};
 
 const VERSION: &str = "version";
diff --git a/src/uu/seq/Cargo.toml b/src/uu/seq/Cargo.toml
index 2646d36095d..41b42ef83a4 100644
--- a/src/uu/seq/Cargo.toml
+++ b/src/uu/seq/Cargo.toml
@@ -20,7 +20,7 @@ bigdecimal = { workspace = true }
 clap = { workspace = true }
 num-bigint = { workspace = true }
 num-traits = { workspace = true }
-uucore = { workspace = true, features = ["memo"] }
+uucore = { workspace = true, features = ["format"] }
 
 [[bin]]
 name = "seq"
diff --git a/src/uu/seq/src/seq.rs b/src/uu/seq/src/seq.rs
index 2e55efa4ada..0dd65fc3f24 100644
--- a/src/uu/seq/src/seq.rs
+++ b/src/uu/seq/src/seq.rs
@@ -4,15 +4,12 @@
 //  * file that was distributed with this source code.
 // spell-checker:ignore (ToDO) istr chiter argptr ilen extendedbigdecimal extendedbigint numberparse
 use std::io::{stdout, ErrorKind, Write};
-use std::process::exit;
 
 use clap::{crate_version, Arg, ArgAction, Command};
 use num_traits::Zero;
 
-use uucore::error::FromIo;
 use uucore::error::UResult;
-use uucore::memo::printf;
-use uucore::show;
+use uucore::format::printf;
 use uucore::{format_usage, help_about, help_usage};
 
 mod error;
@@ -251,7 +248,7 @@ fn print_seq(
     pad: bool,
     padding: usize,
     format: Option<&str>,
-) -> std::io::Result<()> {
+) -> UResult<()> {
     let stdout = stdout();
     let mut stdout = stdout.lock();
     let (first, increment, last) = range;
@@ -277,10 +274,7 @@ fn print_seq(
         match format {
             Some(f) => {
                 let s = format!("{value}");
-                if let Err(x) = printf(f, &[s]) {
-                    show!(x);
-                    exit(1);
-                }
+                printf(f, &[s])?;
             }
             None => write_value_float(
                 &mut stdout,
@@ -322,7 +316,7 @@ fn print_seq_integers(
     pad: bool,
     padding: usize,
     format: Option<&str>,
-) -> std::io::Result<()> {
+) -> UResult<()> {
     let stdout = stdout();
     let mut stdout = stdout.lock();
     let (first, increment, last) = range;
@@ -342,10 +336,7 @@ fn print_seq_integers(
         match format {
             Some(f) => {
                 let s = format!("{value}");
-                if let Err(x) = printf(f, &[s]) {
-                    show!(x);
-                    exit(1);
-                }
+                printf(f, &[s])?;
             }
             None => write_value_int(&mut stdout, &value, padding, pad, is_first_iteration)?,
         }

From 407bccc54f48dc54ab28fdc10da0c4ecd9c5c805 Mon Sep 17 00:00:00 2001
From: Terts Diepraam <terts.diepraam@gmail.com>
Date: Thu, 10 Aug 2023 23:20:20 +0200
Subject: [PATCH 005/429] some more work on printf spec

---
 src/uucore/src/lib/features/format/spec.rs | 78 +++++++++++++++++-----
 1 file changed, 60 insertions(+), 18 deletions(-)

diff --git a/src/uucore/src/lib/features/format/spec.rs b/src/uucore/src/lib/features/format/spec.rs
index 4319e44d93f..d1786c3d36f 100644
--- a/src/uucore/src/lib/features/format/spec.rs
+++ b/src/uucore/src/lib/features/format/spec.rs
@@ -358,20 +358,28 @@ impl Spec {
                     return Err(FormatError::InvalidArgument(arg));
                 };
 
-                match positive_sign {
-                    PositiveSign::None => Ok(()),
-                    PositiveSign::Plus => write!(writer, "+"),
-                    PositiveSign::Space => write!(writer, " "),
+                if f.is_sign_positive() {
+                    match positive_sign {
+                        PositiveSign::None => Ok(()),
+                        PositiveSign::Plus => write!(writer, "+"),
+                        PositiveSign::Space => write!(writer, " "),
+                    }
+                    .map_err(FormatError::IoError)?;
                 }
-                .map_err(FormatError::IoError)?;
 
                 let s = match variant {
-                    FloatVariant::Decimal => format_float_decimal(f, precision, case, force_decimal),
+                    FloatVariant::Decimal => {
+                        format_float_decimal(f, precision, case, force_decimal)
+                    }
                     FloatVariant::Scientific => {
                         format_float_scientific(f, precision, case, force_decimal)
                     }
-                    FloatVariant::Shortest => format_float_shortest(f, precision, case, force_decimal),
-                    FloatVariant::Hexadecimal => todo!(),
+                    FloatVariant::Shortest => {
+                        format_float_shortest(f, precision, case, force_decimal)
+                    }
+                    FloatVariant::Hexadecimal => {
+                        format_float_hexadecimal(f, precision, case, force_decimal)
+                    }
                 };
 
                 match alignment {
@@ -385,6 +393,15 @@ impl Spec {
     }
 }
 
+fn format_float_nonfinite(f: f64, case: Case) -> String {
+    debug_assert!(!f.is_finite());
+    let mut s = format!("{f}");
+    if case == Case::Uppercase {
+        s.make_ascii_uppercase();
+    }
+    return s;
+}
+
 fn format_float_decimal(
     f: f64,
     precision: usize,
@@ -392,11 +409,7 @@ fn format_float_decimal(
     force_decimal: ForceDecimal,
 ) -> String {
     if !f.is_finite() {
-        let mut s = format!("{f}");
-        if case == Case::Lowercase {
-            s.make_ascii_uppercase();
-        }
-        return s;
+        return format_float_nonfinite(f, case);
     }
 
     if precision == 0 && force_decimal == ForceDecimal::Yes {
@@ -414,11 +427,7 @@ fn format_float_scientific(
 ) -> String {
     // If the float is NaN, -Nan, Inf or -Inf, format like any other float
     if !f.is_finite() {
-        let mut s = format!("{f}");
-        if case == Case::Lowercase {
-            s.make_ascii_uppercase();
-        }
-        return s;
+        return format_float_nonfinite(f, case);
     }
 
     let exponent: i32 = f.log10().floor() as i32;
@@ -458,6 +467,39 @@ fn format_float_shortest(
     }
 }
 
+fn format_float_hexadecimal(
+    f: f64,
+    precision: usize,
+    case: Case,
+    force_decimal: ForceDecimal,
+) -> String {
+    if !f.is_finite() {
+        return format_float_nonfinite(f, case);
+    }
+
+    let (first_digit, mantissa, exponent) = if f == 0.0 {
+        (0, 0, 0)
+    } else {
+        let bits = f.to_bits();
+        let exponent_bits = ((bits >> 52) & 0x7fff) as i64;
+        let exponent = exponent_bits - 1023;
+        let mantissa = bits & 0xf_ffff_ffff_ffff;
+        (1, mantissa, exponent)
+    };
+
+    let mut s = match (precision, force_decimal) {
+        (0, ForceDecimal::No) => format!("0x{first_digit}p{exponent:+x}"),
+        (0, ForceDecimal::Yes) => format!("0x{first_digit}.p{exponent:+x}"),
+        _ => format!("0x{first_digit}.{mantissa:0>13x}p{exponent:+x}")
+    };
+
+    if case == Case::Uppercase {
+        s.make_ascii_uppercase();
+    }
+
+    return s;
+}
+
 fn resolve_asterisk(
     option: Option<CanAsterisk<usize>>,
     args: impl Iterator<Item = FormatArgument>,

From df6193f84c62666d9ba79ec9bf3bb3adb3f1bc36 Mon Sep 17 00:00:00 2001
From: Terts Diepraam <terts.diepraam@gmail.com>
Date: Sun, 24 Sep 2023 15:40:35 +0200
Subject: [PATCH 006/429] clean up deps.nu

---
 util/deps.nu | 81 ++++++++++++++++++----------------------------------
 1 file changed, 28 insertions(+), 53 deletions(-)

diff --git a/util/deps.nu b/util/deps.nu
index a35e2d98c96..368048fff45 100644
--- a/util/deps.nu
+++ b/util/deps.nu
@@ -20,11 +20,11 @@
 #  - `normal_dep`: whether the crate is a normal dependency.
 #  - `build_dep`: whether the crate is a build dependency.
 #  - `dev_dep`: whether the crate is a dev dependency.
-#  - `organisation`: the GitHub/GitLab organisation or user of the repository of the crate.
+#  - `organization`: the GitHub/GitLab organization or user of the repository of the crate.
 #  - `repository_name`: the name of the repository the crate is in. The format is "{owner}/{repo}".
 #  - `dependencies`: direct dependencies of the crate (in the format of Cargo.lock).
 #
-# To use this script, start nushell (tested only on version 0.82.0), import the library and
+# To use this script, start Nushell (tested only on version 0.82.0), import the library and
 # call `all_dep_info`:
 #
 # ```
@@ -33,19 +33,19 @@
 # > let dep = (deps all_dep_info)
 # ```
 #
-# Then you can perform analysis. For example, to group the dependencies by organisation:
+# Then you can perform analysis. For example, to group the dependencies by organization:
 #
 # ```
-# > $dep | group-by organisation   
+# > $dep | group-by organization
 # ```
 #
 # Or to find all crates with multiple versions (like cargo deny):
 # ```
-# > $dep | where num_versions > 1   
+# > $dep | where num_versions > 1
 # ```
 #
 # Ideas to expand this:
-# 
+#
 #  - Figure out the whole dependency graph
 #  - Figure out which platforms and which features enable which crates
 #  - Figure out which utils require which crates
@@ -58,61 +58,37 @@
 #  - Check the number of owners/contributors
 #  - Make a webpage to more easily explore the data
 
-# Read the packages a Cargo.lock file
-def read_lockfile [name: path] {
-    open $name | from toml | get package
-}
-
 # Read the names output by cargo tree
-export def read_tree_names [edges: string, features: string] {
-    cargo tree -e $edges --features $features
-    | rg "[a-zA-Z0-9_-]+ v[0-9.]+" -o
-    | lines
-    | each {|x| parse_name_and_version $x }
-}
-
-def parse_name_and_version [s: string] {
-    let s = ($s | split row " ")
-
-    let name = $s.0
-    let version = if ($s | length) > 1 {
-        $s.1 | str substring 1..
-    } else {
-        ""
-    }
-
-    {name: $name, version: $version}
+export def read_tree_names [edge_kind: string, features: list<string>]: any -> table<> {
+    cargo tree --edges $edge_kind --features ($features | str join ",")
+        | parse -r "(?P<name>[a-zA-Z0-9_-]+) v(?P<version>[0-9.]+)"
 }
 
 # Read the crates.io info for a list of crates names
-def read_crates_io [names: list<string>] {
-    let total = ($names | length)
-    $names | enumerate | par-each {|el|
-        let key = $el.index
-        let name = $el.item
-        print $"($key)/($total): ($name)"
-        http get $"https://crates.io/api/v1/crates/($name)" | get crate
+def read_crates_io [names: list<string>] -> any -> table<> {
+    let total = $names | length
+    $names | enumerate | par-each {|name|
+        print $"($name.index)/($total): ($name.item)"
+        http get $"https://crates.io/api/v1/crates/($name.item)" | get crate
     }
 }
 
-def in_table [col_name, table] {
-    insert $col_name {|el|
-        $table
-        | any {|table_el|
-            $table_el.name == $el.name and $table_el.version == $el.version }
-        }
-}
-
 # Add column for a dependency type
-def add_dep_type [dep_type: string, features: string] {
-    in_table $"($dep_type)_dep" (read_tree_names $dep_type $features)
+def add_dep_type [dep_type: string, features: list<string>]: table<> -> table<> {
+    let input_table = $in
+    let table = read_tree_names $dep_type $features
+    $input_table | insert $"($dep_type)_dep" {|outer|
+        $table | any {|inner|
+            $inner.name == $outer.name and $inner.version == $outer.version
+        }
+    }
 }
 
 export def all_dep_info [] {
-    let features = unix,feat_selinux
-
-    let lock = (read_lockfile Cargo.lock)
+    let features = [unix, feat_selinux]
 
+    let lock = open Cargo.lock | from toml | get package
+    
     $lock
     # Add number of versions
     | join ($lock | group-by name | transpose | update column1 { length } | rename name num_versions) name
@@ -124,10 +100,10 @@ export def all_dep_info [] {
     # Add crates.io info
     | join (read_crates_io ($lock.name | uniq)) name
     # Add GH org or user info
-    # The organisation is an indicator that crates should be treated as one dependency.
-    # However, there are also unrelated projects by a single organisation, so it's not
+    # The organization is an indicator that crates should be treated as one dependency.
+    # However, there are also unrelated projects by a single organization, so it's not
     # clear.
-    | insert organisation {|x|
+    | insert organization {|x|
         let repository = $x.repository?
         if ($repository == null) { "" } else {
             $repository | url parse | get path | path split | get 1
@@ -152,4 +128,3 @@ export def all_dep_info [] {
         }
     }
 }
-

From 94492c98a52bbb9b406ebe9599319796553d5300 Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Fri, 20 Oct 2023 09:40:09 +0200
Subject: [PATCH 007/429] cp: --rem don't fail if dest is hardlink to source

---
 src/uu/cp/src/cp.rs      | 13 +++++++++++--
 tests/by-util/test_cp.rs | 18 ++++++++++++++++++
 2 files changed, 29 insertions(+), 2 deletions(-)

diff --git a/src/uu/cp/src/cp.rs b/src/uu/cp/src/cp.rs
index da9918365ff..5441e88ed39 100644
--- a/src/uu/cp/src/cp.rs
+++ b/src/uu/cp/src/cp.rs
@@ -33,8 +33,8 @@ use platform::copy_on_write;
 use uucore::display::Quotable;
 use uucore::error::{set_exit_code, UClapError, UError, UResult, UUsageError};
 use uucore::fs::{
-    canonicalize, is_symlink_loop, paths_refer_to_same_file, FileInformation, MissingHandling,
-    ResolveMode,
+    are_hardlinks_to_same_file, canonicalize, is_symlink_loop, paths_refer_to_same_file,
+    FileInformation, MissingHandling, ResolveMode,
 };
 use uucore::{backup_control, update_control};
 // These are exposed for projects (e.g. nushell) that want to create an `Options` value, which
@@ -1657,6 +1657,15 @@ fn copy_file(
         }
     }
 
+    if are_hardlinks_to_same_file(source, dest)
+        && matches!(
+            options.overwrite,
+            OverwriteMode::Clobber(ClobberMode::RemoveDestination)
+        )
+    {
+        fs::remove_file(dest)?;
+    }
+
     if file_or_link_exists(dest) {
         handle_existing_dest(source, dest, options, source_in_command_line)?;
     }
diff --git a/tests/by-util/test_cp.rs b/tests/by-util/test_cp.rs
index b3cc3e0c12c..7d3ebfa709c 100644
--- a/tests/by-util/test_cp.rs
+++ b/tests/by-util/test_cp.rs
@@ -2827,6 +2827,24 @@ fn test_cp_mode_hardlink_no_dereference() {
     assert_eq!(at.read_symlink("z"), "slink");
 }
 
+#[cfg(not(any(windows, target_os = "android")))]
+#[test]
+fn test_remove_destination_with_destination_being_a_hardlink_to_source() {
+    let (at, mut ucmd) = at_and_ucmd!();
+    let file = "file";
+    let hardlink = "hardlink";
+
+    at.touch(file);
+    at.hard_link(file, hardlink);
+
+    ucmd.args(&["--remove-destination", file, hardlink])
+        .succeeds();
+
+    assert_eq!("", at.resolve_link(hardlink));
+    assert!(at.file_exists(file));
+    assert!(at.file_exists(hardlink));
+}
+
 #[test]
 fn test_remove_destination_with_destination_being_a_symlink_to_source() {
     let (at, mut ucmd) = at_and_ucmd!();

From 69b7095eac172846ba62a511b096735ecb6b391e Mon Sep 17 00:00:00 2001
From: Terts Diepraam <terts.diepraam@gmail.com>
Date: Sat, 28 Oct 2023 17:34:04 +0200
Subject: [PATCH 008/429] printf rewrite: fix compilation

---
 src/uu/dd/src/progress.rs                  |  6 ++-
 src/uu/printf/src/printf.rs                |  8 ++--
 src/uu/seq/src/seq.rs                      | 11 +++--
 src/uucore/src/lib/features/format/mod.rs  | 55 ++++++++++++++++++----
 src/uucore/src/lib/features/format/spec.rs | 38 +++++++--------
 5 files changed, 80 insertions(+), 38 deletions(-)

diff --git a/src/uu/dd/src/progress.rs b/src/uu/dd/src/progress.rs
index f2472600927..1d9b7247d20 100644
--- a/src/uu/dd/src/progress.rs
+++ b/src/uu/dd/src/progress.rs
@@ -13,8 +13,8 @@ use std::io::Write;
 use std::sync::mpsc;
 use std::time::Duration;
 
-use uucore::error::UResult;
 use uucore::format::sprintf;
+use uucore::{error::UResult, format::FormatArgument};
 
 use crate::numbers::{to_magnitude_and_suffix, SuffixType};
 
@@ -152,7 +152,9 @@ impl ProgUpdate {
         let (carriage_return, newline) = if rewrite { ("\r", "") } else { ("", "\n") };
 
         // The duration should be formatted as in `printf %g`.
-        let duration_str = sprintf("%g", &[duration.to_string()])?;
+        // TODO: remove unwrap and make FormatError implement UError
+        let duration_str = sprintf("%g", &[FormatArgument::Float(duration)])?;
+        let duration_str = std::str::from_utf8(&duration_str).unwrap();
 
         // If the number of bytes written is sufficiently large, then
         // print a more concise representation of the number, like
diff --git a/src/uu/printf/src/printf.rs b/src/uu/printf/src/printf.rs
index 36b4c34535b..6e270ec2645 100644
--- a/src/uu/printf/src/printf.rs
+++ b/src/uu/printf/src/printf.rs
@@ -8,7 +8,7 @@
 
 use clap::{crate_version, Arg, ArgAction, Command};
 use uucore::error::{UResult, UUsageError};
-use uucore::format::printf;
+use uucore::format::{printf, FormatArgument};
 use uucore::{format_usage, help_about, help_section, help_usage};
 
 const VERSION: &str = "version";
@@ -30,12 +30,12 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
     let format_string = matches
         .get_one::<String>(options::FORMATSTRING)
         .ok_or_else(|| UUsageError::new(1, "missing operand"))?;
-    let values: Vec<String> = match matches.get_many::<String>(options::ARGUMENT) {
-        Some(s) => s.map(|s| s.to_string()).collect(),
+    let values: Vec<_> = match matches.get_many::<String>(options::ARGUMENT) {
+        Some(s) => s.map(|s| FormatArgument::Unparsed(s.to_string())).collect(),
         None => vec![],
     };
 
-    printf(format_string, &values[..])?;
+    printf(format_string, &values)?;
     Ok(())
 }
 
diff --git a/src/uu/seq/src/seq.rs b/src/uu/seq/src/seq.rs
index f93ced9264d..217e9042833 100644
--- a/src/uu/seq/src/seq.rs
+++ b/src/uu/seq/src/seq.rs
@@ -9,7 +9,7 @@ use clap::{crate_version, Arg, ArgAction, Command};
 use num_traits::Zero;
 
 use uucore::error::UResult;
-use uucore::format::printf;
+use uucore::format::{printf, FormatArgument};
 use uucore::{format_usage, help_about, help_usage};
 
 mod error;
@@ -144,8 +144,9 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
     };
     match result {
         Ok(_) => Ok(()),
-        Err(err) if err.kind() == ErrorKind::BrokenPipe => Ok(()),
-        Err(e) => Err(e.map_err_context(|| "write error".into())),
+        _ => todo!(),
+        // Err(err) if err.kind() == ErrorKind::BrokenPipe => Ok(()),
+        // Err(e) => Err(e.map_err_context(|| "write error".into())),
     }
 }
 
@@ -270,7 +271,7 @@ fn print_seq(
         match format {
             Some(f) => {
                 let s = format!("{value}");
-                printf(f, &[s])?;
+                printf(f, &[FormatArgument::String(s)])?;
             }
             None => write_value_float(&mut stdout, &value, padding, largest_dec)?,
         }
@@ -326,7 +327,7 @@ fn print_seq_integers(
         match format {
             Some(f) => {
                 let s = format!("{value}");
-                printf(f, &[s])?;
+                printf(f, &[FormatArgument::String(s)])?;
             }
             None => write_value_int(&mut stdout, &value, padding, pad)?,
         }
diff --git a/src/uucore/src/lib/features/format/mod.rs b/src/uucore/src/lib/features/format/mod.rs
index abd92011cc4..ebb1cc360eb 100644
--- a/src/uucore/src/lib/features/format/mod.rs
+++ b/src/uucore/src/lib/features/format/mod.rs
@@ -3,7 +3,7 @@
 //! The [`printf`] and [`sprintf`] closely match the behavior of the
 //! corresponding C functions: the former renders a formatted string
 //! to stdout, the latter renders to a new [`String`] object.
-//! 
+//!
 //! In addition to the [`printf`] and [`sprintf`] functions, we expose the
 //! [`Format`] struct, which represents a parsed format string. This reduces
 //! the need for parsing a format string multiple times and assures that no
@@ -14,8 +14,15 @@
 mod spec;
 
 use spec::Spec;
-use std::io::{stdout, Write};
+use std::{
+    error::Error,
+    fmt::Display,
+    io::{stdout, Write},
+};
+
+use crate::error::UError;
 
+#[derive(Debug)]
 pub enum FormatError {
     SpecError,
     IoError(std::io::Error),
@@ -23,6 +30,21 @@ pub enum FormatError {
     InvalidArgument(FormatArgument),
 }
 
+impl Error for FormatError {}
+impl UError for FormatError {}
+
+impl Display for FormatError {
+    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
+        // TODO: Be more precise about these
+        match self {
+            FormatError::SpecError => write!(f, "invalid spec"),
+            FormatError::IoError(_) => write!(f, "io error"),
+            FormatError::NoMoreArguments => write!(f, "no more arguments"),
+            FormatError::InvalidArgument(_) => write!(f, "invalid argument"),
+        }
+    }
+}
+
 /// A single item to format
 enum FormatItem {
     /// A format specifier
@@ -30,21 +52,28 @@ enum FormatItem {
     /// Some plain text
     Text(Vec<u8>),
     /// A single character
-    /// 
+    ///
     /// Added in addition to `Text` as an optimization.
     Char(u8),
 }
 
+#[derive(Clone, Debug)]
 pub enum FormatArgument {
     Char(char),
     String(String),
     UnsignedInt(u64),
     SignedInt(i64),
     Float(f64),
+    // Special argument that gets coerced into the other variants
+    Unparsed(String),
 }
 
 impl FormatItem {
-    fn write<'a>(&self, mut writer: impl Write, args: &mut impl Iterator<Item = FormatArgument>) -> Result<(), FormatError> {
+    fn write<'a>(
+        &self,
+        mut writer: impl Write,
+        args: &mut impl Iterator<Item = &'a FormatArgument>,
+    ) -> Result<(), FormatError> {
         match self {
             FormatItem::Spec(spec) => spec.write(writer, args),
             FormatItem::Text(bytes) => writer.write_all(bytes).map_err(FormatError::IoError),
@@ -110,13 +139,20 @@ fn parse_iter(fmt: &[u8]) -> impl Iterator<Item = Result<FormatItem, FormatError
 /// printf("hello %s", &["world".to_string()]).unwrap();
 /// // prints "hello world"
 /// ```
-pub fn printf(format_string: &[u8], arguments: impl IntoIterator<Item = FormatArgument>) -> Result<(), FormatError> {
+pub fn printf<'a>(
+    format_string: impl AsRef<[u8]>,
+    arguments: impl IntoIterator<Item = &'a FormatArgument>,
+) -> Result<(), FormatError> {
     printf_writer(stdout(), format_string, arguments)
 }
 
-fn printf_writer(mut writer: impl Write, format_string: &[u8], args: impl IntoIterator<Item = FormatArgument>) -> Result<(), FormatError> {
+fn printf_writer<'a>(
+    mut writer: impl Write,
+    format_string: impl AsRef<[u8]>,
+    args: impl IntoIterator<Item = &'a FormatArgument>,
+) -> Result<(), FormatError> {
     let mut args = args.into_iter();
-    for item in parse_iter(format_string) {
+    for item in parse_iter(format_string.as_ref()) {
         item?.write(&mut writer, &mut args)?;
     }
     Ok(())
@@ -137,7 +173,10 @@ fn printf_writer(mut writer: impl Write, format_string: &[u8], args: impl IntoIt
 /// let s = sprintf("hello %s", &["world".to_string()]).unwrap();
 /// assert_eq!(s, "hello world".to_string());
 /// ```
-pub fn sprintf(format_string: &[u8], arguments: impl IntoIterator<Item = FormatArgument>) -> Result<Vec<u8>, FormatError> {
+pub fn sprintf<'a>(
+    format_string: impl AsRef<[u8]>,
+    arguments: impl IntoIterator<Item = &'a FormatArgument>,
+) -> Result<Vec<u8>, FormatError> {
     let mut writer = Vec::new();
     printf_writer(&mut writer, format_string, arguments)?;
     Ok(writer)
diff --git a/src/uucore/src/lib/features/format/spec.rs b/src/uucore/src/lib/features/format/spec.rs
index d1786c3d36f..c1eb7856db1 100644
--- a/src/uucore/src/lib/features/format/spec.rs
+++ b/src/uucore/src/lib/features/format/spec.rs
@@ -257,7 +257,7 @@ impl Spec {
     pub fn write<'a>(
         &self,
         mut writer: impl Write,
-        mut args: impl Iterator<Item = FormatArgument>,
+        mut args: impl Iterator<Item = &'a FormatArgument>,
     ) -> Result<(), FormatError> {
         match self {
             &Spec::Char { width, align_left } => {
@@ -265,7 +265,7 @@ impl Spec {
                 let arg = next_arg(&mut args)?;
                 match arg {
                     FormatArgument::Char(c) => write_padded(writer, c, width, false, align_left),
-                    _ => Err(FormatError::InvalidArgument(arg)),
+                    _ => Err(FormatError::InvalidArgument(arg.clone())),
                 }
             }
             &Spec::String { width, align_left } => {
@@ -273,7 +273,7 @@ impl Spec {
                 let arg = next_arg(&mut args)?;
                 match arg {
                     FormatArgument::String(s) => write_padded(writer, s, width, false, align_left),
-                    _ => Err(FormatError::InvalidArgument(arg)),
+                    _ => Err(FormatError::InvalidArgument(arg.clone())),
                 }
             }
             &Spec::SignedInt {
@@ -285,10 +285,10 @@ impl Spec {
 
                 let arg = next_arg(&mut args)?;
                 let FormatArgument::SignedInt(i) = arg else {
-                    return Err(FormatError::InvalidArgument(arg));
+                    return Err(FormatError::InvalidArgument(arg.clone()));
                 };
 
-                if i >= 0 {
+                if *i >= 0 {
                     match positive_sign {
                         PositiveSign::None => Ok(()),
                         PositiveSign::Plus => write!(writer, "+"),
@@ -313,7 +313,7 @@ impl Spec {
 
                 let arg = next_arg(args)?;
                 let FormatArgument::SignedInt(i) = arg else {
-                    return Err(FormatError::InvalidArgument(arg));
+                    return Err(FormatError::InvalidArgument(arg.clone()));
                 };
 
                 let s = match variant {
@@ -355,7 +355,7 @@ impl Spec {
 
                 let arg = next_arg(args)?;
                 let FormatArgument::Float(f) = arg else {
-                    return Err(FormatError::InvalidArgument(arg));
+                    return Err(FormatError::InvalidArgument(arg.clone()));
                 };
 
                 if f.is_sign_positive() {
@@ -369,16 +369,16 @@ impl Spec {
 
                 let s = match variant {
                     FloatVariant::Decimal => {
-                        format_float_decimal(f, precision, case, force_decimal)
+                        format_float_decimal(*f, precision, case, force_decimal)
                     }
                     FloatVariant::Scientific => {
-                        format_float_scientific(f, precision, case, force_decimal)
+                        format_float_scientific(*f, precision, case, force_decimal)
                     }
                     FloatVariant::Shortest => {
-                        format_float_shortest(f, precision, case, force_decimal)
+                        format_float_shortest(*f, precision, case, force_decimal)
                     }
                     FloatVariant::Hexadecimal => {
-                        format_float_hexadecimal(f, precision, case, force_decimal)
+                        format_float_hexadecimal(*f, precision, case, force_decimal)
                     }
                 };
 
@@ -500,29 +500,29 @@ fn format_float_hexadecimal(
     return s;
 }
 
-fn resolve_asterisk(
+fn resolve_asterisk<'a>(
     option: Option<CanAsterisk<usize>>,
-    args: impl Iterator<Item = FormatArgument>,
+    args: impl Iterator<Item = &'a FormatArgument>,
 ) -> Result<Option<usize>, FormatError> {
     Ok(match option {
         None => None,
         Some(CanAsterisk::Asterisk) => {
             let arg = next_arg(args)?;
             match arg {
-                FormatArgument::UnsignedInt(u) => match usize::try_from(u) {
+                FormatArgument::UnsignedInt(u) => match usize::try_from(*u) {
                     Ok(u) => Some(u),
-                    Err(_) => return Err(FormatError::InvalidArgument(arg)),
+                    Err(_) => return Err(FormatError::InvalidArgument(arg.clone())),
                 },
-                _ => return Err(FormatError::InvalidArgument(arg)),
+                _ => return Err(FormatError::InvalidArgument(arg.clone())),
             }
         }
         Some(CanAsterisk::Fixed(w)) => Some(w),
     })
 }
 
-fn next_arg(
-    mut arguments: impl Iterator<Item = FormatArgument>,
-) -> Result<FormatArgument, FormatError> {
+fn next_arg<'a>(
+    mut arguments: impl Iterator<Item = &'a FormatArgument>,
+) -> Result<&'a FormatArgument, FormatError> {
     arguments.next().ok_or(FormatError::NoMoreArguments)
 }
 

From f117fc1bab8aaab4c26d41bad40c111904f5f9b6 Mon Sep 17 00:00:00 2001
From: Terts Diepraam <terts.diepraam@gmail.com>
Date: Sat, 28 Oct 2023 17:34:04 +0200
Subject: [PATCH 009/429] printf rewrite: fix compilation

---
 src/uu/dd/src/progress.rs                  |  6 ++-
 src/uu/printf/src/printf.rs                |  8 ++--
 src/uu/seq/src/seq.rs                      | 11 +++--
 src/uucore/src/lib/features.rs             |  8 +---
 src/uucore/src/lib/features/format/mod.rs  | 55 ++++++++++++++++++----
 src/uucore/src/lib/features/format/spec.rs | 40 ++++++++--------
 src/uucore/src/lib/lib.rs                  |  6 +--
 7 files changed, 85 insertions(+), 49 deletions(-)

diff --git a/src/uu/dd/src/progress.rs b/src/uu/dd/src/progress.rs
index f2472600927..1d9b7247d20 100644
--- a/src/uu/dd/src/progress.rs
+++ b/src/uu/dd/src/progress.rs
@@ -13,8 +13,8 @@ use std::io::Write;
 use std::sync::mpsc;
 use std::time::Duration;
 
-use uucore::error::UResult;
 use uucore::format::sprintf;
+use uucore::{error::UResult, format::FormatArgument};
 
 use crate::numbers::{to_magnitude_and_suffix, SuffixType};
 
@@ -152,7 +152,9 @@ impl ProgUpdate {
         let (carriage_return, newline) = if rewrite { ("\r", "") } else { ("", "\n") };
 
         // The duration should be formatted as in `printf %g`.
-        let duration_str = sprintf("%g", &[duration.to_string()])?;
+        // TODO: remove unwrap and make FormatError implement UError
+        let duration_str = sprintf("%g", &[FormatArgument::Float(duration)])?;
+        let duration_str = std::str::from_utf8(&duration_str).unwrap();
 
         // If the number of bytes written is sufficiently large, then
         // print a more concise representation of the number, like
diff --git a/src/uu/printf/src/printf.rs b/src/uu/printf/src/printf.rs
index 36b4c34535b..6e270ec2645 100644
--- a/src/uu/printf/src/printf.rs
+++ b/src/uu/printf/src/printf.rs
@@ -8,7 +8,7 @@
 
 use clap::{crate_version, Arg, ArgAction, Command};
 use uucore::error::{UResult, UUsageError};
-use uucore::format::printf;
+use uucore::format::{printf, FormatArgument};
 use uucore::{format_usage, help_about, help_section, help_usage};
 
 const VERSION: &str = "version";
@@ -30,12 +30,12 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
     let format_string = matches
         .get_one::<String>(options::FORMATSTRING)
         .ok_or_else(|| UUsageError::new(1, "missing operand"))?;
-    let values: Vec<String> = match matches.get_many::<String>(options::ARGUMENT) {
-        Some(s) => s.map(|s| s.to_string()).collect(),
+    let values: Vec<_> = match matches.get_many::<String>(options::ARGUMENT) {
+        Some(s) => s.map(|s| FormatArgument::Unparsed(s.to_string())).collect(),
         None => vec![],
     };
 
-    printf(format_string, &values[..])?;
+    printf(format_string, &values)?;
     Ok(())
 }
 
diff --git a/src/uu/seq/src/seq.rs b/src/uu/seq/src/seq.rs
index f93ced9264d..217e9042833 100644
--- a/src/uu/seq/src/seq.rs
+++ b/src/uu/seq/src/seq.rs
@@ -9,7 +9,7 @@ use clap::{crate_version, Arg, ArgAction, Command};
 use num_traits::Zero;
 
 use uucore::error::UResult;
-use uucore::format::printf;
+use uucore::format::{printf, FormatArgument};
 use uucore::{format_usage, help_about, help_usage};
 
 mod error;
@@ -144,8 +144,9 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
     };
     match result {
         Ok(_) => Ok(()),
-        Err(err) if err.kind() == ErrorKind::BrokenPipe => Ok(()),
-        Err(e) => Err(e.map_err_context(|| "write error".into())),
+        _ => todo!(),
+        // Err(err) if err.kind() == ErrorKind::BrokenPipe => Ok(()),
+        // Err(e) => Err(e.map_err_context(|| "write error".into())),
     }
 }
 
@@ -270,7 +271,7 @@ fn print_seq(
         match format {
             Some(f) => {
                 let s = format!("{value}");
-                printf(f, &[s])?;
+                printf(f, &[FormatArgument::String(s)])?;
             }
             None => write_value_float(&mut stdout, &value, padding, largest_dec)?,
         }
@@ -326,7 +327,7 @@ fn print_seq_integers(
         match format {
             Some(f) => {
                 let s = format!("{value}");
-                printf(f, &[s])?;
+                printf(f, &[FormatArgument::String(s)])?;
             }
             None => write_value_int(&mut stdout, &value, padding, pad)?,
         }
diff --git a/src/uucore/src/lib/features.rs b/src/uucore/src/lib/features.rs
index 133050954dd..1d0d437824d 100644
--- a/src/uucore/src/lib/features.rs
+++ b/src/uucore/src/lib/features.rs
@@ -8,16 +8,14 @@
 pub mod backup_control;
 #[cfg(feature = "encoding")]
 pub mod encoding;
+#[cfg(feature = "format")]
+pub mod format;
 #[cfg(feature = "fs")]
 pub mod fs;
 #[cfg(feature = "fsext")]
 pub mod fsext;
 #[cfg(feature = "lines")]
 pub mod lines;
-#[cfg(feature = "format")]
-pub mod format;
-#[cfg(feature = "memo")]
-pub mod memo;
 #[cfg(feature = "quoting-style")]
 pub mod quoting_style;
 #[cfg(feature = "ranges")]
@@ -26,8 +24,6 @@ pub mod ranges;
 pub mod ringbuffer;
 #[cfg(feature = "sum")]
 pub mod sum;
-#[cfg(feature = "memo")]
-mod tokenize;
 #[cfg(feature = "update-control")]
 pub mod update_control;
 #[cfg(feature = "version-cmp")]
diff --git a/src/uucore/src/lib/features/format/mod.rs b/src/uucore/src/lib/features/format/mod.rs
index abd92011cc4..ebb1cc360eb 100644
--- a/src/uucore/src/lib/features/format/mod.rs
+++ b/src/uucore/src/lib/features/format/mod.rs
@@ -3,7 +3,7 @@
 //! The [`printf`] and [`sprintf`] closely match the behavior of the
 //! corresponding C functions: the former renders a formatted string
 //! to stdout, the latter renders to a new [`String`] object.
-//! 
+//!
 //! In addition to the [`printf`] and [`sprintf`] functions, we expose the
 //! [`Format`] struct, which represents a parsed format string. This reduces
 //! the need for parsing a format string multiple times and assures that no
@@ -14,8 +14,15 @@
 mod spec;
 
 use spec::Spec;
-use std::io::{stdout, Write};
+use std::{
+    error::Error,
+    fmt::Display,
+    io::{stdout, Write},
+};
+
+use crate::error::UError;
 
+#[derive(Debug)]
 pub enum FormatError {
     SpecError,
     IoError(std::io::Error),
@@ -23,6 +30,21 @@ pub enum FormatError {
     InvalidArgument(FormatArgument),
 }
 
+impl Error for FormatError {}
+impl UError for FormatError {}
+
+impl Display for FormatError {
+    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
+        // TODO: Be more precise about these
+        match self {
+            FormatError::SpecError => write!(f, "invalid spec"),
+            FormatError::IoError(_) => write!(f, "io error"),
+            FormatError::NoMoreArguments => write!(f, "no more arguments"),
+            FormatError::InvalidArgument(_) => write!(f, "invalid argument"),
+        }
+    }
+}
+
 /// A single item to format
 enum FormatItem {
     /// A format specifier
@@ -30,21 +52,28 @@ enum FormatItem {
     /// Some plain text
     Text(Vec<u8>),
     /// A single character
-    /// 
+    ///
     /// Added in addition to `Text` as an optimization.
     Char(u8),
 }
 
+#[derive(Clone, Debug)]
 pub enum FormatArgument {
     Char(char),
     String(String),
     UnsignedInt(u64),
     SignedInt(i64),
     Float(f64),
+    // Special argument that gets coerced into the other variants
+    Unparsed(String),
 }
 
 impl FormatItem {
-    fn write<'a>(&self, mut writer: impl Write, args: &mut impl Iterator<Item = FormatArgument>) -> Result<(), FormatError> {
+    fn write<'a>(
+        &self,
+        mut writer: impl Write,
+        args: &mut impl Iterator<Item = &'a FormatArgument>,
+    ) -> Result<(), FormatError> {
         match self {
             FormatItem::Spec(spec) => spec.write(writer, args),
             FormatItem::Text(bytes) => writer.write_all(bytes).map_err(FormatError::IoError),
@@ -110,13 +139,20 @@ fn parse_iter(fmt: &[u8]) -> impl Iterator<Item = Result<FormatItem, FormatError
 /// printf("hello %s", &["world".to_string()]).unwrap();
 /// // prints "hello world"
 /// ```
-pub fn printf(format_string: &[u8], arguments: impl IntoIterator<Item = FormatArgument>) -> Result<(), FormatError> {
+pub fn printf<'a>(
+    format_string: impl AsRef<[u8]>,
+    arguments: impl IntoIterator<Item = &'a FormatArgument>,
+) -> Result<(), FormatError> {
     printf_writer(stdout(), format_string, arguments)
 }
 
-fn printf_writer(mut writer: impl Write, format_string: &[u8], args: impl IntoIterator<Item = FormatArgument>) -> Result<(), FormatError> {
+fn printf_writer<'a>(
+    mut writer: impl Write,
+    format_string: impl AsRef<[u8]>,
+    args: impl IntoIterator<Item = &'a FormatArgument>,
+) -> Result<(), FormatError> {
     let mut args = args.into_iter();
-    for item in parse_iter(format_string) {
+    for item in parse_iter(format_string.as_ref()) {
         item?.write(&mut writer, &mut args)?;
     }
     Ok(())
@@ -137,7 +173,10 @@ fn printf_writer(mut writer: impl Write, format_string: &[u8], args: impl IntoIt
 /// let s = sprintf("hello %s", &["world".to_string()]).unwrap();
 /// assert_eq!(s, "hello world".to_string());
 /// ```
-pub fn sprintf(format_string: &[u8], arguments: impl IntoIterator<Item = FormatArgument>) -> Result<Vec<u8>, FormatError> {
+pub fn sprintf<'a>(
+    format_string: impl AsRef<[u8]>,
+    arguments: impl IntoIterator<Item = &'a FormatArgument>,
+) -> Result<Vec<u8>, FormatError> {
     let mut writer = Vec::new();
     printf_writer(&mut writer, format_string, arguments)?;
     Ok(writer)
diff --git a/src/uucore/src/lib/features/format/spec.rs b/src/uucore/src/lib/features/format/spec.rs
index d1786c3d36f..e66cad32d65 100644
--- a/src/uucore/src/lib/features/format/spec.rs
+++ b/src/uucore/src/lib/features/format/spec.rs
@@ -257,7 +257,7 @@ impl Spec {
     pub fn write<'a>(
         &self,
         mut writer: impl Write,
-        mut args: impl Iterator<Item = FormatArgument>,
+        mut args: impl Iterator<Item = &'a FormatArgument>,
     ) -> Result<(), FormatError> {
         match self {
             &Spec::Char { width, align_left } => {
@@ -265,7 +265,7 @@ impl Spec {
                 let arg = next_arg(&mut args)?;
                 match arg {
                     FormatArgument::Char(c) => write_padded(writer, c, width, false, align_left),
-                    _ => Err(FormatError::InvalidArgument(arg)),
+                    _ => Err(FormatError::InvalidArgument(arg.clone())),
                 }
             }
             &Spec::String { width, align_left } => {
@@ -273,7 +273,7 @@ impl Spec {
                 let arg = next_arg(&mut args)?;
                 match arg {
                     FormatArgument::String(s) => write_padded(writer, s, width, false, align_left),
-                    _ => Err(FormatError::InvalidArgument(arg)),
+                    _ => Err(FormatError::InvalidArgument(arg.clone())),
                 }
             }
             &Spec::SignedInt {
@@ -285,10 +285,10 @@ impl Spec {
 
                 let arg = next_arg(&mut args)?;
                 let FormatArgument::SignedInt(i) = arg else {
-                    return Err(FormatError::InvalidArgument(arg));
+                    return Err(FormatError::InvalidArgument(arg.clone()));
                 };
 
-                if i >= 0 {
+                if *i >= 0 {
                     match positive_sign {
                         PositiveSign::None => Ok(()),
                         PositiveSign::Plus => write!(writer, "+"),
@@ -313,7 +313,7 @@ impl Spec {
 
                 let arg = next_arg(args)?;
                 let FormatArgument::SignedInt(i) = arg else {
-                    return Err(FormatError::InvalidArgument(arg));
+                    return Err(FormatError::InvalidArgument(arg.clone()));
                 };
 
                 let s = match variant {
@@ -355,7 +355,7 @@ impl Spec {
 
                 let arg = next_arg(args)?;
                 let FormatArgument::Float(f) = arg else {
-                    return Err(FormatError::InvalidArgument(arg));
+                    return Err(FormatError::InvalidArgument(arg.clone()));
                 };
 
                 if f.is_sign_positive() {
@@ -369,16 +369,16 @@ impl Spec {
 
                 let s = match variant {
                     FloatVariant::Decimal => {
-                        format_float_decimal(f, precision, case, force_decimal)
+                        format_float_decimal(*f, precision, case, force_decimal)
                     }
                     FloatVariant::Scientific => {
-                        format_float_scientific(f, precision, case, force_decimal)
+                        format_float_scientific(*f, precision, case, force_decimal)
                     }
                     FloatVariant::Shortest => {
-                        format_float_shortest(f, precision, case, force_decimal)
+                        format_float_shortest(*f, precision, case, force_decimal)
                     }
                     FloatVariant::Hexadecimal => {
-                        format_float_hexadecimal(f, precision, case, force_decimal)
+                        format_float_hexadecimal(*f, precision, case, force_decimal)
                     }
                 };
 
@@ -490,7 +490,7 @@ fn format_float_hexadecimal(
     let mut s = match (precision, force_decimal) {
         (0, ForceDecimal::No) => format!("0x{first_digit}p{exponent:+x}"),
         (0, ForceDecimal::Yes) => format!("0x{first_digit}.p{exponent:+x}"),
-        _ => format!("0x{first_digit}.{mantissa:0>13x}p{exponent:+x}")
+        _ => format!("0x{first_digit}.{mantissa:0>13x}p{exponent:+x}"),
     };
 
     if case == Case::Uppercase {
@@ -500,29 +500,29 @@ fn format_float_hexadecimal(
     return s;
 }
 
-fn resolve_asterisk(
+fn resolve_asterisk<'a>(
     option: Option<CanAsterisk<usize>>,
-    args: impl Iterator<Item = FormatArgument>,
+    args: impl Iterator<Item = &'a FormatArgument>,
 ) -> Result<Option<usize>, FormatError> {
     Ok(match option {
         None => None,
         Some(CanAsterisk::Asterisk) => {
             let arg = next_arg(args)?;
             match arg {
-                FormatArgument::UnsignedInt(u) => match usize::try_from(u) {
+                FormatArgument::UnsignedInt(u) => match usize::try_from(*u) {
                     Ok(u) => Some(u),
-                    Err(_) => return Err(FormatError::InvalidArgument(arg)),
+                    Err(_) => return Err(FormatError::InvalidArgument(arg.clone())),
                 },
-                _ => return Err(FormatError::InvalidArgument(arg)),
+                _ => return Err(FormatError::InvalidArgument(arg.clone())),
             }
         }
         Some(CanAsterisk::Fixed(w)) => Some(w),
     })
 }
 
-fn next_arg(
-    mut arguments: impl Iterator<Item = FormatArgument>,
-) -> Result<FormatArgument, FormatError> {
+fn next_arg<'a>(
+    mut arguments: impl Iterator<Item = &'a FormatArgument>,
+) -> Result<&'a FormatArgument, FormatError> {
     arguments.next().ok_or(FormatError::NoMoreArguments)
 }
 
diff --git a/src/uucore/src/lib/lib.rs b/src/uucore/src/lib/lib.rs
index 0540275eee4..af8668ef02f 100644
--- a/src/uucore/src/lib/lib.rs
+++ b/src/uucore/src/lib/lib.rs
@@ -37,16 +37,14 @@ pub use crate::parser::shortcut_value_parser;
 pub use crate::features::backup_control;
 #[cfg(feature = "encoding")]
 pub use crate::features::encoding;
+#[cfg(feature = "format")]
+pub use crate::features::format;
 #[cfg(feature = "fs")]
 pub use crate::features::fs;
 #[cfg(feature = "fsext")]
 pub use crate::features::fsext;
 #[cfg(feature = "lines")]
 pub use crate::features::lines;
-#[cfg(feature = "format")]
-pub use crate::features::format;
-#[cfg(feature = "memo")]
-pub use crate::features::memo;
 #[cfg(feature = "quoting-style")]
 pub use crate::features::quoting_style;
 #[cfg(feature = "ranges")]

From 198f7c7f26c6aa5a374d8f4def4ad324bee38535 Mon Sep 17 00:00:00 2001
From: Terts Diepraam <terts.diepraam@gmail.com>
Date: Thu, 9 Nov 2023 15:45:44 +0100
Subject: [PATCH 010/429] printf: move number formatting to separate module

---
 src/uucore/src/lib/features/format/mod.rs     |   2 +-
 .../src/lib/features/format/num_format.rs     | 232 ++++++++++++++++++
 src/uucore/src/lib/features/format/spec.rs    | 202 ++-------------
 3 files changed, 258 insertions(+), 178 deletions(-)
 create mode 100644 src/uucore/src/lib/features/format/num_format.rs

diff --git a/src/uucore/src/lib/features/format/mod.rs b/src/uucore/src/lib/features/format/mod.rs
index ebb1cc360eb..0849ada15f8 100644
--- a/src/uucore/src/lib/features/format/mod.rs
+++ b/src/uucore/src/lib/features/format/mod.rs
@@ -10,8 +10,8 @@
 //! parsing errors occur during writing.
 // spell-checker:ignore (vars) charf decf floatf intf scif strf Cninety
 
-// mod num_format;
 mod spec;
+mod num_format;
 
 use spec::Spec;
 use std::{
diff --git a/src/uucore/src/lib/features/format/num_format.rs b/src/uucore/src/lib/features/format/num_format.rs
new file mode 100644
index 00000000000..75c18438cc8
--- /dev/null
+++ b/src/uucore/src/lib/features/format/num_format.rs
@@ -0,0 +1,232 @@
+use std::io::Write;
+
+use super::{
+    spec::{
+        Case, FloatVariant, ForceDecimal, NumberAlignment, PositiveSign, Prefix, UnsignedIntVariant,
+    },
+    FormatError,
+};
+
+pub trait Formatter {
+    type Input;
+    fn fmt(&self, writer: impl Write, x: Self::Input) -> Result<(), FormatError>;
+}
+
+pub struct SignedInt {
+    pub width: usize,
+    pub positive_sign: PositiveSign,
+    pub alignment: NumberAlignment,
+}
+
+impl Formatter for SignedInt {
+    type Input = i64;
+
+    fn fmt(&self, mut writer: impl Write, x: Self::Input) -> Result<(), FormatError> {
+        if x >= 0 {
+            match self.positive_sign {
+                PositiveSign::None => Ok(()),
+                PositiveSign::Plus => write!(writer, "+"),
+                PositiveSign::Space => write!(writer, " "),
+            }
+            .map_err(FormatError::IoError)?;
+        }
+
+        match self.alignment {
+            NumberAlignment::Left => write!(writer, "{x:<width$}", width = self.width),
+            NumberAlignment::RightSpace => write!(writer, "{x:>width$}", width = self.width),
+            NumberAlignment::RightZero => write!(writer, "{x:0>width$}", width = self.width),
+        }
+        .map_err(FormatError::IoError)
+    }
+}
+
+pub struct UnsignedInt {
+    pub variant: UnsignedIntVariant,
+    pub width: usize,
+    pub alignment: NumberAlignment,
+}
+
+impl Formatter for UnsignedInt {
+    type Input = u64;
+
+    fn fmt(&self, mut writer: impl Write, x: Self::Input) -> Result<(), FormatError> {
+        let s = match self.variant {
+            UnsignedIntVariant::Decimal => format!("{x}"),
+            UnsignedIntVariant::Octal(Prefix::No) => format!("{x:o}"),
+            UnsignedIntVariant::Octal(Prefix::Yes) => format!("{x:#o}"),
+            UnsignedIntVariant::Hexadecimal(Case::Lowercase, Prefix::No) => {
+                format!("{x:x}")
+            }
+            UnsignedIntVariant::Hexadecimal(Case::Lowercase, Prefix::Yes) => {
+                format!("{x:#x}")
+            }
+            UnsignedIntVariant::Hexadecimal(Case::Uppercase, Prefix::No) => {
+                format!("{x:X}")
+            }
+            UnsignedIntVariant::Hexadecimal(Case::Uppercase, Prefix::Yes) => {
+                format!("{x:#X}")
+            }
+        };
+
+        match self.alignment {
+            NumberAlignment::Left => write!(writer, "{s:<width$}", width = self.width),
+            NumberAlignment::RightSpace => write!(writer, "{s:>width$}", width = self.width),
+            NumberAlignment::RightZero => write!(writer, "{s:0>width$}", width = self.width),
+        }
+        .map_err(FormatError::IoError)
+    }
+}
+
+pub struct Float {
+    pub variant: FloatVariant,
+    pub case: Case,
+    pub force_decimal: ForceDecimal,
+    pub width: usize,
+    pub positive_sign: PositiveSign,
+    pub alignment: NumberAlignment,
+    pub precision: usize,
+}
+
+impl Formatter for Float {
+    type Input = f64;
+
+    fn fmt(&self, mut writer: impl Write, x: Self::Input) -> Result<(), FormatError> {
+        if x.is_sign_positive() {
+            match self.positive_sign {
+                PositiveSign::None => Ok(()),
+                PositiveSign::Plus => write!(writer, "+"),
+                PositiveSign::Space => write!(writer, " "),
+            }
+            .map_err(FormatError::IoError)?;
+        }
+
+        let s = match self.variant {
+            FloatVariant::Decimal => {
+                format_float_decimal(x, self.precision, self.case, self.force_decimal)
+            }
+            FloatVariant::Scientific => {
+                format_float_scientific(x, self.precision, self.case, self.force_decimal)
+            }
+            FloatVariant::Shortest => {
+                format_float_shortest(x, self.precision, self.case, self.force_decimal)
+            }
+            FloatVariant::Hexadecimal => {
+                format_float_hexadecimal(x, self.precision, self.case, self.force_decimal)
+            }
+        };
+
+        match self.alignment {
+            NumberAlignment::Left => write!(writer, "{s:<width$}", width = self.width),
+            NumberAlignment::RightSpace => write!(writer, "{s:>width$}", width = self.width),
+            NumberAlignment::RightZero => write!(writer, "{s:0>width$}", width = self.width),
+        }
+        .map_err(FormatError::IoError)
+    }
+}
+
+fn format_float_nonfinite(f: f64, case: Case) -> String {
+    debug_assert!(!f.is_finite());
+    let mut s = format!("{f}");
+    if case == Case::Uppercase {
+        s.make_ascii_uppercase();
+    }
+    return s;
+}
+
+fn format_float_decimal(
+    f: f64,
+    precision: usize,
+    case: Case,
+    force_decimal: ForceDecimal,
+) -> String {
+    if !f.is_finite() {
+        return format_float_nonfinite(f, case);
+    }
+
+    if precision == 0 && force_decimal == ForceDecimal::Yes {
+        format!("{f:.0}.")
+    } else {
+        format!("{f:.*}", precision)
+    }
+}
+
+fn format_float_scientific(
+    f: f64,
+    precision: usize,
+    case: Case,
+    force_decimal: ForceDecimal,
+) -> String {
+    // If the float is NaN, -Nan, Inf or -Inf, format like any other float
+    if !f.is_finite() {
+        return format_float_nonfinite(f, case);
+    }
+
+    let exponent: i32 = f.log10().floor() as i32;
+    let normalized = f / 10.0_f64.powi(exponent);
+
+    let additional_dot = if precision == 0 && ForceDecimal::Yes == force_decimal {
+        "."
+    } else {
+        ""
+    };
+
+    let exp_char = match case {
+        Case::Lowercase => 'e',
+        Case::Uppercase => 'E',
+    };
+
+    format!(
+        "{normalized:.*}{additional_dot}{exp_char}{exponent:+03}",
+        precision
+    )
+}
+
+// TODO: This could be optimized. It's not terribly important though.
+fn format_float_shortest(
+    f: f64,
+    precision: usize,
+    case: Case,
+    force_decimal: ForceDecimal,
+) -> String {
+    let a = format_float_decimal(f, precision, case, force_decimal);
+    let b = format_float_scientific(f, precision, case, force_decimal);
+
+    if a.len() > b.len() {
+        b
+    } else {
+        a
+    }
+}
+
+fn format_float_hexadecimal(
+    f: f64,
+    precision: usize,
+    case: Case,
+    force_decimal: ForceDecimal,
+) -> String {
+    if !f.is_finite() {
+        return format_float_nonfinite(f, case);
+    }
+
+    let (first_digit, mantissa, exponent) = if f == 0.0 {
+        (0, 0, 0)
+    } else {
+        let bits = f.to_bits();
+        let exponent_bits = ((bits >> 52) & 0x7fff) as i64;
+        let exponent = exponent_bits - 1023;
+        let mantissa = bits & 0xf_ffff_ffff_ffff;
+        (1, mantissa, exponent)
+    };
+
+    let mut s = match (precision, force_decimal) {
+        (0, ForceDecimal::No) => format!("0x{first_digit}p{exponent:+x}"),
+        (0, ForceDecimal::Yes) => format!("0x{first_digit}.p{exponent:+x}"),
+        _ => format!("0x{first_digit}.{mantissa:0>13x}p{exponent:+x}"),
+    };
+
+    if case == Case::Uppercase {
+        s.make_ascii_uppercase();
+    }
+
+    return s;
+}
diff --git a/src/uucore/src/lib/features/format/spec.rs b/src/uucore/src/lib/features/format/spec.rs
index e66cad32d65..4a533d1e10f 100644
--- a/src/uucore/src/lib/features/format/spec.rs
+++ b/src/uucore/src/lib/features/format/spec.rs
@@ -1,6 +1,9 @@
 // spell-checker:ignore (vars) charf decf floatf intf scif strf Cninety
 
-use super::{FormatArgument, FormatError};
+use super::{
+    num_format::{self, Formatter},
+    FormatArgument, FormatError,
+};
 use std::{fmt::Display, io::Write};
 
 pub enum Spec {
@@ -256,7 +259,7 @@ impl Spec {
 
     pub fn write<'a>(
         &self,
-        mut writer: impl Write,
+        writer: impl Write,
         mut args: impl Iterator<Item = &'a FormatArgument>,
     ) -> Result<(), FormatError> {
         match self {
@@ -288,21 +291,11 @@ impl Spec {
                     return Err(FormatError::InvalidArgument(arg.clone()));
                 };
 
-                if *i >= 0 {
-                    match positive_sign {
-                        PositiveSign::None => Ok(()),
-                        PositiveSign::Plus => write!(writer, "+"),
-                        PositiveSign::Space => write!(writer, " "),
-                    }
-                    .map_err(FormatError::IoError)?;
-                }
-
-                match alignment {
-                    NumberAlignment::Left => write!(writer, "{i:<width$}"),
-                    NumberAlignment::RightSpace => write!(writer, "{i:>width$}"),
-                    NumberAlignment::RightZero => write!(writer, "{i:0>width$}"),
-                }
-                .map_err(FormatError::IoError)
+                num_format::SignedInt {
+                    width,
+                    positive_sign,
+                    alignment,
+                }.fmt(writer, *i)
             }
             &Spec::UnsignedInt {
                 variant,
@@ -312,34 +305,16 @@ impl Spec {
                 let width = resolve_asterisk(width, &mut args)?.unwrap_or(0);
 
                 let arg = next_arg(args)?;
-                let FormatArgument::SignedInt(i) = arg else {
+                let FormatArgument::UnsignedInt(i) = arg else {
                     return Err(FormatError::InvalidArgument(arg.clone()));
                 };
 
-                let s = match variant {
-                    UnsignedIntVariant::Decimal => format!("{i}"),
-                    UnsignedIntVariant::Octal(Prefix::No) => format!("{i:o}"),
-                    UnsignedIntVariant::Octal(Prefix::Yes) => format!("{i:#o}"),
-                    UnsignedIntVariant::Hexadecimal(Case::Lowercase, Prefix::No) => {
-                        format!("{i:x}")
-                    }
-                    UnsignedIntVariant::Hexadecimal(Case::Lowercase, Prefix::Yes) => {
-                        format!("{i:#x}")
-                    }
-                    UnsignedIntVariant::Hexadecimal(Case::Uppercase, Prefix::No) => {
-                        format!("{i:X}")
-                    }
-                    UnsignedIntVariant::Hexadecimal(Case::Uppercase, Prefix::Yes) => {
-                        format!("{i:#X}")
-                    }
-                };
-
-                match alignment {
-                    NumberAlignment::Left => write!(writer, "{s:<width$}"),
-                    NumberAlignment::RightSpace => write!(writer, "{s:>width$}"),
-                    NumberAlignment::RightZero => write!(writer, "{s:0>width$}"),
+                num_format::UnsignedInt {
+                    variant,
+                    width,
+                    alignment,
                 }
-                .map_err(FormatError::IoError)
+                .fmt(writer, *i)
             }
             &Spec::Float {
                 variant,
@@ -358,148 +333,21 @@ impl Spec {
                     return Err(FormatError::InvalidArgument(arg.clone()));
                 };
 
-                if f.is_sign_positive() {
-                    match positive_sign {
-                        PositiveSign::None => Ok(()),
-                        PositiveSign::Plus => write!(writer, "+"),
-                        PositiveSign::Space => write!(writer, " "),
-                    }
-                    .map_err(FormatError::IoError)?;
-                }
-
-                let s = match variant {
-                    FloatVariant::Decimal => {
-                        format_float_decimal(*f, precision, case, force_decimal)
-                    }
-                    FloatVariant::Scientific => {
-                        format_float_scientific(*f, precision, case, force_decimal)
-                    }
-                    FloatVariant::Shortest => {
-                        format_float_shortest(*f, precision, case, force_decimal)
-                    }
-                    FloatVariant::Hexadecimal => {
-                        format_float_hexadecimal(*f, precision, case, force_decimal)
-                    }
-                };
-
-                match alignment {
-                    NumberAlignment::Left => write!(writer, "{s:<width$}"),
-                    NumberAlignment::RightSpace => write!(writer, "{s:>width$}"),
-                    NumberAlignment::RightZero => write!(writer, "{s:0>width$}"),
+                num_format::Float {
+                    variant,
+                    case,
+                    force_decimal,
+                    width,
+                    positive_sign,
+                    alignment,
+                    precision,
                 }
-                .map_err(FormatError::IoError)
+                .fmt(writer, *f)
             }
         }
     }
 }
 
-fn format_float_nonfinite(f: f64, case: Case) -> String {
-    debug_assert!(!f.is_finite());
-    let mut s = format!("{f}");
-    if case == Case::Uppercase {
-        s.make_ascii_uppercase();
-    }
-    return s;
-}
-
-fn format_float_decimal(
-    f: f64,
-    precision: usize,
-    case: Case,
-    force_decimal: ForceDecimal,
-) -> String {
-    if !f.is_finite() {
-        return format_float_nonfinite(f, case);
-    }
-
-    if precision == 0 && force_decimal == ForceDecimal::Yes {
-        format!("{f:.0}.")
-    } else {
-        format!("{f:.*}", precision)
-    }
-}
-
-fn format_float_scientific(
-    f: f64,
-    precision: usize,
-    case: Case,
-    force_decimal: ForceDecimal,
-) -> String {
-    // If the float is NaN, -Nan, Inf or -Inf, format like any other float
-    if !f.is_finite() {
-        return format_float_nonfinite(f, case);
-    }
-
-    let exponent: i32 = f.log10().floor() as i32;
-    let normalized = f / 10.0_f64.powi(exponent);
-
-    let additional_dot = if precision == 0 && ForceDecimal::Yes == force_decimal {
-        "."
-    } else {
-        ""
-    };
-
-    let exp_char = match case {
-        Case::Lowercase => 'e',
-        Case::Uppercase => 'E',
-    };
-
-    format!(
-        "{normalized:.*}{additional_dot}{exp_char}{exponent:+03}",
-        precision
-    )
-}
-
-// TODO: This could be optimized. It's not terribly important though.
-fn format_float_shortest(
-    f: f64,
-    precision: usize,
-    case: Case,
-    force_decimal: ForceDecimal,
-) -> String {
-    let a = format_float_decimal(f, precision, case, force_decimal);
-    let b = format_float_scientific(f, precision, case, force_decimal);
-
-    if a.len() > b.len() {
-        b
-    } else {
-        a
-    }
-}
-
-fn format_float_hexadecimal(
-    f: f64,
-    precision: usize,
-    case: Case,
-    force_decimal: ForceDecimal,
-) -> String {
-    if !f.is_finite() {
-        return format_float_nonfinite(f, case);
-    }
-
-    let (first_digit, mantissa, exponent) = if f == 0.0 {
-        (0, 0, 0)
-    } else {
-        let bits = f.to_bits();
-        let exponent_bits = ((bits >> 52) & 0x7fff) as i64;
-        let exponent = exponent_bits - 1023;
-        let mantissa = bits & 0xf_ffff_ffff_ffff;
-        (1, mantissa, exponent)
-    };
-
-    let mut s = match (precision, force_decimal) {
-        (0, ForceDecimal::No) => format!("0x{first_digit}p{exponent:+x}"),
-        (0, ForceDecimal::Yes) => format!("0x{first_digit}.p{exponent:+x}"),
-        _ => format!("0x{first_digit}.{mantissa:0>13x}p{exponent:+x}"),
-    };
-
-    if case == Case::Uppercase {
-        s.make_ascii_uppercase();
-    }
-
-    return s;
-}
-
 fn resolve_asterisk<'a>(
     option: Option<CanAsterisk<usize>>,
     args: impl Iterator<Item = &'a FormatArgument>,

From 39c675847545b5653e04f9338815d882fdc7d01a Mon Sep 17 00:00:00 2001
From: Terts Diepraam <terts.diepraam@gmail.com>
Date: Thu, 9 Nov 2023 16:05:11 +0100
Subject: [PATCH 011/429] uucore/format: move types for num_format

---
 src/uucore/src/lib/features/format/mod.rs     |  2 +-
 .../src/lib/features/format/num_format.rs     | 69 +++++++++++++++++--
 src/uucore/src/lib/features/format/spec.rs    | 56 ++-------------
 3 files changed, 70 insertions(+), 57 deletions(-)

diff --git a/src/uucore/src/lib/features/format/mod.rs b/src/uucore/src/lib/features/format/mod.rs
index 0849ada15f8..d6db5e8c7cd 100644
--- a/src/uucore/src/lib/features/format/mod.rs
+++ b/src/uucore/src/lib/features/format/mod.rs
@@ -11,7 +11,7 @@
 // spell-checker:ignore (vars) charf decf floatf intf scif strf Cninety
 
 mod spec;
-mod num_format;
+pub mod num_format;
 
 use spec::Spec;
 use std::{
diff --git a/src/uucore/src/lib/features/format/num_format.rs b/src/uucore/src/lib/features/format/num_format.rs
index 75c18438cc8..3a27ac200f8 100644
--- a/src/uucore/src/lib/features/format/num_format.rs
+++ b/src/uucore/src/lib/features/format/num_format.rs
@@ -1,17 +1,60 @@
 use std::io::Write;
 
-use super::{
-    spec::{
-        Case, FloatVariant, ForceDecimal, NumberAlignment, PositiveSign, Prefix, UnsignedIntVariant,
-    },
-    FormatError,
-};
+use super::FormatError;
 
 pub trait Formatter {
     type Input;
     fn fmt(&self, writer: impl Write, x: Self::Input) -> Result<(), FormatError>;
 }
 
+#[derive(Clone, Copy)]
+pub enum UnsignedIntVariant {
+    Decimal,
+    Octal(Prefix),
+    Hexadecimal(Case, Prefix),
+}
+
+#[derive(Clone, Copy)]
+
+pub enum FloatVariant {
+    Decimal,
+    Scientific,
+    Shortest,
+    Hexadecimal,
+}
+
+#[derive(Clone, Copy, PartialEq, Eq)]
+pub enum Case {
+    Lowercase,
+    Uppercase,
+}
+
+#[derive(Clone, Copy, PartialEq, Eq)]
+pub enum Prefix {
+    No,
+    Yes,
+}
+
+#[derive(Clone, Copy, PartialEq, Eq)]
+pub enum ForceDecimal {
+    No,
+    Yes,
+}
+
+#[derive(Clone, Copy)]
+pub enum PositiveSign {
+    None,
+    Plus,
+    Space,
+}
+
+#[derive(Clone, Copy)]
+pub enum NumberAlignment {
+    Left,
+    RightSpace,
+    RightZero,
+}
+
 pub struct SignedInt {
     pub width: usize,
     pub positive_sign: PositiveSign,
@@ -87,6 +130,20 @@ pub struct Float {
     pub precision: usize,
 }
 
+impl Default for Float {
+    fn default() -> Self {
+        Self {
+            variant: FloatVariant::Decimal,
+            case: Case::Lowercase,
+            force_decimal: ForceDecimal::No,
+            width: 0,
+            positive_sign: PositiveSign::None,
+            alignment: NumberAlignment::Left,
+            precision: 2,
+        }
+    }
+}
+
 impl Formatter for Float {
     type Input = f64;
 
diff --git a/src/uucore/src/lib/features/format/spec.rs b/src/uucore/src/lib/features/format/spec.rs
index 4a533d1e10f..80896997007 100644
--- a/src/uucore/src/lib/features/format/spec.rs
+++ b/src/uucore/src/lib/features/format/spec.rs
@@ -1,7 +1,10 @@
 // spell-checker:ignore (vars) charf decf floatf intf scif strf Cninety
 
 use super::{
-    num_format::{self, Formatter},
+    num_format::{
+        self, Case, FloatVariant, ForceDecimal, Formatter, NumberAlignment, PositiveSign, Prefix,
+        UnsignedIntVariant,
+    },
     FormatArgument, FormatError,
 };
 use std::{fmt::Display, io::Write};
@@ -36,54 +39,6 @@ pub enum Spec {
     },
 }
 
-#[derive(Clone, Copy)]
-pub enum UnsignedIntVariant {
-    Decimal,
-    Octal(Prefix),
-    Hexadecimal(Case, Prefix),
-}
-
-#[derive(Clone, Copy)]
-
-pub enum FloatVariant {
-    Decimal,
-    Scientific,
-    Shortest,
-    Hexadecimal,
-}
-
-#[derive(Clone, Copy, PartialEq, Eq)]
-pub enum Case {
-    Lowercase,
-    Uppercase,
-}
-
-#[derive(Clone, Copy, PartialEq, Eq)]
-pub enum Prefix {
-    No,
-    Yes,
-}
-
-#[derive(Clone, Copy, PartialEq, Eq)]
-pub enum ForceDecimal {
-    No,
-    Yes,
-}
-
-#[derive(Clone, Copy)]
-pub enum PositiveSign {
-    None,
-    Plus,
-    Space,
-}
-
-#[derive(Clone, Copy)]
-pub enum NumberAlignment {
-    Left,
-    RightSpace,
-    RightZero,
-}
-
 /// Precision and width specified might use an asterisk to indicate that they are
 /// determined by an argument.
 #[derive(Clone, Copy)]
@@ -295,7 +250,8 @@ impl Spec {
                     width,
                     positive_sign,
                     alignment,
-                }.fmt(writer, *i)
+                }
+                .fmt(writer, *i)
             }
             &Spec::UnsignedInt {
                 variant,

From ee0e2c042bf93062727cf20356d4ebbfaa018291 Mon Sep 17 00:00:00 2001
From: Terts Diepraam <terts.diepraam@gmail.com>
Date: Thu, 9 Nov 2023 16:05:38 +0100
Subject: [PATCH 012/429] dd: use num_format::Float directly instead of printf

---
 src/uu/dd/src/progress.rs | 15 +++++++++++----
 1 file changed, 11 insertions(+), 4 deletions(-)

diff --git a/src/uu/dd/src/progress.rs b/src/uu/dd/src/progress.rs
index 1d9b7247d20..269ae5df463 100644
--- a/src/uu/dd/src/progress.rs
+++ b/src/uu/dd/src/progress.rs
@@ -13,8 +13,10 @@ use std::io::Write;
 use std::sync::mpsc;
 use std::time::Duration;
 
-use uucore::format::sprintf;
-use uucore::{error::UResult, format::FormatArgument};
+use uucore::{
+    error::UResult,
+    format::num_format::{FloatVariant, Formatter},
+};
 
 use crate::numbers::{to_magnitude_and_suffix, SuffixType};
 
@@ -152,8 +154,13 @@ impl ProgUpdate {
         let (carriage_return, newline) = if rewrite { ("\r", "") } else { ("", "\n") };
 
         // The duration should be formatted as in `printf %g`.
-        // TODO: remove unwrap and make FormatError implement UError
-        let duration_str = sprintf("%g", &[FormatArgument::Float(duration)])?;
+        let mut duration_str = Vec::new();
+        uucore::format::num_format::Float {
+            variant: FloatVariant::Shortest,
+            ..Default::default()
+        }
+        .fmt(&mut duration_str, duration)?;
+        // We assume that printf will output valid UTF-8
         let duration_str = std::str::from_utf8(&duration_str).unwrap();
 
         // If the number of bytes written is sufficiently large, then

From 6481d63ea4b8cd768d064e0a6769d7cbd4a2803c Mon Sep 17 00:00:00 2001
From: Terts Diepraam <terts.diepraam@gmail.com>
Date: Mon, 13 Nov 2023 15:22:49 +0100
Subject: [PATCH 013/429] uucore/format: implement single specifier formats

---
 src/uu/seq/src/seq.rs                         |  58 ++++++---
 src/uucore/src/lib/features/format/mod.rs     |  72 +++++++++++-
 .../src/lib/features/format/num_format.rs     | 111 ++++++++++++++++--
 src/uucore/src/lib/features/format/spec.rs    |   3 +
 4 files changed, 216 insertions(+), 28 deletions(-)

diff --git a/src/uu/seq/src/seq.rs b/src/uu/seq/src/seq.rs
index 217e9042833..bb4d5414ef8 100644
--- a/src/uu/seq/src/seq.rs
+++ b/src/uu/seq/src/seq.rs
@@ -3,13 +3,13 @@
 // For the full copyright and license information, please view the LICENSE
 // file that was distributed with this source code.
 // spell-checker:ignore (ToDO) istr chiter argptr ilen extendedbigdecimal extendedbigint numberparse
-use std::io::{stdout, ErrorKind, Write};
+use std::io::{stdout, Write};
 
 use clap::{crate_version, Arg, ArgAction, Command};
-use num_traits::Zero;
+use num_traits::{Zero, ToPrimitive};
 
 use uucore::error::UResult;
-use uucore::format::{printf, FormatArgument};
+use uucore::format::{printf, FormatArgument, Format, num_format};
 use uucore::{format_usage, help_about, help_usage};
 
 mod error;
@@ -119,16 +119,31 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
     let result = match (first.number, increment.number, last.number) {
         (Number::Int(first), Number::Int(increment), last) => {
             let last = last.round_towards(&first);
+            let format = match options.format {
+                Some(f) => {
+                    let f = Format::<num_format::SignedInt>::parse(f)?;
+                    Some(f)
+                }
+                None => None,
+            };
             print_seq_integers(
                 (first, increment, last),
                 &options.separator,
                 &options.terminator,
                 options.equal_width,
                 padding,
-                options.format,
+                format,
             )
         }
-        (first, increment, last) => print_seq(
+        (first, increment, last) => {
+            let format = match options.format {
+                Some(f) => {
+                    let f = Format::<num_format::Float>::parse(f)?;
+                    Some(f)
+                }
+                None => None,
+            };
+            print_seq(
             (
                 first.into_extended_big_decimal(),
                 increment.into_extended_big_decimal(),
@@ -139,8 +154,9 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
             &options.terminator,
             options.equal_width,
             padding,
-            options.format,
-        ),
+            format,
+            )
+        }
     };
     match result {
         Ok(_) => Ok(()),
@@ -244,7 +260,7 @@ fn print_seq(
     terminator: &str,
     pad: bool,
     padding: usize,
-    format: Option<&str>,
+    format: Option<Format<num_format::Float>>,
 ) -> UResult<()> {
     let stdout = stdout();
     let mut stdout = stdout.lock();
@@ -268,10 +284,16 @@ fn print_seq(
         // it as a string and ultimately writing to `stdout`. We
         // shouldn't have to do so much converting back and forth via
         // strings.
-        match format {
+        match &format {
             Some(f) => {
-                let s = format!("{value}");
-                printf(f, &[FormatArgument::String(s)])?;
+                let float = match &value {
+                    ExtendedBigDecimal::BigDecimal(bd) => bd.to_f64().unwrap(),
+                    ExtendedBigDecimal::Infinity => f64::INFINITY,
+                    ExtendedBigDecimal::MinusInfinity => f64::NEG_INFINITY,
+                    ExtendedBigDecimal::MinusZero => -0.0,
+                    ExtendedBigDecimal::Nan => f64::NAN,
+                };
+                f.fmt(&mut stdout, float)?;
             }
             None => write_value_float(&mut stdout, &value, padding, largest_dec)?,
         }
@@ -306,7 +328,7 @@ fn print_seq_integers(
     terminator: &str,
     pad: bool,
     padding: usize,
-    format: Option<&str>,
+    format: Option<Format<num_format::SignedInt>>,
 ) -> UResult<()> {
     let stdout = stdout();
     let mut stdout = stdout.lock();
@@ -324,10 +346,16 @@ fn print_seq_integers(
         // the current value and writes the result to `stdout`.
         //
         // TODO See similar comment about formatting in `print_seq()`.
-        match format {
+        match &format {
             Some(f) => {
-                let s = format!("{value}");
-                printf(f, &[FormatArgument::String(s)])?;
+                let int = match &value {
+                    ExtendedBigInt::BigInt(bi) => bi.to_i64().unwrap(),
+                    ExtendedBigInt::Infinity => todo!(),
+                    ExtendedBigInt::MinusInfinity => todo!(),
+                    ExtendedBigInt::MinusZero => todo!(),
+                    ExtendedBigInt::Nan => todo!(),
+                };
+                f.fmt(&mut stdout, int)?;
             }
             None => write_value_int(&mut stdout, &value, padding, pad)?,
         }
diff --git a/src/uucore/src/lib/features/format/mod.rs b/src/uucore/src/lib/features/format/mod.rs
index d6db5e8c7cd..48151be9892 100644
--- a/src/uucore/src/lib/features/format/mod.rs
+++ b/src/uucore/src/lib/features/format/mod.rs
@@ -10,8 +10,8 @@
 //! parsing errors occur during writing.
 // spell-checker:ignore (vars) charf decf floatf intf scif strf Cninety
 
-mod spec;
 pub mod num_format;
+mod spec;
 
 use spec::Spec;
 use std::{
@@ -22,6 +22,8 @@ use std::{
 
 use crate::error::UError;
 
+use self::num_format::Formatter;
+
 #[derive(Debug)]
 pub enum FormatError {
     SpecError,
@@ -33,6 +35,12 @@ pub enum FormatError {
 impl Error for FormatError {}
 impl UError for FormatError {}
 
+impl From<std::io::Error> for FormatError {
+    fn from(value: std::io::Error) -> Self {
+        FormatError::IoError(value)
+    }
+}
+
 impl Display for FormatError {
     fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
         // TODO: Be more precise about these
@@ -181,3 +189,65 @@ pub fn sprintf<'a>(
     printf_writer(&mut writer, format_string, arguments)?;
     Ok(writer)
 }
+
+/// A parsed format for a single float value
+/// 
+/// This is used by `seq`. It can be constructed with [`FloatFormat::parse`]
+/// and can write a value with [`FloatFormat::fmt`].
+/// 
+/// It can only accept a single specification without any asterisk parameters.
+/// If it does get more specifications, it will return an error.
+pub struct Format<F: Formatter> {
+    prefix: Vec<u8>,
+    suffix: Vec<u8>,
+    formatter: F,
+}
+
+impl<F: Formatter> Format<F> {
+    pub fn parse(format_string: impl AsRef<[u8]>) -> Result<Self, FormatError> {
+        let mut iter = parse_iter(format_string.as_ref());
+
+        let mut prefix = Vec::new();
+        let mut spec = None;
+        for item in &mut iter {
+            match item? {
+                FormatItem::Spec(s) => {
+                    spec = Some(s);
+                    break;
+                }
+                FormatItem::Text(t) => prefix.extend_from_slice(&t),
+                FormatItem::Char(c) => prefix.push(c),
+            }
+        }
+
+        let Some(spec) = spec else {
+            return Err(FormatError::SpecError);
+        };
+
+        let formatter = F::try_from_spec(spec)?;
+
+        let mut suffix = Vec::new();
+        for item in &mut iter {
+            match item? {
+                FormatItem::Spec(_) => {
+                    return Err(FormatError::SpecError);
+                }
+                FormatItem::Text(t) => suffix.extend_from_slice(&t),
+                FormatItem::Char(c) => suffix.push(c),
+            }
+        }
+
+        Ok(Self {
+            prefix,
+            suffix,
+            formatter,
+        })
+    }
+
+    pub fn fmt(&self, mut w: impl Write, f: F::Input) -> std::io::Result<()> {
+        w.write_all(&self.prefix)?;
+        self.formatter.fmt(&mut w, f)?;
+        w.write_all(&self.suffix)?;
+        Ok(())
+    }
+}
diff --git a/src/uucore/src/lib/features/format/num_format.rs b/src/uucore/src/lib/features/format/num_format.rs
index 3a27ac200f8..fd010bdc029 100644
--- a/src/uucore/src/lib/features/format/num_format.rs
+++ b/src/uucore/src/lib/features/format/num_format.rs
@@ -1,10 +1,16 @@
 use std::io::Write;
 
-use super::FormatError;
+use super::{
+    spec::{CanAsterisk, Spec},
+    FormatError,
+};
 
 pub trait Formatter {
     type Input;
-    fn fmt(&self, writer: impl Write, x: Self::Input) -> Result<(), FormatError>;
+    fn fmt(&self, writer: impl Write, x: Self::Input) -> std::io::Result<()>;
+    fn try_from_spec(s: Spec) -> Result<Self, FormatError>
+    where
+        Self: Sized;
 }
 
 #[derive(Clone, Copy)]
@@ -64,14 +70,13 @@ pub struct SignedInt {
 impl Formatter for SignedInt {
     type Input = i64;
 
-    fn fmt(&self, mut writer: impl Write, x: Self::Input) -> Result<(), FormatError> {
+    fn fmt(&self, mut writer: impl Write, x: Self::Input) -> std::io::Result<()> {
         if x >= 0 {
             match self.positive_sign {
                 PositiveSign::None => Ok(()),
                 PositiveSign::Plus => write!(writer, "+"),
                 PositiveSign::Space => write!(writer, " "),
-            }
-            .map_err(FormatError::IoError)?;
+            }?;
         }
 
         match self.alignment {
@@ -79,7 +84,29 @@ impl Formatter for SignedInt {
             NumberAlignment::RightSpace => write!(writer, "{x:>width$}", width = self.width),
             NumberAlignment::RightZero => write!(writer, "{x:0>width$}", width = self.width),
         }
-        .map_err(FormatError::IoError)
+    }
+
+    fn try_from_spec(s: Spec) -> Result<Self, FormatError> {
+        let Spec::SignedInt {
+            width,
+            positive_sign,
+            alignment,
+        } = s
+        else {
+            return Err(FormatError::SpecError);
+        };
+
+        let width = match width {
+            Some(CanAsterisk::Fixed(x)) => x,
+            None => 0,
+            Some(CanAsterisk::Asterisk) => return Err(FormatError::SpecError),
+        };
+
+        Ok(Self {
+            width,
+            positive_sign,
+            alignment,
+        })
     }
 }
 
@@ -92,7 +119,7 @@ pub struct UnsignedInt {
 impl Formatter for UnsignedInt {
     type Input = u64;
 
-    fn fmt(&self, mut writer: impl Write, x: Self::Input) -> Result<(), FormatError> {
+    fn fmt(&self, mut writer: impl Write, x: Self::Input) -> std::io::Result<()> {
         let s = match self.variant {
             UnsignedIntVariant::Decimal => format!("{x}"),
             UnsignedIntVariant::Octal(Prefix::No) => format!("{x:o}"),
@@ -116,7 +143,29 @@ impl Formatter for UnsignedInt {
             NumberAlignment::RightSpace => write!(writer, "{s:>width$}", width = self.width),
             NumberAlignment::RightZero => write!(writer, "{s:0>width$}", width = self.width),
         }
-        .map_err(FormatError::IoError)
+    }
+
+    fn try_from_spec(s: Spec) -> Result<Self, FormatError> {
+        let Spec::UnsignedInt {
+            variant,
+            width,
+            alignment,
+        } = s
+        else {
+            return Err(FormatError::SpecError);
+        };
+
+        let width = match width {
+            Some(CanAsterisk::Fixed(x)) => x,
+            None => 0,
+            Some(CanAsterisk::Asterisk) => return Err(FormatError::SpecError),
+        };
+
+        Ok(Self {
+            width,
+            variant,
+            alignment,
+        })
     }
 }
 
@@ -147,14 +196,13 @@ impl Default for Float {
 impl Formatter for Float {
     type Input = f64;
 
-    fn fmt(&self, mut writer: impl Write, x: Self::Input) -> Result<(), FormatError> {
+    fn fmt(&self, mut writer: impl Write, x: Self::Input) -> std::io::Result<()> {
         if x.is_sign_positive() {
             match self.positive_sign {
                 PositiveSign::None => Ok(()),
                 PositiveSign::Plus => write!(writer, "+"),
                 PositiveSign::Space => write!(writer, " "),
-            }
-            .map_err(FormatError::IoError)?;
+            }?;
         }
 
         let s = match self.variant {
@@ -177,7 +225,46 @@ impl Formatter for Float {
             NumberAlignment::RightSpace => write!(writer, "{s:>width$}", width = self.width),
             NumberAlignment::RightZero => write!(writer, "{s:0>width$}", width = self.width),
         }
-        .map_err(FormatError::IoError)
+    }
+
+    fn try_from_spec(s: Spec) -> Result<Self, FormatError>
+    where
+        Self: Sized,
+    {
+        let Spec::Float {
+            variant,
+            case,
+            force_decimal,
+            width,
+            positive_sign,
+            alignment,
+            precision,
+        } = s
+        else {
+            return Err(FormatError::SpecError);
+        };
+
+        let width = match width {
+            Some(CanAsterisk::Fixed(x)) => x,
+            None => 0,
+            Some(CanAsterisk::Asterisk) => return Err(FormatError::SpecError),
+        };
+
+        let precision = match precision {
+            Some(CanAsterisk::Fixed(x)) => x,
+            None => 0,
+            Some(CanAsterisk::Asterisk) => return Err(FormatError::SpecError),
+        };
+
+        Ok(Self {
+            variant,
+            case,
+            force_decimal,
+            width,
+            positive_sign,
+            alignment,
+            precision,
+        })
     }
 }
 
diff --git a/src/uucore/src/lib/features/format/spec.rs b/src/uucore/src/lib/features/format/spec.rs
index 80896997007..9c53669fa9c 100644
--- a/src/uucore/src/lib/features/format/spec.rs
+++ b/src/uucore/src/lib/features/format/spec.rs
@@ -252,6 +252,7 @@ impl Spec {
                     alignment,
                 }
                 .fmt(writer, *i)
+                .map_err(FormatError::IoError)
             }
             &Spec::UnsignedInt {
                 variant,
@@ -271,6 +272,7 @@ impl Spec {
                     alignment,
                 }
                 .fmt(writer, *i)
+                .map_err(FormatError::IoError)
             }
             &Spec::Float {
                 variant,
@@ -299,6 +301,7 @@ impl Spec {
                     precision,
                 }
                 .fmt(writer, *f)
+                .map_err(FormatError::IoError)
             }
         }
     }

From c4580df2a4cbb4f1cb4e3124779bde43d7b027f8 Mon Sep 17 00:00:00 2001
From: cswn <claraswanson671@gmail.com>
Date: Tue, 14 Nov 2023 18:07:35 +0100
Subject: [PATCH 014/429] split: remove crash macro

---
 src/uu/split/src/platform/unix.rs | 10 +++++++---
 1 file changed, 7 insertions(+), 3 deletions(-)

diff --git a/src/uu/split/src/platform/unix.rs b/src/uu/split/src/platform/unix.rs
index f4adb818834..c2bf7216b57 100644
--- a/src/uu/split/src/platform/unix.rs
+++ b/src/uu/split/src/platform/unix.rs
@@ -7,9 +7,10 @@ use std::io::Write;
 use std::io::{BufWriter, Error, ErrorKind, Result};
 use std::path::Path;
 use std::process::{Child, Command, Stdio};
-use uucore::crash;
+use uucore::error::USimpleError;
 use uucore::fs;
 use uucore::fs::FileInformation;
+use uucore::show;
 
 /// A writer that writes to a shell_process' stdin
 ///
@@ -101,10 +102,13 @@ impl Drop for FilterWriter {
             .expect("Couldn't wait for child process");
         if let Some(return_code) = exit_status.code() {
             if return_code != 0 {
-                crash!(1, "Shell process returned {}", return_code);
+                show!(USimpleError::new(
+                    1,
+                    format!("Shell process returned {}", return_code)
+                ));
             }
         } else {
-            crash!(1, "Shell process terminated by signal")
+            show!(USimpleError::new(1, "Shell process terminated by signal"));
         }
     }
 }

From e2e5ec60cde2a407a2c8a467c1d0057f312e2276 Mon Sep 17 00:00:00 2001
From: "renovate[bot]" <29139614+renovate[bot]@users.noreply.github.com>
Date: Tue, 14 Nov 2023 20:05:36 +0000
Subject: [PATCH 015/429] chore(deps): update rust crate itertools to 0.12.0

---
 Cargo.lock | 4 ++--
 Cargo.toml | 2 +-
 2 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/Cargo.lock b/Cargo.lock
index d83adfee600..c89c87df41c 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -1122,9 +1122,9 @@ dependencies = [
 
 [[package]]
 name = "itertools"
-version = "0.11.0"
+version = "0.12.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "b1c173a5686ce8bfa551b3563d0c2170bf24ca44da99c7ca4bfdab5418c3fe57"
+checksum = "25db6b064527c5d482d0423354fcd07a89a2dfe07b67892e62411946db7f07b0"
 dependencies = [
  "either",
 ]
diff --git a/Cargo.toml b/Cargo.toml
index f313e2b03e4..2f3af2c83d1 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -285,7 +285,7 @@ gcd = "2.3"
 glob = "0.3.1"
 half = "2.3"
 indicatif = "0.17"
-itertools = "0.11.0"
+itertools = "0.12.0"
 libc = "0.2.150"
 lscolors = { version = "0.15.0", default-features = false, features = [
   "nu-ansi-term",

From 6446ef294c1ec0dc9ab9450d659e51dc4b30526f Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Tue, 14 Nov 2023 20:44:19 +0100
Subject: [PATCH 016/429] publishing: check if the current version is already
 there or not

This can happen when a publishing step failed
---
 util/publish.sh | 32 ++++++++++++++++++++++++++++++--
 1 file changed, 30 insertions(+), 2 deletions(-)

diff --git a/util/publish.sh b/util/publish.sh
index 71830f1f915..7207ba7fb91 100755
--- a/util/publish.sh
+++ b/util/publish.sh
@@ -5,6 +5,22 @@ if test "$1" != "--do-it"; then
     ARG="--dry-run --allow-dirty"
 fi
 
+# Function to check if the crate is already published
+is_already_published() {
+    local crate_name=$1
+    local crate_version=$2
+
+    # Use the crates.io API to get the latest version of the crate
+    local latest_published_version
+    latest_published_version=$(curl -s https://crates.io/api/v1/crates/$crate_name | jq -r '.crate.max_version')
+
+    if [ "$latest_published_version" = "$crate_version" ]; then
+        return 0
+    else
+        return 1
+    fi
+}
+
 # Figure out any dependencies between the util via Cargo.toml
 # We store this as edges in a graph with each line:
 # [dependent] [dependency]
@@ -35,12 +51,19 @@ TOTAL_ORDER=$(echo -e $PARTIAL_ORDER | tsort | tac)
 # Remove the ROOT node from the start
 TOTAL_ORDER=${TOTAL_ORDER#ROOT}
 
+CRATE_VERSION=$(grep '^version' Cargo.toml | head -n1 | cut -d '"' -f2)
+
 set -e
 for dir in src/uuhelp_parser/ src/uucore_procs/ src/uucore/ src/uu/stdbuf/src/libstdbuf/; do
     (
         cd "$dir"
+        CRATE_NAME=$(grep '^name =' "Cargo.toml" | head -n1 | cut -d '"' -f2)
         #shellcheck disable=SC2086
-        cargo publish $ARG
+        if ! is_already_published "$CRATE_NAME" "$CRATE_VERSION"; then
+            cargo publish $ARG
+        else
+            echo "Skip: $CRATE_NAME $CRATE_VERSION already published"
+        fi
     )
     sleep 2s
 done
@@ -48,8 +71,13 @@ done
 for p in $TOTAL_ORDER; do
     (
         cd "src/uu/$p"
+        CRATE_NAME=$(grep '^name =' "Cargo.toml" | head -n1 | cut -d '"' -f2)
         #shellcheck disable=SC2086
-        cargo publish $ARG
+        if ! is_already_published "$CRATE_NAME" "$CRATE_VERSION"; then
+            cargo publish $ARG
+        else
+            echo "Skip: $CRATE_NAME $CRATE_VERSION already published"
+        fi
     )
 done
 

From 3f86bc59de6f8c6dbb73faaa81d3ad3fa40c01e7 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Wed, 15 Nov 2023 08:31:47 +0100
Subject: [PATCH 017/429] add missing features to uucore

---
 src/uu/dd/Cargo.toml     | 2 +-
 src/uu/printf/Cargo.toml | 2 +-
 src/uu/seq/Cargo.toml    | 2 +-
 3 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/src/uu/dd/Cargo.toml b/src/uu/dd/Cargo.toml
index 7db05b422f3..d654d829736 100644
--- a/src/uu/dd/Cargo.toml
+++ b/src/uu/dd/Cargo.toml
@@ -18,7 +18,7 @@ path = "src/dd.rs"
 clap = { workspace = true }
 gcd = { workspace = true }
 libc = { workspace = true }
-uucore = { workspace = true, features = ["memo"] }
+uucore = { workspace = true, features = ["memo", "quoting-style"] }
 
 [target.'cfg(any(target_os = "linux"))'.dependencies]
 nix = { workspace = true, features = ["fs"] }
diff --git a/src/uu/printf/Cargo.toml b/src/uu/printf/Cargo.toml
index 1cb05ec09b0..f36eff35e8c 100644
--- a/src/uu/printf/Cargo.toml
+++ b/src/uu/printf/Cargo.toml
@@ -16,7 +16,7 @@ path = "src/printf.rs"
 
 [dependencies]
 clap = { workspace = true }
-uucore = { workspace = true, features = ["memo"] }
+uucore = { workspace = true, features = ["memo", "quoting-style"] }
 
 [[bin]]
 name = "printf"
diff --git a/src/uu/seq/Cargo.toml b/src/uu/seq/Cargo.toml
index 95f761696c2..d4e7cd316c6 100644
--- a/src/uu/seq/Cargo.toml
+++ b/src/uu/seq/Cargo.toml
@@ -20,7 +20,7 @@ bigdecimal = { workspace = true }
 clap = { workspace = true }
 num-bigint = { workspace = true }
 num-traits = { workspace = true }
-uucore = { workspace = true, features = ["memo"] }
+uucore = { workspace = true, features = ["memo", "quoting-style"] }
 
 [[bin]]
 name = "seq"

From 3f177ef97fc4e6f7a17f7565761732d89847fe72 Mon Sep 17 00:00:00 2001
From: "Y.D.X" <73375426+YDX-2147483647@users.noreply.github.com>
Date: Wed, 15 Nov 2023 19:09:46 +0800
Subject: [PATCH 018/429] doc: Fix the markdown highlighting syntax
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

There should be a new line after `[!WARNING]`, according to [community · Discussion #16925](https://github.com/orgs/community/discussions/16925).
---
 CONTRIBUTING.md | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/CONTRIBUTING.md b/CONTRIBUTING.md
index 255ed2c53e3..b10d3d11472 100644
--- a/CONTRIBUTING.md
+++ b/CONTRIBUTING.md
@@ -14,7 +14,8 @@ check out these documents:
 
 Now follows a very important warning:
 
-> [!WARNING] uutils is original code and cannot contain any code from GNU or
+> [!WARNING]
+> uutils is original code and cannot contain any code from GNU or
 > other implementations. This means that **we cannot accept any changes based on
 > the GNU source code**. To make sure that cannot happen, **you cannot link to
 > the GNU source code** either.

From 94f6702ba52a875d251e869eba55583e61da9ad1 Mon Sep 17 00:00:00 2001
From: cswn <claraswanson671@gmail.com>
Date: Wed, 15 Nov 2023 13:20:22 +0100
Subject: [PATCH 019/429] join: remove crash! macro

---
 src/uu/join/src/join.rs | 20 +++++++++++++-------
 1 file changed, 13 insertions(+), 7 deletions(-)

diff --git a/src/uu/join/src/join.rs b/src/uu/join/src/join.rs
index a48ba3657bd..3f2172da33e 100644
--- a/src/uu/join/src/join.rs
+++ b/src/uu/join/src/join.rs
@@ -21,7 +21,7 @@ use std::os::unix::ffi::OsStrExt;
 use uucore::display::Quotable;
 use uucore::error::{set_exit_code, UError, UResult, USimpleError};
 use uucore::line_ending::LineEnding;
-use uucore::{crash, crash_if_err, format_usage, help_about, help_usage};
+use uucore::{crash_if_err, format_usage, help_about, help_usage};
 
 const ABOUT: &str = help_about!("join.md");
 const USAGE: &str = help_usage!("join.md");
@@ -334,17 +334,23 @@ impl<'a> State<'a> {
         key: usize,
         line_ending: LineEnding,
         print_unpaired: bool,
-    ) -> State<'a> {
+    ) -> Result<State<'a>, JoinError> {
         let f = if name == "-" {
             Box::new(stdin.lock()) as Box<dyn BufRead>
         } else {
             match File::open(name) {
                 Ok(file) => Box::new(BufReader::new(file)) as Box<dyn BufRead>,
-                Err(err) => crash!(1, "{}: {}", name.maybe_quote(), err),
+                Err(err) => {
+                    return Err(JoinError::UnorderedInput(format!(
+                        "{}: {}",
+                        name.maybe_quote(),
+                        err
+                    )));
+                }
             }
         };
 
-        State {
+        Ok(State {
             key,
             file_name: name,
             file_num,
@@ -355,7 +361,7 @@ impl<'a> State<'a> {
             line_num: 0,
             has_failed: false,
             has_unpaired: false,
-        }
+        })
     }
 
     /// Skip the current unpaired line.
@@ -847,7 +853,7 @@ fn exec(file1: &str, file2: &str, settings: Settings) -> Result<(), JoinError> {
         settings.key1,
         settings.line_ending,
         settings.print_unpaired1,
-    );
+    )?;
 
     let mut state2 = State::new(
         FileNum::File2,
@@ -856,7 +862,7 @@ fn exec(file1: &str, file2: &str, settings: Settings) -> Result<(), JoinError> {
         settings.key2,
         settings.line_ending,
         settings.print_unpaired2,
-    );
+    )?;
 
     let input = Input::new(
         settings.separator,

From 5dff5f2f736c44c576adce2dbcbe8275d52ebbd2 Mon Sep 17 00:00:00 2001
From: cswn <claraswanson671@gmail.com>
Date: Wed, 15 Nov 2023 13:52:01 +0100
Subject: [PATCH 020/429] join: rename f variable to file_buf

---
 src/uu/join/src/join.rs | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/uu/join/src/join.rs b/src/uu/join/src/join.rs
index 3f2172da33e..c8008c91c61 100644
--- a/src/uu/join/src/join.rs
+++ b/src/uu/join/src/join.rs
@@ -335,7 +335,7 @@ impl<'a> State<'a> {
         line_ending: LineEnding,
         print_unpaired: bool,
     ) -> Result<State<'a>, JoinError> {
-        let f = if name == "-" {
+        let file_buf = if name == "-" {
             Box::new(stdin.lock()) as Box<dyn BufRead>
         } else {
             match File::open(name) {
@@ -355,7 +355,7 @@ impl<'a> State<'a> {
             file_name: name,
             file_num,
             print_unpaired,
-            lines: f.split(line_ending as u8),
+            lines: file_buf.split(line_ending as u8),
             max_len: 1,
             seq: Vec::new(),
             line_num: 0,

From b3eae16faddf03e5ce83047f244a510932970565 Mon Sep 17 00:00:00 2001
From: ALXD <github@alxd.org>
Date: Wed, 15 Nov 2023 17:40:54 +0100
Subject: [PATCH 021/429] printf: intf: change warning and exit code

---
 .../features/tokenize/num_format/formatters/intf.rs    | 10 ++++++----
 1 file changed, 6 insertions(+), 4 deletions(-)

diff --git a/src/uucore/src/lib/features/tokenize/num_format/formatters/intf.rs b/src/uucore/src/lib/features/tokenize/num_format/formatters/intf.rs
index 11070113c26..767c0c4bb67 100644
--- a/src/uucore/src/lib/features/tokenize/num_format/formatters/intf.rs
+++ b/src/uucore/src/lib/features/tokenize/num_format/formatters/intf.rs
@@ -8,10 +8,11 @@
 //! formatter for unsigned and signed int subs
 //! unsigned int: %X %x (hex u64) %o (octal u64) %u (base ten u64)
 //! signed int: %i %d (both base ten i64)
+use crate::error::set_exit_code;
+use crate::features::tokenize::num_format::num_format::warn_expected_numeric;
+
 use super::super::format_field::FormatField;
-use super::super::formatter::{
-    get_it_at, warn_incomplete_conv, Base, FormatPrimitive, Formatter, InitialPrefix,
-};
+use super::super::formatter::{get_it_at, Base, FormatPrimitive, Formatter, InitialPrefix};
 use std::i64;
 use std::u64;
 
@@ -112,7 +113,8 @@ impl Intf {
                         }
                     }
                     _ => {
-                        warn_incomplete_conv(str_in);
+                        warn_expected_numeric(str_in);
+                        set_exit_code(1);
                         break;
                     }
                 }

From 3cdb0966ae1b86724be8f7b6db2b6f41472169fc Mon Sep 17 00:00:00 2001
From: ALXD <github@alxd.org>
Date: Wed, 15 Nov 2023 17:46:58 +0100
Subject: [PATCH 022/429] printf: add a test for %x with invalid value

---
 tests/by-util/test_printf.rs | 8 ++++++++
 1 file changed, 8 insertions(+)

diff --git a/tests/by-util/test_printf.rs b/tests/by-util/test_printf.rs
index a297dbf6833..ab3505a327b 100644
--- a/tests/by-util/test_printf.rs
+++ b/tests/by-util/test_printf.rs
@@ -258,6 +258,14 @@ fn sub_num_hex_upper() {
         .stdout_only("thirty in hex is 1E");
 }
 
+#[test]
+fn sub_num_hex_non_numerical() {
+    new_ucmd!()
+        .args(&["parameters need to be numbers %X", "%194"])
+        .fails()
+        .code_is(1);
+}
+
 #[test]
 fn sub_num_float() {
     new_ucmd!()

From 212991cd53cba8be58e877ab5b17ea86eb46f20e Mon Sep 17 00:00:00 2001
From: "Y.D.X." <73375426+YDX-2147483647@users.noreply.github.com>
Date: Thu, 16 Nov 2023 12:26:40 +0800
Subject: [PATCH 023/429] doc: Fix a broken link
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

`/build.md` is absolute, so the link in https://uutils.github.io/coreutils/book/installation.html turns out to be https://uutils.github.io/build.html instead of https://uutils.github.io/coreutils/book/build.html.

Reference: [Links · Markdown - mdBook Documentation](https://rust-lang.github.io/mdBook/format/markdown.html#links)
---
 docs/src/installation.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/src/installation.md b/docs/src/installation.md
index da124ead977..54b1e23f3f6 100644
--- a/docs/src/installation.md
+++ b/docs/src/installation.md
@@ -6,7 +6,7 @@ This is a list of uutils packages in various distributions and package managers.
 Note that these are packaged by third-parties and the packages might contain
 patches.
 
-You can also [build uutils from source](/build.md).
+You can also [build uutils from source](build.md).
 
 <!-- toc -->
 

From a064c886566f810c3e58b1b1153762e772e35567 Mon Sep 17 00:00:00 2001
From: cswn <claraswanson671@gmail.com>
Date: Thu, 16 Nov 2023 09:35:32 +0100
Subject: [PATCH 024/429] join: replace match with JoinError with
 map_err_context

---
 src/uu/join/src/join.rs | 34 ++++++++--------------------------
 1 file changed, 8 insertions(+), 26 deletions(-)

diff --git a/src/uu/join/src/join.rs b/src/uu/join/src/join.rs
index c8008c91c61..9661138879b 100644
--- a/src/uu/join/src/join.rs
+++ b/src/uu/join/src/join.rs
@@ -19,7 +19,7 @@ use std::num::IntErrorKind;
 #[cfg(unix)]
 use std::os::unix::ffi::OsStrExt;
 use uucore::display::Quotable;
-use uucore::error::{set_exit_code, UError, UResult, USimpleError};
+use uucore::error::{set_exit_code, FromIo, UError, UResult, USimpleError};
 use uucore::line_ending::LineEnding;
 use uucore::{crash_if_err, format_usage, help_about, help_usage};
 
@@ -334,20 +334,12 @@ impl<'a> State<'a> {
         key: usize,
         line_ending: LineEnding,
         print_unpaired: bool,
-    ) -> Result<State<'a>, JoinError> {
+    ) -> UResult<State<'a>> {
         let file_buf = if name == "-" {
             Box::new(stdin.lock()) as Box<dyn BufRead>
         } else {
-            match File::open(name) {
-                Ok(file) => Box::new(BufReader::new(file)) as Box<dyn BufRead>,
-                Err(err) => {
-                    return Err(JoinError::UnorderedInput(format!(
-                        "{}: {}",
-                        name.maybe_quote(),
-                        err
-                    )));
-                }
-            }
+            let file = File::open(name).map_err_context(|| format!("{}", name.maybe_quote()))?;
+            Box::new(BufReader::new(file)) as Box<dyn BufRead>
         };
 
         Ok(State {
@@ -365,12 +357,7 @@ impl<'a> State<'a> {
     }
 
     /// Skip the current unpaired line.
-    fn skip_line(
-        &mut self,
-        writer: &mut impl Write,
-        input: &Input,
-        repr: &Repr,
-    ) -> Result<(), JoinError> {
+    fn skip_line(&mut self, writer: &mut impl Write, input: &Input, repr: &Repr) -> UResult<()> {
         if self.print_unpaired {
             self.print_first_line(writer, repr)?;
         }
@@ -381,7 +368,7 @@ impl<'a> State<'a> {
 
     /// Keep reading line sequence until the key does not change, return
     /// the first line whose key differs.
-    fn extend(&mut self, input: &Input) -> Result<Option<Line>, JoinError> {
+    fn extend(&mut self, input: &Input) -> UResult<Option<Line>> {
         while let Some(line) = self.next_line(input)? {
             let diff = input.compare(self.get_current_key(), line.get_field(self.key));
 
@@ -490,12 +477,7 @@ impl<'a> State<'a> {
         0
     }
 
-    fn finalize(
-        &mut self,
-        writer: &mut impl Write,
-        input: &Input,
-        repr: &Repr,
-    ) -> Result<(), JoinError> {
+    fn finalize(&mut self, writer: &mut impl Write, input: &Input, repr: &Repr) -> UResult<()> {
         if self.has_line() {
             if self.print_unpaired {
                 self.print_first_line(writer, repr)?;
@@ -843,7 +825,7 @@ FILENUM is 1 or 2, corresponding to FILE1 or FILE2",
         )
 }
 
-fn exec(file1: &str, file2: &str, settings: Settings) -> Result<(), JoinError> {
+fn exec(file1: &str, file2: &str, settings: Settings) -> UResult<()> {
     let stdin = stdin();
 
     let mut state1 = State::new(

From 7ff4cb3f4e236724d8bdf0d3a83258cd5daeb228 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Thu, 16 Nov 2023 10:40:31 +0100
Subject: [PATCH 025/429] update of the license file to make it generic (#5545)

---
 LICENSE | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/LICENSE b/LICENSE
index 49fdbd4cf5f..21bd44404e3 100644
--- a/LICENSE
+++ b/LICENSE
@@ -1,4 +1,4 @@
-Copyright (c) Jordi Boggiano and many others
+Copyright (c) uutils developers
 
 Permission is hereby granted, free of charge, to any person obtaining a copy of
 this software and associated documentation files (the "Software"), to deal in

From 65dc70b55396c3a00b70143fc84cc7d96cc25539 Mon Sep 17 00:00:00 2001
From: cswn <claraswanson671@gmail.com>
Date: Thu, 16 Nov 2023 12:02:39 +0100
Subject: [PATCH 026/429] join: remove match in uumain and return exec result

---
 src/uu/join/src/join.rs | 5 +----
 1 file changed, 1 insertion(+), 4 deletions(-)

diff --git a/src/uu/join/src/join.rs b/src/uu/join/src/join.rs
index 9661138879b..423af983ec9 100644
--- a/src/uu/join/src/join.rs
+++ b/src/uu/join/src/join.rs
@@ -701,10 +701,7 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
         return Err(USimpleError::new(1, "both files cannot be standard input"));
     }
 
-    match exec(file1, file2, settings) {
-        Ok(_) => Ok(()),
-        Err(e) => Err(USimpleError::new(1, format!("{e}"))),
-    }
+    exec(file1, file2, settings)
 }
 
 pub fn uu_app() -> Command {

From e7d58f673ff9515af11169cd92b6b341d6e8c13f Mon Sep 17 00:00:00 2001
From: Terts Diepraam <terts.diepraam@gmail.com>
Date: Mon, 13 Nov 2023 17:37:25 +0100
Subject: [PATCH 027/429] seq: simplify and use new printf implementation

---
 src/uu/seq/src/extendedbigdecimal.rs          |  54 +----
 src/uu/seq/src/extendedbigint.rs              | 214 ------------------
 src/uu/seq/src/number.rs                      |  70 +-----
 src/uu/seq/src/numberparse.rs                 | 127 ++++-------
 src/uu/seq/src/seq.rs                         | 167 +++-----------
 src/uucore/src/lib/features/format/mod.rs     |   4 +-
 .../src/lib/features/format/num_format.rs     |  24 +-
 src/uucore/src/lib/features/format/spec.rs    |  13 +-
 8 files changed, 104 insertions(+), 569 deletions(-)
 delete mode 100644 src/uu/seq/src/extendedbigint.rs

diff --git a/src/uu/seq/src/extendedbigdecimal.rs b/src/uu/seq/src/extendedbigdecimal.rs
index 388046ba368..ecd460ceb73 100644
--- a/src/uu/seq/src/extendedbigdecimal.rs
+++ b/src/uu/seq/src/extendedbigdecimal.rs
@@ -25,13 +25,8 @@ use std::fmt::Display;
 use std::ops::Add;
 
 use bigdecimal::BigDecimal;
-use num_bigint::BigInt;
-use num_bigint::ToBigInt;
-use num_traits::One;
 use num_traits::Zero;
 
-use crate::extendedbigint::ExtendedBigInt;
-
 #[derive(Debug, Clone)]
 pub enum ExtendedBigDecimal {
     /// Arbitrary precision floating point number.
@@ -72,53 +67,14 @@ pub enum ExtendedBigDecimal {
     Nan,
 }
 
-/// The smallest integer greater than or equal to this number.
-fn ceil(x: BigDecimal) -> BigInt {
-    if x.is_integer() {
-        // Unwrapping the Option because it always returns Some
-        x.to_bigint().unwrap()
-    } else {
-        (x + BigDecimal::one().half()).round(0).to_bigint().unwrap()
-    }
-}
-
-/// The largest integer less than or equal to this number.
-fn floor(x: BigDecimal) -> BigInt {
-    if x.is_integer() {
-        // Unwrapping the Option because it always returns Some
-        x.to_bigint().unwrap()
-    } else {
-        (x - BigDecimal::one().half()).round(0).to_bigint().unwrap()
-    }
-}
-
 impl ExtendedBigDecimal {
-    /// The smallest integer greater than or equal to this number.
-    pub fn ceil(self) -> ExtendedBigInt {
-        match self {
-            Self::BigDecimal(x) => ExtendedBigInt::BigInt(ceil(x)),
-            other => From::from(other),
-        }
+    #[cfg(test)]
+    pub fn zero() -> Self {
+        Self::BigDecimal(1.into())
     }
 
-    /// The largest integer less than or equal to this number.
-    pub fn floor(self) -> ExtendedBigInt {
-        match self {
-            Self::BigDecimal(x) => ExtendedBigInt::BigInt(floor(x)),
-            other => From::from(other),
-        }
-    }
-}
-
-impl From<ExtendedBigInt> for ExtendedBigDecimal {
-    fn from(big_int: ExtendedBigInt) -> Self {
-        match big_int {
-            ExtendedBigInt::BigInt(n) => Self::BigDecimal(BigDecimal::from(n)),
-            ExtendedBigInt::Infinity => Self::Infinity,
-            ExtendedBigInt::MinusInfinity => Self::MinusInfinity,
-            ExtendedBigInt::MinusZero => Self::MinusZero,
-            ExtendedBigInt::Nan => Self::Nan,
-        }
+    pub fn one() -> Self {
+        Self::BigDecimal(1.into())
     }
 }
 
diff --git a/src/uu/seq/src/extendedbigint.rs b/src/uu/seq/src/extendedbigint.rs
deleted file mode 100644
index 6828fba2df2..00000000000
--- a/src/uu/seq/src/extendedbigint.rs
+++ /dev/null
@@ -1,214 +0,0 @@
-// This file is part of the uutils coreutils package.
-//
-// For the full copyright and license information, please view the LICENSE
-// file that was distributed with this source code.
-// spell-checker:ignore bigint extendedbigint extendedbigdecimal
-//! An arbitrary precision integer that can also represent infinity, NaN, etc.
-//!
-//! Usually infinity, NaN, and negative zero are only represented for
-//! floating point numbers. The [`ExtendedBigInt`] enumeration provides
-//! a representation of those things with the set of integers. The
-//! finite values are stored as [`BigInt`] instances.
-//!
-//! # Examples
-//!
-//! Addition works for [`ExtendedBigInt`] as it does for floats. For
-//! example, adding infinity to any finite value results in infinity:
-//!
-//! ```rust,ignore
-//! let summand1 = ExtendedBigInt::BigInt(BigInt::zero());
-//! let summand2 = ExtendedBigInt::Infinity;
-//! assert_eq!(summand1 + summand2, ExtendedBigInt::Infinity);
-//! ```
-use std::cmp::Ordering;
-use std::fmt::Display;
-use std::ops::Add;
-
-use num_bigint::BigInt;
-use num_bigint::ToBigInt;
-use num_traits::One;
-use num_traits::Zero;
-
-use crate::extendedbigdecimal::ExtendedBigDecimal;
-
-#[derive(Debug, Clone)]
-pub enum ExtendedBigInt {
-    BigInt(BigInt),
-    Infinity,
-    MinusInfinity,
-    MinusZero,
-    Nan,
-}
-
-impl ExtendedBigInt {
-    /// The integer number one.
-    pub fn one() -> Self {
-        // We would like to implement `num_traits::One`, but it requires
-        // a multiplication implementation, and we don't want to
-        // implement that here.
-        Self::BigInt(BigInt::one())
-    }
-}
-
-impl From<ExtendedBigDecimal> for ExtendedBigInt {
-    fn from(big_decimal: ExtendedBigDecimal) -> Self {
-        match big_decimal {
-            // TODO When can this fail?
-            ExtendedBigDecimal::BigDecimal(x) => Self::BigInt(x.to_bigint().unwrap()),
-            ExtendedBigDecimal::Infinity => Self::Infinity,
-            ExtendedBigDecimal::MinusInfinity => Self::MinusInfinity,
-            ExtendedBigDecimal::MinusZero => Self::MinusZero,
-            ExtendedBigDecimal::Nan => Self::Nan,
-        }
-    }
-}
-
-impl Display for ExtendedBigInt {
-    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
-        match self {
-            Self::BigInt(n) => n.fmt(f),
-            Self::Infinity => f32::INFINITY.fmt(f),
-            Self::MinusInfinity => f32::NEG_INFINITY.fmt(f),
-            Self::MinusZero => "-0".fmt(f),
-            Self::Nan => "nan".fmt(f),
-        }
-    }
-}
-
-impl Zero for ExtendedBigInt {
-    fn zero() -> Self {
-        Self::BigInt(BigInt::zero())
-    }
-    fn is_zero(&self) -> bool {
-        match self {
-            Self::BigInt(n) => n.is_zero(),
-            Self::MinusZero => true,
-            _ => false,
-        }
-    }
-}
-
-impl Add for ExtendedBigInt {
-    type Output = Self;
-
-    fn add(self, other: Self) -> Self {
-        match (self, other) {
-            (Self::BigInt(m), Self::BigInt(n)) => Self::BigInt(m.add(n)),
-            (Self::BigInt(_), Self::MinusInfinity) => Self::MinusInfinity,
-            (Self::BigInt(_), Self::Infinity) => Self::Infinity,
-            (Self::BigInt(_), Self::Nan) => Self::Nan,
-            (Self::BigInt(m), Self::MinusZero) => Self::BigInt(m),
-            (Self::Infinity, Self::BigInt(_)) => Self::Infinity,
-            (Self::Infinity, Self::Infinity) => Self::Infinity,
-            (Self::Infinity, Self::MinusZero) => Self::Infinity,
-            (Self::Infinity, Self::MinusInfinity) => Self::Nan,
-            (Self::Infinity, Self::Nan) => Self::Nan,
-            (Self::MinusInfinity, Self::BigInt(_)) => Self::MinusInfinity,
-            (Self::MinusInfinity, Self::MinusInfinity) => Self::MinusInfinity,
-            (Self::MinusInfinity, Self::MinusZero) => Self::MinusInfinity,
-            (Self::MinusInfinity, Self::Infinity) => Self::Nan,
-            (Self::MinusInfinity, Self::Nan) => Self::Nan,
-            (Self::Nan, _) => Self::Nan,
-            (Self::MinusZero, other) => other,
-        }
-    }
-}
-
-impl PartialEq for ExtendedBigInt {
-    fn eq(&self, other: &Self) -> bool {
-        match (self, other) {
-            (Self::BigInt(m), Self::BigInt(n)) => m.eq(n),
-            (Self::BigInt(_), Self::MinusInfinity) => false,
-            (Self::BigInt(_), Self::Infinity) => false,
-            (Self::BigInt(_), Self::Nan) => false,
-            (Self::BigInt(_), Self::MinusZero) => false,
-            (Self::Infinity, Self::BigInt(_)) => false,
-            (Self::Infinity, Self::Infinity) => true,
-            (Self::Infinity, Self::MinusZero) => false,
-            (Self::Infinity, Self::MinusInfinity) => false,
-            (Self::Infinity, Self::Nan) => false,
-            (Self::MinusInfinity, Self::BigInt(_)) => false,
-            (Self::MinusInfinity, Self::Infinity) => false,
-            (Self::MinusInfinity, Self::MinusZero) => false,
-            (Self::MinusInfinity, Self::MinusInfinity) => true,
-            (Self::MinusInfinity, Self::Nan) => false,
-            (Self::Nan, _) => false,
-            (Self::MinusZero, Self::BigInt(_)) => false,
-            (Self::MinusZero, Self::Infinity) => false,
-            (Self::MinusZero, Self::MinusZero) => true,
-            (Self::MinusZero, Self::MinusInfinity) => false,
-            (Self::MinusZero, Self::Nan) => false,
-        }
-    }
-}
-
-impl PartialOrd for ExtendedBigInt {
-    fn partial_cmp(&self, other: &Self) -> Option<Ordering> {
-        match (self, other) {
-            (Self::BigInt(m), Self::BigInt(n)) => m.partial_cmp(n),
-            (Self::BigInt(_), Self::MinusInfinity) => Some(Ordering::Greater),
-            (Self::BigInt(_), Self::Infinity) => Some(Ordering::Less),
-            (Self::BigInt(_), Self::Nan) => None,
-            (Self::BigInt(m), Self::MinusZero) => m.partial_cmp(&BigInt::zero()),
-            (Self::Infinity, Self::BigInt(_)) => Some(Ordering::Greater),
-            (Self::Infinity, Self::Infinity) => Some(Ordering::Equal),
-            (Self::Infinity, Self::MinusZero) => Some(Ordering::Greater),
-            (Self::Infinity, Self::MinusInfinity) => Some(Ordering::Greater),
-            (Self::Infinity, Self::Nan) => None,
-            (Self::MinusInfinity, Self::BigInt(_)) => Some(Ordering::Less),
-            (Self::MinusInfinity, Self::Infinity) => Some(Ordering::Less),
-            (Self::MinusInfinity, Self::MinusZero) => Some(Ordering::Less),
-            (Self::MinusInfinity, Self::MinusInfinity) => Some(Ordering::Equal),
-            (Self::MinusInfinity, Self::Nan) => None,
-            (Self::Nan, _) => None,
-            (Self::MinusZero, Self::BigInt(n)) => BigInt::zero().partial_cmp(n),
-            (Self::MinusZero, Self::Infinity) => Some(Ordering::Less),
-            (Self::MinusZero, Self::MinusZero) => Some(Ordering::Equal),
-            (Self::MinusZero, Self::MinusInfinity) => Some(Ordering::Greater),
-            (Self::MinusZero, Self::Nan) => None,
-        }
-    }
-}
-
-#[cfg(test)]
-mod tests {
-
-    use num_bigint::BigInt;
-    use num_traits::Zero;
-
-    use crate::extendedbigint::ExtendedBigInt;
-
-    #[test]
-    fn test_addition_infinity() {
-        let summand1 = ExtendedBigInt::BigInt(BigInt::zero());
-        let summand2 = ExtendedBigInt::Infinity;
-        assert_eq!(summand1 + summand2, ExtendedBigInt::Infinity);
-    }
-
-    #[test]
-    fn test_addition_minus_infinity() {
-        let summand1 = ExtendedBigInt::BigInt(BigInt::zero());
-        let summand2 = ExtendedBigInt::MinusInfinity;
-        assert_eq!(summand1 + summand2, ExtendedBigInt::MinusInfinity);
-    }
-
-    #[test]
-    fn test_addition_nan() {
-        let summand1 = ExtendedBigInt::BigInt(BigInt::zero());
-        let summand2 = ExtendedBigInt::Nan;
-        let sum = summand1 + summand2;
-        match sum {
-            ExtendedBigInt::Nan => (),
-            _ => unreachable!(),
-        }
-    }
-
-    #[test]
-    fn test_display() {
-        assert_eq!(format!("{}", ExtendedBigInt::BigInt(BigInt::zero())), "0");
-        assert_eq!(format!("{}", ExtendedBigInt::MinusZero), "-0");
-        assert_eq!(format!("{}", ExtendedBigInt::Infinity), "inf");
-        assert_eq!(format!("{}", ExtendedBigInt::MinusInfinity), "-inf");
-        assert_eq!(format!("{}", ExtendedBigInt::Nan), "nan");
-    }
-}
diff --git a/src/uu/seq/src/number.rs b/src/uu/seq/src/number.rs
index 85bc327ff46..4da1146eff6 100644
--- a/src/uu/seq/src/number.rs
+++ b/src/uu/seq/src/number.rs
@@ -12,70 +12,6 @@
 use num_traits::Zero;
 
 use crate::extendedbigdecimal::ExtendedBigDecimal;
-use crate::extendedbigint::ExtendedBigInt;
-
-/// An integral or floating point number.
-#[derive(Debug, PartialEq)]
-pub enum Number {
-    Int(ExtendedBigInt),
-    Float(ExtendedBigDecimal),
-}
-
-impl Number {
-    /// Decide whether this number is zero (either positive or negative).
-    pub fn is_zero(&self) -> bool {
-        // We would like to implement `num_traits::Zero`, but it
-        // requires an addition implementation, and we don't want to
-        // implement that here.
-        match self {
-            Self::Int(n) => n.is_zero(),
-            Self::Float(x) => x.is_zero(),
-        }
-    }
-
-    /// Convert this number into an `ExtendedBigDecimal`.
-    pub fn into_extended_big_decimal(self) -> ExtendedBigDecimal {
-        match self {
-            Self::Int(n) => ExtendedBigDecimal::from(n),
-            Self::Float(x) => x,
-        }
-    }
-
-    /// The integer number one.
-    pub fn one() -> Self {
-        // We would like to implement `num_traits::One`, but it requires
-        // a multiplication implementation, and we don't want to
-        // implement that here.
-        Self::Int(ExtendedBigInt::one())
-    }
-
-    /// Round this number towards the given other number.
-    ///
-    /// If `other` is greater, then round up. If `other` is smaller,
-    /// then round down.
-    pub fn round_towards(self, other: &ExtendedBigInt) -> ExtendedBigInt {
-        match self {
-            // If this number is already an integer, it is already
-            // rounded to the nearest integer in the direction of
-            // `other`.
-            Self::Int(num) => num,
-            // Otherwise, if this number is a float, we need to decide
-            // whether `other` is larger or smaller than it, and thus
-            // whether to round up or round down, respectively.
-            Self::Float(num) => {
-                let other: ExtendedBigDecimal = From::from(other.clone());
-                if other > num {
-                    num.ceil()
-                } else {
-                    // If they are equal, then `self` is already an
-                    // integer, so calling `floor()` does no harm and
-                    // will just return that integer anyway.
-                    num.floor()
-                }
-            }
-        }
-    }
-}
 
 /// A number with a specified number of integer and fractional digits.
 ///
@@ -87,13 +23,13 @@ impl Number {
 /// You can get an instance of this struct by calling [`str::parse`].
 #[derive(Debug)]
 pub struct PreciseNumber {
-    pub number: Number,
+    pub number: ExtendedBigDecimal,
     pub num_integral_digits: usize,
     pub num_fractional_digits: usize,
 }
 
 impl PreciseNumber {
-    pub fn new(number: Number, num_integral_digits: usize, num_fractional_digits: usize) -> Self {
+    pub fn new(number: ExtendedBigDecimal, num_integral_digits: usize, num_fractional_digits: usize) -> Self {
         Self {
             number,
             num_integral_digits,
@@ -106,7 +42,7 @@ impl PreciseNumber {
         // We would like to implement `num_traits::One`, but it requires
         // a multiplication implementation, and we don't want to
         // implement that here.
-        Self::new(Number::one(), 1, 0)
+        Self::new(ExtendedBigDecimal::one(), 1, 0)
     }
 
     /// Decide whether this number is zero (either positive or negative).
diff --git a/src/uu/seq/src/numberparse.rs b/src/uu/seq/src/numberparse.rs
index 3f4b213955f..a82d1e88776 100644
--- a/src/uu/seq/src/numberparse.rs
+++ b/src/uu/seq/src/numberparse.rs
@@ -16,8 +16,6 @@ use num_traits::Num;
 use num_traits::Zero;
 
 use crate::extendedbigdecimal::ExtendedBigDecimal;
-use crate::extendedbigint::ExtendedBigInt;
-use crate::number::Number;
 use crate::number::PreciseNumber;
 
 /// An error returned when parsing a number fails.
@@ -29,8 +27,8 @@ pub enum ParseNumberError {
 }
 
 /// Decide whether a given string and its parsed `BigInt` is negative zero.
-fn is_minus_zero_int(s: &str, n: &BigInt) -> bool {
-    s.starts_with('-') && n == &BigInt::zero()
+fn is_minus_zero_int(s: &str, n: &BigDecimal) -> bool {
+    s.starts_with('-') && n == &BigDecimal::zero()
 }
 
 /// Decide whether a given string and its parsed `BigDecimal` is negative zero.
@@ -53,19 +51,19 @@ fn is_minus_zero_float(s: &str, x: &BigDecimal) -> bool {
 /// assert_eq!(actual, expected);
 /// ```
 fn parse_no_decimal_no_exponent(s: &str) -> Result<PreciseNumber, ParseNumberError> {
-    match s.parse::<BigInt>() {
+    match s.parse::<BigDecimal>() {
         Ok(n) => {
             // If `s` is '-0', then `parse()` returns `BigInt::zero()`,
             // but we need to return `Number::MinusZeroInt` instead.
             if is_minus_zero_int(s, &n) {
                 Ok(PreciseNumber::new(
-                    Number::Int(ExtendedBigInt::MinusZero),
+                    ExtendedBigDecimal::MinusZero,
                     s.len(),
                     0,
                 ))
             } else {
                 Ok(PreciseNumber::new(
-                    Number::Int(ExtendedBigInt::BigInt(n)),
+                    ExtendedBigDecimal::BigDecimal(n),
                     s.len(),
                     0,
                 ))
@@ -79,7 +77,7 @@ fn parse_no_decimal_no_exponent(s: &str) -> Result<PreciseNumber, ParseNumberErr
                 "nan" | "-nan" => return Err(ParseNumberError::Nan),
                 _ => return Err(ParseNumberError::Float),
             };
-            Ok(PreciseNumber::new(Number::Float(float_val), 0, 0))
+            Ok(PreciseNumber::new(float_val, 0, 0))
         }
     }
 }
@@ -125,13 +123,13 @@ fn parse_exponent_no_decimal(s: &str, j: usize) -> Result<PreciseNumber, ParseNu
     if exponent < 0 {
         if is_minus_zero_float(s, &x) {
             Ok(PreciseNumber::new(
-                Number::Float(ExtendedBigDecimal::MinusZero),
+                ExtendedBigDecimal::MinusZero,
                 num_integral_digits,
                 num_fractional_digits,
             ))
         } else {
             Ok(PreciseNumber::new(
-                Number::Float(ExtendedBigDecimal::BigDecimal(x)),
+                ExtendedBigDecimal::BigDecimal(x),
                 num_integral_digits,
                 num_fractional_digits,
             ))
@@ -169,13 +167,13 @@ fn parse_decimal_no_exponent(s: &str, i: usize) -> Result<PreciseNumber, ParseNu
     let num_fractional_digits = s.len() - (i + 1);
     if is_minus_zero_float(s, &x) {
         Ok(PreciseNumber::new(
-            Number::Float(ExtendedBigDecimal::MinusZero),
+            ExtendedBigDecimal::MinusZero,
             num_integral_digits,
             num_fractional_digits,
         ))
     } else {
         Ok(PreciseNumber::new(
-            Number::Float(ExtendedBigDecimal::BigDecimal(x)),
+            ExtendedBigDecimal::BigDecimal(x),
             num_integral_digits,
             num_fractional_digits,
         ))
@@ -239,7 +237,7 @@ fn parse_decimal_and_exponent(
     if num_digits_between_decimal_point_and_e <= exponent {
         if is_minus_zero_float(s, &val) {
             Ok(PreciseNumber::new(
-                Number::Int(ExtendedBigInt::MinusZero),
+                ExtendedBigDecimal::MinusZero,
                 num_integral_digits,
                 num_fractional_digits,
             ))
@@ -251,23 +249,23 @@ fn parse_decimal_and_exponent(
             );
             let expanded = [&s[0..i], &s[i + 1..j], &zeros].concat();
             let n = expanded
-                .parse::<BigInt>()
+                .parse::<BigDecimal>()
                 .map_err(|_| ParseNumberError::Float)?;
             Ok(PreciseNumber::new(
-                Number::Int(ExtendedBigInt::BigInt(n)),
+                ExtendedBigDecimal::BigDecimal(n),
                 num_integral_digits,
                 num_fractional_digits,
             ))
         }
     } else if is_minus_zero_float(s, &val) {
         Ok(PreciseNumber::new(
-            Number::Float(ExtendedBigDecimal::MinusZero),
+            ExtendedBigDecimal::MinusZero,
             num_integral_digits,
             num_fractional_digits,
         ))
     } else {
         Ok(PreciseNumber::new(
-            Number::Float(ExtendedBigDecimal::BigDecimal(val)),
+            ExtendedBigDecimal::BigDecimal(val),
             num_integral_digits,
             num_fractional_digits,
         ))
@@ -303,20 +301,17 @@ fn parse_hexadecimal(s: &str) -> Result<PreciseNumber, ParseNumberError> {
     }
 
     let num = BigInt::from_str_radix(s, 16).map_err(|_| ParseNumberError::Hex)?;
+    let num = BigDecimal::from(num);
 
-    match (is_neg, num == BigInt::zero()) {
-        (true, true) => Ok(PreciseNumber::new(
-            Number::Int(ExtendedBigInt::MinusZero),
-            2,
-            0,
-        )),
+    match (is_neg, num == BigDecimal::zero()) {
+        (true, true) => Ok(PreciseNumber::new(ExtendedBigDecimal::MinusZero, 2, 0)),
         (true, false) => Ok(PreciseNumber::new(
-            Number::Int(ExtendedBigInt::BigInt(-num)),
+            ExtendedBigDecimal::BigDecimal(-num),
             0,
             0,
         )),
         (false, _) => Ok(PreciseNumber::new(
-            Number::Int(ExtendedBigInt::BigInt(num)),
+            ExtendedBigDecimal::BigDecimal(num),
             0,
             0,
         )),
@@ -364,19 +359,14 @@ impl FromStr for PreciseNumber {
 
 #[cfg(test)]
 mod tests {
-
     use bigdecimal::BigDecimal;
-    use num_bigint::BigInt;
-    use num_traits::Zero;
 
     use crate::extendedbigdecimal::ExtendedBigDecimal;
-    use crate::extendedbigint::ExtendedBigInt;
-    use crate::number::Number;
     use crate::number::PreciseNumber;
     use crate::numberparse::ParseNumberError;
 
     /// Convenience function for parsing a [`Number`] and unwrapping.
-    fn parse(s: &str) -> Number {
+    fn parse(s: &str) -> ExtendedBigDecimal {
         s.parse::<PreciseNumber>().unwrap().number
     }
 
@@ -392,40 +382,37 @@ mod tests {
 
     #[test]
     fn test_parse_minus_zero_int() {
-        assert_eq!(parse("-0e0"), Number::Int(ExtendedBigInt::MinusZero));
-        assert_eq!(parse("-0e-0"), Number::Int(ExtendedBigInt::MinusZero));
-        assert_eq!(parse("-0e1"), Number::Int(ExtendedBigInt::MinusZero));
-        assert_eq!(parse("-0e+1"), Number::Int(ExtendedBigInt::MinusZero));
-        assert_eq!(parse("-0.0e1"), Number::Int(ExtendedBigInt::MinusZero));
-        assert_eq!(parse("-0x0"), Number::Int(ExtendedBigInt::MinusZero));
+        assert_eq!(parse("-0e0"), ExtendedBigDecimal::MinusZero);
+        assert_eq!(parse("-0e-0"), ExtendedBigDecimal::MinusZero);
+        assert_eq!(parse("-0e1"), ExtendedBigDecimal::MinusZero);
+        assert_eq!(parse("-0e+1"), ExtendedBigDecimal::MinusZero);
+        assert_eq!(parse("-0.0e1"), ExtendedBigDecimal::MinusZero);
+        assert_eq!(parse("-0x0"), ExtendedBigDecimal::MinusZero);
     }
 
     #[test]
     fn test_parse_minus_zero_float() {
-        assert_eq!(parse("-0.0"), Number::Float(ExtendedBigDecimal::MinusZero));
-        assert_eq!(parse("-0e-1"), Number::Float(ExtendedBigDecimal::MinusZero));
-        assert_eq!(
-            parse("-0.0e-1"),
-            Number::Float(ExtendedBigDecimal::MinusZero)
-        );
+        assert_eq!(parse("-0.0"), ExtendedBigDecimal::MinusZero);
+        assert_eq!(parse("-0e-1"), ExtendedBigDecimal::MinusZero);
+        assert_eq!(parse("-0.0e-1"), ExtendedBigDecimal::MinusZero);
     }
 
     #[test]
     fn test_parse_big_int() {
-        assert_eq!(parse("0"), Number::Int(ExtendedBigInt::zero()));
-        assert_eq!(parse("0.1e1"), Number::Int(ExtendedBigInt::one()));
+        assert_eq!(parse("0"), ExtendedBigDecimal::zero());
+        assert_eq!(parse("0.1e1"), ExtendedBigDecimal::one());
         assert_eq!(
             parse("1.0e1"),
-            Number::Int(ExtendedBigInt::BigInt("10".parse::<BigInt>().unwrap()))
+            ExtendedBigDecimal::BigDecimal("10".parse::<BigDecimal>().unwrap())
         );
     }
 
     #[test]
     fn test_parse_hexadecimal_big_int() {
-        assert_eq!(parse("0x0"), Number::Int(ExtendedBigInt::zero()));
+        assert_eq!(parse("0x0"), ExtendedBigDecimal::zero());
         assert_eq!(
             parse("0x10"),
-            Number::Int(ExtendedBigInt::BigInt("16".parse::<BigInt>().unwrap()))
+            ExtendedBigDecimal::BigDecimal("16".parse::<BigDecimal>().unwrap())
         );
     }
 
@@ -433,56 +420,34 @@ mod tests {
     fn test_parse_big_decimal() {
         assert_eq!(
             parse("0.0"),
-            Number::Float(ExtendedBigDecimal::BigDecimal(
-                "0.0".parse::<BigDecimal>().unwrap()
-            ))
+            ExtendedBigDecimal::BigDecimal("0.0".parse::<BigDecimal>().unwrap())
         );
         assert_eq!(
             parse(".0"),
-            Number::Float(ExtendedBigDecimal::BigDecimal(
-                "0.0".parse::<BigDecimal>().unwrap()
-            ))
+            ExtendedBigDecimal::BigDecimal("0.0".parse::<BigDecimal>().unwrap())
         );
         assert_eq!(
             parse("1.0"),
-            Number::Float(ExtendedBigDecimal::BigDecimal(
-                "1.0".parse::<BigDecimal>().unwrap()
-            ))
+            ExtendedBigDecimal::BigDecimal("1.0".parse::<BigDecimal>().unwrap())
         );
         assert_eq!(
             parse("10e-1"),
-            Number::Float(ExtendedBigDecimal::BigDecimal(
-                "1.0".parse::<BigDecimal>().unwrap()
-            ))
+            ExtendedBigDecimal::BigDecimal("1.0".parse::<BigDecimal>().unwrap())
         );
         assert_eq!(
             parse("-1e-3"),
-            Number::Float(ExtendedBigDecimal::BigDecimal(
-                "-0.001".parse::<BigDecimal>().unwrap()
-            ))
+            ExtendedBigDecimal::BigDecimal("-0.001".parse::<BigDecimal>().unwrap())
         );
     }
 
     #[test]
     fn test_parse_inf() {
-        assert_eq!(parse("inf"), Number::Float(ExtendedBigDecimal::Infinity));
-        assert_eq!(
-            parse("infinity"),
-            Number::Float(ExtendedBigDecimal::Infinity)
-        );
-        assert_eq!(parse("+inf"), Number::Float(ExtendedBigDecimal::Infinity));
-        assert_eq!(
-            parse("+infinity"),
-            Number::Float(ExtendedBigDecimal::Infinity)
-        );
-        assert_eq!(
-            parse("-inf"),
-            Number::Float(ExtendedBigDecimal::MinusInfinity)
-        );
-        assert_eq!(
-            parse("-infinity"),
-            Number::Float(ExtendedBigDecimal::MinusInfinity)
-        );
+        assert_eq!(parse("inf"), ExtendedBigDecimal::Infinity);
+        assert_eq!(parse("infinity"), ExtendedBigDecimal::Infinity);
+        assert_eq!(parse("+inf"), ExtendedBigDecimal::Infinity);
+        assert_eq!(parse("+infinity"), ExtendedBigDecimal::Infinity);
+        assert_eq!(parse("-inf"), ExtendedBigDecimal::MinusInfinity);
+        assert_eq!(parse("-infinity"), ExtendedBigDecimal::MinusInfinity);
     }
 
     #[test]
diff --git a/src/uu/seq/src/seq.rs b/src/uu/seq/src/seq.rs
index bb4d5414ef8..a987405ce15 100644
--- a/src/uu/seq/src/seq.rs
+++ b/src/uu/seq/src/seq.rs
@@ -3,24 +3,21 @@
 // For the full copyright and license information, please view the LICENSE
 // file that was distributed with this source code.
 // spell-checker:ignore (ToDO) istr chiter argptr ilen extendedbigdecimal extendedbigint numberparse
-use std::io::{stdout, Write};
+use std::io::{stdout, ErrorKind, Write};
 
 use clap::{crate_version, Arg, ArgAction, Command};
-use num_traits::{Zero, ToPrimitive};
+use num_traits::{ToPrimitive, Zero};
 
-use uucore::error::UResult;
-use uucore::format::{printf, FormatArgument, Format, num_format};
+use uucore::error::{FromIo, UResult};
+use uucore::format::{num_format, Format};
 use uucore::{format_usage, help_about, help_usage};
 
 mod error;
 mod extendedbigdecimal;
-mod extendedbigint;
 mod number;
 mod numberparse;
 use crate::error::SeqError;
 use crate::extendedbigdecimal::ExtendedBigDecimal;
-use crate::extendedbigint::ExtendedBigInt;
-use crate::number::Number;
 use crate::number::PreciseNumber;
 
 const ABOUT: &str = help_about!("seq.md");
@@ -41,11 +38,6 @@ struct SeqOptions<'a> {
     format: Option<&'a str>,
 }
 
-/// A range of integers.
-///
-/// The elements are (first, increment, last).
-type RangeInt = (ExtendedBigInt, ExtendedBigInt, ExtendedBigInt);
-
 /// A range of floats.
 ///
 /// The elements are (first, increment, last).
@@ -116,53 +108,26 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
         .num_fractional_digits
         .max(increment.num_fractional_digits);
 
-    let result = match (first.number, increment.number, last.number) {
-        (Number::Int(first), Number::Int(increment), last) => {
-            let last = last.round_towards(&first);
-            let format = match options.format {
-                Some(f) => {
-                    let f = Format::<num_format::SignedInt>::parse(f)?;
-                    Some(f)
-                }
-                None => None,
-            };
-            print_seq_integers(
-                (first, increment, last),
-                &options.separator,
-                &options.terminator,
-                options.equal_width,
-                padding,
-                format,
-            )
-        }
-        (first, increment, last) => {
-            let format = match options.format {
-                Some(f) => {
-                    let f = Format::<num_format::Float>::parse(f)?;
-                    Some(f)
-                }
-                None => None,
-            };
-            print_seq(
-            (
-                first.into_extended_big_decimal(),
-                increment.into_extended_big_decimal(),
-                last.into_extended_big_decimal(),
-            ),
-            largest_dec,
-            &options.separator,
-            &options.terminator,
-            options.equal_width,
-            padding,
-            format,
-            )
+    let format = match options.format {
+        Some(f) => {
+            let f = Format::<num_format::Float>::parse(f)?;
+            Some(f)
         }
+        None => None,
     };
+    let result = print_seq(
+        (first.number, increment.number, last.number),
+        largest_dec,
+        &options.separator,
+        &options.terminator,
+        options.equal_width,
+        padding,
+        format,
+    );
     match result {
         Ok(_) => Ok(()),
-        _ => todo!(),
-        // Err(err) if err.kind() == ErrorKind::BrokenPipe => Ok(()),
-        // Err(e) => Err(e.map_err_context(|| "write error".into())),
+        Err(err) if err.kind() == ErrorKind::BrokenPipe => Ok(()),
+        Err(e) => Err(e.map_err_context(|| "write error".into())),
     }
 }
 
@@ -230,28 +195,6 @@ fn write_value_float(
     write!(writer, "{value_as_str}")
 }
 
-/// Write a big int formatted according to the given parameters.
-fn write_value_int(
-    writer: &mut impl Write,
-    value: &ExtendedBigInt,
-    width: usize,
-    pad: bool,
-) -> std::io::Result<()> {
-    let value_as_str = if pad {
-        if *value == ExtendedBigInt::MinusZero {
-            format!("{value:0<width$}")
-        } else {
-            format!("{value:>0width$}")
-        }
-    } else {
-        format!("{value}")
-    };
-    write!(writer, "{value_as_str}")
-}
-
-// TODO `print_seq()` and `print_seq_integers()` are nearly identical,
-// they could be refactored into a single more general function.
-
 /// Floating point based code path
 fn print_seq(
     range: RangeFloat,
@@ -261,12 +204,16 @@ fn print_seq(
     pad: bool,
     padding: usize,
     format: Option<Format<num_format::Float>>,
-) -> UResult<()> {
+) -> std::io::Result<()> {
     let stdout = stdout();
     let mut stdout = stdout.lock();
     let (first, increment, last) = range;
     let mut value = first;
-    let padding = if pad { padding + 1 + largest_dec } else { 0 };
+    let padding = if pad {
+        padding + if largest_dec > 0 { largest_dec + 1 } else { 0 }
+    } else {
+        0
+    };
     let mut is_first_iteration = true;
     while !done_printing(&value, &increment, &last) {
         if !is_first_iteration {
@@ -307,65 +254,3 @@ fn print_seq(
     stdout.flush()?;
     Ok(())
 }
-
-/// Print an integer sequence.
-///
-/// This function prints a sequence of integers defined by `range`,
-/// which defines the first integer, last integer, and increment of the
-/// range. The `separator` is inserted between each integer and
-/// `terminator` is inserted at the end.
-///
-/// The `pad` parameter indicates whether to pad numbers to the width
-/// given in `padding`.
-///
-/// If `is_first_minus_zero` is `true`, then the `first` parameter is
-/// printed as if it were negative zero, even though no such number
-/// exists as an integer (negative zero only exists for floating point
-/// numbers). Only set this to `true` if `first` is actually zero.
-fn print_seq_integers(
-    range: RangeInt,
-    separator: &str,
-    terminator: &str,
-    pad: bool,
-    padding: usize,
-    format: Option<Format<num_format::SignedInt>>,
-) -> UResult<()> {
-    let stdout = stdout();
-    let mut stdout = stdout.lock();
-    let (first, increment, last) = range;
-    let mut value = first;
-    let mut is_first_iteration = true;
-    while !done_printing(&value, &increment, &last) {
-        if !is_first_iteration {
-            write!(stdout, "{separator}")?;
-        }
-        // If there was an argument `-f FORMAT`, then use that format
-        // template instead of the default formatting strategy.
-        //
-        // The `printf()` function takes in the template and
-        // the current value and writes the result to `stdout`.
-        //
-        // TODO See similar comment about formatting in `print_seq()`.
-        match &format {
-            Some(f) => {
-                let int = match &value {
-                    ExtendedBigInt::BigInt(bi) => bi.to_i64().unwrap(),
-                    ExtendedBigInt::Infinity => todo!(),
-                    ExtendedBigInt::MinusInfinity => todo!(),
-                    ExtendedBigInt::MinusZero => todo!(),
-                    ExtendedBigInt::Nan => todo!(),
-                };
-                f.fmt(&mut stdout, int)?;
-            }
-            None => write_value_int(&mut stdout, &value, padding, pad)?,
-        }
-        // TODO Implement augmenting addition.
-        value = value + increment.clone();
-        is_first_iteration = false;
-    }
-
-    if !is_first_iteration {
-        write!(stdout, "{terminator}")?;
-    }
-    Ok(())
-}
diff --git a/src/uucore/src/lib/features/format/mod.rs b/src/uucore/src/lib/features/format/mod.rs
index 48151be9892..d6500b20c5a 100644
--- a/src/uucore/src/lib/features/format/mod.rs
+++ b/src/uucore/src/lib/features/format/mod.rs
@@ -115,7 +115,7 @@ fn parse_iter(fmt: &[u8]) -> impl Iterator<Item = Result<FormatItem, FormatError
                     Some(_) => {
                         let spec = match Spec::parse(&mut rest) {
                             Some(spec) => spec,
-                            None => return Some(Err(FormatError::SpecError)),
+                            None => return Some(Err(dbg!(FormatError::SpecError))),
                         };
                         Some(Ok(FormatItem::Spec(spec)))
                     }
@@ -230,7 +230,7 @@ impl<F: Formatter> Format<F> {
         for item in &mut iter {
             match item? {
                 FormatItem::Spec(_) => {
-                    return Err(FormatError::SpecError);
+                    return Err(dbg!(FormatError::SpecError));
                 }
                 FormatItem::Text(t) => suffix.extend_from_slice(&t),
                 FormatItem::Char(c) => suffix.push(c),
diff --git a/src/uucore/src/lib/features/format/num_format.rs b/src/uucore/src/lib/features/format/num_format.rs
index fd010bdc029..046249a13d2 100644
--- a/src/uucore/src/lib/features/format/num_format.rs
+++ b/src/uucore/src/lib/features/format/num_format.rs
@@ -13,14 +13,14 @@ pub trait Formatter {
         Self: Sized;
 }
 
-#[derive(Clone, Copy)]
+#[derive(Clone, Copy, Debug)]
 pub enum UnsignedIntVariant {
     Decimal,
     Octal(Prefix),
     Hexadecimal(Case, Prefix),
 }
 
-#[derive(Clone, Copy)]
+#[derive(Clone, Copy, Debug)]
 
 pub enum FloatVariant {
     Decimal,
@@ -29,32 +29,32 @@ pub enum FloatVariant {
     Hexadecimal,
 }
 
-#[derive(Clone, Copy, PartialEq, Eq)]
+#[derive(Clone, Copy, Debug, PartialEq, Eq)]
 pub enum Case {
     Lowercase,
     Uppercase,
 }
 
-#[derive(Clone, Copy, PartialEq, Eq)]
+#[derive(Clone, Copy, Debug, PartialEq, Eq)]
 pub enum Prefix {
     No,
     Yes,
 }
 
-#[derive(Clone, Copy, PartialEq, Eq)]
+#[derive(Clone, Copy, Debug, PartialEq, Eq)]
 pub enum ForceDecimal {
     No,
     Yes,
 }
 
-#[derive(Clone, Copy)]
+#[derive(Clone, Copy, Debug)]
 pub enum PositiveSign {
     None,
     Plus,
     Space,
 }
 
-#[derive(Clone, Copy)]
+#[derive(Clone, Copy, Debug)]
 pub enum NumberAlignment {
     Left,
     RightSpace,
@@ -93,7 +93,7 @@ impl Formatter for SignedInt {
             alignment,
         } = s
         else {
-            return Err(FormatError::SpecError);
+            return Err(dbg!(FormatError::SpecError));
         };
 
         let width = match width {
@@ -152,7 +152,7 @@ impl Formatter for UnsignedInt {
             alignment,
         } = s
         else {
-            return Err(FormatError::SpecError);
+            return Err(dbg!(FormatError::SpecError));
         };
 
         let width = match width {
@@ -241,19 +241,19 @@ impl Formatter for Float {
             precision,
         } = s
         else {
-            return Err(FormatError::SpecError);
+            return Err(dbg!(FormatError::SpecError));
         };
 
         let width = match width {
             Some(CanAsterisk::Fixed(x)) => x,
             None => 0,
-            Some(CanAsterisk::Asterisk) => return Err(FormatError::SpecError),
+            Some(CanAsterisk::Asterisk) => return Err(dbg!(FormatError::SpecError)),
         };
 
         let precision = match precision {
             Some(CanAsterisk::Fixed(x)) => x,
             None => 0,
-            Some(CanAsterisk::Asterisk) => return Err(FormatError::SpecError),
+            Some(CanAsterisk::Asterisk) => return Err(dbg!(FormatError::SpecError)),
         };
 
         Ok(Self {
diff --git a/src/uucore/src/lib/features/format/spec.rs b/src/uucore/src/lib/features/format/spec.rs
index 9c53669fa9c..abc9b7a875a 100644
--- a/src/uucore/src/lib/features/format/spec.rs
+++ b/src/uucore/src/lib/features/format/spec.rs
@@ -9,6 +9,7 @@ use super::{
 };
 use std::{fmt::Display, io::Write};
 
+#[derive(Debug)]
 pub enum Spec {
     Char {
         width: Option<CanAsterisk<usize>>,
@@ -41,7 +42,7 @@ pub enum Spec {
 
 /// Precision and width specified might use an asterisk to indicate that they are
 /// determined by an argument.
-#[derive(Clone, Copy)]
+#[derive(Clone, Copy, Debug)]
 pub enum CanAsterisk<T> {
     Fixed(T),
     Asterisk,
@@ -99,6 +100,7 @@ impl Spec {
         let width = eat_asterisk_or_number(rest);
 
         let precision = if let Some(b'.') = rest.get(0) {
+            *rest = &rest[1..];
             Some(eat_asterisk_or_number(rest).unwrap_or(CanAsterisk::Fixed(0)))
         } else {
             None
@@ -134,7 +136,9 @@ impl Spec {
             *rest = &rest[1..];
         }
 
-        Some(match rest.get(0)? {
+        let type_spec = rest.get(0)?;
+        *rest = &rest[1..];
+        Some(match type_spec {
             b'c' => Spec::Char {
                 width,
                 align_left: minus,
@@ -208,7 +212,10 @@ impl Spec {
                     (false, false) => PositiveSign::None,
                 },
             },
-            _ => return None,
+            x => {
+                dbg!("{:b}", x);
+                return dbg!(None)
+            },
         })
     }
 

From 2f9fcf73faad9d60db6f08c2e9ecd57fa845b0bd Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Thu, 16 Nov 2023 16:02:38 +0100
Subject: [PATCH 028/429] clippy: fix warnings introduced by Rust 1.74

---
 src/uu/more/src/more.rs     | 2 +-
 tests/by-util/test_dd.rs    | 4 ++--
 tests/by-util/test_ls.rs    | 6 +++---
 tests/by-util/test_users.rs | 6 ++----
 4 files changed, 8 insertions(+), 10 deletions(-)

diff --git a/src/uu/more/src/more.rs b/src/uu/more/src/more.rs
index 02ed0feea20..b21b2ab1f35 100644
--- a/src/uu/more/src/more.rs
+++ b/src/uu/more/src/more.rs
@@ -88,7 +88,7 @@ impl Options {
 #[uucore::main]
 pub fn uumain(args: impl uucore::Args) -> UResult<()> {
     let args = args.collect_lossy();
-    let matches = match uu_app().try_get_matches_from(&args) {
+    let matches = match uu_app().try_get_matches_from(args) {
         Ok(m) => m,
         Err(e) => return Err(e.into()),
     };
diff --git a/tests/by-util/test_dd.rs b/tests/by-util/test_dd.rs
index f560e35261b..d5ac8dc801c 100644
--- a/tests/by-util/test_dd.rs
+++ b/tests/by-util/test_dd.rs
@@ -1470,7 +1470,7 @@ fn test_seek_output_fifo() {
         .args(&["count=0", "seek=1", "of=fifo", "status=noxfer"])
         .run_no_wait();
 
-    std::fs::write(at.plus("fifo"), &vec![0; 512]).unwrap();
+    std::fs::write(at.plus("fifo"), vec![0; 512]).unwrap();
 
     child
         .wait()
@@ -1492,7 +1492,7 @@ fn test_skip_input_fifo() {
         .args(&["count=0", "skip=1", "if=fifo", "status=noxfer"])
         .run_no_wait();
 
-    std::fs::write(at.plus("fifo"), &vec![0; 512]).unwrap();
+    std::fs::write(at.plus("fifo"), vec![0; 512]).unwrap();
 
     child
         .wait()
diff --git a/tests/by-util/test_ls.rs b/tests/by-util/test_ls.rs
index cdd0292e1f2..07ea8c9cd63 100644
--- a/tests/by-util/test_ls.rs
+++ b/tests/by-util/test_ls.rs
@@ -994,9 +994,9 @@ fn test_ls_long() {
 fn test_ls_long_format() {
     let scene = TestScenario::new(util_name!());
     let at = &scene.fixtures;
-    at.mkdir(&at.plus_as_string("test-long-dir"));
+    at.mkdir(at.plus_as_string("test-long-dir"));
     at.touch(at.plus_as_string("test-long-dir/test-long-file"));
-    at.mkdir(&at.plus_as_string("test-long-dir/test-long-dir"));
+    at.mkdir(at.plus_as_string("test-long-dir/test-long-dir"));
 
     for arg in LONG_ARGS {
         // Assuming sane username do not have spaces within them.
@@ -1971,7 +1971,7 @@ fn test_ls_color() {
         .join("nested_dir")
         .to_string_lossy()
         .to_string();
-    at.mkdir(&nested_dir);
+    at.mkdir(nested_dir);
     at.mkdir("z");
     let nested_file = Path::new("a")
         .join("nested_file")
diff --git a/tests/by-util/test_users.rs b/tests/by-util/test_users.rs
index 766378a9dca..3d87aa9d068 100644
--- a/tests/by-util/test_users.rs
+++ b/tests/by-util/test_users.rs
@@ -21,11 +21,9 @@ fn test_users_check_name() {
     #[cfg(target_os = "linux")]
     let util_name = util_name!();
     #[cfg(target_vendor = "apple")]
-    let util_name = format!("g{}", util_name!());
+    let util_name = &format!("g{}", util_name!());
 
-    // note: clippy::needless_borrow *false positive*
-    #[allow(clippy::needless_borrow)]
-    let expected = TestScenario::new(&util_name)
+    let expected = TestScenario::new(util_name)
         .cmd(util_name)
         .env("LC_ALL", "C")
         .succeeds()

From eaf500637900a47c4e00497aaccccf3d6d7dd5c8 Mon Sep 17 00:00:00 2001
From: Terts Diepraam <terts.diepraam@gmail.com>
Date: Thu, 16 Nov 2023 17:00:41 +0100
Subject: [PATCH 029/429] printf: parse arguments and handle escape codes

---
 src/uu/printf/src/printf.rs                   |  23 ++-
 .../src/lib/features/format/argument.rs       |  60 ++++++
 src/uucore/src/lib/features/format/escape.rs  | 100 ++++++++++
 src/uucore/src/lib/features/format/mod.rs     | 186 +++++++++++-------
 .../src/lib/features/format/num_format.rs     |  10 +-
 src/uucore/src/lib/features/format/spec.rs    |  29 ++-
 6 files changed, 317 insertions(+), 91 deletions(-)
 create mode 100644 src/uucore/src/lib/features/format/argument.rs
 create mode 100644 src/uucore/src/lib/features/format/escape.rs

diff --git a/src/uu/printf/src/printf.rs b/src/uu/printf/src/printf.rs
index 6e270ec2645..00d03816e4c 100644
--- a/src/uu/printf/src/printf.rs
+++ b/src/uu/printf/src/printf.rs
@@ -6,9 +6,12 @@
 // spell-checker:ignore (change!) each's
 // spell-checker:ignore (ToDO) LONGHELP FORMATSTRING templating parameterizing formatstr
 
+use std::io::stdout;
+use std::ops::ControlFlow;
+
 use clap::{crate_version, Arg, ArgAction, Command};
 use uucore::error::{UResult, UUsageError};
-use uucore::format::{printf, FormatArgument};
+use uucore::format::{parse_spec_and_escape, FormatArgument};
 use uucore::{format_usage, help_about, help_section, help_usage};
 
 const VERSION: &str = "version";
@@ -30,12 +33,28 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
     let format_string = matches
         .get_one::<String>(options::FORMATSTRING)
         .ok_or_else(|| UUsageError::new(1, "missing operand"))?;
+
     let values: Vec<_> = match matches.get_many::<String>(options::ARGUMENT) {
         Some(s) => s.map(|s| FormatArgument::Unparsed(s.to_string())).collect(),
         None => vec![],
     };
 
-    printf(format_string, &values)?;
+    let mut args = values.iter().peekable();
+    for item in parse_spec_and_escape(format_string.as_ref()) {
+        match item?.write(stdout(), &mut args)? {
+            ControlFlow::Continue(()) => {}
+            ControlFlow::Break(()) => break,
+        };
+    }
+
+    while args.peek().is_some() {
+        for item in parse_spec_and_escape(format_string.as_ref()) {
+            match item?.write(stdout(), &mut args)? {
+                ControlFlow::Continue(()) => {}
+                ControlFlow::Break(()) => break,
+            };
+        }
+    }
     Ok(())
 }
 
diff --git a/src/uucore/src/lib/features/format/argument.rs b/src/uucore/src/lib/features/format/argument.rs
new file mode 100644
index 00000000000..007f519c2a4
--- /dev/null
+++ b/src/uucore/src/lib/features/format/argument.rs
@@ -0,0 +1,60 @@
+#[derive(Clone, Debug)]
+pub enum FormatArgument {
+    Char(char),
+    String(String),
+    UnsignedInt(u64),
+    SignedInt(i64),
+    Float(f64),
+    /// Special argument that gets coerced into the other variants
+    Unparsed(String),
+}
+
+impl FormatArgument {
+    pub fn get_char(&self) -> Option<char> {
+        match self {
+            Self::Char(c) => Some(*c),
+            Self::Unparsed(s) => {
+                let mut chars = s.chars();
+                let Some(c) = chars.next() else {
+                    return None;
+                };
+                let None = chars.next() else {
+                    return None;
+                };
+                Some(c)
+            }
+            _ => None,
+        }
+    }
+
+    pub fn get_u64(&self) -> Option<u64> {
+        match self {
+            Self::UnsignedInt(n) => Some(*n),
+            Self::Unparsed(s) => s.parse().ok(),
+            _ => None,
+        }
+    }
+    
+    pub fn get_i64(&self) -> Option<i64> {
+        match self {
+            Self::SignedInt(n) => Some(*n),
+            Self::Unparsed(s) => s.parse().ok(),
+            _ => None,
+        }
+    }
+    
+    pub fn get_f64(&self) -> Option<f64> {
+        match self {
+            Self::Float(n) => Some(*n),
+            Self::Unparsed(s) => s.parse().ok(),
+            _ => None,
+        }
+    }
+
+    pub fn get_str(&self) -> Option<&str> {
+        match self {
+            Self::Unparsed(s) | Self::String(s) => Some(s),
+            _ => None,
+        }
+    }
+}
\ No newline at end of file
diff --git a/src/uucore/src/lib/features/format/escape.rs b/src/uucore/src/lib/features/format/escape.rs
new file mode 100644
index 00000000000..b8c21741caf
--- /dev/null
+++ b/src/uucore/src/lib/features/format/escape.rs
@@ -0,0 +1,100 @@
+#[derive(Debug)]
+pub enum EscapedChar {
+    Char(u8),
+    Backslash(u8),
+    End,
+}
+
+#[repr(u8)]
+#[derive(Clone, Copy)]
+enum Base {
+    Oct = 8,
+    Hex = 16,
+}
+
+impl Base {
+    fn max_digits(&self) -> u8 {
+        match self {
+            Self::Oct => 3,
+            Self::Hex => 2,
+        }
+    }
+
+    fn to_digit(&self, c: u8) -> Option<u8> {
+        match self {
+            Base::Oct => {
+                if matches!(c, b'0'..=b'7') {
+                    Some(c - b'0')
+                } else {
+                    None
+                }
+            }
+            Base::Hex => match c {
+                b'0'..=b'9' => Some(c - b'0'),
+                b'A'..=b'F' => Some(c - b'A' + 10),
+                b'a'..=b'f' => Some(c - b'a' + 10),
+                _ => None,
+            },
+        }
+    }
+}
+
+/// Parse the numeric part of the `\xHHH` and `\0NNN` escape sequences
+fn parse_code(input: &mut &[u8], base: Base) -> Option<u8> {
+    // All arithmetic on `ret` needs to be wrapping, because octal input can
+    // take 3 digits, which is 9 bits, and therefore more than what fits in a
+    // `u8`. GNU just seems to wrap these values.
+    // Note that if we instead make `ret` a `u32` and use `char::from_u32` will
+    // yield incorrect results because it will interpret values larger than
+    // `u8::MAX` as unicode.
+    let [c, rest @ ..] = input else { return None };
+    let mut ret = base.to_digit(*c)?;
+    *input = &rest[..];
+
+    for _ in 1..base.max_digits() {
+        let [c, rest @ ..] = input else { break };
+        let Some(n) = base.to_digit(*c) else { break };
+        ret = ret.wrapping_mul(base as u8).wrapping_add(n);
+        *input = &rest[..];
+    }
+
+    Some(ret)
+}
+
+pub fn parse_escape_code(rest: &mut &[u8]) -> EscapedChar {
+    if let [c, new_rest @ ..] = rest {
+        // This is for the \NNN syntax for octal sequences.
+        // Note that '0' is intentionally omitted because that
+        // would be the \0NNN syntax.
+        if let b'1'..=b'7' = c {
+            if let Some(parsed) = parse_code(rest, Base::Oct) {
+                return EscapedChar::Char(parsed);
+            }
+        }
+
+        *rest = &new_rest[..];
+        match c {
+            b'\\' => EscapedChar::Char(b'\\'),
+            b'a' => EscapedChar::Char(b'\x07'),
+            b'b' => EscapedChar::Char(b'\x08'),
+            b'c' => return EscapedChar::End,
+            b'e' => EscapedChar::Char(b'\x1b'),
+            b'f' => EscapedChar::Char(b'\x0c'),
+            b'n' => EscapedChar::Char(b'\n'),
+            b'r' => EscapedChar::Char(b'\r'),
+            b't' => EscapedChar::Char(b'\t'),
+            b'v' => EscapedChar::Char(b'\x0b'),
+            b'x' => {
+                if let Some(c) = parse_code(rest, Base::Hex) {
+                    EscapedChar::Char(c)
+                } else {
+                    EscapedChar::Backslash(b'x')
+                }
+            }
+            b'0' => EscapedChar::Char(parse_code(rest, Base::Oct).unwrap_or(b'\0')),
+            c => EscapedChar::Backslash(*c),
+        }
+    } else {
+        EscapedChar::Char(b'\\')
+    }
+}
diff --git a/src/uucore/src/lib/features/format/mod.rs b/src/uucore/src/lib/features/format/mod.rs
index d6500b20c5a..8fa8d0717e1 100644
--- a/src/uucore/src/lib/features/format/mod.rs
+++ b/src/uucore/src/lib/features/format/mod.rs
@@ -8,8 +8,19 @@
 //! [`Format`] struct, which represents a parsed format string. This reduces
 //! the need for parsing a format string multiple times and assures that no
 //! parsing errors occur during writing.
+//!
+//! There are three kinds of parsing that we might want to do:
+//!
+//!  1. Only `printf` specifiers (for e.g. `seq`, `dd`)
+//!  2. Only escape sequences (for e.g. `echo`)
+//!  3. Both `printf` specifiers and escape sequences (for e.g. `printf`)
+//!
+//! This module aims to combine all three use cases.
+
 // spell-checker:ignore (vars) charf decf floatf intf scif strf Cninety
 
+mod escape;
+mod argument;
 pub mod num_format;
 mod spec;
 
@@ -18,11 +29,16 @@ use std::{
     error::Error,
     fmt::Display,
     io::{stdout, Write},
+    ops::ControlFlow,
 };
+pub use argument::*;
 
 use crate::error::UError;
 
-use self::num_format::Formatter;
+use self::{
+    escape::{parse_escape_code, EscapedChar},
+    num_format::Formatter,
+};
 
 #[derive(Debug)]
 pub enum FormatError {
@@ -54,80 +70,116 @@ impl Display for FormatError {
 }
 
 /// A single item to format
-enum FormatItem {
+pub enum FormatItem<C: FormatChar> {
     /// A format specifier
     Spec(Spec),
-    /// Some plain text
-    Text(Vec<u8>),
     /// A single character
-    ///
-    /// Added in addition to `Text` as an optimization.
-    Char(u8),
+    Char(C),
+}
+
+pub trait FormatChar {
+    fn write(&self, writer: impl Write) -> std::io::Result<ControlFlow<()>>;
+}
+
+impl FormatChar for u8 {
+    fn write(&self, mut writer: impl Write) -> std::io::Result<ControlFlow<()>> {
+        writer.write(&[*self])?;
+        Ok(ControlFlow::Continue(()))
+    }
 }
 
-#[derive(Clone, Debug)]
-pub enum FormatArgument {
-    Char(char),
-    String(String),
-    UnsignedInt(u64),
-    SignedInt(i64),
-    Float(f64),
-    // Special argument that gets coerced into the other variants
-    Unparsed(String),
+impl FormatChar for EscapedChar {
+    fn write(&self, mut writer: impl Write) -> std::io::Result<ControlFlow<()>> {
+        match self {
+            EscapedChar::Char(c) => {
+                writer.write(&[*c])?;
+            }
+            EscapedChar::Backslash(c) => {
+                writer.write(&[b'\\', *c])?;
+            }
+            EscapedChar::End => return Ok(ControlFlow::Break(())),
+        }
+        Ok(ControlFlow::Continue(()))
+    }
 }
 
-impl FormatItem {
-    fn write<'a>(
+impl<C: FormatChar> FormatItem<C> {
+    pub fn write<'a>(
         &self,
-        mut writer: impl Write,
+        writer: impl Write,
         args: &mut impl Iterator<Item = &'a FormatArgument>,
-    ) -> Result<(), FormatError> {
+    ) -> Result<ControlFlow<()>, FormatError> {
         match self {
-            FormatItem::Spec(spec) => spec.write(writer, args),
-            FormatItem::Text(bytes) => writer.write_all(bytes).map_err(FormatError::IoError),
-            FormatItem::Char(char) => writer.write_all(&[*char]).map_err(FormatError::IoError),
-        }
+            FormatItem::Spec(spec) => spec.write(writer, args)?,
+            FormatItem::Char(c) => return c.write(writer).map_err(FormatError::IoError),
+        };
+        Ok(ControlFlow::Continue(()))
     }
 }
 
-fn parse_iter(fmt: &[u8]) -> impl Iterator<Item = Result<FormatItem, FormatError>> + '_ {
-    let mut rest = fmt;
-    std::iter::from_fn(move || {
-        if rest.is_empty() {
-            return None;
+pub fn parse_spec_and_escape(
+    fmt: &[u8],
+) -> impl Iterator<Item = Result<FormatItem<EscapedChar>, FormatError>> + '_ {
+    let mut current = fmt;
+    std::iter::from_fn(move || match current {
+        [] => return None,
+        [b'%', b'%', rest @ ..] => {
+            current = rest;
+            Some(Ok(FormatItem::Char(EscapedChar::Char(b'%'))))
+        }
+        [b'%', rest @ ..] => {
+            current = rest;
+            let spec = match Spec::parse(&mut current) {
+                Some(spec) => spec,
+                None => return Some(Err(FormatError::SpecError)),
+            };
+            Some(Ok(FormatItem::Spec(spec)))
         }
+        [b'\\', rest @ ..] => {
+            current = rest;
+            Some(Ok(FormatItem::Char(parse_escape_code(&mut current))))
+        }
+        [c, rest @ ..] => {
+            current = rest;
+            Some(Ok(FormatItem::Char(EscapedChar::Char(*c))))
+        }
+    })
+}
 
-        match rest.iter().position(|c| *c == b'%') {
-            None => {
-                let final_text = rest;
-                rest = &[];
-                Some(Ok(FormatItem::Text(final_text.into())))
-            }
-            Some(0) => {
-                // Handle the spec
-                rest = &rest[1..];
-                match rest.get(0) {
-                    None => Some(Ok(FormatItem::Char(b'%'))),
-                    Some(b'%') => {
-                        rest = &rest[1..];
-                        Some(Ok(FormatItem::Char(b'%')))
-                    }
-                    Some(_) => {
-                        let spec = match Spec::parse(&mut rest) {
-                            Some(spec) => spec,
-                            None => return Some(Err(dbg!(FormatError::SpecError))),
-                        };
-                        Some(Ok(FormatItem::Spec(spec)))
-                    }
-                }
-            }
-            Some(i) => {
-                // The `after` slice includes the % so it will be handled correctly
-                // in the next iteration.
-                let (before, after) = rest.split_at(i);
-                rest = after;
-                return Some(Ok(FormatItem::Text(before.into())));
-            }
+fn parse_spec_only(fmt: &[u8]) -> impl Iterator<Item = Result<FormatItem<u8>, FormatError>> + '_ {
+    let mut current = fmt;
+    std::iter::from_fn(move || match current {
+        [] => return None,
+        [b'%', b'%', rest @ ..] => {
+            current = rest;
+            Some(Ok(FormatItem::Char(b'%')))
+        }
+        [b'%', rest @ ..] => {
+            current = rest;
+            let spec = match Spec::parse(&mut current) {
+                Some(spec) => spec,
+                None => return Some(Err(FormatError::SpecError)),
+            };
+            Some(Ok(FormatItem::Spec(spec)))
+        }
+        [c, rest @ ..] => {
+            current = rest;
+            Some(Ok(FormatItem::Char(*c)))
+        }
+    })
+}
+
+fn parse_escape_only(fmt: &[u8]) -> impl Iterator<Item = Result<EscapedChar, FormatError>> + '_ {
+    let mut current = fmt;
+    std::iter::from_fn(move || match current {
+        [] => return None,
+        [b'\\', rest @ ..] => {
+            current = rest;
+            Some(Ok(parse_escape_code(&mut current)))
+        }
+        [c, rest @ ..] => {
+            current = rest;
+            Some(Ok(EscapedChar::Char(*c)))
         }
     })
 }
@@ -144,7 +196,7 @@ fn parse_iter(fmt: &[u8]) -> impl Iterator<Item = Result<FormatItem, FormatError
 /// ```rust
 /// use uucore::format::printf;
 ///
-/// printf("hello %s", &["world".to_string()]).unwrap();
+/// printf("hello %s", &[FormatArgument::String("world")]).unwrap();
 /// // prints "hello world"
 /// ```
 pub fn printf<'a>(
@@ -160,7 +212,7 @@ fn printf_writer<'a>(
     args: impl IntoIterator<Item = &'a FormatArgument>,
 ) -> Result<(), FormatError> {
     let mut args = args.into_iter();
-    for item in parse_iter(format_string.as_ref()) {
+    for item in parse_spec_only(format_string.as_ref()) {
         item?.write(&mut writer, &mut args)?;
     }
     Ok(())
@@ -191,10 +243,10 @@ pub fn sprintf<'a>(
 }
 
 /// A parsed format for a single float value
-/// 
+///
 /// This is used by `seq`. It can be constructed with [`FloatFormat::parse`]
 /// and can write a value with [`FloatFormat::fmt`].
-/// 
+///
 /// It can only accept a single specification without any asterisk parameters.
 /// If it does get more specifications, it will return an error.
 pub struct Format<F: Formatter> {
@@ -205,7 +257,7 @@ pub struct Format<F: Formatter> {
 
 impl<F: Formatter> Format<F> {
     pub fn parse(format_string: impl AsRef<[u8]>) -> Result<Self, FormatError> {
-        let mut iter = parse_iter(format_string.as_ref());
+        let mut iter = parse_spec_only(format_string.as_ref());
 
         let mut prefix = Vec::new();
         let mut spec = None;
@@ -215,7 +267,6 @@ impl<F: Formatter> Format<F> {
                     spec = Some(s);
                     break;
                 }
-                FormatItem::Text(t) => prefix.extend_from_slice(&t),
                 FormatItem::Char(c) => prefix.push(c),
             }
         }
@@ -230,9 +281,8 @@ impl<F: Formatter> Format<F> {
         for item in &mut iter {
             match item? {
                 FormatItem::Spec(_) => {
-                    return Err(dbg!(FormatError::SpecError));
+                    return Err(FormatError::SpecError);
                 }
-                FormatItem::Text(t) => suffix.extend_from_slice(&t),
                 FormatItem::Char(c) => suffix.push(c),
             }
         }
diff --git a/src/uucore/src/lib/features/format/num_format.rs b/src/uucore/src/lib/features/format/num_format.rs
index 046249a13d2..339b522091d 100644
--- a/src/uucore/src/lib/features/format/num_format.rs
+++ b/src/uucore/src/lib/features/format/num_format.rs
@@ -93,7 +93,7 @@ impl Formatter for SignedInt {
             alignment,
         } = s
         else {
-            return Err(dbg!(FormatError::SpecError));
+            return Err(FormatError::SpecError);
         };
 
         let width = match width {
@@ -152,7 +152,7 @@ impl Formatter for UnsignedInt {
             alignment,
         } = s
         else {
-            return Err(dbg!(FormatError::SpecError));
+            return Err(FormatError::SpecError);
         };
 
         let width = match width {
@@ -241,19 +241,19 @@ impl Formatter for Float {
             precision,
         } = s
         else {
-            return Err(dbg!(FormatError::SpecError));
+            return Err(FormatError::SpecError);
         };
 
         let width = match width {
             Some(CanAsterisk::Fixed(x)) => x,
             None => 0,
-            Some(CanAsterisk::Asterisk) => return Err(dbg!(FormatError::SpecError)),
+            Some(CanAsterisk::Asterisk) => return Err(FormatError::SpecError),
         };
 
         let precision = match precision {
             Some(CanAsterisk::Fixed(x)) => x,
             None => 0,
-            Some(CanAsterisk::Asterisk) => return Err(dbg!(FormatError::SpecError)),
+            Some(CanAsterisk::Asterisk) => return Err(FormatError::SpecError),
         };
 
         Ok(Self {
diff --git a/src/uucore/src/lib/features/format/spec.rs b/src/uucore/src/lib/features/format/spec.rs
index abc9b7a875a..258005bb5e6 100644
--- a/src/uucore/src/lib/features/format/spec.rs
+++ b/src/uucore/src/lib/features/format/spec.rs
@@ -212,10 +212,7 @@ impl Spec {
                     (false, false) => PositiveSign::None,
                 },
             },
-            x => {
-                dbg!("{:b}", x);
-                return dbg!(None)
-            },
+            _ => return None,
         })
     }
 
@@ -228,16 +225,16 @@ impl Spec {
             &Spec::Char { width, align_left } => {
                 let width = resolve_asterisk(width, &mut args)?.unwrap_or(0);
                 let arg = next_arg(&mut args)?;
-                match arg {
-                    FormatArgument::Char(c) => write_padded(writer, c, width, false, align_left),
+                match arg.get_char() {
+                    Some(c) => write_padded(writer, c, width, false, align_left),
                     _ => Err(FormatError::InvalidArgument(arg.clone())),
                 }
             }
             &Spec::String { width, align_left } => {
                 let width = resolve_asterisk(width, &mut args)?.unwrap_or(0);
                 let arg = next_arg(&mut args)?;
-                match arg {
-                    FormatArgument::String(s) => write_padded(writer, s, width, false, align_left),
+                match arg.get_str() {
+                    Some(s) => write_padded(writer, s, width, false, align_left),
                     _ => Err(FormatError::InvalidArgument(arg.clone())),
                 }
             }
@@ -249,7 +246,7 @@ impl Spec {
                 let width = resolve_asterisk(width, &mut args)?.unwrap_or(0);
 
                 let arg = next_arg(&mut args)?;
-                let FormatArgument::SignedInt(i) = arg else {
+                let Some(i) = arg.get_i64() else {
                     return Err(FormatError::InvalidArgument(arg.clone()));
                 };
 
@@ -258,7 +255,7 @@ impl Spec {
                     positive_sign,
                     alignment,
                 }
-                .fmt(writer, *i)
+                .fmt(writer, i)
                 .map_err(FormatError::IoError)
             }
             &Spec::UnsignedInt {
@@ -269,7 +266,7 @@ impl Spec {
                 let width = resolve_asterisk(width, &mut args)?.unwrap_or(0);
 
                 let arg = next_arg(args)?;
-                let FormatArgument::UnsignedInt(i) = arg else {
+                let Some(i) = arg.get_u64() else {
                     return Err(FormatError::InvalidArgument(arg.clone()));
                 };
 
@@ -278,7 +275,7 @@ impl Spec {
                     width,
                     alignment,
                 }
-                .fmt(writer, *i)
+                .fmt(writer, i)
                 .map_err(FormatError::IoError)
             }
             &Spec::Float {
@@ -294,7 +291,7 @@ impl Spec {
                 let precision = resolve_asterisk(precision, &mut args)?.unwrap_or(6);
 
                 let arg = next_arg(args)?;
-                let FormatArgument::Float(f) = arg else {
+                let Some(f) = arg.get_f64() else {
                     return Err(FormatError::InvalidArgument(arg.clone()));
                 };
 
@@ -307,7 +304,7 @@ impl Spec {
                     alignment,
                     precision,
                 }
-                .fmt(writer, *f)
+                .fmt(writer, f)
                 .map_err(FormatError::IoError)
             }
         }
@@ -322,8 +319,8 @@ fn resolve_asterisk<'a>(
         None => None,
         Some(CanAsterisk::Asterisk) => {
             let arg = next_arg(args)?;
-            match arg {
-                FormatArgument::UnsignedInt(u) => match usize::try_from(*u) {
+            match arg.get_u64() {
+                Some(u) => match usize::try_from(u) {
                     Ok(u) => Some(u),
                     Err(_) => return Err(FormatError::InvalidArgument(arg.clone())),
                 },

From a45ff8ca73060939983379f5d973ac3da4c75330 Mon Sep 17 00:00:00 2001
From: Terts Diepraam <terts.diepraam@gmail.com>
Date: Fri, 17 Nov 2023 14:39:39 +0100
Subject: [PATCH 030/429] printf: more flexible parsing of unparsed arguments

---
 .../src/lib/features/format/argument.rs       | 40 ++++++++++++++++---
 1 file changed, 34 insertions(+), 6 deletions(-)

diff --git a/src/uucore/src/lib/features/format/argument.rs b/src/uucore/src/lib/features/format/argument.rs
index 007f519c2a4..644546c38b7 100644
--- a/src/uucore/src/lib/features/format/argument.rs
+++ b/src/uucore/src/lib/features/format/argument.rs
@@ -30,23 +30,51 @@ impl FormatArgument {
     pub fn get_u64(&self) -> Option<u64> {
         match self {
             Self::UnsignedInt(n) => Some(*n),
-            Self::Unparsed(s) => s.parse().ok(),
+            Self::Unparsed(s) => {
+                if let Some(s) = s.strip_prefix("0x") {
+                    u64::from_str_radix(s, 16).ok()
+                } else if let Some(s) = s.strip_prefix("0") {
+                    u64::from_str_radix(s, 8).ok()
+                } else if let Some(s) = s.strip_prefix('\'') {
+                    Some(s.chars().next()? as u64)
+                } else {
+                    s.parse().ok()
+                }
+            }
             _ => None,
         }
     }
-    
+
     pub fn get_i64(&self) -> Option<i64> {
         match self {
             Self::SignedInt(n) => Some(*n),
-            Self::Unparsed(s) => s.parse().ok(),
+            Self::Unparsed(s) => {
+                if let Some(s) = s.strip_prefix("0x") {
+                    i64::from_str_radix(s, 16).ok()
+                } else if let Some(s) = s.strip_prefix("0") {
+                    i64::from_str_radix(s, 8).ok()
+                } else if let Some(s) = s.strip_prefix('\'') {
+                    Some(s.chars().next()? as i64)
+                } else {
+                    s.parse().ok()
+                }
+            }
             _ => None,
         }
     }
-    
+
     pub fn get_f64(&self) -> Option<f64> {
         match self {
             Self::Float(n) => Some(*n),
-            Self::Unparsed(s) => s.parse().ok(),
+            Self::Unparsed(s) => {
+                if s.starts_with("0x") || s.starts_with("-0x") {
+                    unimplemented!("Hexadecimal floats are unimplemented!")
+                } else if let Some(s) = s.strip_prefix('\'') {
+                    Some(s.chars().next()? as u64 as f64)
+                } else {
+                    s.parse().ok()
+                }
+            }
             _ => None,
         }
     }
@@ -57,4 +85,4 @@ impl FormatArgument {
             _ => None,
         }
     }
-}
\ No newline at end of file
+}

From cd0c24af07d1412a746c5dbfe8a3df0a8cb56191 Mon Sep 17 00:00:00 2001
From: Terts Diepraam <terts.diepraam@gmail.com>
Date: Fri, 17 Nov 2023 14:41:14 +0100
Subject: [PATCH 031/429] printf: implement %b

---
 src/uucore/src/lib/features/format/mod.rs  |  6 +--
 src/uucore/src/lib/features/format/spec.rs | 43 +++++++++++++++++++---
 2 files changed, 40 insertions(+), 9 deletions(-)

diff --git a/src/uucore/src/lib/features/format/mod.rs b/src/uucore/src/lib/features/format/mod.rs
index 8fa8d0717e1..7417d48fad5 100644
--- a/src/uucore/src/lib/features/format/mod.rs
+++ b/src/uucore/src/lib/features/format/mod.rs
@@ -169,17 +169,17 @@ fn parse_spec_only(fmt: &[u8]) -> impl Iterator<Item = Result<FormatItem<u8>, Fo
     })
 }
 
-fn parse_escape_only(fmt: &[u8]) -> impl Iterator<Item = Result<EscapedChar, FormatError>> + '_ {
+fn parse_escape_only(fmt: &[u8]) -> impl Iterator<Item = EscapedChar> + '_ {
     let mut current = fmt;
     std::iter::from_fn(move || match current {
         [] => return None,
         [b'\\', rest @ ..] => {
             current = rest;
-            Some(Ok(parse_escape_code(&mut current)))
+            Some(parse_escape_code(&mut current))
         }
         [c, rest @ ..] => {
             current = rest;
-            Some(Ok(EscapedChar::Char(*c)))
+            Some(EscapedChar::Char(*c))
         }
     })
 }
diff --git a/src/uucore/src/lib/features/format/spec.rs b/src/uucore/src/lib/features/format/spec.rs
index 258005bb5e6..dc55bc653e6 100644
--- a/src/uucore/src/lib/features/format/spec.rs
+++ b/src/uucore/src/lib/features/format/spec.rs
@@ -5,9 +5,9 @@ use super::{
         self, Case, FloatVariant, ForceDecimal, Formatter, NumberAlignment, PositiveSign, Prefix,
         UnsignedIntVariant,
     },
-    FormatArgument, FormatError,
+    parse_escape_only, FormatArgument, FormatChar, FormatError,
 };
-use std::{fmt::Display, io::Write};
+use std::{fmt::Display, io::Write, ops::ControlFlow};
 
 #[derive(Debug)]
 pub enum Spec {
@@ -17,6 +17,7 @@ pub enum Spec {
     },
     String {
         width: Option<CanAsterisk<usize>>,
+        parse_escape: bool,
         align_left: bool,
     },
     SignedInt {
@@ -145,6 +146,12 @@ impl Spec {
             },
             b's' => Spec::String {
                 width,
+                parse_escape: false,
+                align_left: minus,
+            },
+            b'b' => Spec::String {
+                width,
+                parse_escape: true,
                 align_left: minus,
             },
             b'd' | b'i' => Spec::SignedInt {
@@ -230,12 +237,36 @@ impl Spec {
                     _ => Err(FormatError::InvalidArgument(arg.clone())),
                 }
             }
-            &Spec::String { width, align_left } => {
+            &Spec::String {
+                width,
+                parse_escape,
+                align_left,
+            } => {
                 let width = resolve_asterisk(width, &mut args)?.unwrap_or(0);
                 let arg = next_arg(&mut args)?;
-                match arg.get_str() {
-                    Some(s) => write_padded(writer, s, width, false, align_left),
-                    _ => Err(FormatError::InvalidArgument(arg.clone())),
+                let Some(s) = arg.get_str() else {
+                    return Err(FormatError::InvalidArgument(arg.clone()));
+                };
+                if parse_escape {
+                    let mut parsed = Vec::new();
+                    for c in parse_escape_only(s.as_bytes()) {
+                        match c.write(&mut parsed)? {
+                            ControlFlow::Continue(()) => {}
+                            ControlFlow::Break(()) => {
+                                // TODO: This should break the _entire execution_ of printf
+                                break;
+                            }
+                        };
+                    }
+                    write_padded(
+                        writer,
+                        std::str::from_utf8(&parsed).expect("TODO: Accept invalid utf8"),
+                        width,
+                        false,
+                        align_left,
+                    )
+                } else {
+                    write_padded(writer, s, width, false, align_left)
                 }
             }
             &Spec::SignedInt {

From f83e0d1b04a55feaf7a4dbb810c9dda7a007dc40 Mon Sep 17 00:00:00 2001
From: Terts Diepraam <terts.diepraam@gmail.com>
Date: Fri, 17 Nov 2023 14:41:42 +0100
Subject: [PATCH 032/429] printf: accept multiple length parameters

---
 src/uucore/src/lib/features/format/spec.rs | 63 +++++++++++++---------
 1 file changed, 37 insertions(+), 26 deletions(-)

diff --git a/src/uucore/src/lib/features/format/spec.rs b/src/uucore/src/lib/features/format/spec.rs
index dc55bc653e6..0f48cdafe9f 100644
--- a/src/uucore/src/lib/features/format/spec.rs
+++ b/src/uucore/src/lib/features/format/spec.rs
@@ -107,34 +107,45 @@ impl Spec {
             None
         };
 
-        let length = rest.get(0).and_then(|c| {
-            Some(match c {
-                b'h' => {
-                    if let Some(b'h') = rest.get(1) {
-                        *rest = &rest[1..];
-                        Length::Char
-                    } else {
-                        Length::Short
+        // Parse 0..N length options, keep the last one
+        // Even though it is just ignored. We might want to use it later and we
+        // should parse those characters.
+        //
+        // TODO: This needs to be configurable: `seq` accepts only one length
+        //       param
+        let mut _length = None;
+        loop {
+            let new_length = rest.get(0).and_then(|c| {
+                Some(match c {
+                    b'h' => {
+                        if let Some(b'h') = rest.get(1) {
+                            *rest = &rest[1..];
+                            Length::Char
+                        } else {
+                            Length::Short
+                        }
                     }
-                }
-                b'l' => {
-                    if let Some(b'l') = rest.get(1) {
-                        *rest = &rest[1..];
-                        Length::Long
-                    } else {
-                        Length::LongLong
+                    b'l' => {
+                        if let Some(b'l') = rest.get(1) {
+                            *rest = &rest[1..];
+                            Length::Long
+                        } else {
+                            Length::LongLong
+                        }
                     }
-                }
-                b'j' => Length::IntMaxT,
-                b'z' => Length::SizeT,
-                b't' => Length::PtfDiffT,
-                b'L' => Length::LongDouble,
-                _ => return None,
-            })
-        });
-
-        if length.is_some() {
-            *rest = &rest[1..];
+                    b'j' => Length::IntMaxT,
+                    b'z' => Length::SizeT,
+                    b't' => Length::PtfDiffT,
+                    b'L' => Length::LongDouble,
+                    _ => return None,
+                })
+            });
+            if new_length.is_some() {
+                *rest = &rest[1..];
+                _length = new_length;
+            } else {
+                break;
+            }
         }
 
         let type_spec = rest.get(0)?;

From f3da0817a57d740a527d07b5a74368ed41fd3d08 Mon Sep 17 00:00:00 2001
From: Terts Diepraam <terts.diepraam@gmail.com>
Date: Fri, 17 Nov 2023 14:42:52 +0100
Subject: [PATCH 033/429] printf: support precision for integers

---
 .../src/lib/features/format/num_format.rs     | 32 ++++++++++++++++---
 src/uucore/src/lib/features/format/spec.rs    | 10 ++++++
 2 files changed, 38 insertions(+), 4 deletions(-)

diff --git a/src/uucore/src/lib/features/format/num_format.rs b/src/uucore/src/lib/features/format/num_format.rs
index 339b522091d..fab81c456fc 100644
--- a/src/uucore/src/lib/features/format/num_format.rs
+++ b/src/uucore/src/lib/features/format/num_format.rs
@@ -63,6 +63,7 @@ pub enum NumberAlignment {
 
 pub struct SignedInt {
     pub width: usize,
+    pub precision: usize,
     pub positive_sign: PositiveSign,
     pub alignment: NumberAlignment,
 }
@@ -79,16 +80,19 @@ impl Formatter for SignedInt {
             }?;
         }
 
+        let s = format!("{:0width$}", x, width = self.precision);
+
         match self.alignment {
-            NumberAlignment::Left => write!(writer, "{x:<width$}", width = self.width),
-            NumberAlignment::RightSpace => write!(writer, "{x:>width$}", width = self.width),
-            NumberAlignment::RightZero => write!(writer, "{x:0>width$}", width = self.width),
+            NumberAlignment::Left => write!(writer, "{s:<width$}", width = self.width),
+            NumberAlignment::RightSpace => write!(writer, "{s:>width$}", width = self.width),
+            NumberAlignment::RightZero => write!(writer, "{s:0>width$}", width = self.width),
         }
     }
 
     fn try_from_spec(s: Spec) -> Result<Self, FormatError> {
         let Spec::SignedInt {
             width,
+            precision,
             positive_sign,
             alignment,
         } = s
@@ -102,8 +106,15 @@ impl Formatter for SignedInt {
             Some(CanAsterisk::Asterisk) => return Err(FormatError::SpecError),
         };
 
+        let precision = match precision {
+            Some(CanAsterisk::Fixed(x)) => x,
+            None => 0,
+            Some(CanAsterisk::Asterisk) => return Err(FormatError::SpecError),
+        };
+
         Ok(Self {
             width,
+            precision,
             positive_sign,
             alignment,
         })
@@ -113,6 +124,7 @@ impl Formatter for SignedInt {
 pub struct UnsignedInt {
     pub variant: UnsignedIntVariant,
     pub width: usize,
+    pub precision: usize,
     pub alignment: NumberAlignment,
 }
 
@@ -120,7 +132,7 @@ impl Formatter for UnsignedInt {
     type Input = u64;
 
     fn fmt(&self, mut writer: impl Write, x: Self::Input) -> std::io::Result<()> {
-        let s = match self.variant {
+        let mut s = match self.variant {
             UnsignedIntVariant::Decimal => format!("{x}"),
             UnsignedIntVariant::Octal(Prefix::No) => format!("{x:o}"),
             UnsignedIntVariant::Octal(Prefix::Yes) => format!("{x:#o}"),
@@ -138,6 +150,10 @@ impl Formatter for UnsignedInt {
             }
         };
 
+        if self.precision > s.len() {
+            s = format!("{:0width$}", s, width = self.precision)
+        }
+
         match self.alignment {
             NumberAlignment::Left => write!(writer, "{s:<width$}", width = self.width),
             NumberAlignment::RightSpace => write!(writer, "{s:>width$}", width = self.width),
@@ -149,6 +165,7 @@ impl Formatter for UnsignedInt {
         let Spec::UnsignedInt {
             variant,
             width,
+            precision,
             alignment,
         } = s
         else {
@@ -161,8 +178,15 @@ impl Formatter for UnsignedInt {
             Some(CanAsterisk::Asterisk) => return Err(FormatError::SpecError),
         };
 
+        let precision = match precision {
+            Some(CanAsterisk::Fixed(x)) => x,
+            None => 0,
+            Some(CanAsterisk::Asterisk) => return Err(FormatError::SpecError),
+        };
+
         Ok(Self {
             width,
+            precision,
             variant,
             alignment,
         })
diff --git a/src/uucore/src/lib/features/format/spec.rs b/src/uucore/src/lib/features/format/spec.rs
index 0f48cdafe9f..06f0ca1d6e7 100644
--- a/src/uucore/src/lib/features/format/spec.rs
+++ b/src/uucore/src/lib/features/format/spec.rs
@@ -22,12 +22,14 @@ pub enum Spec {
     },
     SignedInt {
         width: Option<CanAsterisk<usize>>,
+        precision: Option<CanAsterisk<usize>>,
         positive_sign: PositiveSign,
         alignment: NumberAlignment,
     },
     UnsignedInt {
         variant: UnsignedIntVariant,
         width: Option<CanAsterisk<usize>>,
+        precision: Option<CanAsterisk<usize>>,
         alignment: NumberAlignment,
     },
     Float {
@@ -167,6 +169,7 @@ impl Spec {
             },
             b'd' | b'i' => Spec::SignedInt {
                 width,
+                precision,
                 alignment: match (minus, zero) {
                     (true, _) => NumberAlignment::Left,
                     (false, true) => NumberAlignment::RightZero,
@@ -197,6 +200,7 @@ impl Spec {
                 };
                 Spec::UnsignedInt {
                     variant,
+                    precision,
                     width,
                     alignment,
                 }
@@ -282,10 +286,12 @@ impl Spec {
             }
             &Spec::SignedInt {
                 width,
+                precision,
                 positive_sign,
                 alignment,
             } => {
                 let width = resolve_asterisk(width, &mut args)?.unwrap_or(0);
+                let precision = resolve_asterisk(precision, &mut args)?.unwrap_or(0);
 
                 let arg = next_arg(&mut args)?;
                 let Some(i) = arg.get_i64() else {
@@ -294,6 +300,7 @@ impl Spec {
 
                 num_format::SignedInt {
                     width,
+                    precision,
                     positive_sign,
                     alignment,
                 }
@@ -303,9 +310,11 @@ impl Spec {
             &Spec::UnsignedInt {
                 variant,
                 width,
+                precision,
                 alignment,
             } => {
                 let width = resolve_asterisk(width, &mut args)?.unwrap_or(0);
+                let precision = resolve_asterisk(precision, &mut args)?.unwrap_or(0);
 
                 let arg = next_arg(args)?;
                 let Some(i) = arg.get_u64() else {
@@ -314,6 +323,7 @@ impl Spec {
 
                 num_format::UnsignedInt {
                     variant,
+                    precision,
                     width,
                     alignment,
                 }

From 76eca8d9996cd96751a1ab8a0e7577bff967fd6a Mon Sep 17 00:00:00 2001
From: Terts Diepraam <terts.diepraam@gmail.com>
Date: Fri, 17 Nov 2023 14:43:25 +0100
Subject: [PATCH 034/429] uucore/format: fix doctests

---
 src/uucore/src/lib/features/format/mod.rs | 11 ++++++-----
 1 file changed, 6 insertions(+), 5 deletions(-)

diff --git a/src/uucore/src/lib/features/format/mod.rs b/src/uucore/src/lib/features/format/mod.rs
index 7417d48fad5..47e6fa4cc0b 100644
--- a/src/uucore/src/lib/features/format/mod.rs
+++ b/src/uucore/src/lib/features/format/mod.rs
@@ -194,9 +194,9 @@ fn parse_escape_only(fmt: &[u8]) -> impl Iterator<Item = EscapedChar> + '_ {
 /// # Examples
 ///
 /// ```rust
-/// use uucore::format::printf;
+/// use uucore::format::{printf, FormatArgument};
 ///
-/// printf("hello %s", &[FormatArgument::String("world")]).unwrap();
+/// printf("hello %s", &[FormatArgument::String("world".into())]).unwrap();
 /// // prints "hello world"
 /// ```
 pub fn printf<'a>(
@@ -228,10 +228,11 @@ fn printf_writer<'a>(
 /// # Examples
 ///
 /// ```rust
-/// use uucore::format::sprintf;
+/// use uucore::format::{sprintf, FormatArgument};
 ///
-/// let s = sprintf("hello %s", &["world".to_string()]).unwrap();
-/// assert_eq!(s, "hello world".to_string());
+/// let s = sprintf("hello %s", &[FormatArgument::String("world".into())]).unwrap();
+/// let s = std::str::from_utf8(&s).unwrap();
+/// assert_eq!(s, "hello world");
 /// ```
 pub fn sprintf<'a>(
     format_string: impl AsRef<[u8]>,

From 4aafb3f88ba2e3113df29ab264fe507ab78fdfb1 Mon Sep 17 00:00:00 2001
From: Terts Diepraam <terts.diepraam@gmail.com>
Date: Fri, 17 Nov 2023 14:46:00 +0100
Subject: [PATCH 035/429] printf: exit correctly on \c

---
 src/uu/printf/src/printf.rs | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/uu/printf/src/printf.rs b/src/uu/printf/src/printf.rs
index 00d03816e4c..663411b8952 100644
--- a/src/uu/printf/src/printf.rs
+++ b/src/uu/printf/src/printf.rs
@@ -43,7 +43,7 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
     for item in parse_spec_and_escape(format_string.as_ref()) {
         match item?.write(stdout(), &mut args)? {
             ControlFlow::Continue(()) => {}
-            ControlFlow::Break(()) => break,
+            ControlFlow::Break(()) => return Ok(()),
         };
     }
 
@@ -51,7 +51,7 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
         for item in parse_spec_and_escape(format_string.as_ref()) {
             match item?.write(stdout(), &mut args)? {
                 ControlFlow::Continue(()) => {}
-                ControlFlow::Break(()) => break,
+                ControlFlow::Break(()) => return Ok(()),
             };
         }
     }

From 955640aac8a9b1b40932bf6f282ea48ce30398b8 Mon Sep 17 00:00:00 2001
From: Terts Diepraam <terts.diepraam@gmail.com>
Date: Fri, 17 Nov 2023 14:46:38 +0100
Subject: [PATCH 036/429] printf: fix and test float formatting

---
 .../src/lib/features/format/num_format.rs     | 205 +++++++++++++++++-
 tests/by-util/test_printf.rs                  |   2 +-
 2 files changed, 198 insertions(+), 9 deletions(-)

diff --git a/src/uucore/src/lib/features/format/num_format.rs b/src/uucore/src/lib/features/format/num_format.rs
index fab81c456fc..49edecce085 100644
--- a/src/uucore/src/lib/features/format/num_format.rs
+++ b/src/uucore/src/lib/features/format/num_format.rs
@@ -329,8 +329,24 @@ fn format_float_scientific(
         return format_float_nonfinite(f, case);
     }
 
-    let exponent: i32 = f.log10().floor() as i32;
-    let normalized = f / 10.0_f64.powi(exponent);
+    if f == 0.0 {
+        return if force_decimal == ForceDecimal::Yes && precision == 0 {
+            "0.e+00".into()
+        } else {
+            format!("{:.*}e+00", precision, 0.0)
+        };
+    }
+
+    
+    let mut exponent: i32 = f.log10().floor() as i32;
+    let mut normalized = f / 10.0_f64.powi(exponent);
+
+    // If the normalized value will be rounded to a value greater than 10
+    // we need to correct.
+    if (normalized * 10_f64.powi(precision as i32)).round() / 10_f64.powi(precision as i32)  >= 10.0 {
+        normalized /= 10.0;
+        exponent += 1;
+    }
 
     let additional_dot = if precision == 0 && ForceDecimal::Yes == force_decimal {
         "."
@@ -349,20 +365,89 @@ fn format_float_scientific(
     )
 }
 
-// TODO: This could be optimized. It's not terribly important though.
 fn format_float_shortest(
     f: f64,
     precision: usize,
     case: Case,
     force_decimal: ForceDecimal,
 ) -> String {
-    let a = format_float_decimal(f, precision, case, force_decimal);
-    let b = format_float_scientific(f, precision, case, force_decimal);
+    // If the float is NaN, -Nan, Inf or -Inf, format like any other float
+    if !f.is_finite() {
+        return format_float_nonfinite(f, case);
+    }
 
-    if a.len() > b.len() {
-        b
+    // Precision here is about how many digits should be displayed
+    // instead of how many digits for the fractional part, this means that if
+    // we pass this to rust's format string, it's always gonna be one less.
+    let precision = precision.saturating_sub(1);
+
+    if f == 0.0 {
+        return match (force_decimal, precision) {
+            (ForceDecimal::Yes, 0) => "0.".into(),
+            (ForceDecimal::Yes, _) => {
+                format!("{:.*}", precision, 0.0)
+            }
+            (ForceDecimal::No, _) => "0".into(),
+        };
+    }
+
+    let mut exponent = f.log10().floor() as i32;
+    if f != 0.0 && exponent <= -4 || exponent > precision as i32 {
+        // Scientific-ish notation (with a few differences)
+        let mut normalized = f / 10.0_f64.powi(exponent);
+
+        // If the normalized value will be rounded to a value greater than 10
+        // we need to correct.
+        if (normalized * 10_f64.powi(precision as i32)).round() / 10_f64.powi(precision as i32)  >= 10.0 {
+            normalized /= 10.0;
+            exponent += 1;
+        }
+
+        let additional_dot = if precision == 0 && ForceDecimal::Yes == force_decimal {
+            "."
+        } else {
+            ""
+        };
+
+        let mut normalized = format!("{normalized:.*}", precision);
+
+        if force_decimal == ForceDecimal::No {
+            while normalized.ends_with('0') {
+                normalized.pop();
+            }
+            if normalized.ends_with('.') {
+                normalized.pop();
+            }
+        }
+
+        let exp_char = match case {
+            Case::Lowercase => 'e',
+            Case::Uppercase => 'E',
+        };
+
+        format!("{normalized}{additional_dot}{exp_char}{exponent:+03}")
     } else {
-        a
+        // Decimal-ish notation with a few differences:
+        //  - The precision works differently and specifies the total number
+        //    of digits instead of the digits in the fractional part.
+        //  - If we don't force the decimal, '0' and `.` are trimmed.
+        let decimal_places = (precision as i32).saturating_sub(exponent) as usize;
+        let mut formatted = if decimal_places == 0 && force_decimal == ForceDecimal::Yes {
+            format!("{f:.0}.")
+        } else {
+            format!("{f:.*}", decimal_places)
+        };
+
+        if force_decimal == ForceDecimal::No {
+            while formatted.ends_with('0') {
+                formatted.pop();
+            }
+            if formatted.ends_with('.') {
+                formatted.pop();
+            }
+        }
+
+        formatted
     }
 }
 
@@ -398,3 +483,107 @@ fn format_float_hexadecimal(
 
     return s;
 }
+
+#[cfg(test)]
+mod test {
+    use crate::format::num_format::{Case, ForceDecimal};
+
+    #[test]
+    fn decimal_float() {
+        use super::format_float_decimal;
+        let f = |x| format_float_decimal(x, 6, Case::Lowercase, ForceDecimal::No);
+        assert_eq!(f(0.0), "0.000000");
+        assert_eq!(f(1.0), "1.000000");
+        assert_eq!(f(100.0), "100.000000");
+        assert_eq!(f(123456.789), "123456.789000");
+        assert_eq!(f(12.3456789), "12.345679");
+        assert_eq!(f(1000000.0), "1000000.000000");
+        assert_eq!(f(99999999.0), "99999999.000000");
+        assert_eq!(f(1.9999995), "1.999999");
+        assert_eq!(f(1.9999996), "2.000000");
+    }
+
+    #[test]
+    fn scientific_float() {
+        use super::format_float_scientific;
+        let f = |x| format_float_scientific(x, 6, Case::Lowercase, ForceDecimal::No);
+        assert_eq!(f(0.0), "0.000000e+00");
+        assert_eq!(f(1.0), "1.000000e+00");
+        assert_eq!(f(100.0), "1.000000e+02");
+        assert_eq!(f(123456.789), "1.234568e+05");
+        assert_eq!(f(12.3456789), "1.234568e+01");
+        assert_eq!(f(1000000.0), "1.000000e+06");
+        assert_eq!(f(99999999.0), "1.000000e+08");
+    }
+
+    #[test]
+    fn scientific_float_zero_precision() {
+        use super::format_float_scientific;
+
+        let f = |x| format_float_scientific(x, 0, Case::Lowercase, ForceDecimal::No);
+        assert_eq!(f(0.0), "0e+00");
+        assert_eq!(f(1.0), "1e+00");
+        assert_eq!(f(100.0), "1e+02");
+        assert_eq!(f(123456.789), "1e+05");
+        assert_eq!(f(12.3456789), "1e+01");
+        assert_eq!(f(1000000.0), "1e+06");
+        assert_eq!(f(99999999.0), "1e+08");
+
+        let f = |x| format_float_scientific(x, 0, Case::Lowercase, ForceDecimal::Yes);
+        assert_eq!(f(0.0), "0.e+00");
+        assert_eq!(f(1.0), "1.e+00");
+        assert_eq!(f(100.0), "1.e+02");
+        assert_eq!(f(123456.789), "1.e+05");
+        assert_eq!(f(12.3456789), "1.e+01");
+        assert_eq!(f(1000000.0), "1.e+06");
+        assert_eq!(f(99999999.0), "1.e+08");
+    }
+
+    #[test]
+    fn shortest_float() {
+        use super::format_float_shortest;
+        let f = |x| format_float_shortest(x, 6, Case::Lowercase, ForceDecimal::No);
+        assert_eq!(f(0.0), "0");
+        assert_eq!(f(1.0), "1");
+        assert_eq!(f(100.0), "100");
+        assert_eq!(f(123456.789), "123457");
+        assert_eq!(f(12.3456789), "12.3457");
+        assert_eq!(f(1000000.0), "1e+06");
+        assert_eq!(f(99999999.0), "1e+08");
+    }
+
+    #[test]
+    fn shortest_float_force_decimal() {
+        use super::format_float_shortest;
+        let f = |x| format_float_shortest(x, 6, Case::Lowercase, ForceDecimal::Yes);
+        assert_eq!(f(0.0), "0.00000");
+        assert_eq!(f(1.0), "1.00000");
+        assert_eq!(f(100.0), "100.000");
+        assert_eq!(f(123456.789), "123457.");
+        assert_eq!(f(12.3456789), "12.3457");
+        assert_eq!(f(1000000.0), "1.00000e+06");
+        assert_eq!(f(99999999.0), "1.00000e+08");
+    }
+
+    #[test]
+    fn shortest_float_force_decimal_zero_precision() {
+        use super::format_float_shortest;
+        let f = |x| format_float_shortest(x, 0, Case::Lowercase, ForceDecimal::No);
+        assert_eq!(f(0.0), "0");
+        assert_eq!(f(1.0), "1");
+        assert_eq!(f(100.0), "1e+02");
+        assert_eq!(f(123456.789), "1e+05");
+        assert_eq!(f(12.3456789), "1e+01");
+        assert_eq!(f(1000000.0), "1e+06");
+        assert_eq!(f(99999999.0), "1e+08");
+        
+        let f = |x| format_float_shortest(x, 0, Case::Lowercase, ForceDecimal::Yes);
+        assert_eq!(f(0.0), "0.");
+        assert_eq!(f(1.0), "1.");
+        assert_eq!(f(100.0), "1.e+02");
+        assert_eq!(f(123456.789), "1.e+05");
+        assert_eq!(f(12.3456789), "1.e+01");
+        assert_eq!(f(1000000.0), "1.e+06");
+        assert_eq!(f(99999999.0), "1.e+08");
+    }
+}
diff --git a/tests/by-util/test_printf.rs b/tests/by-util/test_printf.rs
index d7ba5679ecf..5a74aa724e4 100644
--- a/tests/by-util/test_printf.rs
+++ b/tests/by-util/test_printf.rs
@@ -251,7 +251,7 @@ fn sub_num_float_e_no_round() {
 #[test]
 fn sub_num_float_round() {
     new_ucmd!()
-        .args(&["two is %f", "1.9999995"])
+        .args(&["two is %f", "1.9999996"])
         .succeeds()
         .stdout_only("two is 2.000000");
 }

From fef84f72030fdd13065bd6735b1b01a40a36e52f Mon Sep 17 00:00:00 2001
From: Terts Diepraam <terts.diepraam@gmail.com>
Date: Fri, 17 Nov 2023 14:47:08 +0100
Subject: [PATCH 037/429] printf: add emoji character test

---
 tests/by-util/test_printf.rs | 5 +++++
 1 file changed, 5 insertions(+)

diff --git a/tests/by-util/test_printf.rs b/tests/by-util/test_printf.rs
index 5a74aa724e4..7573b5fb983 100644
--- a/tests/by-util/test_printf.rs
+++ b/tests/by-util/test_printf.rs
@@ -190,6 +190,11 @@ fn sub_num_int_char_const_in() {
         .args(&["ninety seven is %i", "'a"])
         .succeeds()
         .stdout_only("ninety seven is 97");
+
+    new_ucmd!()
+        .args(&["emoji is %i", "'🙃"])
+        .succeeds()
+        .stdout_only("emoji is 128579");
 }
 
 #[test]

From ce18e0ab9702c73d778b6b4bb9218926562c83fa Mon Sep 17 00:00:00 2001
From: Terts Diepraam <terts.diepraam@gmail.com>
Date: Fri, 17 Nov 2023 14:47:41 +0100
Subject: [PATCH 038/429] printf: ignore hexadecimal floats test

This can be un-ignored when it is implemented
---
 tests/by-util/test_printf.rs | 1 +
 1 file changed, 1 insertion(+)

diff --git a/tests/by-util/test_printf.rs b/tests/by-util/test_printf.rs
index 7573b5fb983..436bc498b7c 100644
--- a/tests/by-util/test_printf.rs
+++ b/tests/by-util/test_printf.rs
@@ -376,6 +376,7 @@ fn sub_float_dec_places() {
 }
 
 #[test]
+#[ignore = "hexadecimal floats are unimplemented"]
 fn sub_float_hex_in() {
     new_ucmd!()
         .args(&["%f", "0xF1.1F"])

From 5f2374b33960f42fd1cb575ee4801ef50f342cf8 Mon Sep 17 00:00:00 2001
From: Terts Diepraam <terts.diepraam@gmail.com>
Date: Fri, 17 Nov 2023 14:57:09 +0100
Subject: [PATCH 039/429] printf: fix negative hex argument parsing

---
 src/uucore/src/lib/features/format/argument.rs | 10 +++++++---
 1 file changed, 7 insertions(+), 3 deletions(-)

diff --git a/src/uucore/src/lib/features/format/argument.rs b/src/uucore/src/lib/features/format/argument.rs
index 644546c38b7..120b59aa4b5 100644
--- a/src/uucore/src/lib/features/format/argument.rs
+++ b/src/uucore/src/lib/features/format/argument.rs
@@ -49,9 +49,13 @@ impl FormatArgument {
         match self {
             Self::SignedInt(n) => Some(*n),
             Self::Unparsed(s) => {
-                if let Some(s) = s.strip_prefix("0x") {
-                    i64::from_str_radix(s, 16).ok()
-                } else if let Some(s) = s.strip_prefix("0") {
+                // For hex, we parse `u64` because we do not allow another
+                // minus sign. We might need to do more precise parsing here.
+                if let Some(s) = s.strip_prefix("-0x") {
+                    Some(- (u64::from_str_radix(s, 16).ok()? as i64))
+                } else if let Some(s) = s.strip_prefix("0x") {
+                    Some(u64::from_str_radix(s, 16).ok()? as i64)
+                } else if s.starts_with("-0") || s.starts_with('0') {
                     i64::from_str_radix(s, 8).ok()
                 } else if let Some(s) = s.strip_prefix('\'') {
                     Some(s.chars().next()? as i64)

From eb00c195c6c9e014c89d53b7d0e6feade507da8d Mon Sep 17 00:00:00 2001
From: Yury Zhytkou <54360928+zhitkoff@users.noreply.github.com>
Date: Fri, 17 Nov 2023 11:19:10 -0500
Subject: [PATCH 040/429] split: pass GNU tests/b-chunk.sh (#5475)

---------

Co-authored-by: Terts Diepraam <terts.diepraam@gmail.com>
Co-authored-by: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Co-authored-by: Brandon Elam Barker <brandon.barker@gmail.com>
Co-authored-by: Kostiantyn Hryshchuk <statheres@gmail.com>
Co-authored-by: renovate[bot] <29139614+renovate[bot]@users.noreply.github.com>
---
 src/uu/split/src/split.rs   | 669 +++++++++++++++++++-----------------
 tests/by-util/test_split.rs | 130 ++++---
 2 files changed, 435 insertions(+), 364 deletions(-)

diff --git a/src/uu/split/src/split.rs b/src/uu/split/src/split.rs
index 17a783d72f2..592e4eedde9 100644
--- a/src/uu/split/src/split.rs
+++ b/src/uu/split/src/split.rs
@@ -18,11 +18,12 @@ use std::ffi::OsString;
 use std::fmt;
 use std::fs::{metadata, File};
 use std::io;
-use std::io::{stdin, BufRead, BufReader, BufWriter, ErrorKind, Read, Write};
+use std::io::{stdin, BufRead, BufReader, BufWriter, ErrorKind, Read, Seek, SeekFrom, Write};
 use std::path::Path;
 use std::u64;
 use uucore::display::Quotable;
 use uucore::error::{FromIo, UIoError, UResult, USimpleError, UUsageError};
+use uucore::parse_size::parse_size_u64;
 
 use uucore::uio_error;
 use uucore::{format_usage, help_about, help_section, help_usage};
@@ -40,11 +41,20 @@ static OPT_HEX_SUFFIXES_SHORT: &str = "-x";
 static OPT_SUFFIX_LENGTH: &str = "suffix-length";
 static OPT_VERBOSE: &str = "verbose";
 static OPT_SEPARATOR: &str = "separator";
-//The ---io and ---io-blksize parameters are consumed and ignored.
-//The parameter is included to make GNU coreutils tests pass.
-static OPT_IO: &str = "-io";
-static OPT_IO_BLKSIZE: &str = "-io-blksize";
 static OPT_ELIDE_EMPTY_FILES: &str = "elide-empty-files";
+static OPT_IO_BLKSIZE: &str = "-io-blksize";
+// Cap ---io-blksize value
+// For 64bit systems the max value is the same as in GNU
+// and is equivalent of `i32::MAX >> 20 << 20` operation.
+// On 32bit systems however, even though it fits within `u32` and `i32`,
+// it causes rust-lang `library/alloc/src/raw_vec.rs` to panic with 'capacity overflow' error.
+// Could be due to how `std::io::BufReader` handles internal buffers.
+// So we use much smaller value for those
+static OPT_IO_BLKSIZE_MAX: usize = if usize::BITS >= 64 {
+    2_146_435_072
+} else {
+    1_000_000_000
+};
 
 static ARG_INPUT: &str = "input";
 static ARG_PREFIX: &str = "prefix";
@@ -311,7 +321,6 @@ pub fn uu_app() -> Command {
         .arg(
             Arg::new(OPT_NUMERIC_SUFFIXES)
                 .long(OPT_NUMERIC_SUFFIXES)
-                .alias("numeric")
                 .require_equals(true)
                 .num_args(0..=1)
                 .overrides_with_all([
@@ -338,7 +347,6 @@ pub fn uu_app() -> Command {
         .arg(
             Arg::new(OPT_HEX_SUFFIXES)
                 .long(OPT_HEX_SUFFIXES)
-                .alias("hex")
                 .require_equals(true)
                 .num_args(0..=1)
                 .overrides_with_all([
@@ -373,12 +381,6 @@ pub fn uu_app() -> Command {
                 .action(ArgAction::Append)
                 .help("use SEP instead of newline as the record separator; '\\0' (zero) specifies the NUL character"),
         )
-        .arg(
-            Arg::new(OPT_IO)
-                .long("io")
-                .alias(OPT_IO)
-                .hide(true),
-        )
         .arg(
             Arg::new(OPT_IO_BLKSIZE)
                 .long("io-blksize")
@@ -419,6 +421,7 @@ struct Settings {
     /// chunks. If this is `false`, then empty files will not be
     /// created.
     elide_empty_files: bool,
+    io_blksize: Option<usize>,
 }
 
 /// An error when parsing settings from command-line arguments.
@@ -441,6 +444,9 @@ enum SettingsError {
     /// r/K/N
     FilterWithKthChunkNumber,
 
+    /// Invalid IO block size
+    InvalidIOBlockSize(String),
+
     /// The `--filter` option is not supported on Windows.
     #[cfg(windows)]
     NotSupported,
@@ -471,6 +477,7 @@ impl fmt::Display for SettingsError {
             Self::FilterWithKthChunkNumber => {
                 write!(f, "--filter does not process a chunk extracted to stdout")
             }
+            Self::InvalidIOBlockSize(s) => write!(f, "invalid IO block size: {}", s.quote()),
             #[cfg(windows)]
             Self::NotSupported => write!(
                 f,
@@ -499,12 +506,29 @@ impl Settings {
                 match first.as_str() {
                     "\\0" => b'\0',
                     s if s.as_bytes().len() == 1 => s.as_bytes()[0],
-                    s => return Err(SettingsError::MultiCharacterSeparator(s.to_owned())),
+                    s => return Err(SettingsError::MultiCharacterSeparator(s.to_string())),
                 }
             }
             None => b'\n',
         };
 
+        let io_blksize: Option<usize> = if let Some(s) = matches.get_one::<String>(OPT_IO_BLKSIZE) {
+            match parse_size_u64(s) {
+                Ok(n) => {
+                    let n: usize = n
+                        .try_into()
+                        .map_err(|_| SettingsError::InvalidIOBlockSize(s.to_string()))?;
+                    if n > OPT_IO_BLKSIZE_MAX {
+                        return Err(SettingsError::InvalidIOBlockSize(s.to_string()));
+                    }
+                    Some(n)
+                }
+                _ => return Err(SettingsError::InvalidIOBlockSize(s.to_string())),
+            }
+        } else {
+            None
+        };
+
         let result = Self {
             prefix: matches.get_one::<String>(ARG_PREFIX).unwrap().clone(),
             suffix,
@@ -514,6 +538,7 @@ impl Settings {
             verbose: matches.value_source(OPT_VERBOSE) == Some(ValueSource::CommandLine),
             separator,
             elide_empty_files: matches.get_flag(OPT_ELIDE_EMPTY_FILES),
+            io_blksize,
         };
 
         #[cfg(windows)]
@@ -591,6 +616,93 @@ fn custom_write_all<T: Write>(
     }
 }
 
+/// Get the size of the input file in bytes
+/// Used only for subset of `--number=CHUNKS` strategy, as there is a need
+/// to determine input file size upfront in order to know chunk size
+/// to be written into each of N files/chunks:
+/// * N       split into N files based on size of input
+/// * K/N     output Kth of N to stdout
+/// * l/N     split into N files without splitting lines/records
+/// * l/K/N   output Kth of N to stdout without splitting lines/records
+///
+/// For most files the size will be determined by either reading entire file content into a buffer
+/// or by `len()` function of [`std::fs::metadata`].
+///
+/// However, for some files which report filesystem metadata size that does not match
+/// their actual content size, we will need to attempt to find the end of file
+/// with direct `seek()` on [`std::fs::File`].
+///
+/// For STDIN stream - read into a buffer up to a limit
+/// If input stream does not EOF before that - return an error
+/// (i.e. "infinite" input as in `cat /dev/zero | split ...`, `yes | split ...` etc.).
+///
+/// Note: The `buf` might end up with either partial or entire input content.
+fn get_input_size<R>(
+    input: &String,
+    reader: &mut R,
+    buf: &mut Vec<u8>,
+    io_blksize: &Option<usize>,
+) -> std::io::Result<u64>
+where
+    R: BufRead,
+{
+    // Set read limit to io_blksize if specified
+    // Otherwise to OPT_IO_BLKSIZE_MAX
+    let read_limit = io_blksize.unwrap_or(OPT_IO_BLKSIZE_MAX) as u64;
+
+    // Try to read into buffer up to a limit
+    let num_bytes = reader
+        .by_ref()
+        .take(read_limit)
+        .read_to_end(buf)
+        .map(|n| n as u64)?;
+
+    if num_bytes < read_limit {
+        // Finite file or STDIN stream that fits entirely
+        // into a buffer within the limit
+        // Note: files like /dev/null or similar,
+        // empty STDIN stream,
+        // and files with true file size 0
+        // will also fit here
+        Ok(num_bytes)
+    } else if input == "-" {
+        // STDIN stream that did not fit all content into a buffer
+        // Most likely continuous/infinite input stream
+        return Err(io::Error::new(
+            ErrorKind::Other,
+            format!("{}: cannot determine input size", input),
+        ));
+    } else {
+        // Could be that file size is larger than set read limit
+        // Get the file size from filesystem metadata
+        let metadata = metadata(input)?;
+        let metadata_size = metadata.len();
+        if num_bytes <= metadata_size {
+            Ok(metadata_size)
+        } else {
+            // Could be a file from locations like /dev, /sys, /proc or similar
+            // which report filesystem metadata size that does not match
+            // their actual content size
+            // Attempt direct `seek()` for the end of a file
+            let mut tmp_fd = File::open(Path::new(input))?;
+            let end = tmp_fd.seek(SeekFrom::End(0))?;
+            if end > 0 {
+                Ok(end)
+            } else {
+                // Edge case of either "infinite" file (i.e. /dev/zero)
+                // or some other "special" non-standard file type
+                // Give up and return an error
+                // TODO It might be possible to do more here
+                // to address all possible file types and edge cases
+                return Err(io::Error::new(
+                    ErrorKind::Other,
+                    format!("{}: cannot determine file size", input),
+                ));
+            }
+        }
+    }
+}
+
 /// Write a certain number of bytes to one file, then move on to another one.
 ///
 /// This struct maintains an underlying writer representing the
@@ -1018,155 +1130,110 @@ impl<'a> Write for LineBytesChunkWriter<'a> {
     }
 }
 
-/// Split a file into a specific number of chunks by byte.
+/// Split a file or STDIN into a specific number of chunks by byte.
+/// If in Kth chunk of N mode - print the k-th chunk to STDOUT.
 ///
-/// This function always creates one output file for each chunk, even
+/// When file size cannot be evenly divided into the number of chunks of the same size,
+/// the first X chunks are 1 byte longer than the rest,
+/// where X is a modulus reminder of (file size % number of chunks)
+///
+/// In Kth chunk of N mode - writes to stdout the contents of the chunk identified by `kth_chunk`
+///
+/// In N chunks mode - this function always creates one output file for each chunk, even
 /// if there is an error reading or writing one of the chunks or if
-/// the input file is truncated. However, if the `filter` option is
-/// being used, then no files are created.
+/// the input file is truncated. However, if the `--filter` option is
+/// being used, then files will only be created if `$FILE` variable was used
+/// in filter command,
+/// i.e. `split -n 10 --filter='head -c1 > $FILE' in`
 ///
 /// # Errors
 ///
 /// This function returns an error if there is a problem reading from
-/// `reader` or writing to one of the output files.
+/// `reader` or writing to one of the output files or stdout.
+///
+/// # See also
+///
+/// * [`n_chunks_by_line`], which splits its input into a specific number of chunks by line.
 ///
 /// Implements `--number=CHUNKS`
 /// Where CHUNKS
 /// * N
-fn split_into_n_chunks_by_byte<R>(
+/// * K/N
+fn n_chunks_by_byte<R>(
     settings: &Settings,
     reader: &mut R,
     num_chunks: u64,
+    kth_chunk: Option<u64>,
 ) -> UResult<()>
 where
-    R: Read,
+    R: BufRead,
 {
-    // Get the size of the input file in bytes and compute the number
-    // of bytes per chunk.
-    //
+    // Get the size of the input in bytes
+    let initial_buf = &mut Vec::new();
+    let mut num_bytes = get_input_size(&settings.input, reader, initial_buf, &settings.io_blksize)?;
+    let mut reader = initial_buf.chain(reader);
+
+    // If input file is empty and we would not have determined the Kth chunk
+    // in the Kth chunk of N chunk mode, then terminate immediately.
+    // This happens on `split -n 3/10 /dev/null`, for example.
+    if kth_chunk.is_some() && num_bytes == 0 {
+        return Ok(());
+    }
+
     // If the requested number of chunks exceeds the number of bytes
-    // in the file *and* the `elide_empty_files` parameter is enabled,
-    // then behave as if the number of chunks was set to the number of
-    // bytes in the file. This ensures that we don't write empty
-    // files. Otherwise, just write the `num_chunks - num_bytes` empty
-    // files.
-    let metadata = metadata(&settings.input).map_err(|_| {
-        USimpleError::new(1, format!("{}: cannot determine file size", settings.input))
-    })?;
-
-    let num_bytes = metadata.len();
-    let will_have_empty_files = settings.elide_empty_files && num_chunks > num_bytes;
-    let (num_chunks, chunk_size) = if will_have_empty_files {
-        let num_chunks = num_bytes;
-        let chunk_size = 1;
-        (num_chunks, chunk_size)
+    // in the input:
+    // * in Kth chunk of N mode - just write empty byte string to stdout
+    //   NOTE: the `elide_empty_files` parameter is ignored here
+    //   as we do not generate any files
+    //   and instead writing to stdout
+    // * In N chunks mode - if the `elide_empty_files` parameter is enabled,
+    //   then behave as if the number of chunks was set to the number of
+    //   bytes in the file. This ensures that we don't write empty
+    //   files. Otherwise, just write the `num_chunks - num_bytes` empty files.
+    let num_chunks = if kth_chunk.is_none() && settings.elide_empty_files && num_chunks > num_bytes
+    {
+        num_bytes
     } else {
-        let chunk_size = (num_bytes / (num_chunks)).max(1);
-        (num_chunks, chunk_size)
+        num_chunks
     };
 
     // If we would have written zero chunks of output, then terminate
     // immediately. This happens on `split -e -n 3 /dev/null`, for
     // example.
-    if num_chunks == 0 || num_bytes == 0 {
+    if num_chunks == 0 {
         return Ok(());
     }
 
-    let num_chunks: usize = num_chunks
-        .try_into()
-        .map_err(|_| USimpleError::new(1, "Number of chunks too big"))?;
-
-    // This object is responsible for creating the filename for each chunk.
-    let mut filename_iterator = FilenameIterator::new(&settings.prefix, &settings.suffix)?;
-
-    // Create one writer for each chunk. This will create each
-    // of the underlying files (if not in `--filter` mode).
+    // In Kth chunk of N mode - we will write to stdout instead of to a file.
+    let mut stdout_writer = std::io::stdout().lock();
+    // In N chunks mode - we will write to `num_chunks` files
     let mut writers = vec![];
-    for _ in 0..num_chunks {
-        let filename = filename_iterator
-            .next()
-            .ok_or_else(|| USimpleError::new(1, "output file suffixes exhausted"))?;
-        let writer = settings.instantiate_current_writer(filename.as_str())?;
-        writers.push(writer);
-    }
-
-    // Write `chunk_size` bytes from the reader into each writer
-    // except the last.
-    //
-    // The last writer gets all remaining bytes so that if the number
-    // of bytes in the input file was not evenly divisible by
-    // `num_chunks`, we don't leave any bytes behind.
-    for writer in writers.iter_mut().take(num_chunks - 1) {
-        match io::copy(&mut reader.by_ref().take(chunk_size), writer) {
-            Ok(_) => continue,
-            Err(e) if ignorable_io_error(&e, settings) => continue,
-            Err(e) => return Err(uio_error!(e, "input/output error")),
-        };
-    }
-
-    // Write all the remaining bytes to the last chunk.
-    let i = num_chunks - 1;
-    let last_chunk_size = num_bytes - (chunk_size * (num_chunks as u64 - 1));
-    match io::copy(&mut reader.by_ref().take(last_chunk_size), &mut writers[i]) {
-        Ok(_) => Ok(()),
-        Err(e) if ignorable_io_error(&e, settings) => Ok(()),
-        Err(e) => Err(uio_error!(e, "input/output error")),
-    }
-}
 
-/// Print the k-th chunk of a file to stdout, splitting by byte.
-///
-/// This function is like [`split_into_n_chunks_by_byte`], but instead
-/// of writing each chunk to its own file, it only writes to stdout
-/// the contents of the chunk identified by `chunk_number`
-///
-/// # Errors
-///
-/// This function returns an error if there is a problem reading from
-/// `reader` or writing to stdout.
-///
-/// Implements `--number=CHUNKS`
-/// Where CHUNKS
-/// * K/N
-fn kth_chunks_by_byte<R>(
-    settings: &Settings,
-    reader: &mut R,
-    chunk_number: u64,
-    num_chunks: u64,
-) -> UResult<()>
-where
-    R: BufRead,
-{
-    // Get the size of the input file in bytes and compute the number
-    // of bytes per chunk.
-    //
-    // If the requested number of chunks exceeds the number of bytes
-    // in the file - just write empty byte string to stdout
-    // NOTE: the `elide_empty_files` parameter is ignored here
-    // as we do not generate any files
-    // and instead writing to stdout
-    let metadata = metadata(&settings.input).map_err(|_| {
-        USimpleError::new(1, format!("{}: cannot determine file size", settings.input))
-    })?;
-
-    let num_bytes = metadata.len();
-    // If input file is empty and we would have written zero chunks of output,
-    // then terminate immediately.
-    // This happens on `split -e -n 3 /dev/null`, for example.
-    if num_bytes == 0 {
-        return Ok(());
+    // Calculate chunk size base and modulo reminder
+    // to be used in calculating chunk_size later on
+    let chunk_size_base = num_bytes / num_chunks;
+    let chunk_size_reminder = num_bytes % num_chunks;
+
+    // If in N chunks mode
+    // Create one writer for each chunk.
+    // This will create each of the underlying files
+    // or stdin pipes to child shell/command processes if in `--filter` mode
+    if kth_chunk.is_none() {
+        // This object is responsible for creating the filename for each chunk.
+        let mut filename_iterator = FilenameIterator::new(&settings.prefix, &settings.suffix)
+            .map_err(|e| io::Error::new(ErrorKind::Other, format!("{e}")))?;
+        for _ in 0..num_chunks {
+            let filename = filename_iterator
+                .next()
+                .ok_or_else(|| USimpleError::new(1, "output file suffixes exhausted"))?;
+            let writer = settings.instantiate_current_writer(filename.as_str())?;
+            writers.push(writer);
+        }
     }
 
-    // Write to stdout instead of to a file.
-    let stdout = std::io::stdout();
-    let mut writer = stdout.lock();
-
-    let chunk_size = (num_bytes / (num_chunks)).max(1);
-    let mut num_bytes: usize = num_bytes.try_into().unwrap();
-
-    let mut i = 1;
-    loop {
-        let buf: &mut Vec<u8> = &mut vec![];
+    for i in 1_u64..=num_chunks {
+        let chunk_size = chunk_size_base + (chunk_size_reminder > i - 1) as u64;
+        let buf = &mut Vec::new();
         if num_bytes > 0 {
             // Read `chunk_size` bytes from the reader into `buf`
             // except the last.
@@ -1176,15 +1243,17 @@ where
             // `num_chunks`, we don't leave any bytes behind.
             let limit = {
                 if i == num_chunks {
-                    num_bytes.try_into().unwrap()
+                    num_bytes
                 } else {
                     chunk_size
                 }
             };
+
             let n_bytes_read = reader.by_ref().take(limit).read_to_end(buf);
+
             match n_bytes_read {
                 Ok(n_bytes) => {
-                    num_bytes -= n_bytes;
+                    num_bytes -= n_bytes as u64;
                 }
                 Err(error) => {
                     return Err(USimpleError::new(
@@ -1193,11 +1262,20 @@ where
                     ));
                 }
             }
-            if i == chunk_number {
-                writer.write_all(buf)?;
-                break;
+
+            match kth_chunk {
+                Some(chunk_number) => {
+                    if i == chunk_number {
+                        stdout_writer.write_all(buf)?;
+                        break;
+                    }
+                }
+                None => {
+                    let idx = (i - 1) as usize;
+                    let writer = writers.get_mut(idx).unwrap();
+                    writer.write_all(buf)?;
+                }
             }
-            i += 1;
         } else {
             break;
         }
@@ -1205,12 +1283,17 @@ where
     Ok(())
 }
 
-/// Split a file into a specific number of chunks by line.
+/// Split a file or STDIN into a specific number of chunks by line.
+/// If in Kth chunk of N mode - print the k-th chunk to STDOUT.
+///
+/// In Kth chunk of N mode - writes to stdout the contents of the chunk identified by `kth_chunk`
 ///
-/// This function always creates one output file for each chunk, even
+/// In N chunks mode - this function always creates one output file for each chunk, even
 /// if there is an error reading or writing one of the chunks or if
-/// the input file is truncated. However, if the `filter` option is
-/// being used, then no files are created.
+/// the input file is truncated. However, if the `--filter` option is
+/// being used, then files will only be created if `$FILE` variable was used
+/// in filter command,
+/// i.e. `split -n l/10 --filter='head -c1 > $FILE' in`
 ///
 /// # Errors
 ///
@@ -1219,119 +1302,82 @@ where
 ///
 /// # See also
 ///
-/// * [`kth_chunk_by_line`], which splits its input in the same way,
-///   but writes only one specified chunk to stdout.
+/// * [`n_chunks_by_byte`], which splits its input into a specific number of chunks by byte.
 ///
 /// Implements `--number=CHUNKS`
 /// Where CHUNKS
 /// * l/N
-fn split_into_n_chunks_by_line<R>(
+/// * l/K/N
+fn n_chunks_by_line<R>(
     settings: &Settings,
     reader: &mut R,
     num_chunks: u64,
+    kth_chunk: Option<u64>,
 ) -> UResult<()>
 where
     R: BufRead,
 {
-    // Get the size of the input file in bytes and compute the number
+    // Get the size of the input in bytes and compute the number
     // of bytes per chunk.
-    let metadata = metadata(&settings.input).map_err(|_| {
-        USimpleError::new(1, format!("{}: cannot determine file size", settings.input))
-    })?;
-    let num_bytes = metadata.len();
+    let initial_buf = &mut Vec::new();
+    let num_bytes = get_input_size(&settings.input, reader, initial_buf, &settings.io_blksize)?;
+    let reader = initial_buf.chain(reader);
     let chunk_size = (num_bytes / num_chunks) as usize;
 
-    // This object is responsible for creating the filename for each chunk.
-    let mut filename_iterator = FilenameIterator::new(&settings.prefix, &settings.suffix)?;
-
-    // Create one writer for each chunk. This will create each
-    // of the underlying files (if not in `--filter` mode).
-    let mut writers = vec![];
-    for _ in 0..num_chunks {
-        let filename = filename_iterator
-            .next()
-            .ok_or_else(|| USimpleError::new(1, "output file suffixes exhausted"))?;
-        let writer = settings.instantiate_current_writer(filename.as_str())?;
-        writers.push(writer);
+    // If input file is empty and we would not have determined the Kth chunk
+    // in the Kth chunk of N chunk mode, then terminate immediately.
+    // This happens on `split -n l/3/10 /dev/null`, for example.
+    if kth_chunk.is_some() && num_bytes == 0 {
+        return Ok(());
     }
 
-    let mut num_bytes_remaining_in_current_chunk = chunk_size;
-    let mut i = 0;
-    let sep = settings.separator;
-    for line_result in reader.split(sep) {
-        let line = line_result.unwrap();
-        let maybe_writer = writers.get_mut(i);
-        let writer = maybe_writer.unwrap();
-        let bytes = line.as_slice();
-        custom_write_all(bytes, writer, settings)?;
-        custom_write_all(&[sep], writer, settings)?;
+    // In Kth chunk of N mode - we will write to stdout instead of to a file.
+    let mut stdout_writer = std::io::stdout().lock();
+    // In N chunks mode - we will write to `num_chunks` files
+    let mut writers = vec![];
 
-        // Add one byte for the separator character.
-        let num_bytes = bytes.len() + 1;
-        if num_bytes > num_bytes_remaining_in_current_chunk {
-            num_bytes_remaining_in_current_chunk = chunk_size;
-            i += 1;
-        } else {
-            num_bytes_remaining_in_current_chunk -= num_bytes;
+    // If in N chunks mode
+    // Create one writer for each chunk.
+    // This will create each of the underlying files
+    // or stdin pipes to child shell/command processes if in `--filter` mode
+    if kth_chunk.is_none() {
+        // This object is responsible for creating the filename for each chunk.
+        let mut filename_iterator = FilenameIterator::new(&settings.prefix, &settings.suffix)
+            .map_err(|e| io::Error::new(ErrorKind::Other, format!("{e}")))?;
+        for _ in 0..num_chunks {
+            let filename = filename_iterator
+                .next()
+                .ok_or_else(|| USimpleError::new(1, "output file suffixes exhausted"))?;
+            let writer = settings.instantiate_current_writer(filename.as_str())?;
+            writers.push(writer);
         }
     }
 
-    Ok(())
-}
-
-/// Print the k-th chunk of a file, splitting by line.
-///
-/// This function is like [`split_into_n_chunks_by_line`], but instead
-/// of writing each chunk to its own file, it only writes to stdout
-/// the contents of the chunk identified by `chunk_number`.
-///
-/// # Errors
-///
-/// This function returns an error if there is a problem reading from
-/// `reader` or writing to one of the output files.
-///
-/// # See also
-///
-/// * [`split_into_n_chunks_by_line`], which splits its input in the
-///   same way, but writes each chunk to its own file.
-///
-/// Implements `--number=CHUNKS`
-/// Where CHUNKS
-/// * l/K/N
-fn kth_chunk_by_line<R>(
-    settings: &Settings,
-    reader: &mut R,
-    chunk_number: u64,
-    num_chunks: u64,
-) -> UResult<()>
-where
-    R: BufRead,
-{
-    // Get the size of the input file in bytes and compute the number
-    // of bytes per chunk.
-    let metadata = metadata(&settings.input).map_err(|_| {
-        USimpleError::new(1, format!("{}: cannot determine file size", settings.input))
-    })?;
-    let num_bytes = metadata.len();
-    let chunk_size = (num_bytes / num_chunks) as usize;
-
-    // Write to stdout instead of to a file.
-    let stdout = std::io::stdout();
-    let mut writer = stdout.lock();
-
     let mut num_bytes_remaining_in_current_chunk = chunk_size;
     let mut i = 1;
     let sep = settings.separator;
+
     for line_result in reader.split(sep) {
-        let line = line_result?;
+        // add separator back in at the end of the line
+        let mut line = line_result?;
+        line.push(sep);
         let bytes = line.as_slice();
-        if i == chunk_number {
-            writer.write_all(bytes)?;
-            writer.write_all(&[sep])?;
+
+        match kth_chunk {
+            Some(chunk_number) => {
+                if i == chunk_number {
+                    stdout_writer.write_all(bytes)?;
+                }
+            }
+            None => {
+                let idx = (i - 1) as usize;
+                let maybe_writer = writers.get_mut(idx);
+                let writer = maybe_writer.unwrap();
+                custom_write_all(bytes, writer, settings)?;
+            }
         }
 
-        // Add one byte for the separator character.
-        let num_bytes = bytes.len() + 1;
+        let num_bytes = bytes.len();
         if num_bytes >= num_bytes_remaining_in_current_chunk {
             num_bytes_remaining_in_current_chunk = chunk_size;
             i += 1;
@@ -1339,21 +1385,27 @@ where
             num_bytes_remaining_in_current_chunk -= num_bytes;
         }
 
-        if i > chunk_number {
-            break;
+        if let Some(chunk_number) = kth_chunk {
+            if i > chunk_number {
+                break;
+            }
         }
     }
 
     Ok(())
 }
 
-/// Split a file into a specific number of chunks by line, but
+/// Split a file or STDIN into a specific number of chunks by line, but
 /// assign lines via round-robin
 ///
-/// This function always creates one output file for each chunk, even
+/// In Kth chunk of N mode - writes to stdout the contents of the chunk identified by `kth_chunk`
+///
+/// In N chunks mode - this function always creates one output file for each chunk, even
 /// if there is an error reading or writing one of the chunks or if
-/// the input file is truncated. However, if the `filter` option is
-/// being used, then no files are created.
+/// the input file is truncated. However, if the `--filter` option is
+/// being used, then files will only be created if `$FILE` variable was used
+/// in filter command,
+/// i.e. `split -n r/10 --filter='head -c1 > $FILE' in`
 ///
 /// # Errors
 ///
@@ -1362,50 +1414,73 @@ where
 ///
 /// # See also
 ///
-/// * [`split_into_n_chunks_by_line`], which splits its input in the same way,
-///   but without round robin distribution.
+/// * [`n_chunks_by_line`], which splits its input into a specific number of chunks by line.
 ///
 /// Implements `--number=CHUNKS`
 /// Where CHUNKS
 /// * r/N
-fn split_into_n_chunks_by_line_round_robin<R>(
+/// * r/K/N
+fn n_chunks_by_line_round_robin<R>(
     settings: &Settings,
     reader: &mut R,
     num_chunks: u64,
+    kth_chunk: Option<u64>,
 ) -> UResult<()>
 where
     R: BufRead,
 {
-    // This object is responsible for creating the filename for each chunk.
-    let mut filename_iterator = FilenameIterator::new(&settings.prefix, &settings.suffix)
-        .map_err(|e| io::Error::new(ErrorKind::Other, format!("{e}")))?;
-
-    // Create one writer for each chunk. This will create each
-    // of the underlying files (if not in `--filter` mode).
+    // In Kth chunk of N mode - we will write to stdout instead of to a file.
+    let mut stdout_writer = std::io::stdout().lock();
+    // In N chunks mode - we will write to `num_chunks` files
     let mut writers = vec![];
-    for _ in 0..num_chunks {
-        let filename = filename_iterator
-            .next()
-            .ok_or_else(|| io::Error::new(ErrorKind::Other, "output file suffixes exhausted"))?;
-        let writer = settings.instantiate_current_writer(filename.as_str())?;
-        writers.push(writer);
+
+    // If in N chunks mode
+    // Create one writer for each chunk.
+    // This will create each of the underlying files
+    // or stdin pipes to child shell/command processes if in `--filter` mode
+    if kth_chunk.is_none() {
+        // This object is responsible for creating the filename for each chunk.
+        let mut filename_iterator = FilenameIterator::new(&settings.prefix, &settings.suffix)
+            .map_err(|e| io::Error::new(ErrorKind::Other, format!("{e}")))?;
+        for _ in 0..num_chunks {
+            let filename = filename_iterator
+                .next()
+                .ok_or_else(|| USimpleError::new(1, "output file suffixes exhausted"))?;
+            let writer = settings.instantiate_current_writer(filename.as_str())?;
+            writers.push(writer);
+        }
     }
 
     let num_chunks: usize = num_chunks.try_into().unwrap();
     let sep = settings.separator;
     let mut closed_writers = 0;
     for (i, line_result) in reader.split(sep).enumerate() {
-        let maybe_writer = writers.get_mut(i % num_chunks);
-        let writer = maybe_writer.unwrap();
-        let mut line = line_result.unwrap();
+        // add separator back in at the end of the line
+        let mut line = line_result?;
         line.push(sep);
         let bytes = line.as_slice();
-        let writer_stdin_open = custom_write_all(bytes, writer, settings)?;
-        if !writer_stdin_open {
-            closed_writers += 1;
-            if closed_writers == num_chunks {
-                // all writers are closed - stop reading
-                break;
+
+        match kth_chunk {
+            Some(chunk_number) => {
+                // The `.enumerate()` method returns index `i` starting with 0,
+                // but chunk number is given as a 1-indexed number,
+                // so compare to `chunk_number - 1`
+                if (i % num_chunks) == (chunk_number - 1) as usize {
+                    stdout_writer.write_all(bytes)?;
+                }
+            }
+            None => {
+                let maybe_writer = writers.get_mut(i % num_chunks);
+                let writer = maybe_writer.unwrap();
+
+                let writer_stdin_open = custom_write_all(bytes, writer, settings)?;
+                if !writer_stdin_open {
+                    closed_writers += 1;
+                    if closed_writers == num_chunks {
+                        // all writers are closed - stop reading
+                        break;
+                    }
+                }
             }
         }
     }
@@ -1413,62 +1488,9 @@ where
     Ok(())
 }
 
-/// Print the k-th chunk of a file, splitting by line, but
-/// assign lines via round-robin to the specified number of output
-/// chunks, but output only the *k*th chunk.
-///
-/// This function is like [`kth_chunk_by_line`], as it only writes to stdout and
-/// prints out only *k*th chunk
-/// It is also like [`split_into_n_chunks_by_line_round_robin`], as it is assigning chunks
-/// using round robin distribution
-///
-/// # Errors
-///
-/// This function returns an error if there is a problem reading from
-/// `reader` or writing to one of the output files.
-///
-/// # See also
-///
-/// * [`split_into_n_chunks_by_line_round_robin`], which splits its input in the
-///   same way, but writes each chunk to its own file.
-///
-/// Implements `--number=CHUNKS`
-/// Where CHUNKS
-/// * r/K/N
-fn kth_chunk_by_line_round_robin<R>(
-    settings: &Settings,
-    reader: &mut R,
-    chunk_number: u64,
-    num_chunks: u64,
-) -> UResult<()>
-where
-    R: BufRead,
-{
-    // Write to stdout instead of to a file.
-    let stdout = std::io::stdout();
-    let mut writer = stdout.lock();
-
-    let num_chunks: usize = num_chunks.try_into().unwrap();
-    let chunk_number: usize = chunk_number.try_into().unwrap();
-    let sep = settings.separator;
-    // The chunk number is given as a 1-indexed number, but it
-    // is a little easier to deal with a 0-indexed number
-    // since `.enumerate()` returns index `i` starting with 0
-    let chunk_number = chunk_number - 1;
-    for (i, line_result) in reader.split(sep).enumerate() {
-        let line = line_result?;
-        let bytes = line.as_slice();
-        if (i % num_chunks) == chunk_number {
-            writer.write_all(bytes)?;
-            writer.write_all(&[sep])?;
-        }
-    }
-    Ok(())
-}
-
 #[allow(clippy::cognitive_complexity)]
 fn split(settings: &Settings) -> UResult<()> {
-    let mut reader = BufReader::new(if settings.input == "-" {
+    let r_box = if settings.input == "-" {
         Box::new(stdin()) as Box<dyn Read>
     } else {
         let r = File::open(Path::new(&settings.input)).map_err_context(|| {
@@ -1478,26 +1500,33 @@ fn split(settings: &Settings) -> UResult<()> {
             )
         })?;
         Box::new(r) as Box<dyn Read>
-    });
+    };
+    let mut reader = if let Some(c) = settings.io_blksize {
+        BufReader::with_capacity(c, r_box)
+    } else {
+        BufReader::new(r_box)
+    };
 
     match settings.strategy {
         Strategy::Number(NumberType::Bytes(num_chunks)) => {
-            split_into_n_chunks_by_byte(settings, &mut reader, num_chunks)
+            // split_into_n_chunks_by_byte(settings, &mut reader, num_chunks)
+            n_chunks_by_byte(settings, &mut reader, num_chunks, None)
         }
         Strategy::Number(NumberType::KthBytes(chunk_number, num_chunks)) => {
-            kth_chunks_by_byte(settings, &mut reader, chunk_number, num_chunks)
+            // kth_chunks_by_byte(settings, &mut reader, chunk_number, num_chunks)
+            n_chunks_by_byte(settings, &mut reader, num_chunks, Some(chunk_number))
         }
         Strategy::Number(NumberType::Lines(num_chunks)) => {
-            split_into_n_chunks_by_line(settings, &mut reader, num_chunks)
+            n_chunks_by_line(settings, &mut reader, num_chunks, None)
         }
         Strategy::Number(NumberType::KthLines(chunk_number, num_chunks)) => {
-            kth_chunk_by_line(settings, &mut reader, chunk_number, num_chunks)
+            n_chunks_by_line(settings, &mut reader, num_chunks, Some(chunk_number))
         }
         Strategy::Number(NumberType::RoundRobin(num_chunks)) => {
-            split_into_n_chunks_by_line_round_robin(settings, &mut reader, num_chunks)
+            n_chunks_by_line_round_robin(settings, &mut reader, num_chunks, None)
         }
         Strategy::Number(NumberType::KthRoundRobin(chunk_number, num_chunks)) => {
-            kth_chunk_by_line_round_robin(settings, &mut reader, chunk_number, num_chunks)
+            n_chunks_by_line_round_robin(settings, &mut reader, num_chunks, Some(chunk_number))
         }
         Strategy::Lines(chunk_size) => {
             let mut writer = LineChunkWriter::new(chunk_size, settings)?;
diff --git a/tests/by-util/test_split.rs b/tests/by-util/test_split.rs
index aec6f059441..0ae2af5cb92 100644
--- a/tests/by-util/test_split.rs
+++ b/tests/by-util/test_split.rs
@@ -2,7 +2,7 @@
 //
 // For the full copyright and license information, please view the LICENSE
 // file that was distributed with this source code.
-// spell-checker:ignore xzaaa sixhundredfiftyonebytes ninetyonebytes threebytes asciilowercase fghij klmno pqrst uvwxyz fivelines twohundredfortyonebytes onehundredlines nbbbb dxen ncccc
+// spell-checker:ignore xzaaa sixhundredfiftyonebytes ninetyonebytes threebytes asciilowercase ghijkl mnopq rstuv wxyz fivelines twohundredfortyonebytes onehundredlines nbbbb dxen ncccc
 
 use crate::common::util::{AtPath, TestScenario};
 use rand::{thread_rng, Rng, SeedableRng};
@@ -704,54 +704,41 @@ fn test_split_overflow_bytes_size() {
     assert_eq!(glob.collate(), at.read_bytes(name));
 }
 
-#[test]
-#[cfg(target_pointer_width = "32")]
-fn test_split_chunks_num_chunks_oversized_32() {
-    let scene = TestScenario::new(util_name!());
-    let at = &scene.fixtures;
-    at.touch("file");
-    scene
-        .ucmd()
-        .args(&["--number", "5000000000", "sixhundredfiftyonebytes.txt"])
-        .fails()
-        .code_is(1)
-        .stderr_only("split: Number of chunks too big\n");
-}
-
 #[test]
 fn test_split_stdin_num_chunks() {
-    new_ucmd!()
-        .args(&["--number=1"])
-        .fails()
-        .code_is(1)
-        .stderr_only("split: -: cannot determine file size\n");
+    let (at, mut ucmd) = at_and_ucmd!();
+    ucmd.args(&["--number=1"]).pipe_in("").succeeds();
+    assert_eq!(file_read(&at, "xaa"), "");
+    assert!(!at.plus("xab").exists());
 }
 
 #[test]
 fn test_split_stdin_num_kth_chunk() {
     new_ucmd!()
         .args(&["--number=1/2"])
-        .fails()
-        .code_is(1)
-        .stderr_only("split: -: cannot determine file size\n");
+        .pipe_in("1\n2\n3\n4\n5\n")
+        .succeeds()
+        .stdout_only("1\n2\n3");
 }
 
 #[test]
 fn test_split_stdin_num_line_chunks() {
-    new_ucmd!()
-        .args(&["--number=l/2"])
-        .fails()
-        .code_is(1)
-        .stderr_only("split: -: cannot determine file size\n");
+    let (at, mut ucmd) = at_and_ucmd!();
+    ucmd.args(&["--number=l/2"])
+        .pipe_in("1\n2\n3\n4\n5\n")
+        .succeeds();
+    assert_eq!(file_read(&at, "xaa"), "1\n2\n3\n");
+    assert_eq!(file_read(&at, "xab"), "4\n5\n");
+    assert!(!at.plus("xac").exists());
 }
 
 #[test]
 fn test_split_stdin_num_kth_line_chunk() {
     new_ucmd!()
         .args(&["--number=l/2/5"])
-        .fails()
-        .code_is(1)
-        .stderr_only("split: -: cannot determine file size\n");
+        .pipe_in("1\n2\n3\n4\n5\n")
+        .succeeds()
+        .stdout_only("2\n");
 }
 
 fn file_read(at: &AtPath, filename: &str) -> String {
@@ -912,6 +899,14 @@ fn test_suffixes_exhausted() {
         .stderr_only("split: output file suffixes exhausted\n");
 }
 
+#[test]
+fn test_suffix_length_req() {
+    new_ucmd!()
+        .args(&["-n", "100", "-a", "1", "asciilowercase.txt"])
+        .fails()
+        .stderr_only("split: the suffix length needs to be at least 2\n");
+}
+
 #[test]
 fn test_verbose() {
     new_ucmd!()
@@ -937,11 +932,11 @@ fn test_number_n() {
         s
     };
     ucmd.args(&["-n", "5", "asciilowercase.txt"]).succeeds();
-    assert_eq!(file_read("xaa"), "abcde");
-    assert_eq!(file_read("xab"), "fghij");
-    assert_eq!(file_read("xac"), "klmno");
-    assert_eq!(file_read("xad"), "pqrst");
-    assert_eq!(file_read("xae"), "uvwxyz\n");
+    assert_eq!(file_read("xaa"), "abcdef");
+    assert_eq!(file_read("xab"), "ghijkl");
+    assert_eq!(file_read("xac"), "mnopq");
+    assert_eq!(file_read("xad"), "rstuv");
+    assert_eq!(file_read("xae"), "wxyz\n");
     #[cfg(unix)]
     new_ucmd!()
         .args(&["--number=100", "/dev/null"])
@@ -954,11 +949,11 @@ fn test_number_kth_of_n() {
     new_ucmd!()
         .args(&["--number=3/5", "asciilowercase.txt"])
         .succeeds()
-        .stdout_only("klmno");
+        .stdout_only("mnopq");
     new_ucmd!()
         .args(&["--number=5/5", "asciilowercase.txt"])
         .succeeds()
-        .stdout_only("uvwxyz\n");
+        .stdout_only("wxyz\n");
     new_ucmd!()
         .args(&["-e", "--number=99/100", "asciilowercase.txt"])
         .succeeds()
@@ -1046,11 +1041,11 @@ fn test_split_number_with_io_blksize() {
     };
     ucmd.args(&["-n", "5", "asciilowercase.txt", "---io-blksize", "1024"])
         .succeeds();
-    assert_eq!(file_read("xaa"), "abcde");
-    assert_eq!(file_read("xab"), "fghij");
-    assert_eq!(file_read("xac"), "klmno");
-    assert_eq!(file_read("xad"), "pqrst");
-    assert_eq!(file_read("xae"), "uvwxyz\n");
+    assert_eq!(file_read("xaa"), "abcdef");
+    assert_eq!(file_read("xab"), "ghijkl");
+    assert_eq!(file_read("xac"), "mnopq");
+    assert_eq!(file_read("xad"), "rstuv");
+    assert_eq!(file_read("xae"), "wxyz\n");
 }
 
 #[test]
@@ -1065,6 +1060,32 @@ fn test_split_default_with_io_blksize() {
     assert_eq!(glob.collate(), at.read_bytes(name));
 }
 
+#[test]
+fn test_split_invalid_io_blksize() {
+    new_ucmd!()
+        .args(&["---io-blksize=XYZ", "threebytes.txt"])
+        .fails()
+        .stderr_only("split: invalid IO block size: 'XYZ'\n");
+    new_ucmd!()
+        .args(&["---io-blksize=5000000000", "threebytes.txt"])
+        .fails()
+        .stderr_only("split: invalid IO block size: '5000000000'\n");
+    #[cfg(target_pointer_width = "32")]
+    new_ucmd!()
+        .args(&["---io-blksize=2146435072", "threebytes.txt"])
+        .fails()
+        .stderr_only("split: invalid IO block size: '2146435072'\n");
+}
+
+#[test]
+fn test_split_number_oversized_stdin() {
+    new_ucmd!()
+        .args(&["--number=3", "---io-blksize=600"])
+        .pipe_in_fixture("sixhundredfiftyonebytes.txt")
+        .fails()
+        .stderr_only("split: -: cannot determine input size\n");
+}
+
 #[test]
 fn test_invalid_suffix_length() {
     new_ucmd!()
@@ -1157,6 +1178,18 @@ fn test_elide_dev_null() {
     assert!(!at.plus("xac").exists());
 }
 
+#[test]
+#[cfg(unix)]
+fn test_dev_zero() {
+    let (at, mut ucmd) = at_and_ucmd!();
+    ucmd.args(&["-n", "3", "/dev/zero"])
+        .fails()
+        .stderr_only("split: /dev/zero: cannot determine file size\n");
+    assert!(!at.plus("xaa").exists());
+    assert!(!at.plus("xab").exists());
+    assert!(!at.plus("xac").exists());
+}
+
 #[test]
 fn test_lines() {
     let (at, mut ucmd) = at_and_ucmd!();
@@ -1182,6 +1215,15 @@ fn test_lines_kth() {
         .stdout_only("20\n21\n22\n23\n24\n25\n26\n27\n28\n29\n");
 }
 
+#[test]
+#[cfg(unix)]
+fn test_lines_kth_dev_null() {
+    new_ucmd!()
+        .args(&["-n", "l/3/10", "/dev/null"])
+        .succeeds()
+        .stdout_only("");
+}
+
 #[test]
 fn test_line_bytes() {
     let (at, mut ucmd) = at_and_ucmd!();
@@ -1321,7 +1363,7 @@ fn test_numeric_suffix() {
 }
 
 #[test]
-fn test_numeric_suffix_alias() {
+fn test_numeric_suffix_inferred() {
     let (at, mut ucmd) = at_and_ucmd!();
     ucmd.args(&["-n", "4", "--numeric=9", "threebytes.txt"])
         .succeeds()

From 8e796d3bb679bf7c064baca79b2ee0664b90762e Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Sun, 19 Nov 2023 15:10:28 +0100
Subject: [PATCH 041/429] mv: fix issue with -T and dest ending with "/"

---
 src/uu/mv/src/mv.rs      |  2 +-
 tests/by-util/test_mv.rs | 26 ++++++++++++++++++++++++++
 2 files changed, 27 insertions(+), 1 deletion(-)

diff --git a/src/uu/mv/src/mv.rs b/src/uu/mv/src/mv.rs
index 036024f9907..f0529af7e6c 100644
--- a/src/uu/mv/src/mv.rs
+++ b/src/uu/mv/src/mv.rs
@@ -341,7 +341,7 @@ fn handle_two_paths(source: &Path, target: &Path, opts: &Options) -> UResult<()>
 
     let target_is_dir = target.is_dir();
 
-    if path_ends_with_terminator(target) && !target_is_dir {
+    if path_ends_with_terminator(target) && !target_is_dir && !opts.no_target_dir {
         return Err(MvError::FailedToAccessNotADirectory(target.quote().to_string()).into());
     }
 
diff --git a/tests/by-util/test_mv.rs b/tests/by-util/test_mv.rs
index c54d24ea906..571de769125 100644
--- a/tests/by-util/test_mv.rs
+++ b/tests/by-util/test_mv.rs
@@ -1158,6 +1158,32 @@ fn test_mv_overwrite_dir() {
     assert!(at.dir_exists(dir_b));
 }
 
+#[test]
+fn test_mv_no_target_dir_with_dest_not_existing() {
+    let (at, mut ucmd) = at_and_ucmd!();
+    let dir_a = "a";
+    let dir_b = "b";
+
+    at.mkdir(dir_a);
+    ucmd.arg("-T").arg(dir_a).arg(dir_b).succeeds().no_output();
+
+    assert!(!at.dir_exists(dir_a));
+    assert!(at.dir_exists(dir_b));
+}
+
+#[test]
+fn test_mv_no_target_dir_with_dest_not_existing_and_ending_with_slash() {
+    let (at, mut ucmd) = at_and_ucmd!();
+    let dir_a = "a";
+    let dir_b = "b/";
+
+    at.mkdir(dir_a);
+    ucmd.arg("-T").arg(dir_a).arg(dir_b).succeeds().no_output();
+
+    assert!(!at.dir_exists(dir_a));
+    assert!(at.dir_exists(dir_b));
+}
+
 #[test]
 fn test_mv_overwrite_nonempty_dir() {
     let (at, mut ucmd) = at_and_ucmd!();

From 285e580b6eb9475e5d61645594b7a75c13073eed Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Sun, 19 Nov 2023 15:59:38 +0100
Subject: [PATCH 042/429] cp: improve error msg if -r is not specified

---
 src/uu/cp/src/copydir.rs | 2 +-
 tests/by-util/test_cp.rs | 4 +++-
 2 files changed, 4 insertions(+), 2 deletions(-)

diff --git a/src/uu/cp/src/copydir.rs b/src/uu/cp/src/copydir.rs
index 763d66c0b03..a903ed2aaff 100644
--- a/src/uu/cp/src/copydir.rs
+++ b/src/uu/cp/src/copydir.rs
@@ -324,7 +324,7 @@ pub(crate) fn copy_directory(
     source_in_command_line: bool,
 ) -> CopyResult<()> {
     if !options.recursive {
-        return Err(format!("omitting directory {}", root.quote()).into());
+        return Err(format!("-r not specified; omitting directory {}", root.quote()).into());
     }
 
     // if no-dereference is enabled and this is a symlink, copy it as a file
diff --git a/tests/by-util/test_cp.rs b/tests/by-util/test_cp.rs
index c8761fab8fb..14b68da3718 100644
--- a/tests/by-util/test_cp.rs
+++ b/tests/by-util/test_cp.rs
@@ -131,7 +131,9 @@ fn test_cp_directory_not_recursive() {
         .arg(TEST_COPY_TO_FOLDER)
         .arg(TEST_HELLO_WORLD_DEST)
         .fails()
-        .stderr_contains("omitting directory");
+        .stderr_is(format!(
+            "cp: -r not specified; omitting directory '{TEST_COPY_TO_FOLDER}'\n"
+        ));
 }
 
 #[test]

From 58087df02a30bb4c7d6e474dfeee20b9faa51b93 Mon Sep 17 00:00:00 2001
From: clara swanson <69856940+cswn@users.noreply.github.com>
Date: Mon, 20 Nov 2023 10:16:18 +0100
Subject: [PATCH 043/429] stdbuf: remove crash macro (#5549)

* stdbuf: remove crash! macro

* stdbuf: change target_vendor back to apple

* tests/stdbuf: change stderr_only to usage_error in test_stdbuf_invalid_mode_fails

* stdbuf: add exit code to check_option

* stdbuf: remove set_exit_code line from error
---
 src/uu/stdbuf/src/stdbuf.rs  | 29 +++++++++++++++--------------
 tests/by-util/test_stdbuf.rs |  2 +-
 2 files changed, 16 insertions(+), 15 deletions(-)

diff --git a/src/uu/stdbuf/src/stdbuf.rs b/src/uu/stdbuf/src/stdbuf.rs
index 8578282752e..38c4451ca50 100644
--- a/src/uu/stdbuf/src/stdbuf.rs
+++ b/src/uu/stdbuf/src/stdbuf.rs
@@ -7,7 +7,7 @@
 
 use clap::{crate_version, Arg, ArgAction, ArgMatches, Command};
 use std::fs::File;
-use std::io::{self, Write};
+use std::io::Write;
 use std::os::unix::process::ExitStatusExt;
 use std::path::PathBuf;
 use std::process;
@@ -15,7 +15,7 @@ use tempfile::tempdir;
 use tempfile::TempDir;
 use uucore::error::{FromIo, UResult, USimpleError, UUsageError};
 use uucore::parse_size::parse_size_u64;
-use uucore::{crash, format_usage, help_about, help_section, help_usage};
+use uucore::{format_usage, help_about, help_section, help_usage};
 
 const ABOUT: &str = help_about!("stdbuf.md");
 const USAGE: &str = help_usage!("stdbuf.md");
@@ -66,13 +66,13 @@ struct ProgramOptionsError(String);
     target_os = "netbsd",
     target_os = "dragonflybsd"
 ))]
-fn preload_strings() -> (&'static str, &'static str) {
-    ("LD_PRELOAD", "so")
+fn preload_strings() -> UResult<(&'static str, &'static str)> {
+    Ok(("LD_PRELOAD", "so"))
 }
 
 #[cfg(target_vendor = "apple")]
-fn preload_strings() -> (&'static str, &'static str) {
-    ("DYLD_LIBRARY_PATH", "dylib")
+fn preload_strings() -> UResult<(&'static str, &'static str)> {
+    Ok(("DYLD_LIBRARY_PATH", "dylib"))
 }
 
 #[cfg(not(any(
@@ -83,10 +83,11 @@ fn preload_strings() -> (&'static str, &'static str) {
     target_os = "dragonflybsd",
     target_vendor = "apple"
 )))]
-fn preload_strings() -> (&'static str, &'static str) {
-    use uucore::crash;
-
-    crash!(1, "Command not supported for this operating system!")
+fn preload_strings() -> UResult<(&'static str, &'static str)> {
+    Err(USimpleError::new(
+        1,
+        "Command not supported for this operating system!",
+    ))
 }
 
 fn check_option(matches: &ArgMatches, name: &str) -> Result<BufferType, ProgramOptionsError> {
@@ -102,7 +103,7 @@ fn check_option(matches: &ArgMatches, name: &str) -> Result<BufferType, ProgramO
                 }
             }
             x => parse_size_u64(x).map_or_else(
-                |e| crash!(125, "invalid mode {}", e),
+                |e| Err(ProgramOptionsError(format!("invalid mode {e}"))),
                 |m| {
                     Ok(BufferType::Size(m.try_into().map_err(|_| {
                         ProgramOptionsError(format!(
@@ -128,8 +129,8 @@ fn set_command_env(command: &mut process::Command, buffer_name: &str, buffer_typ
     }
 }
 
-fn get_preload_env(tmp_dir: &TempDir) -> io::Result<(String, PathBuf)> {
-    let (preload, extension) = preload_strings();
+fn get_preload_env(tmp_dir: &TempDir) -> UResult<(String, PathBuf)> {
+    let (preload, extension) = preload_strings()?;
     let inject_path = tmp_dir.path().join("libstdbuf").with_extension(extension);
 
     let mut file = File::create(&inject_path)?;
@@ -151,7 +152,7 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
     let command_params: Vec<&str> = command_values.map(|s| s.as_ref()).collect();
 
     let tmp_dir = tempdir().unwrap();
-    let (preload_env, libstdbuf) = get_preload_env(&tmp_dir).map_err_context(String::new)?;
+    let (preload_env, libstdbuf) = get_preload_env(&tmp_dir)?;
     command.env(preload_env, libstdbuf);
     set_command_env(&mut command, "_STDBUF_I", &options.stdin);
     set_command_env(&mut command, "_STDBUF_O", &options.stdout);
diff --git a/tests/by-util/test_stdbuf.rs b/tests/by-util/test_stdbuf.rs
index 9a67dad9e37..50de4c54696 100644
--- a/tests/by-util/test_stdbuf.rs
+++ b/tests/by-util/test_stdbuf.rs
@@ -65,7 +65,7 @@ fn test_stdbuf_invalid_mode_fails() {
             .args(&[*option, "1024R", "head"])
             .fails()
             .code_is(125)
-            .stderr_only("stdbuf: invalid mode '1024R': Value too large for defined data type\n");
+            .usage_error("invalid mode '1024R': Value too large for defined data type");
         #[cfg(not(target_pointer_width = "128"))]
         new_ucmd!()
             .args(&[*option, "1Y", "head"])

From c43ee01d1920eeeb98d2cc38f61ef217ef89cf12 Mon Sep 17 00:00:00 2001
From: Terts Diepraam <terts.diepraam@gmail.com>
Date: Mon, 20 Nov 2023 12:38:26 +0100
Subject: [PATCH 044/429] printf: allow precision in string

---
 src/uucore/src/lib/features/format/spec.rs | 23 ++++++++++++++++++++--
 1 file changed, 21 insertions(+), 2 deletions(-)

diff --git a/src/uucore/src/lib/features/format/spec.rs b/src/uucore/src/lib/features/format/spec.rs
index 06f0ca1d6e7..0cd0f03b4c3 100644
--- a/src/uucore/src/lib/features/format/spec.rs
+++ b/src/uucore/src/lib/features/format/spec.rs
@@ -17,6 +17,7 @@ pub enum Spec {
     },
     String {
         width: Option<CanAsterisk<usize>>,
+        precision: Option<CanAsterisk<usize>>,
         parse_escape: bool,
         align_left: bool,
     },
@@ -159,11 +160,13 @@ impl Spec {
             },
             b's' => Spec::String {
                 width,
+                precision,
                 parse_escape: false,
                 align_left: minus,
             },
             b'b' => Spec::String {
                 width,
+                precision,
                 parse_escape: true,
                 align_left: minus,
             },
@@ -254,10 +257,12 @@ impl Spec {
             }
             &Spec::String {
                 width,
+                precision,
                 parse_escape,
                 align_left,
             } => {
                 let width = resolve_asterisk(width, &mut args)?.unwrap_or(0);
+                let precision = resolve_asterisk(precision, &mut args)?;
                 let arg = next_arg(&mut args)?;
                 let Some(s) = arg.get_str() else {
                     return Err(FormatError::InvalidArgument(arg.clone()));
@@ -273,15 +278,29 @@ impl Spec {
                             }
                         };
                     }
+                    // GNU does do this truncation on a byte level, see for instance:
+                    //     printf "%.1s" 🙃
+                    //     > �
+                    // For now, we let printf panic when we truncate within a code point.
+                    // TODO: We need to not use Rust's formatting for aligning the output,
+                    // so that we can just write bytes to stdout without panicking.
+                    let truncated = match precision {
+                        Some(p) if p < parsed.len() => &parsed[..p],
+                        _ => &parsed,
+                    };
                     write_padded(
                         writer,
-                        std::str::from_utf8(&parsed).expect("TODO: Accept invalid utf8"),
+                        std::str::from_utf8(&truncated).expect("TODO: Accept invalid utf8"),
                         width,
                         false,
                         align_left,
                     )
                 } else {
-                    write_padded(writer, s, width, false, align_left)
+                    let truncated = match precision {
+                        Some(p) if p < s.len() => &s[..p],
+                        _ => s,
+                    };
+                    write_padded(writer, truncated, width, false, align_left)
                 }
             }
             &Spec::SignedInt {

From 066d8ba73d0a08eb47c1fea9e1d446b47fbca1f6 Mon Sep 17 00:00:00 2001
From: Terts Diepraam <terts.diepraam@gmail.com>
Date: Mon, 20 Nov 2023 13:25:20 +0100
Subject: [PATCH 045/429] printf: coerce missing and invalid arguments to 0

---
 .../src/lib/features/format/argument.rs       | 113 ++++++++++--------
 src/uucore/src/lib/features/format/spec.rs    |  52 ++------
 2 files changed, 75 insertions(+), 90 deletions(-)

diff --git a/src/uucore/src/lib/features/format/argument.rs b/src/uucore/src/lib/features/format/argument.rs
index 120b59aa4b5..96cfeddf3f6 100644
--- a/src/uucore/src/lib/features/format/argument.rs
+++ b/src/uucore/src/lib/features/format/argument.rs
@@ -9,84 +9,103 @@ pub enum FormatArgument {
     Unparsed(String),
 }
 
-impl FormatArgument {
-    pub fn get_char(&self) -> Option<char> {
-        match self {
-            Self::Char(c) => Some(*c),
-            Self::Unparsed(s) => {
+pub trait ArgumentIter<'a>: Iterator<Item = &'a FormatArgument> {
+    fn get_char(&mut self) -> char;
+    fn get_i64(&mut self) -> i64;
+    fn get_u64(&mut self) -> u64;
+    fn get_f64(&mut self) -> f64;
+    fn get_str(&mut self) -> &'a str;
+}
+
+impl<'a, T: Iterator<Item = &'a FormatArgument>> ArgumentIter<'a> for T {
+    fn get_char(&mut self) -> char {
+        let Some(next) = self.next() else {
+            return '\0';
+        };
+        match next {
+            FormatArgument::Char(c) => *c,
+            FormatArgument::Unparsed(s) => {
                 let mut chars = s.chars();
                 let Some(c) = chars.next() else {
-                    return None;
+                    return '\0';
                 };
                 let None = chars.next() else {
-                    return None;
+                    return '\0';
                 };
-                Some(c)
+                c
             }
-            _ => None,
+            _ => '\0',
         }
     }
 
-    pub fn get_u64(&self) -> Option<u64> {
-        match self {
-            Self::UnsignedInt(n) => Some(*n),
-            Self::Unparsed(s) => {
-                if let Some(s) = s.strip_prefix("0x") {
-                    u64::from_str_radix(s, 16).ok()
-                } else if let Some(s) = s.strip_prefix("0") {
-                    u64::from_str_radix(s, 8).ok()
-                } else if let Some(s) = s.strip_prefix('\'') {
-                    Some(s.chars().next()? as u64)
-                } else {
-                    s.parse().ok()
-                }
+    fn get_u64(&mut self) -> u64 {
+        let Some(next) = self.next() else {
+            return 0;
+        };
+        match next {
+            FormatArgument::UnsignedInt(n) => *n,
+            FormatArgument::Unparsed(s) => if let Some(s) = s.strip_prefix("0x") {
+                u64::from_str_radix(s, 16).ok()
+            } else if let Some(s) = s.strip_prefix("0") {
+                u64::from_str_radix(s, 8).ok()
+            } else if let Some(s) = s.strip_prefix('\'') {
+                s.chars().next().map(|c| c as u64)
+            } else {
+                s.parse().ok()
             }
-            _ => None,
+            .unwrap_or(0),
+            _ => 0,
         }
     }
 
-    pub fn get_i64(&self) -> Option<i64> {
-        match self {
-            Self::SignedInt(n) => Some(*n),
-            Self::Unparsed(s) => {
+    fn get_i64(&mut self) -> i64 {
+        let Some(next) = self.next() else {
+            return 0;
+        };
+        match next {
+            FormatArgument::SignedInt(n) => *n,
+            FormatArgument::Unparsed(s) => {
                 // For hex, we parse `u64` because we do not allow another
                 // minus sign. We might need to do more precise parsing here.
                 if let Some(s) = s.strip_prefix("-0x") {
-                    Some(- (u64::from_str_radix(s, 16).ok()? as i64))
+                    u64::from_str_radix(s, 16).ok().map(|x| -(x as i64))
                 } else if let Some(s) = s.strip_prefix("0x") {
-                    Some(u64::from_str_radix(s, 16).ok()? as i64)
+                    u64::from_str_radix(s, 16).ok().map(|x| x as i64)
                 } else if s.starts_with("-0") || s.starts_with('0') {
                     i64::from_str_radix(s, 8).ok()
                 } else if let Some(s) = s.strip_prefix('\'') {
-                    Some(s.chars().next()? as i64)
+                    s.chars().next().map(|x| x as i64)
                 } else {
                     s.parse().ok()
                 }
+                .unwrap_or(0)
             }
-            _ => None,
+            _ => 0,
         }
     }
 
-    pub fn get_f64(&self) -> Option<f64> {
-        match self {
-            Self::Float(n) => Some(*n),
-            Self::Unparsed(s) => {
-                if s.starts_with("0x") || s.starts_with("-0x") {
-                    unimplemented!("Hexadecimal floats are unimplemented!")
-                } else if let Some(s) = s.strip_prefix('\'') {
-                    Some(s.chars().next()? as u64 as f64)
-                } else {
-                    s.parse().ok()
-                }
+    fn get_f64(&mut self) -> f64 {
+        let Some(next) = self.next() else {
+            return 0.0;
+        };
+        match next {
+            FormatArgument::Float(n) => *n,
+            FormatArgument::Unparsed(s) => if s.starts_with("0x") || s.starts_with("-0x") {
+                unimplemented!("Hexadecimal floats are unimplemented!")
+            } else if let Some(s) = s.strip_prefix('\'') {
+                s.chars().next().map(|x| x as u64 as f64)
+            } else {
+                s.parse().ok()
             }
-            _ => None,
+            .unwrap_or(0.0),
+            _ => 0.0,
         }
     }
 
-    pub fn get_str(&self) -> Option<&str> {
-        match self {
-            Self::Unparsed(s) | Self::String(s) => Some(s),
-            _ => None,
+    fn get_str(&mut self) -> &'a str {
+        match self.next() {
+            Some(FormatArgument::Unparsed(s) | FormatArgument::String(s)) => s,
+            _ => "",
         }
     }
 }
diff --git a/src/uucore/src/lib/features/format/spec.rs b/src/uucore/src/lib/features/format/spec.rs
index 0cd0f03b4c3..23c68c06669 100644
--- a/src/uucore/src/lib/features/format/spec.rs
+++ b/src/uucore/src/lib/features/format/spec.rs
@@ -5,7 +5,7 @@ use super::{
         self, Case, FloatVariant, ForceDecimal, Formatter, NumberAlignment, PositiveSign, Prefix,
         UnsignedIntVariant,
     },
-    parse_escape_only, FormatArgument, FormatChar, FormatError,
+    parse_escape_only, ArgumentIter, FormatChar, FormatError,
 };
 use std::{fmt::Display, io::Write, ops::ControlFlow};
 
@@ -244,16 +244,12 @@ impl Spec {
     pub fn write<'a>(
         &self,
         writer: impl Write,
-        mut args: impl Iterator<Item = &'a FormatArgument>,
+        mut args: impl ArgumentIter<'a>,
     ) -> Result<(), FormatError> {
         match self {
             &Spec::Char { width, align_left } => {
                 let width = resolve_asterisk(width, &mut args)?.unwrap_or(0);
-                let arg = next_arg(&mut args)?;
-                match arg.get_char() {
-                    Some(c) => write_padded(writer, c, width, false, align_left),
-                    _ => Err(FormatError::InvalidArgument(arg.clone())),
-                }
+                write_padded(writer, args.get_char(), width, false, align_left)
             }
             &Spec::String {
                 width,
@@ -263,10 +259,7 @@ impl Spec {
             } => {
                 let width = resolve_asterisk(width, &mut args)?.unwrap_or(0);
                 let precision = resolve_asterisk(precision, &mut args)?;
-                let arg = next_arg(&mut args)?;
-                let Some(s) = arg.get_str() else {
-                    return Err(FormatError::InvalidArgument(arg.clone()));
-                };
+                let s = args.get_str();
                 if parse_escape {
                     let mut parsed = Vec::new();
                     for c in parse_escape_only(s.as_bytes()) {
@@ -311,11 +304,7 @@ impl Spec {
             } => {
                 let width = resolve_asterisk(width, &mut args)?.unwrap_or(0);
                 let precision = resolve_asterisk(precision, &mut args)?.unwrap_or(0);
-
-                let arg = next_arg(&mut args)?;
-                let Some(i) = arg.get_i64() else {
-                    return Err(FormatError::InvalidArgument(arg.clone()));
-                };
+                let i = args.get_i64();
 
                 num_format::SignedInt {
                     width,
@@ -334,11 +323,7 @@ impl Spec {
             } => {
                 let width = resolve_asterisk(width, &mut args)?.unwrap_or(0);
                 let precision = resolve_asterisk(precision, &mut args)?.unwrap_or(0);
-
-                let arg = next_arg(args)?;
-                let Some(i) = arg.get_u64() else {
-                    return Err(FormatError::InvalidArgument(arg.clone()));
-                };
+                let i = args.get_u64();
 
                 num_format::UnsignedInt {
                     variant,
@@ -360,11 +345,7 @@ impl Spec {
             } => {
                 let width = resolve_asterisk(width, &mut args)?.unwrap_or(0);
                 let precision = resolve_asterisk(precision, &mut args)?.unwrap_or(6);
-
-                let arg = next_arg(args)?;
-                let Some(f) = arg.get_f64() else {
-                    return Err(FormatError::InvalidArgument(arg.clone()));
-                };
+                let f = args.get_f64();
 
                 num_format::Float {
                     variant,
@@ -384,30 +365,15 @@ impl Spec {
 
 fn resolve_asterisk<'a>(
     option: Option<CanAsterisk<usize>>,
-    args: impl Iterator<Item = &'a FormatArgument>,
+    mut args: impl ArgumentIter<'a>,
 ) -> Result<Option<usize>, FormatError> {
     Ok(match option {
         None => None,
-        Some(CanAsterisk::Asterisk) => {
-            let arg = next_arg(args)?;
-            match arg.get_u64() {
-                Some(u) => match usize::try_from(u) {
-                    Ok(u) => Some(u),
-                    Err(_) => return Err(FormatError::InvalidArgument(arg.clone())),
-                },
-                _ => return Err(FormatError::InvalidArgument(arg.clone())),
-            }
-        }
+        Some(CanAsterisk::Asterisk) => Some(usize::try_from(args.get_u64()).ok().unwrap_or(0)),
         Some(CanAsterisk::Fixed(w)) => Some(w),
     })
 }
 
-fn next_arg<'a>(
-    mut arguments: impl Iterator<Item = &'a FormatArgument>,
-) -> Result<&'a FormatArgument, FormatError> {
-    arguments.next().ok_or(FormatError::NoMoreArguments)
-}
-
 fn write_padded(
     mut writer: impl Write,
     text: impl Display,

From 68d036c9a299282f77143728063f2c7d52b67c5b Mon Sep 17 00:00:00 2001
From: Terts Diepraam <terts.diepraam@gmail.com>
Date: Mon, 20 Nov 2023 13:45:02 +0100
Subject: [PATCH 046/429] printf: basic support for unicode escape sequences

---
 src/uucore/src/lib/features/format/escape.rs | 49 ++++++++++++++------
 src/uucore/src/lib/features/format/mod.rs    | 15 +++---
 2 files changed, 44 insertions(+), 20 deletions(-)

diff --git a/src/uucore/src/lib/features/format/escape.rs b/src/uucore/src/lib/features/format/escape.rs
index b8c21741caf..1e06a8176dd 100644
--- a/src/uucore/src/lib/features/format/escape.rs
+++ b/src/uucore/src/lib/features/format/escape.rs
@@ -1,6 +1,7 @@
 #[derive(Debug)]
 pub enum EscapedChar {
-    Char(u8),
+    Byte(u8),
+    Char(char),
     Backslash(u8),
     End,
 }
@@ -61,6 +62,24 @@ fn parse_code(input: &mut &[u8], base: Base) -> Option<u8> {
     Some(ret)
 }
 
+/// Parse `\uHHHH` and `\UHHHHHHHH`
+// TODO: This should print warnings and possibly halt execution when it fails to parse
+// TODO: If the character cannot be converted to u32, the input should be printed.
+fn parse_unicode(input: &mut &[u8], digits: u8) -> Option<char> {
+    let (c, rest) = input.split_first()?;
+    let mut ret = Base::Hex.to_digit(*c)? as u32;
+    *input = &rest[..];
+
+    for _ in 1..digits {
+        let (c, rest) = input.split_first()?;
+        let n = Base::Hex.to_digit(*c)?;
+        ret = ret.wrapping_mul(Base::Hex as u32).wrapping_add(n as u32);
+        *input = &rest[..];
+    }
+
+    char::from_u32(ret)
+}
+
 pub fn parse_escape_code(rest: &mut &[u8]) -> EscapedChar {
     if let [c, new_rest @ ..] = rest {
         // This is for the \NNN syntax for octal sequences.
@@ -68,33 +87,35 @@ pub fn parse_escape_code(rest: &mut &[u8]) -> EscapedChar {
         // would be the \0NNN syntax.
         if let b'1'..=b'7' = c {
             if let Some(parsed) = parse_code(rest, Base::Oct) {
-                return EscapedChar::Char(parsed);
+                return EscapedChar::Byte(parsed);
             }
         }
 
         *rest = &new_rest[..];
         match c {
-            b'\\' => EscapedChar::Char(b'\\'),
-            b'a' => EscapedChar::Char(b'\x07'),
-            b'b' => EscapedChar::Char(b'\x08'),
+            b'\\' => EscapedChar::Byte(b'\\'),
+            b'a' => EscapedChar::Byte(b'\x07'),
+            b'b' => EscapedChar::Byte(b'\x08'),
             b'c' => return EscapedChar::End,
-            b'e' => EscapedChar::Char(b'\x1b'),
-            b'f' => EscapedChar::Char(b'\x0c'),
-            b'n' => EscapedChar::Char(b'\n'),
-            b'r' => EscapedChar::Char(b'\r'),
-            b't' => EscapedChar::Char(b'\t'),
-            b'v' => EscapedChar::Char(b'\x0b'),
+            b'e' => EscapedChar::Byte(b'\x1b'),
+            b'f' => EscapedChar::Byte(b'\x0c'),
+            b'n' => EscapedChar::Byte(b'\n'),
+            b'r' => EscapedChar::Byte(b'\r'),
+            b't' => EscapedChar::Byte(b'\t'),
+            b'v' => EscapedChar::Byte(b'\x0b'),
             b'x' => {
                 if let Some(c) = parse_code(rest, Base::Hex) {
-                    EscapedChar::Char(c)
+                    EscapedChar::Byte(c)
                 } else {
                     EscapedChar::Backslash(b'x')
                 }
             }
-            b'0' => EscapedChar::Char(parse_code(rest, Base::Oct).unwrap_or(b'\0')),
+            b'0' => EscapedChar::Byte(parse_code(rest, Base::Oct).unwrap_or(b'\0')),
+            b'u' => EscapedChar::Char(parse_unicode(rest, 4).unwrap_or('\0')),
+            b'U' => EscapedChar::Char(parse_unicode(rest, 8).unwrap_or('\0')),
             c => EscapedChar::Backslash(*c),
         }
     } else {
-        EscapedChar::Char(b'\\')
+        EscapedChar::Byte(b'\\')
     }
 }
diff --git a/src/uucore/src/lib/features/format/mod.rs b/src/uucore/src/lib/features/format/mod.rs
index 47e6fa4cc0b..cfa9a034fd7 100644
--- a/src/uucore/src/lib/features/format/mod.rs
+++ b/src/uucore/src/lib/features/format/mod.rs
@@ -19,11 +19,12 @@
 
 // spell-checker:ignore (vars) charf decf floatf intf scif strf Cninety
 
-mod escape;
 mod argument;
+mod escape;
 pub mod num_format;
 mod spec;
 
+pub use argument::*;
 use spec::Spec;
 use std::{
     error::Error,
@@ -31,7 +32,6 @@ use std::{
     io::{stdout, Write},
     ops::ControlFlow,
 };
-pub use argument::*;
 
 use crate::error::UError;
 
@@ -91,9 +91,12 @@ impl FormatChar for u8 {
 impl FormatChar for EscapedChar {
     fn write(&self, mut writer: impl Write) -> std::io::Result<ControlFlow<()>> {
         match self {
-            EscapedChar::Char(c) => {
+            EscapedChar::Byte(c) => {
                 writer.write(&[*c])?;
             }
+            EscapedChar::Char(c) => {
+                write!(writer, "{c}")?;
+            }
             EscapedChar::Backslash(c) => {
                 writer.write(&[b'\\', *c])?;
             }
@@ -125,7 +128,7 @@ pub fn parse_spec_and_escape(
         [] => return None,
         [b'%', b'%', rest @ ..] => {
             current = rest;
-            Some(Ok(FormatItem::Char(EscapedChar::Char(b'%'))))
+            Some(Ok(FormatItem::Char(EscapedChar::Byte(b'%'))))
         }
         [b'%', rest @ ..] => {
             current = rest;
@@ -141,7 +144,7 @@ pub fn parse_spec_and_escape(
         }
         [c, rest @ ..] => {
             current = rest;
-            Some(Ok(FormatItem::Char(EscapedChar::Char(*c))))
+            Some(Ok(FormatItem::Char(EscapedChar::Byte(*c))))
         }
     })
 }
@@ -179,7 +182,7 @@ fn parse_escape_only(fmt: &[u8]) -> impl Iterator<Item = EscapedChar> + '_ {
         }
         [c, rest @ ..] => {
             current = rest;
-            Some(EscapedChar::Char(*c))
+            Some(EscapedChar::Byte(*c))
         }
     })
 }

From 90b61a8c5cb5768f93ef935cb6ee4c6d328ab128 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Mon, 20 Nov 2023 22:17:57 +0100
Subject: [PATCH 047/429] fuzzing: add a variable to state if we know it fails
 or not

---
 .github/workflows/fuzzing.yml | 30 ++++++++++++++----------------
 1 file changed, 14 insertions(+), 16 deletions(-)

diff --git a/.github/workflows/fuzzing.yml b/.github/workflows/fuzzing.yml
index e7a9cb1e329..cbb0574dee2 100644
--- a/.github/workflows/fuzzing.yml
+++ b/.github/workflows/fuzzing.yml
@@ -37,16 +37,13 @@ jobs:
     strategy:
       matrix:
         test-target:
-          [
-            fuzz_date,
-            fuzz_test,
-            fuzz_expr,
-            fuzz_parse_glob,
-            fuzz_parse_size,
-            fuzz_parse_time,
-            # adding more fuzz tests here.
-            # e.g. fuzz_test_a,
-          ]
+          - { name: fuzz_test, should_pass: true }
+          # https://github.com/uutils/coreutils/issues/5311
+          - { name: fuzz_date, should_pass: false }
+          - { name: fuzz_expr, should_pass: true }
+          - { name: fuzz_parse_glob, should_pass: true }
+          - { name: fuzz_parse_size, should_pass: true }
+          - { name: fuzz_parse_time, should_pass: true }
     steps:
     - uses: actions/checkout@v4
     - uses: dtolnay/rust-toolchain@nightly
@@ -59,16 +56,17 @@ jobs:
     - name: Restore Cached Corpus
       uses: actions/cache/restore@v3
       with:
-        key: corpus-cache-${{ matrix.test-target }}
+        key: corpus-cache-${{ matrix.test-target.name }}
         path: |
-          fuzz/corpus/${{ matrix.test-target }}
-    - name: Run ${{ matrix.test-target }} for XX seconds
+          fuzz/corpus/${{ matrix.test-target.name }}
+    - name: Run ${{ matrix.test-target.name }} for XX seconds
       shell: bash
+      continue-on-error: ${{ !matrix.test-target.name.should_pass }}
       run: |
-        cargo +nightly fuzz run ${{ matrix.test-target }} -- -max_total_time=${{ env.RUN_FOR }} -detect_leaks=0
+        cargo +nightly fuzz run ${{ matrix.test-target.name }} -- -max_total_time=${{ env.RUN_FOR }} -detect_leaks=0
     - name: Save Corpus Cache
       uses: actions/cache/save@v3
       with:
-        key: corpus-cache-${{ matrix.test-target }}
+        key: corpus-cache-${{ matrix.test-target.name }}
         path: |
-          fuzz/corpus/${{ matrix.test-target }}
+          fuzz/corpus/${{ matrix.test-target.name }}

From 5c04283d6ee1a3fc7d4f7f88476809e760933f3c Mon Sep 17 00:00:00 2001
From: Terts Diepraam <terts.diepraam@gmail.com>
Date: Mon, 20 Nov 2023 13:54:58 +0100
Subject: [PATCH 048/429] printf: address fmt, clippy, spelling and failing
 test

---
 src/uu/printf/src/printf.rs                   |  17 +-
 src/uu/seq/src/extendedbigdecimal.rs          |   2 +-
 src/uu/seq/src/number.rs                      |  12 +-
 src/uu/seq/src/seq.rs                         |   4 +-
 .../src/lib/features/format/argument.rs       |  65 ++-
 src/uucore/src/lib/features/format/escape.rs  |  29 +-
 src/uucore/src/lib/features/format/mod.rs     |  65 +--
 .../src/lib/features/format/num_format.rs     | 116 +++---
 src/uucore/src/lib/features/format/spec.rs    | 380 ++++++++++--------
 9 files changed, 379 insertions(+), 311 deletions(-)

diff --git a/src/uu/printf/src/printf.rs b/src/uu/printf/src/printf.rs
index 663411b8952..cfb0315cfb0 100644
--- a/src/uu/printf/src/printf.rs
+++ b/src/uu/printf/src/printf.rs
@@ -10,9 +10,9 @@ use std::io::stdout;
 use std::ops::ControlFlow;
 
 use clap::{crate_version, Arg, ArgAction, Command};
-use uucore::error::{UResult, UUsageError};
+use uucore::error::{UError, UResult, UUsageError};
 use uucore::format::{parse_spec_and_escape, FormatArgument};
-use uucore::{format_usage, help_about, help_section, help_usage};
+use uucore::{format_usage, help_about, help_section, help_usage, show};
 
 const VERSION: &str = "version";
 const HELP: &str = "help";
@@ -49,10 +49,15 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
 
     while args.peek().is_some() {
         for item in parse_spec_and_escape(format_string.as_ref()) {
-            match item?.write(stdout(), &mut args)? {
-                ControlFlow::Continue(()) => {}
-                ControlFlow::Break(()) => return Ok(()),
-            };
+            match item {
+                Ok(item) => {
+                    match item.write(stdout(), &mut args)? {
+                        ControlFlow::Continue(()) => {}
+                        ControlFlow::Break(()) => return Ok(()),
+                    };
+                }
+                Err(e) => show!(e),
+            }
         }
     }
     Ok(())
diff --git a/src/uu/seq/src/extendedbigdecimal.rs b/src/uu/seq/src/extendedbigdecimal.rs
index ecd460ceb73..4f9a0415218 100644
--- a/src/uu/seq/src/extendedbigdecimal.rs
+++ b/src/uu/seq/src/extendedbigdecimal.rs
@@ -70,7 +70,7 @@ pub enum ExtendedBigDecimal {
 impl ExtendedBigDecimal {
     #[cfg(test)]
     pub fn zero() -> Self {
-        Self::BigDecimal(1.into())
+        Self::BigDecimal(0.into())
     }
 
     pub fn one() -> Self {
diff --git a/src/uu/seq/src/number.rs b/src/uu/seq/src/number.rs
index 4da1146eff6..182431a9210 100644
--- a/src/uu/seq/src/number.rs
+++ b/src/uu/seq/src/number.rs
@@ -3,12 +3,6 @@
 // For the full copyright and license information, please view the LICENSE
 // file that was distributed with this source code.
 // spell-checker:ignore extendedbigdecimal extendedbigint
-//! A type to represent the possible start, increment, and end values for seq.
-//!
-//! The [`Number`] enumeration represents the possible values for the
-//! start, increment, and end values for `seq`. These may be integers,
-//! floating point numbers, negative zero, etc. A [`Number`] can be
-//! parsed from a string by calling [`str::parse`].
 use num_traits::Zero;
 
 use crate::extendedbigdecimal::ExtendedBigDecimal;
@@ -29,7 +23,11 @@ pub struct PreciseNumber {
 }
 
 impl PreciseNumber {
-    pub fn new(number: ExtendedBigDecimal, num_integral_digits: usize, num_fractional_digits: usize) -> Self {
+    pub fn new(
+        number: ExtendedBigDecimal,
+        num_integral_digits: usize,
+        num_fractional_digits: usize,
+    ) -> Self {
         Self {
             number,
             num_integral_digits,
diff --git a/src/uu/seq/src/seq.rs b/src/uu/seq/src/seq.rs
index a987405ce15..05338864545 100644
--- a/src/uu/seq/src/seq.rs
+++ b/src/uu/seq/src/seq.rs
@@ -122,7 +122,7 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
         &options.terminator,
         options.equal_width,
         padding,
-        format,
+        &format,
     );
     match result {
         Ok(_) => Ok(()),
@@ -203,7 +203,7 @@ fn print_seq(
     terminator: &str,
     pad: bool,
     padding: usize,
-    format: Option<Format<num_format::Float>>,
+    format: &Option<Format<num_format::Float>>,
 ) -> std::io::Result<()> {
     let stdout = stdout();
     let mut stdout = stdout.lock();
diff --git a/src/uucore/src/lib/features/format/argument.rs b/src/uucore/src/lib/features/format/argument.rs
index 96cfeddf3f6..6370c4177e8 100644
--- a/src/uucore/src/lib/features/format/argument.rs
+++ b/src/uucore/src/lib/features/format/argument.rs
@@ -1,3 +1,7 @@
+use os_display::Quotable;
+
+use crate::{error::set_exit_code, show_warning};
+
 #[derive(Clone, Debug)]
 pub enum FormatArgument {
     Char(char),
@@ -44,16 +48,25 @@ impl<'a, T: Iterator<Item = &'a FormatArgument>> ArgumentIter<'a> for T {
         };
         match next {
             FormatArgument::UnsignedInt(n) => *n,
-            FormatArgument::Unparsed(s) => if let Some(s) = s.strip_prefix("0x") {
-                u64::from_str_radix(s, 16).ok()
-            } else if let Some(s) = s.strip_prefix("0") {
-                u64::from_str_radix(s, 8).ok()
-            } else if let Some(s) = s.strip_prefix('\'') {
-                s.chars().next().map(|c| c as u64)
-            } else {
-                s.parse().ok()
+            FormatArgument::Unparsed(s) => {
+                let opt = if let Some(s) = s.strip_prefix("0x") {
+                    u64::from_str_radix(s, 16).ok()
+                } else if let Some(s) = s.strip_prefix('0') {
+                    u64::from_str_radix(s, 8).ok()
+                } else if let Some(s) = s.strip_prefix('\'') {
+                    s.chars().next().map(|c| c as u64)
+                } else {
+                    s.parse().ok()
+                };
+                match opt {
+                    Some(n) => n,
+                    None => {
+                        show_warning!("{}: expected a numeric value", s.quote());
+                        set_exit_code(1);
+                        0
+                    }
+                }
             }
-            .unwrap_or(0),
             _ => 0,
         }
     }
@@ -67,7 +80,7 @@ impl<'a, T: Iterator<Item = &'a FormatArgument>> ArgumentIter<'a> for T {
             FormatArgument::Unparsed(s) => {
                 // For hex, we parse `u64` because we do not allow another
                 // minus sign. We might need to do more precise parsing here.
-                if let Some(s) = s.strip_prefix("-0x") {
+                let opt = if let Some(s) = s.strip_prefix("-0x") {
                     u64::from_str_radix(s, 16).ok().map(|x| -(x as i64))
                 } else if let Some(s) = s.strip_prefix("0x") {
                     u64::from_str_radix(s, 16).ok().map(|x| x as i64)
@@ -77,8 +90,15 @@ impl<'a, T: Iterator<Item = &'a FormatArgument>> ArgumentIter<'a> for T {
                     s.chars().next().map(|x| x as i64)
                 } else {
                     s.parse().ok()
+                };
+                match opt {
+                    Some(n) => n,
+                    None => {
+                        show_warning!("{}: expected a numeric value", s.quote());
+                        set_exit_code(1);
+                        0
+                    }
                 }
-                .unwrap_or(0)
             }
             _ => 0,
         }
@@ -90,14 +110,23 @@ impl<'a, T: Iterator<Item = &'a FormatArgument>> ArgumentIter<'a> for T {
         };
         match next {
             FormatArgument::Float(n) => *n,
-            FormatArgument::Unparsed(s) => if s.starts_with("0x") || s.starts_with("-0x") {
-                unimplemented!("Hexadecimal floats are unimplemented!")
-            } else if let Some(s) = s.strip_prefix('\'') {
-                s.chars().next().map(|x| x as u64 as f64)
-            } else {
-                s.parse().ok()
+            FormatArgument::Unparsed(s) => {
+                let opt = if s.starts_with("0x") || s.starts_with("-0x") {
+                    unimplemented!("Hexadecimal floats are unimplemented!")
+                } else if let Some(s) = s.strip_prefix('\'') {
+                    s.chars().next().map(|x| x as u64 as f64)
+                } else {
+                    s.parse().ok()
+                };
+                match opt {
+                    Some(n) => n,
+                    None => {
+                        show_warning!("{}: expected a numeric value", s.quote());
+                        set_exit_code(1);
+                        0.0
+                    }
+                }
             }
-            .unwrap_or(0.0),
             _ => 0.0,
         }
     }
diff --git a/src/uucore/src/lib/features/format/escape.rs b/src/uucore/src/lib/features/format/escape.rs
index 1e06a8176dd..188dd1892b5 100644
--- a/src/uucore/src/lib/features/format/escape.rs
+++ b/src/uucore/src/lib/features/format/escape.rs
@@ -21,16 +21,16 @@ impl Base {
         }
     }
 
-    fn to_digit(&self, c: u8) -> Option<u8> {
+    fn convert_digit(&self, c: u8) -> Option<u8> {
         match self {
-            Base::Oct => {
+            Self::Oct => {
                 if matches!(c, b'0'..=b'7') {
                     Some(c - b'0')
                 } else {
                     None
                 }
             }
-            Base::Hex => match c {
+            Self::Hex => match c {
                 b'0'..=b'9' => Some(c - b'0'),
                 b'A'..=b'F' => Some(c - b'A' + 10),
                 b'a'..=b'f' => Some(c - b'a' + 10),
@@ -49,32 +49,35 @@ fn parse_code(input: &mut &[u8], base: Base) -> Option<u8> {
     // yield incorrect results because it will interpret values larger than
     // `u8::MAX` as unicode.
     let [c, rest @ ..] = input else { return None };
-    let mut ret = base.to_digit(*c)?;
-    *input = &rest[..];
+    let mut ret = base.convert_digit(*c)?;
+    *input = rest;
 
     for _ in 1..base.max_digits() {
         let [c, rest @ ..] = input else { break };
-        let Some(n) = base.to_digit(*c) else { break };
+        let Some(n) = base.convert_digit(*c) else {
+            break;
+        };
         ret = ret.wrapping_mul(base as u8).wrapping_add(n);
-        *input = &rest[..];
+        *input = rest;
     }
 
     Some(ret)
 }
 
+// spell-checker:disable-next
 /// Parse `\uHHHH` and `\UHHHHHHHH`
 // TODO: This should print warnings and possibly halt execution when it fails to parse
 // TODO: If the character cannot be converted to u32, the input should be printed.
 fn parse_unicode(input: &mut &[u8], digits: u8) -> Option<char> {
     let (c, rest) = input.split_first()?;
-    let mut ret = Base::Hex.to_digit(*c)? as u32;
-    *input = &rest[..];
+    let mut ret = Base::Hex.convert_digit(*c)? as u32;
+    *input = rest;
 
     for _ in 1..digits {
         let (c, rest) = input.split_first()?;
-        let n = Base::Hex.to_digit(*c)?;
+        let n = Base::Hex.convert_digit(*c)?;
         ret = ret.wrapping_mul(Base::Hex as u32).wrapping_add(n as u32);
-        *input = &rest[..];
+        *input = rest;
     }
 
     char::from_u32(ret)
@@ -91,12 +94,12 @@ pub fn parse_escape_code(rest: &mut &[u8]) -> EscapedChar {
             }
         }
 
-        *rest = &new_rest[..];
+        *rest = new_rest;
         match c {
             b'\\' => EscapedChar::Byte(b'\\'),
             b'a' => EscapedChar::Byte(b'\x07'),
             b'b' => EscapedChar::Byte(b'\x08'),
-            b'c' => return EscapedChar::End,
+            b'c' => EscapedChar::End,
             b'e' => EscapedChar::Byte(b'\x1b'),
             b'f' => EscapedChar::Byte(b'\x0c'),
             b'n' => EscapedChar::Byte(b'\n'),
diff --git a/src/uucore/src/lib/features/format/mod.rs b/src/uucore/src/lib/features/format/mod.rs
index cfa9a034fd7..9045b8b90c3 100644
--- a/src/uucore/src/lib/features/format/mod.rs
+++ b/src/uucore/src/lib/features/format/mod.rs
@@ -42,10 +42,13 @@ use self::{
 
 #[derive(Debug)]
 pub enum FormatError {
-    SpecError,
+    SpecError(Vec<u8>),
     IoError(std::io::Error),
     NoMoreArguments,
     InvalidArgument(FormatArgument),
+    TooManySpecs,
+    NeedAtLeastOneSpec,
+    WrongSpecType,
 }
 
 impl Error for FormatError {}
@@ -53,18 +56,26 @@ impl UError for FormatError {}
 
 impl From<std::io::Error> for FormatError {
     fn from(value: std::io::Error) -> Self {
-        FormatError::IoError(value)
+        Self::IoError(value)
     }
 }
 
 impl Display for FormatError {
     fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
-        // TODO: Be more precise about these
         match self {
-            FormatError::SpecError => write!(f, "invalid spec"),
-            FormatError::IoError(_) => write!(f, "io error"),
-            FormatError::NoMoreArguments => write!(f, "no more arguments"),
-            FormatError::InvalidArgument(_) => write!(f, "invalid argument"),
+            Self::SpecError(s) => write!(
+                f,
+                "%{}: invalid conversion specification",
+                String::from_utf8_lossy(s)
+            ),
+            // TODO: The next two should print the spec as well
+            Self::TooManySpecs => write!(f, "format has too many % directives"),
+            Self::NeedAtLeastOneSpec => write!(f, "format has no % directive"),
+            // TODO: Error message below needs some work
+            Self::WrongSpecType => write!(f, "wrong % directive type was given"),
+            Self::IoError(_) => write!(f, "io error"),
+            Self::NoMoreArguments => write!(f, "no more arguments"),
+            Self::InvalidArgument(_) => write!(f, "invalid argument"),
         }
     }
 }
@@ -83,7 +94,7 @@ pub trait FormatChar {
 
 impl FormatChar for u8 {
     fn write(&self, mut writer: impl Write) -> std::io::Result<ControlFlow<()>> {
-        writer.write(&[*self])?;
+        writer.write_all(&[*self])?;
         Ok(ControlFlow::Continue(()))
     }
 }
@@ -91,16 +102,16 @@ impl FormatChar for u8 {
 impl FormatChar for EscapedChar {
     fn write(&self, mut writer: impl Write) -> std::io::Result<ControlFlow<()>> {
         match self {
-            EscapedChar::Byte(c) => {
-                writer.write(&[*c])?;
+            Self::Byte(c) => {
+                writer.write_all(&[*c])?;
             }
-            EscapedChar::Char(c) => {
+            Self::Char(c) => {
                 write!(writer, "{c}")?;
             }
-            EscapedChar::Backslash(c) => {
-                writer.write(&[b'\\', *c])?;
+            Self::Backslash(c) => {
+                writer.write_all(&[b'\\', *c])?;
             }
-            EscapedChar::End => return Ok(ControlFlow::Break(())),
+            Self::End => return Ok(ControlFlow::Break(())),
         }
         Ok(ControlFlow::Continue(()))
     }
@@ -113,8 +124,8 @@ impl<C: FormatChar> FormatItem<C> {
         args: &mut impl Iterator<Item = &'a FormatArgument>,
     ) -> Result<ControlFlow<()>, FormatError> {
         match self {
-            FormatItem::Spec(spec) => spec.write(writer, args)?,
-            FormatItem::Char(c) => return c.write(writer).map_err(FormatError::IoError),
+            Self::Spec(spec) => spec.write(writer, args)?,
+            Self::Char(c) => return c.write(writer).map_err(FormatError::IoError),
         };
         Ok(ControlFlow::Continue(()))
     }
@@ -125,7 +136,7 @@ pub fn parse_spec_and_escape(
 ) -> impl Iterator<Item = Result<FormatItem<EscapedChar>, FormatError>> + '_ {
     let mut current = fmt;
     std::iter::from_fn(move || match current {
-        [] => return None,
+        [] => None,
         [b'%', b'%', rest @ ..] => {
             current = rest;
             Some(Ok(FormatItem::Char(EscapedChar::Byte(b'%'))))
@@ -133,8 +144,8 @@ pub fn parse_spec_and_escape(
         [b'%', rest @ ..] => {
             current = rest;
             let spec = match Spec::parse(&mut current) {
-                Some(spec) => spec,
-                None => return Some(Err(FormatError::SpecError)),
+                Ok(spec) => spec,
+                Err(slice) => return Some(Err(FormatError::SpecError(slice.to_vec()))),
             };
             Some(Ok(FormatItem::Spec(spec)))
         }
@@ -152,7 +163,7 @@ pub fn parse_spec_and_escape(
 fn parse_spec_only(fmt: &[u8]) -> impl Iterator<Item = Result<FormatItem<u8>, FormatError>> + '_ {
     let mut current = fmt;
     std::iter::from_fn(move || match current {
-        [] => return None,
+        [] => None,
         [b'%', b'%', rest @ ..] => {
             current = rest;
             Some(Ok(FormatItem::Char(b'%')))
@@ -160,8 +171,8 @@ fn parse_spec_only(fmt: &[u8]) -> impl Iterator<Item = Result<FormatItem<u8>, Fo
         [b'%', rest @ ..] => {
             current = rest;
             let spec = match Spec::parse(&mut current) {
-                Some(spec) => spec,
-                None => return Some(Err(FormatError::SpecError)),
+                Ok(spec) => spec,
+                Err(slice) => return Some(Err(FormatError::SpecError(slice.to_vec()))),
             };
             Some(Ok(FormatItem::Spec(spec)))
         }
@@ -175,7 +186,7 @@ fn parse_spec_only(fmt: &[u8]) -> impl Iterator<Item = Result<FormatItem<u8>, Fo
 fn parse_escape_only(fmt: &[u8]) -> impl Iterator<Item = EscapedChar> + '_ {
     let mut current = fmt;
     std::iter::from_fn(move || match current {
-        [] => return None,
+        [] => None,
         [b'\\', rest @ ..] => {
             current = rest;
             Some(parse_escape_code(&mut current))
@@ -248,8 +259,8 @@ pub fn sprintf<'a>(
 
 /// A parsed format for a single float value
 ///
-/// This is used by `seq`. It can be constructed with [`FloatFormat::parse`]
-/// and can write a value with [`FloatFormat::fmt`].
+/// This is used by `seq`. It can be constructed with [`Format::parse`]
+/// and can write a value with [`Format::fmt`].
 ///
 /// It can only accept a single specification without any asterisk parameters.
 /// If it does get more specifications, it will return an error.
@@ -276,7 +287,7 @@ impl<F: Formatter> Format<F> {
         }
 
         let Some(spec) = spec else {
-            return Err(FormatError::SpecError);
+            return Err(FormatError::NeedAtLeastOneSpec);
         };
 
         let formatter = F::try_from_spec(spec)?;
@@ -285,7 +296,7 @@ impl<F: Formatter> Format<F> {
         for item in &mut iter {
             match item? {
                 FormatItem::Spec(_) => {
-                    return Err(FormatError::SpecError);
+                    return Err(FormatError::TooManySpecs);
                 }
                 FormatItem::Char(c) => suffix.push(c),
             }
diff --git a/src/uucore/src/lib/features/format/num_format.rs b/src/uucore/src/lib/features/format/num_format.rs
index 49edecce085..c9a2b8c166f 100644
--- a/src/uucore/src/lib/features/format/num_format.rs
+++ b/src/uucore/src/lib/features/format/num_format.rs
@@ -97,19 +97,19 @@ impl Formatter for SignedInt {
             alignment,
         } = s
         else {
-            return Err(FormatError::SpecError);
+            return Err(FormatError::WrongSpecType);
         };
 
         let width = match width {
             Some(CanAsterisk::Fixed(x)) => x,
             None => 0,
-            Some(CanAsterisk::Asterisk) => return Err(FormatError::SpecError),
+            Some(CanAsterisk::Asterisk) => return Err(FormatError::WrongSpecType),
         };
 
         let precision = match precision {
             Some(CanAsterisk::Fixed(x)) => x,
             None => 0,
-            Some(CanAsterisk::Asterisk) => return Err(FormatError::SpecError),
+            Some(CanAsterisk::Asterisk) => return Err(FormatError::WrongSpecType),
         };
 
         Ok(Self {
@@ -151,7 +151,7 @@ impl Formatter for UnsignedInt {
         };
 
         if self.precision > s.len() {
-            s = format!("{:0width$}", s, width = self.precision)
+            s = format!("{:0width$}", s, width = self.precision);
         }
 
         match self.alignment {
@@ -169,19 +169,19 @@ impl Formatter for UnsignedInt {
             alignment,
         } = s
         else {
-            return Err(FormatError::SpecError);
+            return Err(FormatError::WrongSpecType);
         };
 
         let width = match width {
             Some(CanAsterisk::Fixed(x)) => x,
             None => 0,
-            Some(CanAsterisk::Asterisk) => return Err(FormatError::SpecError),
+            Some(CanAsterisk::Asterisk) => return Err(FormatError::WrongSpecType),
         };
 
         let precision = match precision {
             Some(CanAsterisk::Fixed(x)) => x,
             None => 0,
-            Some(CanAsterisk::Asterisk) => return Err(FormatError::SpecError),
+            Some(CanAsterisk::Asterisk) => return Err(FormatError::WrongSpecType),
         };
 
         Ok(Self {
@@ -212,7 +212,7 @@ impl Default for Float {
             width: 0,
             positive_sign: PositiveSign::None,
             alignment: NumberAlignment::Left,
-            precision: 2,
+            precision: 6,
         }
     }
 }
@@ -229,19 +229,23 @@ impl Formatter for Float {
             }?;
         }
 
-        let s = match self.variant {
-            FloatVariant::Decimal => {
-                format_float_decimal(x, self.precision, self.case, self.force_decimal)
-            }
-            FloatVariant::Scientific => {
-                format_float_scientific(x, self.precision, self.case, self.force_decimal)
-            }
-            FloatVariant::Shortest => {
-                format_float_shortest(x, self.precision, self.case, self.force_decimal)
-            }
-            FloatVariant::Hexadecimal => {
-                format_float_hexadecimal(x, self.precision, self.case, self.force_decimal)
+        let s = if x.is_finite() {
+            match self.variant {
+                FloatVariant::Decimal => {
+                    format_float_decimal(x, self.precision, self.force_decimal)
+                }
+                FloatVariant::Scientific => {
+                    format_float_scientific(x, self.precision, self.case, self.force_decimal)
+                }
+                FloatVariant::Shortest => {
+                    format_float_shortest(x, self.precision, self.case, self.force_decimal)
+                }
+                FloatVariant::Hexadecimal => {
+                    format_float_hexadecimal(x, self.precision, self.case, self.force_decimal)
+                }
             }
+        } else {
+            format_float_non_finite(x, self.case)
         };
 
         match self.alignment {
@@ -265,19 +269,19 @@ impl Formatter for Float {
             precision,
         } = s
         else {
-            return Err(FormatError::SpecError);
+            return Err(FormatError::WrongSpecType);
         };
 
         let width = match width {
             Some(CanAsterisk::Fixed(x)) => x,
             None => 0,
-            Some(CanAsterisk::Asterisk) => return Err(FormatError::SpecError),
+            Some(CanAsterisk::Asterisk) => return Err(FormatError::WrongSpecType),
         };
 
         let precision = match precision {
             Some(CanAsterisk::Fixed(x)) => x,
             None => 0,
-            Some(CanAsterisk::Asterisk) => return Err(FormatError::SpecError),
+            Some(CanAsterisk::Asterisk) => return Err(FormatError::WrongSpecType),
         };
 
         Ok(Self {
@@ -292,25 +296,16 @@ impl Formatter for Float {
     }
 }
 
-fn format_float_nonfinite(f: f64, case: Case) -> String {
+fn format_float_non_finite(f: f64, case: Case) -> String {
     debug_assert!(!f.is_finite());
     let mut s = format!("{f}");
     if case == Case::Uppercase {
         s.make_ascii_uppercase();
     }
-    return s;
+    s
 }
 
-fn format_float_decimal(
-    f: f64,
-    precision: usize,
-    case: Case,
-    force_decimal: ForceDecimal,
-) -> String {
-    if !f.is_finite() {
-        return format_float_nonfinite(f, case);
-    }
-
+fn format_float_decimal(f: f64, precision: usize, force_decimal: ForceDecimal) -> String {
     if precision == 0 && force_decimal == ForceDecimal::Yes {
         format!("{f:.0}.")
     } else {
@@ -324,11 +319,6 @@ fn format_float_scientific(
     case: Case,
     force_decimal: ForceDecimal,
 ) -> String {
-    // If the float is NaN, -Nan, Inf or -Inf, format like any other float
-    if !f.is_finite() {
-        return format_float_nonfinite(f, case);
-    }
-
     if f == 0.0 {
         return if force_decimal == ForceDecimal::Yes && precision == 0 {
             "0.e+00".into()
@@ -337,13 +327,13 @@ fn format_float_scientific(
         };
     }
 
-    
     let mut exponent: i32 = f.log10().floor() as i32;
     let mut normalized = f / 10.0_f64.powi(exponent);
 
     // If the normalized value will be rounded to a value greater than 10
     // we need to correct.
-    if (normalized * 10_f64.powi(precision as i32)).round() / 10_f64.powi(precision as i32)  >= 10.0 {
+    if (normalized * 10_f64.powi(precision as i32)).round() / 10_f64.powi(precision as i32) >= 10.0
+    {
         normalized /= 10.0;
         exponent += 1;
     }
@@ -371,11 +361,6 @@ fn format_float_shortest(
     case: Case,
     force_decimal: ForceDecimal,
 ) -> String {
-    // If the float is NaN, -Nan, Inf or -Inf, format like any other float
-    if !f.is_finite() {
-        return format_float_nonfinite(f, case);
-    }
-
     // Precision here is about how many digits should be displayed
     // instead of how many digits for the fractional part, this means that if
     // we pass this to rust's format string, it's always gonna be one less.
@@ -398,7 +383,9 @@ fn format_float_shortest(
 
         // If the normalized value will be rounded to a value greater than 10
         // we need to correct.
-        if (normalized * 10_f64.powi(precision as i32)).round() / 10_f64.powi(precision as i32)  >= 10.0 {
+        if (normalized * 10_f64.powi(precision as i32)).round() / 10_f64.powi(precision as i32)
+            >= 10.0
+        {
             normalized /= 10.0;
             exponent += 1;
         }
@@ -412,12 +399,7 @@ fn format_float_shortest(
         let mut normalized = format!("{normalized:.*}", precision);
 
         if force_decimal == ForceDecimal::No {
-            while normalized.ends_with('0') {
-                normalized.pop();
-            }
-            if normalized.ends_with('.') {
-                normalized.pop();
-            }
+            strip_zeros_and_dot(&mut normalized);
         }
 
         let exp_char = match case {
@@ -439,12 +421,7 @@ fn format_float_shortest(
         };
 
         if force_decimal == ForceDecimal::No {
-            while formatted.ends_with('0') {
-                formatted.pop();
-            }
-            if formatted.ends_with('.') {
-                formatted.pop();
-            }
+            strip_zeros_and_dot(&mut formatted);
         }
 
         formatted
@@ -457,10 +434,6 @@ fn format_float_hexadecimal(
     case: Case,
     force_decimal: ForceDecimal,
 ) -> String {
-    if !f.is_finite() {
-        return format_float_nonfinite(f, case);
-    }
-
     let (first_digit, mantissa, exponent) = if f == 0.0 {
         (0, 0, 0)
     } else {
@@ -481,7 +454,16 @@ fn format_float_hexadecimal(
         s.make_ascii_uppercase();
     }
 
-    return s;
+    s
+}
+
+fn strip_zeros_and_dot(s: &mut String) {
+    while s.ends_with('0') {
+        s.pop();
+    }
+    if s.ends_with('.') {
+        s.pop();
+    }
 }
 
 #[cfg(test)]
@@ -491,7 +473,7 @@ mod test {
     #[test]
     fn decimal_float() {
         use super::format_float_decimal;
-        let f = |x| format_float_decimal(x, 6, Case::Lowercase, ForceDecimal::No);
+        let f = |x| format_float_decimal(x, 6, ForceDecimal::No);
         assert_eq!(f(0.0), "0.000000");
         assert_eq!(f(1.0), "1.000000");
         assert_eq!(f(100.0), "100.000000");
@@ -576,7 +558,7 @@ mod test {
         assert_eq!(f(12.3456789), "1e+01");
         assert_eq!(f(1000000.0), "1e+06");
         assert_eq!(f(99999999.0), "1e+08");
-        
+
         let f = |x| format_float_shortest(x, 0, Case::Lowercase, ForceDecimal::Yes);
         assert_eq!(f(0.0), "0.");
         assert_eq!(f(1.0), "1.");
diff --git a/src/uucore/src/lib/features/format/spec.rs b/src/uucore/src/lib/features/format/spec.rs
index 23c68c06669..e74b6f8660f 100644
--- a/src/uucore/src/lib/features/format/spec.rs
+++ b/src/uucore/src/lib/features/format/spec.rs
@@ -1,4 +1,6 @@
-// spell-checker:ignore (vars) charf decf floatf intf scif strf Cninety
+// spell-checker:ignore (vars) charf decf floatf intf scif strf Cninety intmax ptrdiff
+
+use crate::quoting_style::{escape_name, QuotingStyle};
 
 use super::{
     num_format::{
@@ -16,11 +18,12 @@ pub enum Spec {
         align_left: bool,
     },
     String {
-        width: Option<CanAsterisk<usize>>,
         precision: Option<CanAsterisk<usize>>,
-        parse_escape: bool,
+        width: Option<CanAsterisk<usize>>,
         align_left: bool,
     },
+    EscapedString,
+    QuotedString,
     SignedInt {
         width: Option<CanAsterisk<usize>>,
         precision: Option<CanAsterisk<usize>>,
@@ -76,12 +79,14 @@ enum Length {
 }
 
 impl Spec {
-    pub fn parse(rest: &mut &[u8]) -> Option<Self> {
+    pub fn parse<'a>(rest: &mut &'a [u8]) -> Result<Self, &'a [u8]> {
         // Based on the C++ reference, the spec format looks like:
         //
         //   %[flags][width][.precision][length]specifier
         //
         // However, we have already parsed the '%'.
+        let mut index = 0;
+        let start = *rest;
 
         let mut minus = false;
         let mut plus = false;
@@ -89,111 +94,101 @@ impl Spec {
         let mut hash = false;
         let mut zero = false;
 
-        while let Some(x @ (b'-' | b'+' | b' ' | b'#' | b'0')) = rest.get(0) {
+        while let Some(x) = rest.get(index) {
             match x {
                 b'-' => minus = true,
                 b'+' => plus = true,
                 b' ' => space = true,
                 b'#' => hash = true,
                 b'0' => zero = true,
-                _ => unreachable!(),
+                _ => break,
             }
-            *rest = &rest[1..]
+            index += 1;
         }
 
-        let width = eat_asterisk_or_number(rest);
+        let alignment = match (minus, zero) {
+            (true, _) => NumberAlignment::Left,
+            (false, true) => NumberAlignment::RightZero,
+            (false, false) => NumberAlignment::RightSpace,
+        };
 
-        let precision = if let Some(b'.') = rest.get(0) {
-            *rest = &rest[1..];
-            Some(eat_asterisk_or_number(rest).unwrap_or(CanAsterisk::Fixed(0)))
+        let positive_sign = match (plus, space) {
+            (true, _) => PositiveSign::Plus,
+            (false, true) => PositiveSign::Space,
+            (false, false) => PositiveSign::None,
+        };
+
+        let width = eat_asterisk_or_number(rest, &mut index);
+
+        let precision = if let Some(b'.') = rest.get(index) {
+            index += 1;
+            Some(eat_asterisk_or_number(rest, &mut index).unwrap_or(CanAsterisk::Fixed(0)))
         } else {
             None
         };
 
-        // Parse 0..N length options, keep the last one
-        // Even though it is just ignored. We might want to use it later and we
-        // should parse those characters.
-        //
-        // TODO: This needs to be configurable: `seq` accepts only one length
-        //       param
-        let mut _length = None;
-        loop {
-            let new_length = rest.get(0).and_then(|c| {
-                Some(match c {
-                    b'h' => {
-                        if let Some(b'h') = rest.get(1) {
-                            *rest = &rest[1..];
-                            Length::Char
-                        } else {
-                            Length::Short
-                        }
-                    }
-                    b'l' => {
-                        if let Some(b'l') = rest.get(1) {
-                            *rest = &rest[1..];
-                            Length::Long
-                        } else {
-                            Length::LongLong
-                        }
-                    }
-                    b'j' => Length::IntMaxT,
-                    b'z' => Length::SizeT,
-                    b't' => Length::PtfDiffT,
-                    b'L' => Length::LongDouble,
-                    _ => return None,
-                })
-            });
-            if new_length.is_some() {
-                *rest = &rest[1..];
-                _length = new_length;
-            } else {
-                break;
-            }
-        }
+        // We ignore the length. It's not really relevant to printf
+        let _ = Self::parse_length(rest, &mut index);
 
-        let type_spec = rest.get(0)?;
-        *rest = &rest[1..];
-        Some(match type_spec {
-            b'c' => Spec::Char {
-                width,
-                align_left: minus,
-            },
-            b's' => Spec::String {
-                width,
-                precision,
-                parse_escape: false,
-                align_left: minus,
-            },
-            b'b' => Spec::String {
-                width,
-                precision,
-                parse_escape: true,
-                align_left: minus,
-            },
-            b'd' | b'i' => Spec::SignedInt {
-                width,
-                precision,
-                alignment: match (minus, zero) {
-                    (true, _) => NumberAlignment::Left,
-                    (false, true) => NumberAlignment::RightZero,
-                    (false, false) => NumberAlignment::RightSpace,
-                },
-                positive_sign: match (plus, space) {
-                    (true, _) => PositiveSign::Plus,
-                    (false, true) => PositiveSign::Space,
-                    (false, false) => PositiveSign::None,
-                },
-            },
+        let Some(type_spec) = rest.get(index) else {
+            return Err(&start[..index]);
+        };
+        index += 1;
+        *rest = &start[index..];
+
+        Ok(match type_spec {
+            // GNU accepts minus, plus and space even though they are not used
+            b'c' => {
+                if hash || precision.is_some() {
+                    return Err(&start[..index]);
+                }
+                Self::Char {
+                    width,
+                    align_left: minus,
+                }
+            }
+            b's' => {
+                if hash {
+                    return Err(&start[..index]);
+                }
+                Self::String {
+                    precision,
+                    width,
+                    align_left: minus,
+                }
+            }
+            b'b' => {
+                if hash || minus || plus || space || width.is_some() || precision.is_some() {
+                    return Err(&start[..index]);
+                }
+                Self::EscapedString
+            }
+            b'q' => {
+                if hash || minus || plus || space || width.is_some() || precision.is_some() {
+                    return Err(&start[..index]);
+                }
+                Self::QuotedString
+            }
+            b'd' | b'i' => {
+                if hash {
+                    return Err(&start[..index]);
+                }
+                Self::SignedInt {
+                    width,
+                    precision,
+                    alignment,
+                    positive_sign,
+                }
+            }
             c @ (b'u' | b'o' | b'x' | b'X') => {
+                // Normal unsigned integer cannot have a prefix
+                if *c == b'u' && hash {
+                    return Err(&start[..index]);
+                }
                 let prefix = match hash {
                     false => Prefix::No,
                     true => Prefix::Yes,
                 };
-                let alignment = match (minus, zero) {
-                    (true, _) => NumberAlignment::Left,
-                    (false, true) => NumberAlignment::RightZero,
-                    (false, false) => NumberAlignment::RightSpace,
-                };
                 let variant = match c {
                     b'u' => UnsignedIntVariant::Decimal,
                     b'o' => UnsignedIntVariant::Octal(prefix),
@@ -201,14 +196,14 @@ impl Spec {
                     b'X' => UnsignedIntVariant::Hexadecimal(Case::Uppercase, prefix),
                     _ => unreachable!(),
                 };
-                Spec::UnsignedInt {
+                Self::UnsignedInt {
                     variant,
                     precision,
                     width,
                     alignment,
                 }
             }
-            c @ (b'f' | b'F' | b'e' | b'E' | b'g' | b'G' | b'a' | b'A') => Spec::Float {
+            c @ (b'f' | b'F' | b'e' | b'E' | b'g' | b'G' | b'a' | b'A') => Self::Float {
                 width,
                 precision,
                 variant: match c {
@@ -226,115 +221,157 @@ impl Spec {
                     false => Case::Lowercase,
                     true => Case::Uppercase,
                 },
-                alignment: match (minus, zero) {
-                    (true, _) => NumberAlignment::Left,
-                    (false, true) => NumberAlignment::RightZero,
-                    (false, false) => NumberAlignment::RightSpace,
-                },
-                positive_sign: match (plus, space) {
-                    (true, _) => PositiveSign::Plus,
-                    (false, true) => PositiveSign::Space,
-                    (false, false) => PositiveSign::None,
-                },
+                alignment,
+                positive_sign,
             },
-            _ => return None,
+            _ => return Err(&start[..index]),
         })
     }
 
+    fn parse_length(rest: &mut &[u8], index: &mut usize) -> Option<Length> {
+        // Parse 0..N length options, keep the last one
+        // Even though it is just ignored. We might want to use it later and we
+        // should parse those characters.
+        //
+        // TODO: This needs to be configurable: `seq` accepts only one length
+        //       param
+        let mut length = None;
+        loop {
+            let new_length = rest.get(*index).and_then(|c| {
+                Some(match c {
+                    b'h' => {
+                        if let Some(b'h') = rest.get(*index + 1) {
+                            *index += 1;
+                            Length::Char
+                        } else {
+                            Length::Short
+                        }
+                    }
+                    b'l' => {
+                        if let Some(b'l') = rest.get(*index + 1) {
+                            *index += 1;
+                            Length::Long
+                        } else {
+                            Length::LongLong
+                        }
+                    }
+                    b'j' => Length::IntMaxT,
+                    b'z' => Length::SizeT,
+                    b't' => Length::PtfDiffT,
+                    b'L' => Length::LongDouble,
+                    _ => return None,
+                })
+            });
+            if new_length.is_some() {
+                *index += 1;
+                length = new_length;
+            } else {
+                break;
+            }
+        }
+        length
+    }
+
     pub fn write<'a>(
         &self,
-        writer: impl Write,
+        mut writer: impl Write,
         mut args: impl ArgumentIter<'a>,
     ) -> Result<(), FormatError> {
         match self {
-            &Spec::Char { width, align_left } => {
-                let width = resolve_asterisk(width, &mut args)?.unwrap_or(0);
-                write_padded(writer, args.get_char(), width, false, align_left)
+            Self::Char { width, align_left } => {
+                let width = resolve_asterisk(*width, &mut args)?.unwrap_or(0);
+                write_padded(writer, args.get_char(), width, false, *align_left)
             }
-            &Spec::String {
+            Self::String {
                 width,
-                precision,
-                parse_escape,
                 align_left,
+                precision,
             } => {
-                let width = resolve_asterisk(width, &mut args)?.unwrap_or(0);
-                let precision = resolve_asterisk(precision, &mut args)?;
+                let width = resolve_asterisk(*width, &mut args)?.unwrap_or(0);
+
+                // GNU does do this truncation on a byte level, see for instance:
+                //     printf "%.1s" 🙃
+                //     > �
+                // For now, we let printf panic when we truncate within a code point.
+                // TODO: We need to not use Rust's formatting for aligning the output,
+                // so that we can just write bytes to stdout without panicking.
+                let precision = resolve_asterisk(*precision, &mut args)?;
                 let s = args.get_str();
-                if parse_escape {
-                    let mut parsed = Vec::new();
-                    for c in parse_escape_only(s.as_bytes()) {
-                        match c.write(&mut parsed)? {
-                            ControlFlow::Continue(()) => {}
-                            ControlFlow::Break(()) => {
-                                // TODO: This should break the _entire execution_ of printf
-                                break;
-                            }
-                        };
-                    }
-                    // GNU does do this truncation on a byte level, see for instance:
-                    //     printf "%.1s" 🙃
-                    //     > �
-                    // For now, we let printf panic when we truncate within a code point.
-                    // TODO: We need to not use Rust's formatting for aligning the output,
-                    // so that we can just write bytes to stdout without panicking.
-                    let truncated = match precision {
-                        Some(p) if p < parsed.len() => &parsed[..p],
-                        _ => &parsed,
-                    };
-                    write_padded(
-                        writer,
-                        std::str::from_utf8(&truncated).expect("TODO: Accept invalid utf8"),
-                        width,
-                        false,
-                        align_left,
-                    )
-                } else {
-                    let truncated = match precision {
-                        Some(p) if p < s.len() => &s[..p],
-                        _ => s,
+                let truncated = match precision {
+                    Some(p) if p < s.len() => &s[..p],
+                    _ => s,
+                };
+                write_padded(writer, truncated, width, false, *align_left)
+            }
+            Self::EscapedString => {
+                let s = args.get_str();
+                let mut parsed = Vec::new();
+                for c in parse_escape_only(s.as_bytes()) {
+                    match c.write(&mut parsed)? {
+                        ControlFlow::Continue(()) => {}
+                        ControlFlow::Break(()) => {
+                            // TODO: This should break the _entire execution_ of printf
+                            break;
+                        }
                     };
-                    write_padded(writer, truncated, width, false, align_left)
                 }
+                writer.write_all(&parsed).map_err(FormatError::IoError)
+            }
+            Self::QuotedString => {
+                let s = args.get_str();
+                writer
+                    .write_all(
+                        escape_name(
+                            s.as_ref(),
+                            &QuotingStyle::Shell {
+                                escape: true,
+                                always_quote: false,
+                                show_control: false,
+                            },
+                        )
+                        .as_bytes(),
+                    )
+                    .map_err(FormatError::IoError)
             }
-            &Spec::SignedInt {
+            Self::SignedInt {
                 width,
                 precision,
                 positive_sign,
                 alignment,
             } => {
-                let width = resolve_asterisk(width, &mut args)?.unwrap_or(0);
-                let precision = resolve_asterisk(precision, &mut args)?.unwrap_or(0);
+                let width = resolve_asterisk(*width, &mut args)?.unwrap_or(0);
+                let precision = resolve_asterisk(*precision, &mut args)?.unwrap_or(0);
                 let i = args.get_i64();
 
                 num_format::SignedInt {
                     width,
                     precision,
-                    positive_sign,
-                    alignment,
+                    positive_sign: *positive_sign,
+                    alignment: *alignment,
                 }
                 .fmt(writer, i)
                 .map_err(FormatError::IoError)
             }
-            &Spec::UnsignedInt {
+            Self::UnsignedInt {
                 variant,
                 width,
                 precision,
                 alignment,
             } => {
-                let width = resolve_asterisk(width, &mut args)?.unwrap_or(0);
-                let precision = resolve_asterisk(precision, &mut args)?.unwrap_or(0);
+                let width = resolve_asterisk(*width, &mut args)?.unwrap_or(0);
+                let precision = resolve_asterisk(*precision, &mut args)?.unwrap_or(0);
                 let i = args.get_u64();
 
                 num_format::UnsignedInt {
-                    variant,
+                    variant: *variant,
                     precision,
                     width,
-                    alignment,
+                    alignment: *alignment,
                 }
                 .fmt(writer, i)
                 .map_err(FormatError::IoError)
             }
-            &Spec::Float {
+            Self::Float {
                 variant,
                 case,
                 force_decimal,
@@ -343,18 +380,18 @@ impl Spec {
                 alignment,
                 precision,
             } => {
-                let width = resolve_asterisk(width, &mut args)?.unwrap_or(0);
-                let precision = resolve_asterisk(precision, &mut args)?.unwrap_or(6);
+                let width = resolve_asterisk(*width, &mut args)?.unwrap_or(0);
+                let precision = resolve_asterisk(*precision, &mut args)?.unwrap_or(6);
                 let f = args.get_f64();
 
                 num_format::Float {
-                    variant,
-                    case,
-                    force_decimal,
                     width,
-                    positive_sign,
-                    alignment,
                     precision,
+                    variant: *variant,
+                    case: *case,
+                    force_decimal: *force_decimal,
+                    positive_sign: *positive_sign,
+                    alignment: *alignment,
                 }
                 .fmt(writer, f)
                 .map_err(FormatError::IoError)
@@ -390,23 +427,26 @@ fn write_padded(
     .map_err(FormatError::IoError)
 }
 
-fn eat_asterisk_or_number(rest: &mut &[u8]) -> Option<CanAsterisk<usize>> {
-    if let Some(b'*') = rest.get(0) {
-        *rest = &rest[1..];
+fn eat_asterisk_or_number(rest: &mut &[u8], index: &mut usize) -> Option<CanAsterisk<usize>> {
+    if let Some(b'*') = rest.get(*index) {
+        *index += 1;
         Some(CanAsterisk::Asterisk)
     } else {
-        eat_number(rest).map(CanAsterisk::Fixed)
+        eat_number(rest, index).map(CanAsterisk::Fixed)
     }
 }
 
-fn eat_number(rest: &mut &[u8]) -> Option<usize> {
-    match rest.iter().position(|b| !b.is_ascii_digit()) {
+fn eat_number(rest: &mut &[u8], index: &mut usize) -> Option<usize> {
+    match rest[*index..].iter().position(|b| !b.is_ascii_digit()) {
         None | Some(0) => None,
         Some(i) => {
             // TODO: This might need to handle errors better
             // For example in case of overflow.
-            let parsed = std::str::from_utf8(&rest[..i]).unwrap().parse().unwrap();
-            *rest = &rest[i..];
+            let parsed = std::str::from_utf8(&rest[*index..(*index + i)])
+                .unwrap()
+                .parse()
+                .unwrap();
+            *index += i;
             Some(parsed)
         }
     }

From 131c310bcbd0c437f55ca0b45677b3d66be8c4ce Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Tue, 21 Nov 2023 08:49:19 +0100
Subject: [PATCH 049/429] Cargo.toml: default_features -> default-features

---
 Cargo.toml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/Cargo.toml b/Cargo.toml
index 2f3af2c83d1..ba701b2d5e5 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -330,7 +330,7 @@ walkdir = "2.4"
 winapi-util = "0.1.6"
 windows-sys = { version = "0.48.0", default-features = false }
 xattr = "1.0.1"
-zip = { version = "0.6.6", default_features = false, features = ["deflate"] }
+zip = { version = "0.6.6", default-features = false, features = ["deflate"] }
 
 hex = "0.4.3"
 md-5 = "0.10.6"

From d2ede927367d87a79901cf45e4fee2dfa1c8f7dc Mon Sep 17 00:00:00 2001
From: ALXD <github@alxd.org>
Date: Mon, 20 Nov 2023 14:19:20 +0100
Subject: [PATCH 050/429] expr: make error messages align with GNU expr

---
 src/uu/expr/src/syntax_tree.rs | 12 ++++++++----
 1 file changed, 8 insertions(+), 4 deletions(-)

diff --git a/src/uu/expr/src/syntax_tree.rs b/src/uu/expr/src/syntax_tree.rs
index c55fb0bdc6a..b19c13c0adf 100644
--- a/src/uu/expr/src/syntax_tree.rs
+++ b/src/uu/expr/src/syntax_tree.rs
@@ -13,6 +13,7 @@
 use num_bigint::BigInt;
 use num_traits::Zero;
 use onig::{Regex, RegexOptions, Syntax};
+use uucore::display::Quotable;
 
 use crate::tokens::Token;
 
@@ -214,7 +215,7 @@ pub fn tokens_to_ast(
         assert!(op_stack.is_empty());
 
         maybe_dump_rpn(&out_stack);
-        let result = ast_from_rpn(&mut out_stack);
+        let result = ast_from_rpn(&mut out_stack, None);
         if out_stack.is_empty() {
             maybe_dump_ast(&result);
             result
@@ -253,9 +254,12 @@ fn maybe_dump_rpn(rpn: &TokenStack) {
     }
 }
 
-fn ast_from_rpn(rpn: &mut TokenStack) -> Result<Box<AstNode>, String> {
+fn ast_from_rpn(rpn: &mut TokenStack, op_type: Option<&str>) -> Result<Box<AstNode>, String> {
     match rpn.pop() {
-        None => Err("syntax error (premature end of expression)".to_owned()),
+        None => Err(match op_type {
+            Some(value) => format!("syntax error: unexpected argument {}", value.quote()),
+            None => "missing operand".to_owned(),
+        }),
 
         Some((token_idx, Token::Value { value })) => Ok(AstNode::new_leaf(token_idx, &value)),
 
@@ -281,7 +285,7 @@ fn maybe_ast_node(
 ) -> Result<Box<AstNode>, String> {
     let mut operands = Vec::with_capacity(arity);
     for _ in 0..arity {
-        let operand = ast_from_rpn(rpn)?;
+        let operand = ast_from_rpn(rpn, Some(op_type))?;
         operands.push(operand);
     }
     operands.reverse();

From 8b650a7a9b5c6356425c37fa0ef49c28c49aea76 Mon Sep 17 00:00:00 2001
From: ALXD <github@alxd.org>
Date: Mon, 20 Nov 2023 14:29:06 +0100
Subject: [PATCH 051/429] expr: add tests for precise error messages

---
 tests/by-util/test_expr.rs | 14 ++++++++++++++
 1 file changed, 14 insertions(+)

diff --git a/tests/by-util/test_expr.rs b/tests/by-util/test_expr.rs
index 28cfcf0ec90..18125fe99dd 100644
--- a/tests/by-util/test_expr.rs
+++ b/tests/by-util/test_expr.rs
@@ -6,6 +6,14 @@
 
 use crate::common::util::TestScenario;
 
+#[test]
+fn test_no_arguments() {
+    new_ucmd!()
+        .fails()
+        .code_is(2)
+        .stderr_only("expr: missing operand\n");
+}
+
 #[test]
 fn test_simple_values() {
     // null or 0 => EXIT_VALUE == 1
@@ -275,6 +283,12 @@ fn test_substr() {
 
 #[test]
 fn test_invalid_substr() {
+    new_ucmd!()
+        .args(&["56", "substr"])
+        .fails()
+        .code_is(2)
+        .stderr_only("expr: syntax error: unexpected argument 'substr'\n");
+
     new_ucmd!()
         .args(&["substr", "abc", "0", "1"])
         .fails()

From a0ac3dd22975ceadfb42498d62b216cc264f0a86 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Tue, 21 Nov 2023 12:38:12 +0100
Subject: [PATCH 052/429] fuzz printf (#5556)

Co-authored-by: Daniel Hofstetter <daniel.hofstetter@42dh.com>
---
 .github/workflows/fuzzing.yml    |   1 +
 fuzz/Cargo.toml                  |   7 ++
 fuzz/fuzz_targets/fuzz_printf.rs | 110 +++++++++++++++++++++++++++++++
 3 files changed, 118 insertions(+)
 create mode 100644 fuzz/fuzz_targets/fuzz_printf.rs

diff --git a/.github/workflows/fuzzing.yml b/.github/workflows/fuzzing.yml
index cbb0574dee2..2274f6905c1 100644
--- a/.github/workflows/fuzzing.yml
+++ b/.github/workflows/fuzzing.yml
@@ -41,6 +41,7 @@ jobs:
           # https://github.com/uutils/coreutils/issues/5311
           - { name: fuzz_date, should_pass: false }
           - { name: fuzz_expr, should_pass: true }
+          - { name: fuzz_printf, should_pass: false }
           - { name: fuzz_parse_glob, should_pass: true }
           - { name: fuzz_parse_size, should_pass: true }
           - { name: fuzz_parse_time, should_pass: true }
diff --git a/fuzz/Cargo.toml b/fuzz/Cargo.toml
index 549f9a6b762..630af4650b6 100644
--- a/fuzz/Cargo.toml
+++ b/fuzz/Cargo.toml
@@ -16,6 +16,7 @@ uucore = { path = "../src/uucore/" }
 uu_date = { path = "../src/uu/date/" }
 uu_test = { path = "../src/uu/test/" }
 uu_expr = { path = "../src/uu/expr/" }
+uu_printf = { path = "../src/uu/printf/" }
 
 
 # Prevent this from interfering with workspaces
@@ -28,6 +29,12 @@ path = "fuzz_targets/fuzz_date.rs"
 test = false
 doc = false
 
+[[bin]]
+name = "fuzz_printf"
+path = "fuzz_targets/fuzz_printf.rs"
+test = false
+doc = false
+
 [[bin]]
 name = "fuzz_expr"
 path = "fuzz_targets/fuzz_expr.rs"
diff --git a/fuzz/fuzz_targets/fuzz_printf.rs b/fuzz/fuzz_targets/fuzz_printf.rs
new file mode 100644
index 00000000000..78bb3e3ce3b
--- /dev/null
+++ b/fuzz/fuzz_targets/fuzz_printf.rs
@@ -0,0 +1,110 @@
+// This file is part of the uutils coreutils package.
+//
+// For the full copyright and license information, please view the LICENSE
+// file that was distributed with this source code.
+// spell-checker:ignore parens
+
+#![no_main]
+use libfuzzer_sys::fuzz_target;
+use uu_printf::uumain;
+
+use rand::seq::SliceRandom;
+use rand::Rng;
+use std::ffi::OsString;
+
+mod fuzz_common;
+use crate::fuzz_common::CommandResult;
+use crate::fuzz_common::{
+    compare_result, generate_and_run_uumain, generate_random_string, run_gnu_cmd,
+};
+
+static CMD_PATH: &str = "printf";
+
+fn generate_escape_sequence(rng: &mut impl Rng) -> String {
+    let escape_sequences = [
+        "\\\"",
+        "\\\\",
+        "\\a",
+        "\\b",
+        "\\c",
+        "\\e",
+        "\\f",
+        "\\n",
+        "\\r",
+        "\\t",
+        "\\v",
+        "\\000",
+        "\\x00",
+        "\\u0000",
+        "\\U00000000",
+        "%%",
+    ];
+    escape_sequences.choose(rng).unwrap().to_string()
+}
+
+fn generate_printf() -> String {
+    let mut rng = rand::thread_rng();
+    let format_specifiers = ["%s", "%d", "%f", "%x", "%o", "%c", "%b", "%q"];
+    let mut printf_str = String::new();
+    // Add a 20% chance of generating an invalid format specifier
+    if rng.gen_bool(0.2) {
+        printf_str.push_str("%z"); // Invalid format specifier
+    } else {
+        let specifier = *format_specifiers.choose(&mut rng).unwrap();
+        printf_str.push_str(specifier);
+
+        // Add a 20% chance of introducing complex format strings
+        if rng.gen_bool(0.2) {
+            printf_str.push_str(&format!(" %{}", rng.gen_range(1..=1000)));
+        } else {
+            // Add a random string or number after the specifier
+            if specifier == "%s" {
+                printf_str.push_str(&format!(
+                    " {}",
+                    generate_random_string(rng.gen_range(1..=10))
+                ));
+            } else {
+                printf_str.push_str(&format!(" {}", rng.gen_range(1..=1000)));
+            }
+        }
+    }
+
+    // Add a 10% chance of including an escape sequence
+    if rng.gen_bool(0.1) {
+        printf_str.push_str(&generate_escape_sequence(&mut rng));
+    }
+    printf_str
+}
+
+fuzz_target!(|_data: &[u8]| {
+    let printf_input = generate_printf();
+    let mut args = vec![OsString::from("printf")];
+    args.extend(printf_input.split_whitespace().map(OsString::from));
+    let rust_result = generate_and_run_uumain(&args, uumain);
+
+    let gnu_result = match run_gnu_cmd(CMD_PATH, &args[1..], false) {
+        Ok(result) => result,
+        Err(error_result) => {
+            eprintln!("Failed to run GNU command:");
+            eprintln!("Stderr: {}", error_result.stderr);
+            eprintln!("Exit Code: {}", error_result.exit_code);
+            CommandResult {
+                stdout: String::new(),
+                stderr: error_result.stderr,
+                exit_code: error_result.exit_code,
+            }
+        }
+    };
+
+    compare_result(
+        "printf",
+        &format!("{:?}", &args[1..]),
+        &rust_result.stdout,
+        &gnu_result.stdout,
+        &rust_result.stderr,
+        &gnu_result.stderr,
+        rust_result.exit_code,
+        gnu_result.exit_code,
+        false, // Set to true if you want to fail on stderr diff
+    );
+});

From da7c168f9d7c27e09c582a99e6dba9c68955c3ec Mon Sep 17 00:00:00 2001
From: Terts Diepraam <terts.diepraam@gmail.com>
Date: Mon, 20 Nov 2023 17:46:47 +0100
Subject: [PATCH 053/429] all: reduce imports needed for show and show_if_err
 macros

---
 src/uu/cut/src/cut.rs           | 2 +-
 src/uu/dd/src/dd.rs             | 4 ++--
 src/uu/head/src/head.rs         | 2 +-
 src/uu/mkdir/src/mkdir.rs       | 2 +-
 src/uu/mv/src/mv.rs             | 2 +-
 src/uu/numfmt/src/numfmt.rs     | 2 +-
 src/uu/realpath/src/realpath.rs | 4 ++--
 src/uu/shred/src/shred.rs       | 2 +-
 src/uu/tail/src/tail.rs         | 2 +-
 src/uu/touch/src/touch.rs       | 2 +-
 src/uucore/src/lib/macros.rs    | 3 ++-
 11 files changed, 14 insertions(+), 13 deletions(-)

diff --git a/src/uu/cut/src/cut.rs b/src/uu/cut/src/cut.rs
index 05e8bc6e424..1a2a8ea01e9 100644
--- a/src/uu/cut/src/cut.rs
+++ b/src/uu/cut/src/cut.rs
@@ -17,7 +17,7 @@ use uucore::line_ending::LineEnding;
 use self::searcher::Searcher;
 use matcher::{ExactMatcher, Matcher, WhitespaceMatcher};
 use uucore::ranges::Range;
-use uucore::{format_usage, help_about, help_section, help_usage, show, show_error, show_if_err};
+use uucore::{format_usage, help_about, help_section, help_usage, show_error, show_if_err};
 
 mod matcher;
 mod searcher;
diff --git a/src/uu/dd/src/dd.rs b/src/uu/dd/src/dd.rs
index b79ae22da4e..2472fba9b0b 100644
--- a/src/uu/dd/src/dd.rs
+++ b/src/uu/dd/src/dd.rs
@@ -52,9 +52,9 @@ use uucore::display::Quotable;
 #[cfg(unix)]
 use uucore::error::set_exit_code;
 use uucore::error::{FromIo, UResult};
-use uucore::{format_usage, help_about, help_section, help_usage, show_error};
 #[cfg(target_os = "linux")]
-use uucore::{show, show_if_err};
+use uucore::show_if_err;
+use uucore::{format_usage, help_about, help_section, help_usage, show_error};
 
 const ABOUT: &str = help_about!("dd.md");
 const AFTER_HELP: &str = help_section!("after help", "dd.md");
diff --git a/src/uu/head/src/head.rs b/src/uu/head/src/head.rs
index 5d0d3beddc9..83bdd37390a 100644
--- a/src/uu/head/src/head.rs
+++ b/src/uu/head/src/head.rs
@@ -9,7 +9,7 @@ use clap::{crate_version, Arg, ArgAction, ArgMatches, Command};
 use std::ffi::OsString;
 use std::io::{self, BufWriter, ErrorKind, Read, Seek, SeekFrom, Write};
 use uucore::display::Quotable;
-use uucore::error::{FromIo, UError, UResult, USimpleError};
+use uucore::error::{FromIo, UResult, USimpleError};
 use uucore::line_ending::LineEnding;
 use uucore::lines::lines;
 use uucore::{format_usage, help_about, help_usage, show};
diff --git a/src/uu/mkdir/src/mkdir.rs b/src/uu/mkdir/src/mkdir.rs
index 4121278b69a..c29905ef4a7 100644
--- a/src/uu/mkdir/src/mkdir.rs
+++ b/src/uu/mkdir/src/mkdir.rs
@@ -16,7 +16,7 @@ use uucore::error::{UResult, USimpleError};
 #[cfg(not(windows))]
 use uucore::mode;
 use uucore::{display::Quotable, fs::dir_strip_dot_for_creation};
-use uucore::{format_usage, help_about, help_section, help_usage, show, show_if_err};
+use uucore::{format_usage, help_about, help_section, help_usage, show_if_err};
 
 static DEFAULT_PERM: u32 = 0o777;
 
diff --git a/src/uu/mv/src/mv.rs b/src/uu/mv/src/mv.rs
index 036024f9907..60dabf34582 100644
--- a/src/uu/mv/src/mv.rs
+++ b/src/uu/mv/src/mv.rs
@@ -21,7 +21,7 @@ use std::os::windows;
 use std::path::{Path, PathBuf};
 use uucore::backup_control::{self, source_is_target_backup};
 use uucore::display::Quotable;
-use uucore::error::{set_exit_code, FromIo, UError, UResult, USimpleError, UUsageError};
+use uucore::error::{set_exit_code, FromIo, UResult, USimpleError, UUsageError};
 use uucore::fs::{are_hardlinks_or_one_way_symlink_to_same_file, are_hardlinks_to_same_file};
 use uucore::update_control;
 // These are exposed for projects (e.g. nushell) that want to create an `Options` value, which
diff --git a/src/uu/numfmt/src/numfmt.rs b/src/uu/numfmt/src/numfmt.rs
index d1785209d06..d158072fbb4 100644
--- a/src/uu/numfmt/src/numfmt.rs
+++ b/src/uu/numfmt/src/numfmt.rs
@@ -13,7 +13,7 @@ use std::str::FromStr;
 
 use units::{IEC_BASES, SI_BASES};
 use uucore::display::Quotable;
-use uucore::error::{UError, UResult};
+use uucore::error::UResult;
 use uucore::ranges::Range;
 use uucore::{format_usage, help_about, help_section, help_usage, show, show_error};
 
diff --git a/src/uu/realpath/src/realpath.rs b/src/uu/realpath/src/realpath.rs
index 64806fbabf6..b099a5f377c 100644
--- a/src/uu/realpath/src/realpath.rs
+++ b/src/uu/realpath/src/realpath.rs
@@ -15,13 +15,13 @@ use std::{
 use uucore::fs::make_path_relative_to;
 use uucore::{
     display::{print_verbatim, Quotable},
-    error::{FromIo, UResult},
+    error::{FromIo, UClapError, UResult},
     format_usage,
     fs::{canonicalize, MissingHandling, ResolveMode},
     help_about, help_usage,
     line_ending::LineEnding,
+    show_if_err,
 };
-use uucore::{error::UClapError, show, show_if_err};
 
 static ABOUT: &str = help_about!("realpath.md");
 const USAGE: &str = help_usage!("realpath.md");
diff --git a/src/uu/shred/src/shred.rs b/src/uu/shred/src/shred.rs
index eb63f0e5f2e..04f81bf23fd 100644
--- a/src/uu/shred/src/shred.rs
+++ b/src/uu/shred/src/shred.rs
@@ -17,7 +17,7 @@ use std::path::{Path, PathBuf};
 use uucore::display::Quotable;
 use uucore::error::{FromIo, UResult, USimpleError, UUsageError};
 use uucore::parse_size::parse_size_u64;
-use uucore::{format_usage, help_about, help_section, help_usage, show, show_error, show_if_err};
+use uucore::{format_usage, help_about, help_section, help_usage, show_error, show_if_err};
 
 const ABOUT: &str = help_about!("shred.md");
 const USAGE: &str = help_usage!("shred.md");
diff --git a/src/uu/tail/src/tail.rs b/src/uu/tail/src/tail.rs
index 0488e0808ed..edac4b151cb 100644
--- a/src/uu/tail/src/tail.rs
+++ b/src/uu/tail/src/tail.rs
@@ -31,7 +31,7 @@ use std::fs::File;
 use std::io::{self, stdin, stdout, BufRead, BufReader, BufWriter, Read, Seek, SeekFrom, Write};
 use std::path::{Path, PathBuf};
 use uucore::display::Quotable;
-use uucore::error::{get_exit_code, set_exit_code, FromIo, UError, UResult, USimpleError};
+use uucore::error::{get_exit_code, set_exit_code, FromIo, UResult, USimpleError};
 use uucore::{show, show_error};
 
 #[uucore::main]
diff --git a/src/uu/touch/src/touch.rs b/src/uu/touch/src/touch.rs
index d9399a051f6..51c09801b0a 100644
--- a/src/uu/touch/src/touch.rs
+++ b/src/uu/touch/src/touch.rs
@@ -17,7 +17,7 @@ use std::ffi::OsString;
 use std::fs::{self, File};
 use std::path::{Path, PathBuf};
 use uucore::display::Quotable;
-use uucore::error::{FromIo, UError, UResult, USimpleError};
+use uucore::error::{FromIo, UResult, USimpleError};
 use uucore::{format_usage, help_about, help_usage, show};
 
 const ABOUT: &str = help_about!("touch.md");
diff --git a/src/uucore/src/lib/macros.rs b/src/uucore/src/lib/macros.rs
index ad86d530828..d1a09c281ab 100644
--- a/src/uucore/src/lib/macros.rs
+++ b/src/uucore/src/lib/macros.rs
@@ -91,6 +91,7 @@ pub static UTILITY_IS_SECOND_ARG: AtomicBool = AtomicBool::new(false);
 #[macro_export]
 macro_rules! show(
     ($err:expr) => ({
+        use $crate::error::UError;
         let e = $err;
         $crate::error::set_exit_code(e.code());
         eprintln!("{}: {}", $crate::util_name(), e);
@@ -131,7 +132,7 @@ macro_rules! show(
 macro_rules! show_if_err(
     ($res:expr) => ({
         if let Err(e) = $res {
-            show!(e);
+            $crate::show!(e);
         }
     })
 );

From 17d21d2d9c7c421202cd692e427ab13bfd01bf60 Mon Sep 17 00:00:00 2001
From: Zhuoxun Yang <Zhuoxun.Yang777@outlook.com>
Date: Tue, 21 Nov 2023 22:05:41 +0800
Subject: [PATCH 054/429] expr: check prefix operation

---
 src/uu/expr/src/syntax_tree.rs | 8 ++++++--
 1 file changed, 6 insertions(+), 2 deletions(-)

diff --git a/src/uu/expr/src/syntax_tree.rs b/src/uu/expr/src/syntax_tree.rs
index c55fb0bdc6a..119f325a3d1 100644
--- a/src/uu/expr/src/syntax_tree.rs
+++ b/src/uu/expr/src/syntax_tree.rs
@@ -332,8 +332,12 @@ fn push_token_to_either_stack(
         }
 
         Token::PrefixOp { .. } | Token::ParOpen => {
-            op_stack.push((token_idx, token.clone()));
-            Ok(())
+            if out_stack.is_empty() {
+                op_stack.push((token_idx, token.clone()));
+                Ok(())
+            } else {
+                Err(String::from("syntax error (operation should be prefix)"))
+            }
         }
 
         Token::ParClose => move_till_match_paren(out_stack, op_stack),

From 44702940d2437a4427638f94870f57cde5d5f8c0 Mon Sep 17 00:00:00 2001
From: Zhuoxun Yang <Zhuoxun.Yang777@outlook.com>
Date: Tue, 21 Nov 2023 22:06:20 +0800
Subject: [PATCH 055/429] tests/expr: check prefix operation

---
 tests/by-util/test_expr.rs | 20 ++++++++++++++++++++
 1 file changed, 20 insertions(+)

diff --git a/tests/by-util/test_expr.rs b/tests/by-util/test_expr.rs
index 28cfcf0ec90..8582082c483 100644
--- a/tests/by-util/test_expr.rs
+++ b/tests/by-util/test_expr.rs
@@ -100,6 +100,11 @@ fn test_parenthesis() {
         .args(&["(", "1", "+", "1", ")", "*", "2"])
         .succeeds()
         .stdout_only("4\n");
+
+    new_ucmd!()
+        .args(&["1", "(", ")"])
+        .fails()
+        .stderr_only("expr: syntax error (operation should be prefix)\n");
 }
 
 #[test]
@@ -221,6 +226,11 @@ fn test_index() {
         .args(&["index", "αbcdef_f", "f"])
         .succeeds()
         .stdout_only("6\n");
+
+    new_ucmd!()
+        .args(&["αbcdef", "index", "α"])
+        .fails()
+        .stderr_only("expr: syntax error (operation should be prefix)\n");
 }
 
 #[test]
@@ -234,6 +244,11 @@ fn test_length() {
         .args(&["length", "abcdef"])
         .succeeds()
         .stdout_only("6\n");
+
+    new_ucmd!()
+        .args(&["abcdef", "length"])
+        .fails()
+        .stderr_only("expr: syntax error (operation should be prefix)\n");
 }
 
 #[test]
@@ -271,6 +286,11 @@ fn test_substr() {
         .args(&["substr", "abc", "1", "1"])
         .succeeds()
         .stdout_only("a\n");
+
+    new_ucmd!()
+        .args(&["abc", "substr", "1", "1"])
+        .fails()
+        .stderr_only("expr: syntax error (operation should be prefix)\n");
 }
 
 #[test]

From 0822511fdcd00d95554601983c2d2e72becaa2ce Mon Sep 17 00:00:00 2001
From: Terts Diepraam <terts.diepraam@gmail.com>
Date: Tue, 21 Nov 2023 16:49:20 +0100
Subject: [PATCH 056/429] test/printf: ignoring rounding up to 2

This is a limitation of the current implementation, which should ultimately use "long double" precision instead of f64.
---
 tests/by-util/test_printf.rs | 13 +++++++++++--
 1 file changed, 11 insertions(+), 2 deletions(-)

diff --git a/tests/by-util/test_printf.rs b/tests/by-util/test_printf.rs
index 875896a9f02..dfd13159043 100644
--- a/tests/by-util/test_printf.rs
+++ b/tests/by-util/test_printf.rs
@@ -296,9 +296,18 @@ fn sub_num_float_e_no_round() {
 }
 
 #[test]
-fn sub_num_float_round() {
+fn sub_num_float_round_to_one() {
     new_ucmd!()
-        .args(&["two is %f", "1.9999996"])
+        .args(&["one is %f", "0.9999995"])
+        .succeeds()
+        .stdout_only("one is 1.000000");
+}
+
+#[test]
+#[ignore = "Requires 'long double' precision floats to be used internally"]
+fn sub_num_float_round_to_two() {
+    new_ucmd!()
+        .args(&["two is %f", "1.9999995"])
         .succeeds()
         .stdout_only("two is 2.000000");
 }

From 18b5c22567f76fdafd138d31bf1dcaf3c3cce7c2 Mon Sep 17 00:00:00 2001
From: "renovate[bot]" <29139614+renovate[bot]@users.noreply.github.com>
Date: Tue, 21 Nov 2023 22:24:11 +0000
Subject: [PATCH 057/429] fix(deps): update rust crate data-encoding to 2.5

---
 Cargo.lock            | 4 ++--
 src/uucore/Cargo.toml | 2 +-
 2 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/Cargo.lock b/Cargo.lock
index c89c87df41c..3cf5dbcc551 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -690,9 +690,9 @@ checksum = "ef8ae57c4978a2acd8b869ce6b9ca1dfe817bff704c220209fdef2c0b75a01b9"
 
 [[package]]
 name = "data-encoding"
-version = "2.4.0"
+version = "2.5.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "c2e66c9d817f1720209181c316d28635c050fa304f9c79e47a520882661b7308"
+checksum = "7e962a19be5cfc3f3bf6dd8f61eb50107f356ad6270fbb3ed41476571db78be5"
 
 [[package]]
 name = "data-encoding-macro"
diff --git a/src/uucore/Cargo.toml b/src/uucore/Cargo.toml
index 370c8a3864c..cbe34d5f7c8 100644
--- a/src/uucore/Cargo.toml
+++ b/src/uucore/Cargo.toml
@@ -33,7 +33,7 @@ time = { workspace = true, optional = true, features = [
   "macros",
 ] }
 # * "problem" dependencies (pinned)
-data-encoding = { version = "2.4", optional = true }
+data-encoding = { version = "2.5", optional = true }
 data-encoding-macro = { version = "0.1.13", optional = true }
 z85 = { version = "3.0.5", optional = true }
 libc = { workspace = true, optional = true }

From 3425ee8d5957e0ad75d9b7fad873ca56ac3d2721 Mon Sep 17 00:00:00 2001
From: "renovate[bot]" <29139614+renovate[bot]@users.noreply.github.com>
Date: Wed, 22 Nov 2023 06:09:44 +0000
Subject: [PATCH 058/429] fix(deps): update rust crate data-encoding-macro to
 0.1.14

---
 Cargo.lock            | 8 ++++----
 src/uucore/Cargo.toml | 2 +-
 2 files changed, 5 insertions(+), 5 deletions(-)

diff --git a/Cargo.lock b/Cargo.lock
index 3cf5dbcc551..d7682f839e4 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -696,9 +696,9 @@ checksum = "7e962a19be5cfc3f3bf6dd8f61eb50107f356ad6270fbb3ed41476571db78be5"
 
 [[package]]
 name = "data-encoding-macro"
-version = "0.1.13"
+version = "0.1.14"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "c904b33cc60130e1aeea4956ab803d08a3f4a0ca82d64ed757afac3891f2bb99"
+checksum = "20c01c06f5f429efdf2bae21eb67c28b3df3cf85b7dd2d8ef09c0838dac5d33e"
 dependencies = [
  "data-encoding",
  "data-encoding-macro-internal",
@@ -706,9 +706,9 @@ dependencies = [
 
 [[package]]
 name = "data-encoding-macro-internal"
-version = "0.1.11"
+version = "0.1.12"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "8fdf3fce3ce863539ec1d7fd1b6dcc3c645663376b43ed376bbf887733e4f772"
+checksum = "0047d07f2c89b17dd631c80450d69841a6b5d7fb17278cbc43d7e4cfcf2576f3"
 dependencies = [
  "data-encoding",
  "syn 1.0.109",
diff --git a/src/uucore/Cargo.toml b/src/uucore/Cargo.toml
index cbe34d5f7c8..fabf068bb4d 100644
--- a/src/uucore/Cargo.toml
+++ b/src/uucore/Cargo.toml
@@ -34,7 +34,7 @@ time = { workspace = true, optional = true, features = [
 ] }
 # * "problem" dependencies (pinned)
 data-encoding = { version = "2.5", optional = true }
-data-encoding-macro = { version = "0.1.13", optional = true }
+data-encoding-macro = { version = "0.1.14", optional = true }
 z85 = { version = "3.0.5", optional = true }
 libc = { workspace = true, optional = true }
 once_cell = { workspace = true }

From e95add794066612aa007f2c7e49855ec30693c4d Mon Sep 17 00:00:00 2001
From: Terts Diepraam <terts.diepraam@gmail.com>
Date: Wed, 22 Nov 2023 12:38:10 +0100
Subject: [PATCH 059/429] uucore/format: fix license headers and improve docs

---
 .../src/lib/features/format/argument.rs       | 12 +++++
 src/uucore/src/lib/features/format/escape.rs  | 11 +++++
 src/uucore/src/lib/features/format/mod.rs     | 46 +++++++++++++------
 .../src/lib/features/format/num_format.rs     |  7 +++
 src/uucore/src/lib/features/format/spec.rs    | 11 ++++-
 5 files changed, 71 insertions(+), 16 deletions(-)

diff --git a/src/uucore/src/lib/features/format/argument.rs b/src/uucore/src/lib/features/format/argument.rs
index 6370c4177e8..db18cf51890 100644
--- a/src/uucore/src/lib/features/format/argument.rs
+++ b/src/uucore/src/lib/features/format/argument.rs
@@ -1,7 +1,19 @@
+// This file is part of the uutils coreutils package.
+//
+// For the full copyright and license information, please view the LICENSE
+// file that was distributed with this source code.
+
 use os_display::Quotable;
 
 use crate::{error::set_exit_code, show_warning};
 
+/// An argument for formatting
+///
+/// Each of these variants is only accepted by their respective directives. For
+/// example, [`FormatArgument::Char`] requires a `%c` directive.
+///
+/// The [`FormatArgument::Unparsed`] variant contains a string that can be
+/// parsed into other types. This is used by the `printf` utility.
 #[derive(Clone, Debug)]
 pub enum FormatArgument {
     Char(char),
diff --git a/src/uucore/src/lib/features/format/escape.rs b/src/uucore/src/lib/features/format/escape.rs
index 188dd1892b5..d20da3e7e38 100644
--- a/src/uucore/src/lib/features/format/escape.rs
+++ b/src/uucore/src/lib/features/format/escape.rs
@@ -1,8 +1,19 @@
+// This file is part of the uutils coreutils package.
+//
+// For the full copyright and license information, please view the LICENSE
+// file that was distributed with this source code.
+
+//! Parsing of escape sequences
+
 #[derive(Debug)]
 pub enum EscapedChar {
+    /// A single byte
     Byte(u8),
+    /// A unicode character
     Char(char),
+    /// A character prefixed with a backslash (i.e. an invalid escape sequence)
     Backslash(u8),
+    /// Specifies that the string should stop (`\c`)
     End,
 }
 
diff --git a/src/uucore/src/lib/features/format/mod.rs b/src/uucore/src/lib/features/format/mod.rs
index 9045b8b90c3..d213d0359cf 100644
--- a/src/uucore/src/lib/features/format/mod.rs
+++ b/src/uucore/src/lib/features/format/mod.rs
@@ -1,23 +1,34 @@
-//! Main entry point for our implementation of printf.
+// This file is part of the uutils coreutils package.
+//
+// For the full copyright and license information, please view the LICENSE
+// file that was distributed with this source code.
+
+//! `printf`-style formatting
+//!
+//! Rust has excellent formatting capabilities, but the coreutils require very
+//! specific formatting that needs to work exactly like the GNU utilities.
+//! Naturally, the GNU behavior is based on the C `printf` functionality.
 //!
-//! The [`printf`] and [`sprintf`] closely match the behavior of the
+//! Additionally, we need support for escape sequences for the `printf` utility.
+//!
+//! The [`printf`] and [`sprintf`] functions closely match the behavior of the
 //! corresponding C functions: the former renders a formatted string
 //! to stdout, the latter renders to a new [`String`] object.
 //!
-//! In addition to the [`printf`] and [`sprintf`] functions, we expose the
-//! [`Format`] struct, which represents a parsed format string. This reduces
-//! the need for parsing a format string multiple times and assures that no
-//! parsing errors occur during writing.
-//!
 //! There are three kinds of parsing that we might want to do:
 //!
-//!  1. Only `printf` specifiers (for e.g. `seq`, `dd`)
-//!  2. Only escape sequences (for e.g. `echo`)
-//!  3. Both `printf` specifiers and escape sequences (for e.g. `printf`)
+//!  1. Parse only `printf` directives (for e.g. `seq`, `dd`)
+//!  2. Parse only escape sequences (for e.g. `echo`)
+//!  3. Parse both `printf` specifiers and escape sequences (for e.g. `printf`)
 //!
-//! This module aims to combine all three use cases.
-
-// spell-checker:ignore (vars) charf decf floatf intf scif strf Cninety
+//! This module aims to combine all three use cases. An iterator parsing each
+//! of these cases is provided by [`parse_escape_only`], [`parse_spec_only`]
+//! and [`parse_spec_and_escape`], respectively.
+//!
+//! There is a special [`Format`] type, which can be used to parse a format
+//! string containing exactly one directive and does not use any `*` in that
+//! directive. This format can be printed in a type-safe manner without failing
+//! (modulo IO errors).
 
 mod argument;
 mod escape;
@@ -131,6 +142,7 @@ impl<C: FormatChar> FormatItem<C> {
     }
 }
 
+/// Parse a format string containing % directives and escape sequences
 pub fn parse_spec_and_escape(
     fmt: &[u8],
 ) -> impl Iterator<Item = Result<FormatItem<EscapedChar>, FormatError>> + '_ {
@@ -160,7 +172,10 @@ pub fn parse_spec_and_escape(
     })
 }
 
-fn parse_spec_only(fmt: &[u8]) -> impl Iterator<Item = Result<FormatItem<u8>, FormatError>> + '_ {
+/// Parse a format string containing % directives
+pub fn parse_spec_only(
+    fmt: &[u8],
+) -> impl Iterator<Item = Result<FormatItem<u8>, FormatError>> + '_ {
     let mut current = fmt;
     std::iter::from_fn(move || match current {
         [] => None,
@@ -183,7 +198,8 @@ fn parse_spec_only(fmt: &[u8]) -> impl Iterator<Item = Result<FormatItem<u8>, Fo
     })
 }
 
-fn parse_escape_only(fmt: &[u8]) -> impl Iterator<Item = EscapedChar> + '_ {
+/// Parse a format string containing escape sequences
+pub fn parse_escape_only(fmt: &[u8]) -> impl Iterator<Item = EscapedChar> + '_ {
     let mut current = fmt;
     std::iter::from_fn(move || match current {
         [] => None,
diff --git a/src/uucore/src/lib/features/format/num_format.rs b/src/uucore/src/lib/features/format/num_format.rs
index c9a2b8c166f..6fd177d1325 100644
--- a/src/uucore/src/lib/features/format/num_format.rs
+++ b/src/uucore/src/lib/features/format/num_format.rs
@@ -1,3 +1,10 @@
+// This file is part of the uutils coreutils package.
+//
+// For the full copyright and license information, please view the LICENSE
+// file that was distributed with this source code.
+
+//! Utilities for formatting numbers in various formats
+
 use std::io::Write;
 
 use super::{
diff --git a/src/uucore/src/lib/features/format/spec.rs b/src/uucore/src/lib/features/format/spec.rs
index e74b6f8660f..7c0d0236764 100644
--- a/src/uucore/src/lib/features/format/spec.rs
+++ b/src/uucore/src/lib/features/format/spec.rs
@@ -1,4 +1,9 @@
-// spell-checker:ignore (vars) charf decf floatf intf scif strf Cninety intmax ptrdiff
+// This file is part of the uutils coreutils package.
+//
+// For the full copyright and license information, please view the LICENSE
+// file that was distributed with this source code.
+
+// spell-checker:ignore (vars) intmax ptrdiff
 
 use crate::quoting_style::{escape_name, QuotingStyle};
 
@@ -11,6 +16,10 @@ use super::{
 };
 use std::{fmt::Display, io::Write, ops::ControlFlow};
 
+/// A parsed specification for formatting a value
+///
+/// This might require more than one argument to resolve width or precision
+/// values that are given as `*`.
 #[derive(Debug)]
 pub enum Spec {
     Char {

From 2e77d99dd4258a853e172a96ed5349d6bd2e169b Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Thu, 23 Nov 2023 14:35:02 +0100
Subject: [PATCH 060/429] expr: fail fast if there are no operands

---
 src/uu/expr/src/expr.rs    | 6 +++++-
 tests/by-util/test_expr.rs | 2 +-
 2 files changed, 6 insertions(+), 2 deletions(-)

diff --git a/src/uu/expr/src/expr.rs b/src/uu/expr/src/expr.rs
index ea559090c92..909c4c37653 100644
--- a/src/uu/expr/src/expr.rs
+++ b/src/uu/expr/src/expr.rs
@@ -5,7 +5,7 @@
 
 use clap::{crate_version, Arg, ArgAction, Command};
 use uucore::{
-    error::{UResult, USimpleError},
+    error::{UResult, USimpleError, UUsageError},
     format_usage, help_about, help_section, help_usage,
 };
 
@@ -58,6 +58,10 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
         .map(|v| v.into_iter().map(|s| s.as_ref()).collect::<Vec<_>>())
         .unwrap_or_default();
 
+    if token_strings.is_empty() {
+        return Err(UUsageError::new(2, "missing operand"));
+    }
+
     match process_expr(&token_strings[..]) {
         Ok(expr_result) => print_expr_ok(&expr_result),
         Err(expr_error) => Err(USimpleError::new(2, &expr_error)),
diff --git a/tests/by-util/test_expr.rs b/tests/by-util/test_expr.rs
index 72d7687b7d1..41fc8d4540b 100644
--- a/tests/by-util/test_expr.rs
+++ b/tests/by-util/test_expr.rs
@@ -11,7 +11,7 @@ fn test_no_arguments() {
     new_ucmd!()
         .fails()
         .code_is(2)
-        .stderr_only("expr: missing operand\n");
+        .usage_error("missing operand");
 }
 
 #[test]

From c2bfb6a465aac1dce51cc04510820893fad0c1dd Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Thu, 23 Nov 2023 15:03:53 +0100
Subject: [PATCH 061/429] expr: adapt error messages, revert most of #5559

---
 src/uu/expr/src/syntax_tree.rs | 28 ++++++++++++++++++----------
 tests/by-util/test_expr.rs     | 18 ++++++++----------
 2 files changed, 26 insertions(+), 20 deletions(-)

diff --git a/src/uu/expr/src/syntax_tree.rs b/src/uu/expr/src/syntax_tree.rs
index 89c23e41249..0654f2ac331 100644
--- a/src/uu/expr/src/syntax_tree.rs
+++ b/src/uu/expr/src/syntax_tree.rs
@@ -215,7 +215,7 @@ pub fn tokens_to_ast(
         assert!(op_stack.is_empty());
 
         maybe_dump_rpn(&out_stack);
-        let result = ast_from_rpn(&mut out_stack, None);
+        let result = ast_from_rpn(&mut out_stack);
         if out_stack.is_empty() {
             maybe_dump_ast(&result);
             result
@@ -254,13 +254,9 @@ fn maybe_dump_rpn(rpn: &TokenStack) {
     }
 }
 
-fn ast_from_rpn(rpn: &mut TokenStack, op_type: Option<&str>) -> Result<Box<AstNode>, String> {
+fn ast_from_rpn(rpn: &mut TokenStack) -> Result<Box<AstNode>, String> {
     match rpn.pop() {
-        None => Err(match op_type {
-            Some(value) => format!("syntax error: unexpected argument {}", value.quote()),
-            None => "missing operand".to_owned(),
-        }),
-
+        None => Err("syntax error (premature end of expression)".to_owned()),
         Some((token_idx, Token::Value { value })) => Ok(AstNode::new_leaf(token_idx, &value)),
 
         Some((token_idx, Token::InfixOp { value, .. })) => {
@@ -285,7 +281,7 @@ fn maybe_ast_node(
 ) -> Result<Box<AstNode>, String> {
     let mut operands = Vec::with_capacity(arity);
     for _ in 0..arity {
-        let operand = ast_from_rpn(rpn, Some(op_type))?;
+        let operand = ast_from_rpn(rpn)?;
         operands.push(operand);
     }
     operands.reverse();
@@ -335,12 +331,24 @@ fn push_token_to_either_stack(
             }
         }
 
-        Token::PrefixOp { .. } | Token::ParOpen => {
+        Token::ParOpen => {
             if out_stack.is_empty() {
                 op_stack.push((token_idx, token.clone()));
                 Ok(())
             } else {
-                Err(String::from("syntax error (operation should be prefix)"))
+                Err("syntax error: unexpected argument '('".to_string())
+            }
+        }
+
+        Token::PrefixOp { value, .. } => {
+            if out_stack.is_empty() {
+                op_stack.push((token_idx, token.clone()));
+                Ok(())
+            } else {
+                Err(format!(
+                    "syntax error: unexpected argument {}",
+                    value.quote()
+                ))
             }
         }
 
diff --git a/tests/by-util/test_expr.rs b/tests/by-util/test_expr.rs
index 41fc8d4540b..f29752f66c9 100644
--- a/tests/by-util/test_expr.rs
+++ b/tests/by-util/test_expr.rs
@@ -112,7 +112,8 @@ fn test_parenthesis() {
     new_ucmd!()
         .args(&["1", "(", ")"])
         .fails()
-        .stderr_only("expr: syntax error (operation should be prefix)\n");
+        .code_is(2)
+        .stderr_only("expr: syntax error: unexpected argument '('\n");
 }
 
 #[test]
@@ -238,7 +239,8 @@ fn test_index() {
     new_ucmd!()
         .args(&["αbcdef", "index", "α"])
         .fails()
-        .stderr_only("expr: syntax error (operation should be prefix)\n");
+        .code_is(2)
+        .stderr_only("expr: syntax error: unexpected argument 'index'\n");
 }
 
 #[test]
@@ -256,7 +258,8 @@ fn test_length() {
     new_ucmd!()
         .args(&["abcdef", "length"])
         .fails()
-        .stderr_only("expr: syntax error (operation should be prefix)\n");
+        .code_is(2)
+        .stderr_only("expr: syntax error: unexpected argument 'length'\n");
 }
 
 #[test]
@@ -298,17 +301,12 @@ fn test_substr() {
     new_ucmd!()
         .args(&["abc", "substr", "1", "1"])
         .fails()
-        .stderr_only("expr: syntax error (operation should be prefix)\n");
+        .code_is(2)
+        .stderr_only("expr: syntax error: unexpected argument 'substr'\n");
 }
 
 #[test]
 fn test_invalid_substr() {
-    new_ucmd!()
-        .args(&["56", "substr"])
-        .fails()
-        .code_is(2)
-        .stderr_only("expr: syntax error: unexpected argument 'substr'\n");
-
     new_ucmd!()
         .args(&["substr", "abc", "0", "1"])
         .fails()

From 7efe33108a8bebada31e962cfb8c0d5a70b07efe Mon Sep 17 00:00:00 2001
From: Coba Weel <122735+cobaweel@users.noreply.github.com>
Date: Wed, 22 Nov 2023 16:15:59 -0800
Subject: [PATCH 062/429] Fix issue 5576 (regex matching bug in expr)

Issue 5576 reported a bug in expr, found by the fuzzer. The problem
turns out to be with the regex match operator `:`, which is defined in
POSIX and the GNU manual to match the pattern only when it occurs at
the beginning of the string, i.e., the regex has an implicit `^`
prepended to it. We hadn't been doing that.
---
 src/uu/expr/src/syntax_tree.rs | 3 ++-
 tests/by-util/test_expr.rs     | 4 ++++
 2 files changed, 6 insertions(+), 1 deletion(-)

diff --git a/src/uu/expr/src/syntax_tree.rs b/src/uu/expr/src/syntax_tree.rs
index 0654f2ac331..2260b2e2186 100644
--- a/src/uu/expr/src/syntax_tree.rs
+++ b/src/uu/expr/src/syntax_tree.rs
@@ -498,7 +498,8 @@ fn infix_operator_and(values: &[String]) -> String {
 
 fn operator_match(values: &[String]) -> Result<String, String> {
     assert!(values.len() == 2);
-    let re = Regex::with_options(&values[1], RegexOptions::REGEX_OPTION_NONE, Syntax::grep())
+    let re_string = format!("^{}", &values[1]);
+    let re = Regex::with_options(&re_string, RegexOptions::REGEX_OPTION_NONE, Syntax::grep())
         .map_err(|err| err.description().to_string())?;
     Ok(if re.captures_len() > 0 {
         re.captures(&values[0])
diff --git a/tests/by-util/test_expr.rs b/tests/by-util/test_expr.rs
index f29752f66c9..ebc2c832feb 100644
--- a/tests/by-util/test_expr.rs
+++ b/tests/by-util/test_expr.rs
@@ -289,6 +289,10 @@ fn test_regex() {
         .args(&["-5", ":", "-\\{0,1\\}[0-9]*$"])
         .succeeds()
         .stdout_only("2\n");
+    new_ucmd!()
+        .args(&["abc", ":", "bc"])
+        .fails()
+        .stdout_only("0\n");
 }
 
 #[test]

From 550f3b0c488451bbe9f930e0520d558f01e3c891 Mon Sep 17 00:00:00 2001
From: zoze0 <licardoooo@gmail.com>
Date: Fri, 24 Nov 2023 00:41:11 +0800
Subject: [PATCH 063/429] uucore: add support for loongarch64 (#5574)

* uucore: add support for loongarch64

* add loongarch

---------

Co-authored-by: Sylvestre Ledru <sylvestre@debian.org>
---
 .vscode/cspell.dictionaries/acronyms+names.wordlist.txt | 1 +
 src/uucore/src/lib/features/fs.rs                       | 2 ++
 2 files changed, 3 insertions(+)

diff --git a/.vscode/cspell.dictionaries/acronyms+names.wordlist.txt b/.vscode/cspell.dictionaries/acronyms+names.wordlist.txt
index c004ea2f822..4a59ed094bd 100644
--- a/.vscode/cspell.dictionaries/acronyms+names.wordlist.txt
+++ b/.vscode/cspell.dictionaries/acronyms+names.wordlist.txt
@@ -37,6 +37,7 @@ aarch
 flac
 impls
 lzma
+loongarch
 
 # * names
 BusyBox
diff --git a/src/uucore/src/lib/features/fs.rs b/src/uucore/src/lib/features/fs.rs
index f8593dfede5..de4c0b08dbe 100644
--- a/src/uucore/src/lib/features/fs.rs
+++ b/src/uucore/src/lib/features/fs.rs
@@ -119,6 +119,7 @@ impl FileInformation {
             not(target_os = "solaris"),
             not(target_arch = "aarch64"),
             not(target_arch = "riscv64"),
+            not(target_arch = "loongarch64"),
             target_pointer_width = "64"
         ))]
         return self.0.st_nlink;
@@ -133,6 +134,7 @@ impl FileInformation {
                 target_os = "solaris",
                 target_arch = "aarch64",
                 target_arch = "riscv64",
+                target_arch = "loongarch64",
                 not(target_pointer_width = "64")
             )
         ))]

From 4dc46f10e9f3636ad8ac68b579b73461b8035bee Mon Sep 17 00:00:00 2001
From: zhitkoff <zhitkoff@gmail.com>
Date: Tue, 21 Nov 2023 11:04:38 -0500
Subject: [PATCH 064/429] split: pass GNU test l-chunk

---
 src/uu/split/src/split.rs    | 188 ++++++++++++++++++----------
 src/uu/split/src/strategy.rs |   9 +-
 tests/by-util/test_split.rs  | 233 +++++++++++++++++++----------------
 3 files changed, 259 insertions(+), 171 deletions(-)

diff --git a/src/uu/split/src/split.rs b/src/uu/split/src/split.rs
index 592e4eedde9..4e2af0be4d8 100644
--- a/src/uu/split/src/split.rs
+++ b/src/uu/split/src/split.rs
@@ -1130,14 +1130,68 @@ impl<'a> Write for LineBytesChunkWriter<'a> {
     }
 }
 
+/// Output file parameters
+struct OutFile {
+    filename: String,
+    maybe_writer: Option<BufWriter<Box<dyn Write>>>,
+}
+
+impl OutFile {
+    /// Get the writer for the output file
+    /// Instantiate the writer if it has not been instantiated upfront
+    fn get_writer(&mut self, settings: &Settings) -> UResult<&mut BufWriter<Box<dyn Write>>> {
+        if self.maybe_writer.is_some() {
+            Ok(self.maybe_writer.as_mut().unwrap())
+        } else {
+            // Writer was not instantiated upfront
+            // Instantiate it and record for future use
+            self.maybe_writer = Some(settings.instantiate_current_writer(self.filename.as_str())?);
+            Ok(self.maybe_writer.as_mut().unwrap())
+        }
+    }
+}
+
+/// Generate a set of Output Files
+/// This is a helper function to [`n_chunks_by_byte`], [`n_chunks_by_line`]
+/// and [`n_chunks_by_line_round_robin`].
+/// Each OutFile is generated with filename, while the writer for it could be
+/// optional, to be instantiated later by the calling function as needed.
+/// Optional writers could happen in [`n_chunks_by_line`]
+/// if `elide_empty_files` parameter is set to `true`.
+fn get_out_files(
+    num_files: u64,
+    settings: &Settings,
+    is_writer_optional: bool,
+) -> UResult<Vec<OutFile>> {
+    // This object is responsible for creating the filename for each chunk
+    let mut filename_iterator: FilenameIterator<'_> =
+        FilenameIterator::new(&settings.prefix, &settings.suffix)
+            .map_err(|e| io::Error::new(ErrorKind::Other, format!("{e}")))?;
+    let mut out_files: Vec<OutFile> = Vec::new();
+    for _ in 0..num_files {
+        let filename = filename_iterator
+            .next()
+            .ok_or_else(|| USimpleError::new(1, "output file suffixes exhausted"))?;
+        let maybe_writer = if is_writer_optional {
+            None
+        } else {
+            Some(settings.instantiate_current_writer(filename.as_str())?)
+        };
+        out_files.push(OutFile {
+            filename,
+            maybe_writer,
+        });
+    }
+    Ok(out_files)
+}
+
 /// Split a file or STDIN into a specific number of chunks by byte.
-/// If in Kth chunk of N mode - print the k-th chunk to STDOUT.
 ///
 /// When file size cannot be evenly divided into the number of chunks of the same size,
 /// the first X chunks are 1 byte longer than the rest,
 /// where X is a modulus reminder of (file size % number of chunks)
 ///
-/// In Kth chunk of N mode - writes to stdout the contents of the chunk identified by `kth_chunk`
+/// In Kth chunk of N mode - writes to STDOUT the contents of the chunk identified by `kth_chunk`
 ///
 /// In N chunks mode - this function always creates one output file for each chunk, even
 /// if there is an error reading or writing one of the chunks or if
@@ -1207,7 +1261,7 @@ where
     // In Kth chunk of N mode - we will write to stdout instead of to a file.
     let mut stdout_writer = std::io::stdout().lock();
     // In N chunks mode - we will write to `num_chunks` files
-    let mut writers = vec![];
+    let mut out_files: Vec<OutFile> = Vec::new();
 
     // Calculate chunk size base and modulo reminder
     // to be used in calculating chunk_size later on
@@ -1219,16 +1273,7 @@ where
     // This will create each of the underlying files
     // or stdin pipes to child shell/command processes if in `--filter` mode
     if kth_chunk.is_none() {
-        // This object is responsible for creating the filename for each chunk.
-        let mut filename_iterator = FilenameIterator::new(&settings.prefix, &settings.suffix)
-            .map_err(|e| io::Error::new(ErrorKind::Other, format!("{e}")))?;
-        for _ in 0..num_chunks {
-            let filename = filename_iterator
-                .next()
-                .ok_or_else(|| USimpleError::new(1, "output file suffixes exhausted"))?;
-            let writer = settings.instantiate_current_writer(filename.as_str())?;
-            writers.push(writer);
-        }
+        out_files = get_out_files(num_chunks, settings, false)?;
     }
 
     for i in 1_u64..=num_chunks {
@@ -1272,7 +1317,7 @@ where
                 }
                 None => {
                     let idx = (i - 1) as usize;
-                    let writer = writers.get_mut(idx).unwrap();
+                    let writer = out_files[idx].get_writer(settings)?;
                     writer.write_all(buf)?;
                 }
             }
@@ -1284,9 +1329,14 @@ where
 }
 
 /// Split a file or STDIN into a specific number of chunks by line.
-/// If in Kth chunk of N mode - print the k-th chunk to STDOUT.
 ///
-/// In Kth chunk of N mode - writes to stdout the contents of the chunk identified by `kth_chunk`
+/// It is most likely that input cannot be evenly divided into the number of chunks
+/// of the same size in bytes or number of lines, since we cannot break lines.
+/// It is also likely that there could be empty files (having `elide_empty_files` is disabled)
+/// when a long line overlaps one or more chunks.
+///
+/// In Kth chunk of N mode - writes to STDOUT the contents of the chunk identified by `kth_chunk`
+/// Note: the `elide_empty_files` flag is ignored in this mode
 ///
 /// In N chunks mode - this function always creates one output file for each chunk, even
 /// if there is an error reading or writing one of the chunks or if
@@ -1322,76 +1372,97 @@ where
     let initial_buf = &mut Vec::new();
     let num_bytes = get_input_size(&settings.input, reader, initial_buf, &settings.io_blksize)?;
     let reader = initial_buf.chain(reader);
-    let chunk_size = (num_bytes / num_chunks) as usize;
 
     // If input file is empty and we would not have determined the Kth chunk
     // in the Kth chunk of N chunk mode, then terminate immediately.
     // This happens on `split -n l/3/10 /dev/null`, for example.
-    if kth_chunk.is_some() && num_bytes == 0 {
+    // Similarly, if input file is empty and `elide_empty_files` parameter is enabled,
+    // then we would have written zero chunks of output,
+    // so terminate immediately as well.
+    // This happens on `split -e -n l/3 /dev/null`, for example.
+    if num_bytes == 0 && (kth_chunk.is_some() || settings.elide_empty_files) {
         return Ok(());
     }
 
     // In Kth chunk of N mode - we will write to stdout instead of to a file.
     let mut stdout_writer = std::io::stdout().lock();
     // In N chunks mode - we will write to `num_chunks` files
-    let mut writers = vec![];
+    let mut out_files: Vec<OutFile> = Vec::new();
+
+    // Calculate chunk size base and modulo reminder
+    // to be used in calculating `num_bytes_should_be_written` later on
+    let chunk_size_base = num_bytes / num_chunks;
+    let chunk_size_reminder = num_bytes % num_chunks;
 
     // If in N chunks mode
-    // Create one writer for each chunk.
-    // This will create each of the underlying files
-    // or stdin pipes to child shell/command processes if in `--filter` mode
+    // Generate filenames for each file and
+    // if `elide_empty_files` parameter is NOT enabled - instantiate the writer
+    // which will create each of the underlying files or stdin pipes
+    // to child shell/command processes if in `--filter` mode.
+    // Otherwise keep writer optional, to be instantiated later if there is data
+    // to write for the associated chunk.
     if kth_chunk.is_none() {
-        // This object is responsible for creating the filename for each chunk.
-        let mut filename_iterator = FilenameIterator::new(&settings.prefix, &settings.suffix)
-            .map_err(|e| io::Error::new(ErrorKind::Other, format!("{e}")))?;
-        for _ in 0..num_chunks {
-            let filename = filename_iterator
-                .next()
-                .ok_or_else(|| USimpleError::new(1, "output file suffixes exhausted"))?;
-            let writer = settings.instantiate_current_writer(filename.as_str())?;
-            writers.push(writer);
-        }
+        out_files = get_out_files(num_chunks, settings, settings.elide_empty_files)?;
     }
 
-    let mut num_bytes_remaining_in_current_chunk = chunk_size;
-    let mut i = 1;
+    let mut chunk_number = 1;
     let sep = settings.separator;
+    let mut num_bytes_should_be_written = chunk_size_base + (chunk_size_reminder > 0) as u64;
+    let mut num_bytes_written = 0;
 
     for line_result in reader.split(sep) {
-        // add separator back in at the end of the line
         let mut line = line_result?;
-        line.push(sep);
+        // add separator back in at the end of the line,
+        // since `reader.split(sep)` removes it,
+        // except if the last line did not end with separator character
+        if (num_bytes_written + line.len() as u64) < num_bytes {
+            line.push(sep);
+        }
         let bytes = line.as_slice();
 
         match kth_chunk {
-            Some(chunk_number) => {
-                if i == chunk_number {
+            Some(kth) => {
+                if chunk_number == kth {
                     stdout_writer.write_all(bytes)?;
                 }
             }
             None => {
-                let idx = (i - 1) as usize;
-                let maybe_writer = writers.get_mut(idx);
-                let writer = maybe_writer.unwrap();
+                // Should write into a file
+                let idx = (chunk_number - 1) as usize;
+                let writer = out_files[idx].get_writer(settings)?;
                 custom_write_all(bytes, writer, settings)?;
             }
         }
 
-        let num_bytes = bytes.len();
-        if num_bytes >= num_bytes_remaining_in_current_chunk {
-            num_bytes_remaining_in_current_chunk = chunk_size;
-            i += 1;
-        } else {
-            num_bytes_remaining_in_current_chunk -= num_bytes;
+        // Advance to the next chunk if the current one is filled.
+        // There could be a situation when a long line, which started in current chunk,
+        // would overlap the next chunk (or even several next chunks),
+        // and since we cannot break lines for this split strategy, we could end up with
+        // empty files in place(s) of skipped chunk(s)
+        let num_line_bytes = bytes.len() as u64;
+        num_bytes_written += num_line_bytes;
+        let mut skipped = -1;
+        while num_bytes_should_be_written <= num_bytes_written {
+            num_bytes_should_be_written +=
+                chunk_size_base + (chunk_size_reminder > chunk_number) as u64;
+            chunk_number += 1;
+            skipped += 1;
         }
 
-        if let Some(chunk_number) = kth_chunk {
-            if i > chunk_number {
+        // If a chunk was skipped and `elide_empty_files` flag is set,
+        // roll chunk_number back to preserve sequential continuity
+        // of file names for files written to,
+        // except for Kth chunk of N mode
+        if settings.elide_empty_files && skipped > 0 && kth_chunk.is_none() {
+            chunk_number -= skipped as u64;
+        }
+
+        if let Some(kth) = kth_chunk {
+            if chunk_number > kth {
                 break;
             }
         }
     }
-
     Ok(())
 }
 
@@ -1432,23 +1503,14 @@ where
     // In Kth chunk of N mode - we will write to stdout instead of to a file.
     let mut stdout_writer = std::io::stdout().lock();
     // In N chunks mode - we will write to `num_chunks` files
-    let mut writers = vec![];
+    let mut out_files: Vec<OutFile> = Vec::new();
 
     // If in N chunks mode
     // Create one writer for each chunk.
     // This will create each of the underlying files
     // or stdin pipes to child shell/command processes if in `--filter` mode
     if kth_chunk.is_none() {
-        // This object is responsible for creating the filename for each chunk.
-        let mut filename_iterator = FilenameIterator::new(&settings.prefix, &settings.suffix)
-            .map_err(|e| io::Error::new(ErrorKind::Other, format!("{e}")))?;
-        for _ in 0..num_chunks {
-            let filename = filename_iterator
-                .next()
-                .ok_or_else(|| USimpleError::new(1, "output file suffixes exhausted"))?;
-            let writer = settings.instantiate_current_writer(filename.as_str())?;
-            writers.push(writer);
-        }
+        out_files = get_out_files(num_chunks, settings, false)?;
     }
 
     let num_chunks: usize = num_chunks.try_into().unwrap();
@@ -1470,9 +1532,7 @@ where
                 }
             }
             None => {
-                let maybe_writer = writers.get_mut(i % num_chunks);
-                let writer = maybe_writer.unwrap();
-
+                let writer = out_files[i % num_chunks].get_writer(settings)?;
                 let writer_stdin_open = custom_write_all(bytes, writer, settings)?;
                 if !writer_stdin_open {
                     closed_writers += 1;
diff --git a/src/uu/split/src/strategy.rs b/src/uu/split/src/strategy.rs
index e85abcee58b..7b934f72047 100644
--- a/src/uu/split/src/strategy.rs
+++ b/src/uu/split/src/strategy.rs
@@ -8,7 +8,10 @@
 use crate::{OPT_BYTES, OPT_LINES, OPT_LINE_BYTES, OPT_NUMBER};
 use clap::{parser::ValueSource, ArgMatches};
 use std::fmt;
-use uucore::parse_size::{parse_size_u64, parse_size_u64_max, ParseSizeError};
+use uucore::{
+    display::Quotable,
+    parse_size::{parse_size_u64, parse_size_u64_max, ParseSizeError},
+};
 
 /// Sub-strategy of the [`Strategy::Number`]
 /// Splitting a file into a specific number of chunks.
@@ -208,10 +211,10 @@ impl fmt::Display for StrategyError {
             Self::Lines(e) => write!(f, "invalid number of lines: {e}"),
             Self::Bytes(e) => write!(f, "invalid number of bytes: {e}"),
             Self::NumberType(NumberTypeError::NumberOfChunks(s)) => {
-                write!(f, "invalid number of chunks: {s}")
+                write!(f, "invalid number of chunks: {}", s.quote())
             }
             Self::NumberType(NumberTypeError::ChunkNumber(s)) => {
-                write!(f, "invalid chunk number: {s}")
+                write!(f, "invalid chunk number: {}", s.quote())
             }
             Self::MultipleWays => write!(f, "cannot split in more than one way"),
         }
diff --git a/tests/by-util/test_split.rs b/tests/by-util/test_split.rs
index 0ae2af5cb92..2c9a56bddee 100644
--- a/tests/by-util/test_split.rs
+++ b/tests/by-util/test_split.rs
@@ -606,13 +606,13 @@ fn test_split_obs_lines_as_other_option_value() {
         .args(&["-n", "-200", "file"])
         .fails()
         .code_is(1)
-        .stderr_contains("split: invalid number of chunks: -200\n");
+        .stderr_contains("split: invalid number of chunks: '-200'\n");
     scene
         .ucmd()
         .args(&["--number", "-e200", "file"])
         .fails()
         .code_is(1)
-        .stderr_contains("split: invalid number of chunks: -e200\n");
+        .stderr_contains("split: invalid number of chunks: '-e200'\n");
 }
 
 /// Test for using more than one obsolete lines option (standalone)
@@ -708,7 +708,7 @@ fn test_split_overflow_bytes_size() {
 fn test_split_stdin_num_chunks() {
     let (at, mut ucmd) = at_and_ucmd!();
     ucmd.args(&["--number=1"]).pipe_in("").succeeds();
-    assert_eq!(file_read(&at, "xaa"), "");
+    assert_eq!(at.read("xaa"), "");
     assert!(!at.plus("xab").exists());
 }
 
@@ -727,8 +727,8 @@ fn test_split_stdin_num_line_chunks() {
     ucmd.args(&["--number=l/2"])
         .pipe_in("1\n2\n3\n4\n5\n")
         .succeeds();
-    assert_eq!(file_read(&at, "xaa"), "1\n2\n3\n");
-    assert_eq!(file_read(&at, "xab"), "4\n5\n");
+    assert_eq!(at.read("xaa"), "1\n2\n3\n");
+    assert_eq!(at.read("xab"), "4\n5\n");
     assert!(!at.plus("xac").exists());
 }
 
@@ -741,12 +741,6 @@ fn test_split_stdin_num_kth_line_chunk() {
         .stdout_only("2\n");
 }
 
-fn file_read(at: &AtPath, filename: &str) -> String {
-    let mut s = String::new();
-    at.open(filename).read_to_string(&mut s).unwrap();
-    s
-}
-
 /// Test for the default suffix length behavior: dynamically increasing size.
 #[test]
 fn test_alphabetic_dynamic_suffix_length() {
@@ -766,11 +760,11 @@ fn test_alphabetic_dynamic_suffix_length() {
     for i in b'a'..=b'y' {
         for j in b'a'..=b'z' {
             let filename = format!("x{}{}", i as char, j as char);
-            let contents = file_read(&at, &filename);
+            let contents = at.read(&filename);
             assert_eq!(contents, "a");
         }
     }
-    assert_eq!(file_read(&at, "xzaaa"), "a");
+    assert_eq!(at.read("xzaaa"), "a");
 }
 
 /// Test for the default suffix length behavior: dynamically increasing size.
@@ -790,10 +784,10 @@ fn test_numeric_dynamic_suffix_length() {
         .succeeds();
     for i in 0..90 {
         let filename = format!("x{i:02}");
-        let contents = file_read(&at, &filename);
+        let contents = at.read(&filename);
         assert_eq!(contents, "a");
     }
-    assert_eq!(file_read(&at, "x9000"), "a");
+    assert_eq!(at.read("x9000"), "a");
 }
 
 #[test]
@@ -812,10 +806,10 @@ fn test_hex_dynamic_suffix_length() {
         .succeeds();
     for i in 0..240 {
         let filename = format!("x{i:02x}");
-        let contents = file_read(&at, &filename);
+        let contents = at.read(&filename);
         assert_eq!(contents, "a");
     }
-    assert_eq!(file_read(&at, "xf000"), "a");
+    assert_eq!(at.read("xf000"), "a");
 }
 
 /// Test for dynamic suffix length (auto-widening) disabled when suffix start number is specified
@@ -833,7 +827,7 @@ fn test_dynamic_suffix_length_on_with_suffix_start_no_value() {
     let (at, mut ucmd) = at_and_ucmd!();
     ucmd.args(&["-b", "1", "--numeric-suffixes", "ninetyonebytes.txt"])
         .succeeds();
-    assert_eq!(file_read(&at, "x9000"), "a");
+    assert_eq!(at.read("x9000"), "a");
 }
 
 /// Test for suffix auto-width with --number strategy and suffix start number
@@ -845,8 +839,8 @@ fn test_suffix_auto_width_with_number() {
     let glob = Glob::new(&at, ".", r"x\d\d\d$");
     assert_eq!(glob.count(), 100);
     assert_eq!(glob.collate(), at.read_bytes("fivelines.txt"));
-    assert_eq!(file_read(&at, "x001"), "1\n");
-    assert_eq!(file_read(&at, "x100"), "");
+    assert_eq!(at.read("x001"), "1\n");
+    assert_eq!(at.read("x100"), "");
 
     new_ucmd!()
         .args(&["--numeric-suffixes=100", "--number=r/100", "fivelines.txt"])
@@ -926,17 +920,12 @@ creating file 'xaf'
 #[test]
 fn test_number_n() {
     let (at, mut ucmd) = at_and_ucmd!();
-    let file_read = |f| {
-        let mut s = String::new();
-        at.open(f).read_to_string(&mut s).unwrap();
-        s
-    };
     ucmd.args(&["-n", "5", "asciilowercase.txt"]).succeeds();
-    assert_eq!(file_read("xaa"), "abcdef");
-    assert_eq!(file_read("xab"), "ghijkl");
-    assert_eq!(file_read("xac"), "mnopq");
-    assert_eq!(file_read("xad"), "rstuv");
-    assert_eq!(file_read("xae"), "wxyz\n");
+    assert_eq!(at.read("xaa"), "abcdef");
+    assert_eq!(at.read("xab"), "ghijkl");
+    assert_eq!(at.read("xac"), "mnopq");
+    assert_eq!(at.read("xad"), "rstuv");
+    assert_eq!(at.read("xae"), "wxyz\n");
     #[cfg(unix)]
     new_ucmd!()
         .args(&["--number=100", "/dev/null"])
@@ -974,11 +963,11 @@ fn test_number_kth_of_n() {
     new_ucmd!()
         .args(&["--number=0/5", "asciilowercase.txt"])
         .fails()
-        .stderr_contains("split: invalid chunk number: 0");
+        .stderr_contains("split: invalid chunk number: '0'");
     new_ucmd!()
         .args(&["--number=10/5", "asciilowercase.txt"])
         .fails()
-        .stderr_contains("split: invalid chunk number: 10");
+        .stderr_contains("split: invalid chunk number: '10'");
     #[cfg(target_pointer_width = "64")]
     new_ucmd!()
         .args(&[
@@ -986,7 +975,7 @@ fn test_number_kth_of_n() {
             "asciilowercase.txt",
         ])
         .fails()
-        .stderr_contains("split: invalid number of chunks: 18446744073709551616");
+        .stderr_contains("split: invalid number of chunks: '18446744073709551616'");
 }
 
 #[test]
@@ -1020,32 +1009,27 @@ fn test_number_kth_of_n_round_robin() {
             "fivelines.txt",
         ])
         .fails()
-        .stderr_contains("split: invalid number of chunks: 18446744073709551616");
+        .stderr_contains("split: invalid number of chunks: '18446744073709551616'");
     new_ucmd!()
         .args(&["--number", "r/0/3", "fivelines.txt"])
         .fails()
-        .stderr_contains("split: invalid chunk number: 0");
+        .stderr_contains("split: invalid chunk number: '0'");
     new_ucmd!()
         .args(&["--number", "r/10/3", "fivelines.txt"])
         .fails()
-        .stderr_contains("split: invalid chunk number: 10");
+        .stderr_contains("split: invalid chunk number: '10'");
 }
 
 #[test]
 fn test_split_number_with_io_blksize() {
     let (at, mut ucmd) = at_and_ucmd!();
-    let file_read = |f| {
-        let mut s = String::new();
-        at.open(f).read_to_string(&mut s).unwrap();
-        s
-    };
     ucmd.args(&["-n", "5", "asciilowercase.txt", "---io-blksize", "1024"])
         .succeeds();
-    assert_eq!(file_read("xaa"), "abcdef");
-    assert_eq!(file_read("xab"), "ghijkl");
-    assert_eq!(file_read("xac"), "mnopq");
-    assert_eq!(file_read("xad"), "rstuv");
-    assert_eq!(file_read("xae"), "wxyz\n");
+    assert_eq!(at.read("xaa"), "abcdef");
+    assert_eq!(at.read("xab"), "ghijkl");
+    assert_eq!(at.read("xac"), "mnopq");
+    assert_eq!(at.read("xad"), "rstuv");
+    assert_eq!(at.read("xae"), "wxyz\n");
 }
 
 #[test]
@@ -1153,7 +1137,7 @@ fn test_allow_empty_files() {
 }
 
 #[test]
-fn test_elide_empty_files() {
+fn test_elide_empty_files_n_chunks() {
     let (at, mut ucmd) = at_and_ucmd!();
     ucmd.args(&["-e", "-n", "4", "threebytes.txt"])
         .succeeds()
@@ -1167,7 +1151,7 @@ fn test_elide_empty_files() {
 
 #[test]
 #[cfg(unix)]
-fn test_elide_dev_null() {
+fn test_elide_dev_null_n_chunks() {
     let (at, mut ucmd) = at_and_ucmd!();
     ucmd.args(&["-e", "-n", "3", "/dev/null"])
         .succeeds()
@@ -1191,24 +1175,58 @@ fn test_dev_zero() {
 }
 
 #[test]
-fn test_lines() {
+fn test_elide_empty_files_l_chunks() {
     let (at, mut ucmd) = at_and_ucmd!();
+    ucmd.args(&["-e", "-n", "l/7", "fivelines.txt"])
+        .succeeds()
+        .no_stdout()
+        .no_stderr();
+    assert_eq!(at.read("xaa"), "1\n");
+    assert_eq!(at.read("xab"), "2\n");
+    assert_eq!(at.read("xac"), "3\n");
+    assert_eq!(at.read("xad"), "4\n");
+    assert_eq!(at.read("xae"), "5\n");
+    assert!(!at.plus("xaf").exists());
+    assert!(!at.plus("xag").exists());
+}
 
-    let file_read = |f| {
-        let mut s = String::new();
-        at.open(f).read_to_string(&mut s).unwrap();
-        s
-    };
+#[test]
+#[cfg(unix)]
+fn test_elide_dev_null_l_chunks() {
+    let (at, mut ucmd) = at_and_ucmd!();
+    ucmd.args(&["-e", "-n", "l/3", "/dev/null"])
+        .succeeds()
+        .no_stdout()
+        .no_stderr();
+    assert!(!at.plus("xaa").exists());
+    assert!(!at.plus("xab").exists());
+    assert!(!at.plus("xac").exists());
+}
 
+#[test]
+#[cfg(unix)]
+fn test_number_by_bytes_dev_zero() {
+    let (at, mut ucmd) = at_and_ucmd!();
+    ucmd.args(&["-n", "3", "/dev/zero"])
+        .fails()
+        .stderr_only("split: /dev/zero: cannot determine file size\n");
+    assert!(!at.plus("xaa").exists());
+    assert!(!at.plus("xab").exists());
+    assert!(!at.plus("xac").exists());
+}
+
+#[test]
+fn test_number_by_lines() {
+    let (at, mut ucmd) = at_and_ucmd!();
     // Split into two files without splitting up lines.
     ucmd.args(&["-n", "l/2", "fivelines.txt"]).succeeds();
 
-    assert_eq!(file_read("xaa"), "1\n2\n3\n");
-    assert_eq!(file_read("xab"), "4\n5\n");
+    assert_eq!(at.read("xaa"), "1\n2\n3\n");
+    assert_eq!(at.read("xab"), "4\n5\n");
 }
 
 #[test]
-fn test_lines_kth() {
+fn test_number_by_lines_kth() {
     new_ucmd!()
         .args(&["-n", "l/3/10", "onehundredlines.txt"])
         .succeeds()
@@ -1217,13 +1235,27 @@ fn test_lines_kth() {
 
 #[test]
 #[cfg(unix)]
-fn test_lines_kth_dev_null() {
+fn test_number_by_lines_kth_dev_null() {
     new_ucmd!()
         .args(&["-n", "l/3/10", "/dev/null"])
         .succeeds()
         .stdout_only("");
 }
 
+#[test]
+fn test_number_by_lines_kth_no_end_sep() {
+    new_ucmd!()
+        .args(&["-n", "l/3/10"])
+        .pipe_in("1\n2222\n3\n4")
+        .succeeds()
+        .stdout_only("2222\n");
+    new_ucmd!()
+        .args(&["-e", "-n", "l/8/10"])
+        .pipe_in("1\n2222\n3\n4")
+        .succeeds()
+        .stdout_only("3\n");
+}
+
 #[test]
 fn test_line_bytes() {
     let (at, mut ucmd) = at_and_ucmd!();
@@ -1588,17 +1620,10 @@ fn test_effective_suffix_hex_last() {
 #[test]
 fn test_round_robin() {
     let (at, mut ucmd) = at_and_ucmd!();
-
-    let file_read = |f| {
-        let mut s = String::new();
-        at.open(f).read_to_string(&mut s).unwrap();
-        s
-    };
-
     ucmd.args(&["-n", "r/2", "fivelines.txt"]).succeeds();
 
-    assert_eq!(file_read("xaa"), "1\n3\n5\n");
-    assert_eq!(file_read("xab"), "2\n4\n");
+    assert_eq!(at.read("xaa"), "1\n3\n5\n");
+    assert_eq!(at.read("xab"), "2\n4\n");
 }
 
 #[test]
@@ -1631,7 +1656,7 @@ fn test_split_invalid_input() {
         .args(&["-n", "0", "file"])
         .fails()
         .no_stdout()
-        .stderr_contains("split: invalid number of chunks: 0");
+        .stderr_contains("split: invalid number of chunks: '0'");
 }
 
 /// Test if there are invalid (non UTF-8) in the arguments - unix
@@ -1690,9 +1715,9 @@ fn test_split_separator_nl_lines() {
         .pipe_in("1\n2\n3\n4\n5\n")
         .succeeds();
 
-    assert_eq!(file_read(&at, "xaa"), "1\n2\n");
-    assert_eq!(file_read(&at, "xab"), "3\n4\n");
-    assert_eq!(file_read(&at, "xac"), "5\n");
+    assert_eq!(at.read("xaa"), "1\n2\n");
+    assert_eq!(at.read("xab"), "3\n4\n");
+    assert_eq!(at.read("xac"), "5\n");
     assert!(!at.plus("xad").exists());
 }
 
@@ -1703,9 +1728,9 @@ fn test_split_separator_nl_line_bytes() {
         .pipe_in("1\n2\n3\n4\n5\n")
         .succeeds();
 
-    assert_eq!(file_read(&at, "xaa"), "1\n2\n");
-    assert_eq!(file_read(&at, "xab"), "3\n4\n");
-    assert_eq!(file_read(&at, "xac"), "5\n");
+    assert_eq!(at.read("xaa"), "1\n2\n");
+    assert_eq!(at.read("xab"), "3\n4\n");
+    assert_eq!(at.read("xac"), "5\n");
     assert!(!at.plus("xad").exists());
 }
 
@@ -1715,9 +1740,9 @@ fn test_split_separator_nl_number_l() {
     ucmd.args(&["--number=l/3", "--separator=\n", "fivelines.txt"])
         .succeeds();
 
-    assert_eq!(file_read(&at, "xaa"), "1\n2\n");
-    assert_eq!(file_read(&at, "xab"), "3\n4\n");
-    assert_eq!(file_read(&at, "xac"), "5\n");
+    assert_eq!(at.read("xaa"), "1\n2\n");
+    assert_eq!(at.read("xab"), "3\n4\n");
+    assert_eq!(at.read("xac"), "5\n");
     assert!(!at.plus("xad").exists());
 }
 
@@ -1727,9 +1752,9 @@ fn test_split_separator_nl_number_r() {
     ucmd.args(&["--number=r/3", "--separator", "\n", "fivelines.txt"])
         .succeeds();
 
-    assert_eq!(file_read(&at, "xaa"), "1\n4\n");
-    assert_eq!(file_read(&at, "xab"), "2\n5\n");
-    assert_eq!(file_read(&at, "xac"), "3\n");
+    assert_eq!(at.read("xaa"), "1\n4\n");
+    assert_eq!(at.read("xab"), "2\n5\n");
+    assert_eq!(at.read("xac"), "3\n");
     assert!(!at.plus("xad").exists());
 }
 
@@ -1739,9 +1764,9 @@ fn test_split_separator_nul_lines() {
     ucmd.args(&["--lines=2", "-t", "\\0", "separator_nul.txt"])
         .succeeds();
 
-    assert_eq!(file_read(&at, "xaa"), "1\x002\0");
-    assert_eq!(file_read(&at, "xab"), "3\x004\0");
-    assert_eq!(file_read(&at, "xac"), "5\0");
+    assert_eq!(at.read("xaa"), "1\x002\0");
+    assert_eq!(at.read("xab"), "3\x004\0");
+    assert_eq!(at.read("xac"), "5\0");
     assert!(!at.plus("xad").exists());
 }
 
@@ -1751,9 +1776,9 @@ fn test_split_separator_nul_line_bytes() {
     ucmd.args(&["--line-bytes=4", "-t", "\\0", "separator_nul.txt"])
         .succeeds();
 
-    assert_eq!(file_read(&at, "xaa"), "1\x002\0");
-    assert_eq!(file_read(&at, "xab"), "3\x004\0");
-    assert_eq!(file_read(&at, "xac"), "5\0");
+    assert_eq!(at.read("xaa"), "1\x002\0");
+    assert_eq!(at.read("xab"), "3\x004\0");
+    assert_eq!(at.read("xac"), "5\0");
     assert!(!at.plus("xad").exists());
 }
 
@@ -1763,9 +1788,9 @@ fn test_split_separator_nul_number_l() {
     ucmd.args(&["--number=l/3", "--separator=\\0", "separator_nul.txt"])
         .succeeds();
 
-    assert_eq!(file_read(&at, "xaa"), "1\x002\0");
-    assert_eq!(file_read(&at, "xab"), "3\x004\0");
-    assert_eq!(file_read(&at, "xac"), "5\0");
+    assert_eq!(at.read("xaa"), "1\x002\0");
+    assert_eq!(at.read("xab"), "3\x004\0");
+    assert_eq!(at.read("xac"), "5\0");
     assert!(!at.plus("xad").exists());
 }
 
@@ -1775,9 +1800,9 @@ fn test_split_separator_nul_number_r() {
     ucmd.args(&["--number=r/3", "--separator=\\0", "separator_nul.txt"])
         .succeeds();
 
-    assert_eq!(file_read(&at, "xaa"), "1\x004\0");
-    assert_eq!(file_read(&at, "xab"), "2\x005\0");
-    assert_eq!(file_read(&at, "xac"), "3\0");
+    assert_eq!(at.read("xaa"), "1\x004\0");
+    assert_eq!(at.read("xab"), "2\x005\0");
+    assert_eq!(at.read("xac"), "3\0");
     assert!(!at.plus("xad").exists());
 }
 
@@ -1787,9 +1812,9 @@ fn test_split_separator_semicolon_lines() {
     ucmd.args(&["--lines=2", "-t", ";", "separator_semicolon.txt"])
         .succeeds();
 
-    assert_eq!(file_read(&at, "xaa"), "1;2;");
-    assert_eq!(file_read(&at, "xab"), "3;4;");
-    assert_eq!(file_read(&at, "xac"), "5;");
+    assert_eq!(at.read("xaa"), "1;2;");
+    assert_eq!(at.read("xab"), "3;4;");
+    assert_eq!(at.read("xac"), "5;");
     assert!(!at.plus("xad").exists());
 }
 
@@ -1799,9 +1824,9 @@ fn test_split_separator_semicolon_line_bytes() {
     ucmd.args(&["--line-bytes=4", "-t", ";", "separator_semicolon.txt"])
         .succeeds();
 
-    assert_eq!(file_read(&at, "xaa"), "1;2;");
-    assert_eq!(file_read(&at, "xab"), "3;4;");
-    assert_eq!(file_read(&at, "xac"), "5;");
+    assert_eq!(at.read("xaa"), "1;2;");
+    assert_eq!(at.read("xab"), "3;4;");
+    assert_eq!(at.read("xac"), "5;");
     assert!(!at.plus("xad").exists());
 }
 
@@ -1811,9 +1836,9 @@ fn test_split_separator_semicolon_number_l() {
     ucmd.args(&["--number=l/3", "--separator=;", "separator_semicolon.txt"])
         .succeeds();
 
-    assert_eq!(file_read(&at, "xaa"), "1;2;");
-    assert_eq!(file_read(&at, "xab"), "3;4;");
-    assert_eq!(file_read(&at, "xac"), "5;");
+    assert_eq!(at.read("xaa"), "1;2;");
+    assert_eq!(at.read("xab"), "3;4;");
+    assert_eq!(at.read("xac"), "5;");
     assert!(!at.plus("xad").exists());
 }
 
@@ -1823,9 +1848,9 @@ fn test_split_separator_semicolon_number_r() {
     ucmd.args(&["--number=r/3", "--separator=;", "separator_semicolon.txt"])
         .succeeds();
 
-    assert_eq!(file_read(&at, "xaa"), "1;4;");
-    assert_eq!(file_read(&at, "xab"), "2;5;");
-    assert_eq!(file_read(&at, "xac"), "3;");
+    assert_eq!(at.read("xaa"), "1;4;");
+    assert_eq!(at.read("xab"), "2;5;");
+    assert_eq!(at.read("xac"), "3;");
     assert!(!at.plus("xad").exists());
 }
 

From 84b5e6f0a1275ffd6816d4478284ed2ef27e5f1e Mon Sep 17 00:00:00 2001
From: Clint Teece <ceteece@gmail.com>
Date: Sat, 25 Nov 2023 09:13:12 -0500
Subject: [PATCH 065/429] du: start printing output immediately (#5552)

* du: very rough draft of continuously printing output

* du: clean up printing logic, still needs some polishing

* du: gracefully handle case where `du` returns no `Stat`s

* du: print output using separate thread

* du: clean up print thread implementation

* du: send ownership of `Stat`s to printing thread as soon as `du` is done with them

* du: add basic error handling for communication between threads, use `StatPrinter` to handle printing thread logic

* du: move printing grand total into `StatPrinter`, and move initialization of printing-related variables into `StatPrinter::new`

* du: clean up calculation of `convert_size` function, and separate printing a single stat our into its own method in `StatPrinter`

* du: have printing thread handle printing IO-related errors, to ensure error messages and regular output message are written one at a time

* du: add comment explaining print thread, remove outdated comments and clippy allows

* du: restore clippy allows for cognitive complexity

---------

Co-authored-by: clint <cteece3@gatech.edu>
---
 src/uu/du/src/du.rs | 317 +++++++++++++++++++++++++++-----------------
 1 file changed, 193 insertions(+), 124 deletions(-)

diff --git a/src/uu/du/src/du.rs b/src/uu/du/src/du.rs
index 148b197df33..dc03a64f218 100644
--- a/src/uu/du/src/du.rs
+++ b/src/uu/du/src/du.rs
@@ -16,8 +16,6 @@ use std::fs::File;
 use std::fs::Metadata;
 use std::io::BufRead;
 use std::io::BufReader;
-use std::io::Result;
-use std::iter;
 #[cfg(not(windows))]
 use std::os::unix::fs::MetadataExt;
 #[cfg(windows)]
@@ -27,15 +25,17 @@ use std::os::windows::io::AsRawHandle;
 use std::path::Path;
 use std::path::PathBuf;
 use std::str::FromStr;
+use std::sync::mpsc;
+use std::thread;
 use std::time::{Duration, UNIX_EPOCH};
 use std::{error::Error, fmt::Display};
 use uucore::display::{print_verbatim, Quotable};
 use uucore::error::FromIo;
-use uucore::error::{set_exit_code, UError, UResult, USimpleError};
+use uucore::error::{UError, UResult, USimpleError};
 use uucore::line_ending::LineEnding;
 use uucore::parse_glob;
 use uucore::parse_size::{parse_size_u64, ParseSizeError};
-use uucore::{format_usage, help_about, help_section, help_usage, show, show_error, show_warning};
+use uucore::{format_usage, help_about, help_section, help_usage, show, show_warning};
 #[cfg(windows)]
 use windows_sys::Win32::Foundation::HANDLE;
 #[cfg(windows)]
@@ -81,6 +81,7 @@ const USAGE: &str = help_usage!("du.md");
 // TODO: Support Z & Y (currently limited by size of u64)
 const UNITS: [(char, u32); 6] = [('E', 6), ('P', 5), ('T', 4), ('G', 3), ('M', 2), ('K', 1)];
 
+#[derive(Clone)]
 struct Options {
     all: bool,
     max_depth: Option<usize>,
@@ -93,7 +94,7 @@ struct Options {
     verbose: bool,
 }
 
-#[derive(PartialEq)]
+#[derive(PartialEq, Clone)]
 enum Deref {
     All,
     Args(Vec<PathBuf>),
@@ -119,7 +120,7 @@ struct Stat {
 }
 
 impl Stat {
-    fn new(path: &Path, options: &Options) -> Result<Self> {
+    fn new(path: &Path, options: &Options) -> std::io::Result<Self> {
         // Determine whether to dereference (follow) the symbolic link
         let should_dereference = match &options.dereference {
             Deref::All => true,
@@ -290,7 +291,6 @@ fn choose_size(matches: &ArgMatches, stat: &Stat) -> u64 {
 }
 
 // this takes `my_stat` to avoid having to stat files multiple times.
-// XXX: this should use the impl Trait return type when it is stabilized
 #[allow(clippy::cognitive_complexity)]
 fn du(
     mut my_stat: Stat,
@@ -298,18 +298,16 @@ fn du(
     depth: usize,
     seen_inodes: &mut HashSet<FileInfo>,
     exclude: &[Pattern],
-) -> Box<dyn DoubleEndedIterator<Item = Stat>> {
-    let mut stats = vec![];
-    let mut futures = vec![];
-
+    print_tx: &mpsc::Sender<UResult<StatPrintInfo>>,
+) -> Result<Stat, Box<mpsc::SendError<UResult<StatPrintInfo>>>> {
     if my_stat.is_dir {
         let read = match fs::read_dir(&my_stat.path) {
             Ok(read) => read,
             Err(e) => {
-                show!(
-                    e.map_err_context(|| format!("cannot read directory {}", my_stat.path.quote()))
-                );
-                return Box::new(iter::once(my_stat));
+                print_tx.send(Err(e.map_err_context(|| {
+                    format!("cannot read directory {}", my_stat.path.quote())
+                })))?;
+                return Ok(my_stat);
             }
         };
 
@@ -354,44 +352,48 @@ fn du(
                                         }
                                     }
                                 }
-                                futures.push(du(
+
+                                let this_stat = du(
                                     this_stat,
                                     options,
                                     depth + 1,
                                     seen_inodes,
                                     exclude,
-                                ));
+                                    print_tx,
+                                )?;
+
+                                if !options.separate_dirs {
+                                    my_stat.size += this_stat.size;
+                                    my_stat.blocks += this_stat.blocks;
+                                    my_stat.inodes += this_stat.inodes;
+                                }
+                                print_tx.send(Ok(StatPrintInfo {
+                                    stat: this_stat,
+                                    depth: depth + 1,
+                                }))?;
                             } else {
                                 my_stat.size += this_stat.size;
                                 my_stat.blocks += this_stat.blocks;
                                 my_stat.inodes += 1;
                                 if options.all {
-                                    stats.push(this_stat);
+                                    print_tx.send(Ok(StatPrintInfo {
+                                        stat: this_stat,
+                                        depth: depth + 1,
+                                    }))?;
                                 }
                             }
                         }
-                        Err(e) => show!(
-                            e.map_err_context(|| format!("cannot access {}", entry.path().quote()))
-                        ),
+                        Err(e) => print_tx.send(Err(e.map_err_context(|| {
+                            format!("cannot access {}", entry.path().quote())
+                        })))?,
                     }
                 }
-                Err(error) => show_error!("{}", error),
+                Err(error) => print_tx.send(Err(error.into()))?,
             }
         }
     }
 
-    stats.extend(futures.into_iter().flatten().filter(|stat| {
-        if !options.separate_dirs && stat.path.parent().unwrap() == my_stat.path {
-            my_stat.size += stat.size;
-            my_stat.blocks += stat.blocks;
-            my_stat.inodes += stat.inodes;
-        }
-        options
-            .max_depth
-            .map_or(true, |max_depth| depth < max_depth)
-    }));
-    stats.push(my_stat);
-    Box::new(stats.into_iter())
+    Ok(my_stat)
 }
 
 fn convert_size_human(size: u64, multiplier: u64, _block_size: u64) -> String {
@@ -426,7 +428,7 @@ fn convert_size_other(size: u64, _multiplier: u64, block_size: u64) -> String {
     format!("{}", ((size as f64) / (block_size as f64)).ceil())
 }
 
-fn get_convert_size_fn(matches: &ArgMatches) -> Box<dyn Fn(u64, u64, u64) -> String> {
+fn get_convert_size_fn(matches: &ArgMatches) -> Box<dyn Fn(u64, u64, u64) -> String + Send> {
     if matches.get_flag(options::HUMAN_READABLE) || matches.get_flag(options::SI) {
         Box::new(convert_size_human)
     } else if matches.get_flag(options::BYTES) {
@@ -532,6 +534,137 @@ fn build_exclude_patterns(matches: &ArgMatches) -> UResult<Vec<Pattern>> {
     Ok(exclude_patterns)
 }
 
+struct StatPrintInfo {
+    stat: Stat,
+    depth: usize,
+}
+
+struct StatPrinter {
+    matches: ArgMatches,
+    threshold: Option<Threshold>,
+    summarize: bool,
+    time_format_str: String,
+    line_ending: LineEnding,
+    options: Options,
+    convert_size: Box<dyn Fn(u64) -> String + Send>,
+}
+
+impl StatPrinter {
+    fn new(matches: ArgMatches, options: Options, summarize: bool) -> UResult<Self> {
+        let block_size = read_block_size(
+            matches
+                .get_one::<String>(options::BLOCK_SIZE)
+                .map(|s| s.as_str()),
+        )?;
+
+        let multiplier: u64 = if matches.get_flag(options::SI) {
+            1000
+        } else {
+            1024
+        };
+
+        let convert_size_fn = get_convert_size_fn(&matches);
+
+        let convert_size: Box<dyn Fn(u64) -> String + Send> = if options.inodes {
+            Box::new(|size: u64| size.to_string())
+        } else {
+            Box::new(move |size: u64| convert_size_fn(size, multiplier, block_size))
+        };
+
+        let threshold = match matches.get_one::<String>(options::THRESHOLD) {
+            Some(s) => match Threshold::from_str(s) {
+                Ok(t) => Some(t),
+                Err(e) => {
+                    return Err(USimpleError::new(
+                        1,
+                        format_error_message(&e, s, options::THRESHOLD),
+                    ))
+                }
+            },
+            None => None,
+        };
+
+        let time_format_str =
+            parse_time_style(matches.get_one::<String>("time-style").map(|s| s.as_str()))?
+                .to_string();
+
+        let line_ending = LineEnding::from_zero_flag(matches.get_flag(options::NULL));
+
+        Ok(Self {
+            matches,
+            threshold,
+            summarize,
+            time_format_str,
+            line_ending,
+            options,
+            convert_size,
+        })
+    }
+
+    fn print_stats(&self, rx: &mpsc::Receiver<UResult<StatPrintInfo>>) -> UResult<()> {
+        let mut grand_total = 0;
+        loop {
+            let received = rx.recv();
+
+            match received {
+                Ok(message) => match message {
+                    Ok(stat_info) => {
+                        let size = choose_size(&self.matches, &stat_info.stat);
+
+                        if stat_info.depth == 0 {
+                            grand_total += size;
+                        }
+
+                        if !self
+                            .threshold
+                            .map_or(false, |threshold| threshold.should_exclude(size))
+                            && self
+                                .options
+                                .max_depth
+                                .map_or(true, |max_depth| stat_info.depth <= max_depth)
+                            && (!self.summarize || stat_info.depth == 0)
+                        {
+                            self.print_stat(&stat_info.stat, size)?;
+                        }
+                    }
+                    Err(e) => show!(e),
+                },
+                Err(_) => break,
+            }
+        }
+
+        if self.options.total {
+            print!("{}\ttotal", (self.convert_size)(grand_total));
+            print!("{}", self.line_ending);
+        }
+
+        Ok(())
+    }
+
+    fn print_stat(&self, stat: &Stat, size: u64) -> UResult<()> {
+        if self.matches.contains_id(options::TIME) {
+            let tm = {
+                let secs = self
+                    .matches
+                    .get_one::<String>(options::TIME)
+                    .map(|s| get_time_secs(s, stat))
+                    .transpose()?
+                    .unwrap_or(stat.modified);
+                DateTime::<Local>::from(UNIX_EPOCH + Duration::from_secs(secs))
+            };
+            let time_str = tm.format(&self.time_format_str).to_string();
+            print!("{}\t{}\t", (self.convert_size)(size), time_str);
+        } else {
+            print!("{}\t", (self.convert_size)(size));
+        }
+
+        print_verbatim(&stat.path).unwrap();
+        print!("{}", self.line_ending);
+
+        Ok(())
+    }
+}
+
 #[uucore::main]
 #[allow(clippy::cognitive_complexity)]
 pub fn uumain(args: impl uucore::Args) -> UResult<()> {
@@ -582,49 +715,13 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
         show_warning!("options --apparent-size and -b are ineffective with --inodes");
     }
 
-    let block_size = read_block_size(
-        matches
-            .get_one::<String>(options::BLOCK_SIZE)
-            .map(|s| s.as_str()),
-    )?;
-
-    let threshold = match matches.get_one::<String>(options::THRESHOLD) {
-        Some(s) => match Threshold::from_str(s) {
-            Ok(t) => Some(t),
-            Err(e) => {
-                return Err(USimpleError::new(
-                    1,
-                    format_error_message(&e, s, options::THRESHOLD),
-                ))
-            }
-        },
-        None => None,
-    };
-
-    let multiplier: u64 = if matches.get_flag(options::SI) {
-        1000
-    } else {
-        1024
-    };
-
-    let convert_size_fn = get_convert_size_fn(&matches);
-
-    let convert_size = |size: u64| {
-        if options.inodes {
-            size.to_string()
-        } else {
-            convert_size_fn(size, multiplier, block_size)
-        }
-    };
-
-    let time_format_str =
-        parse_time_style(matches.get_one::<String>("time-style").map(|s| s.as_str()))?;
-
-    let line_ending = LineEnding::from_zero_flag(matches.get_flag(options::NULL));
+    // Use separate thread to print output, so we can print finished results while computation is still running
+    let stat_printer = StatPrinter::new(matches.clone(), options.clone(), summarize)?;
+    let (print_tx, rx) = mpsc::channel::<UResult<StatPrintInfo>>();
+    let printing_thread = thread::spawn(move || stat_printer.print_stats(&rx));
 
     let excludes = build_exclude_patterns(&matches)?;
 
-    let mut grand_total = 0;
     'loop_file: for path in files {
         // Skip if we don't want to ignore anything
         if !&excludes.is_empty() {
@@ -647,63 +744,35 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
             if let Some(inode) = stat.inode {
                 seen_inodes.insert(inode);
             }
-            let iter = du(stat, &options, 0, &mut seen_inodes, &excludes);
-
-            // Sum up all the returned `Stat`s and display results
-            let (_, len) = iter.size_hint();
-            let len = len.unwrap();
-            for (index, stat) in iter.enumerate() {
-                let size = choose_size(&matches, &stat);
+            let stat = du(stat, &options, 0, &mut seen_inodes, &excludes, &print_tx)
+                .map_err(|e| USimpleError::new(1, e.to_string()))?;
 
-                if threshold.map_or(false, |threshold| threshold.should_exclude(size)) {
-                    continue;
-                }
-
-                if matches.contains_id(options::TIME) {
-                    let tm = {
-                        let secs = matches
-                            .get_one::<String>(options::TIME)
-                            .map(|s| get_time_secs(s, &stat))
-                            .transpose()?
-                            .unwrap_or(stat.modified);
-                        DateTime::<Local>::from(UNIX_EPOCH + Duration::from_secs(secs))
-                    };
-                    if !summarize || index == len - 1 {
-                        let time_str = tm.format(time_format_str).to_string();
-                        print!("{}\t{}\t", convert_size(size), time_str);
-                        print_verbatim(stat.path).unwrap();
-                        print!("{line_ending}");
-                    }
-                } else if !summarize || index == len - 1 {
-                    print!("{}\t", convert_size(size));
-                    print_verbatim(stat.path).unwrap();
-                    print!("{line_ending}");
-                }
-                if options.total && index == (len - 1) {
-                    // The last element will be the total size of the the path under
-                    // path_string.  We add it to the grand total.
-                    grand_total += size;
-                }
-            }
+            print_tx
+                .send(Ok(StatPrintInfo { stat, depth: 0 }))
+                .map_err(|e| USimpleError::new(1, e.to_string()))?;
         } else {
-            show_error!(
-                "{}: {}",
-                path.to_string_lossy().maybe_quote(),
-                "No such file or directory"
-            );
-            set_exit_code(1);
+            print_tx
+                .send(Err(USimpleError::new(
+                    1,
+                    format!(
+                        "{}: No such file or directory",
+                        path.to_string_lossy().maybe_quote()
+                    ),
+                )))
+                .map_err(|e| USimpleError::new(1, e.to_string()))?;
         }
     }
 
-    if options.total {
-        print!("{}\ttotal", convert_size(grand_total));
-        print!("{line_ending}");
-    }
+    drop(print_tx);
+
+    printing_thread
+        .join()
+        .map_err(|_| USimpleError::new(1, "Printing thread panicked."))??;
 
     Ok(())
 }
 
-fn get_time_secs(s: &str, stat: &Stat) -> std::result::Result<u64, DuError> {
+fn get_time_secs(s: &str, stat: &Stat) -> Result<u64, DuError> {
     let secs = match s {
         "ctime" | "status" => stat.modified,
         "access" | "atime" | "use" => stat.accessed,
@@ -966,7 +1035,7 @@ enum Threshold {
 impl FromStr for Threshold {
     type Err = ParseSizeError;
 
-    fn from_str(s: &str) -> std::result::Result<Self, Self::Err> {
+    fn from_str(s: &str) -> Result<Self, Self::Err> {
         let offset = usize::from(s.starts_with(&['-', '+'][..]));
 
         let size = parse_size_u64(&s[offset..])?;

From dc92a434ef0f64a833d8b657268068eb3a25ab22 Mon Sep 17 00:00:00 2001
From: zhitkoff <zhitkoff@gmail.com>
Date: Fri, 24 Nov 2023 17:25:16 -0500
Subject: [PATCH 066/429] split: handling system limit on open files

---
 src/uu/split/src/platform/unix.rs    |  43 ++++--
 src/uu/split/src/platform/windows.rs |  23 ++-
 src/uu/split/src/split.rs            | 204 +++++++++++++++++++--------
 3 files changed, 191 insertions(+), 79 deletions(-)

diff --git a/src/uu/split/src/platform/unix.rs b/src/uu/split/src/platform/unix.rs
index c2bf7216b57..1fd990e0a91 100644
--- a/src/uu/split/src/platform/unix.rs
+++ b/src/uu/split/src/platform/unix.rs
@@ -117,22 +117,37 @@ impl Drop for FilterWriter {
 pub fn instantiate_current_writer(
     filter: &Option<String>,
     filename: &str,
+    is_new: bool,
 ) -> Result<BufWriter<Box<dyn Write>>> {
     match filter {
-        None => Ok(BufWriter::new(Box::new(
-            // write to the next file
-            std::fs::OpenOptions::new()
-                .write(true)
-                .create(true)
-                .truncate(true)
-                .open(std::path::Path::new(&filename))
-                .map_err(|_| {
-                    Error::new(
-                        ErrorKind::Other,
-                        format!("unable to open '{filename}'; aborting"),
-                    )
-                })?,
-        ) as Box<dyn Write>)),
+        None => {
+            let file = if is_new {
+                // create new file
+                std::fs::OpenOptions::new()
+                    .write(true)
+                    .create(true)
+                    .truncate(true)
+                    .open(std::path::Path::new(&filename))
+                    .map_err(|_| {
+                        Error::new(
+                            ErrorKind::Other,
+                            format!("unable to open '{filename}'; aborting"),
+                        )
+                    })?
+            } else {
+                // re-open file that we previously created to append to it
+                std::fs::OpenOptions::new()
+                    .append(true)
+                    .open(std::path::Path::new(&filename))
+                    .map_err(|_| {
+                        Error::new(
+                            ErrorKind::Other,
+                            format!("unable to re-open '{filename}'; aborting"),
+                        )
+                    })?
+            };
+            Ok(BufWriter::new(Box::new(file) as Box<dyn Write>))
+        }
         Some(ref filter_command) => Ok(BufWriter::new(Box::new(
             // spawn a shell command and write to it
             FilterWriter::new(filter_command, filename)?,
diff --git a/src/uu/split/src/platform/windows.rs b/src/uu/split/src/platform/windows.rs
index 8b90789896f..a531d6abc1f 100644
--- a/src/uu/split/src/platform/windows.rs
+++ b/src/uu/split/src/platform/windows.rs
@@ -14,9 +14,10 @@ use uucore::fs;
 pub fn instantiate_current_writer(
     _filter: &Option<String>,
     filename: &str,
+    is_new: bool,
 ) -> Result<BufWriter<Box<dyn Write>>> {
-    Ok(BufWriter::new(Box::new(
-        // write to the next file
+    let file = if is_new {
+        // create new file
         std::fs::OpenOptions::new()
             .write(true)
             .create(true)
@@ -25,10 +26,22 @@ pub fn instantiate_current_writer(
             .map_err(|_| {
                 Error::new(
                     ErrorKind::Other,
-                    format!("'{filename}' would overwrite input; aborting"),
+                    format!("unable to open '{filename}'; aborting"),
                 )
-            })?,
-    ) as Box<dyn Write>))
+            })?
+    } else {
+        // re-open file that we previously created to append to it
+        std::fs::OpenOptions::new()
+            .append(true)
+            .open(std::path::Path::new(&filename))
+            .map_err(|_| {
+                Error::new(
+                    ErrorKind::Other,
+                    format!("unable to re-open '{filename}'; aborting"),
+                )
+            })?
+    };
+    Ok(BufWriter::new(Box::new(file) as Box<dyn Write>))
 }
 
 pub fn paths_refer_to_same_file(p1: &str, p2: &str) -> bool {
diff --git a/src/uu/split/src/split.rs b/src/uu/split/src/split.rs
index 4e2af0be4d8..e5f9032c947 100644
--- a/src/uu/split/src/split.rs
+++ b/src/uu/split/src/split.rs
@@ -3,7 +3,7 @@
 // For the full copyright and license information, please view the LICENSE
 // file that was distributed with this source code.
 
-// spell-checker:ignore nbbbb ncccc hexdigit
+// spell-checker:ignore nbbbb ncccc hexdigit getmaxstdio
 
 mod filenames;
 mod number;
@@ -563,7 +563,11 @@ impl Settings {
         Ok(result)
     }
 
-    fn instantiate_current_writer(&self, filename: &str) -> io::Result<BufWriter<Box<dyn Write>>> {
+    fn instantiate_current_writer(
+        &self,
+        filename: &str,
+        is_new: bool,
+    ) -> io::Result<BufWriter<Box<dyn Write>>> {
         if platform::paths_refer_to_same_file(&self.input, filename) {
             return Err(io::Error::new(
                 ErrorKind::Other,
@@ -571,7 +575,7 @@ impl Settings {
             ));
         }
 
-        platform::instantiate_current_writer(&self.filter, filename)
+        platform::instantiate_current_writer(&self.filter, filename, is_new)
     }
 }
 
@@ -748,7 +752,7 @@ impl<'a> ByteChunkWriter<'a> {
         if settings.verbose {
             println!("creating file {}", filename.quote());
         }
-        let inner = settings.instantiate_current_writer(&filename)?;
+        let inner = settings.instantiate_current_writer(&filename, true)?;
         Ok(ByteChunkWriter {
             settings,
             chunk_size,
@@ -786,7 +790,7 @@ impl<'a> Write for ByteChunkWriter<'a> {
                 if self.settings.verbose {
                     println!("creating file {}", filename.quote());
                 }
-                self.inner = self.settings.instantiate_current_writer(&filename)?;
+                self.inner = self.settings.instantiate_current_writer(&filename, true)?;
             }
 
             // If the capacity of this chunk is greater than the number of
@@ -872,7 +876,7 @@ impl<'a> LineChunkWriter<'a> {
         if settings.verbose {
             println!("creating file {}", filename.quote());
         }
-        let inner = settings.instantiate_current_writer(&filename)?;
+        let inner = settings.instantiate_current_writer(&filename, true)?;
         Ok(LineChunkWriter {
             settings,
             chunk_size,
@@ -907,7 +911,7 @@ impl<'a> Write for LineChunkWriter<'a> {
                 if self.settings.verbose {
                     println!("creating file {}", filename.quote());
                 }
-                self.inner = self.settings.instantiate_current_writer(&filename)?;
+                self.inner = self.settings.instantiate_current_writer(&filename, true)?;
                 self.num_lines_remaining_in_current_chunk = self.chunk_size;
             }
 
@@ -979,7 +983,7 @@ impl<'a> LineBytesChunkWriter<'a> {
         if settings.verbose {
             println!("creating file {}", filename.quote());
         }
-        let inner = settings.instantiate_current_writer(&filename)?;
+        let inner = settings.instantiate_current_writer(&filename, true)?;
         Ok(LineBytesChunkWriter {
             settings,
             chunk_size,
@@ -1045,7 +1049,7 @@ impl<'a> Write for LineBytesChunkWriter<'a> {
                 if self.settings.verbose {
                     println!("creating file {}", filename.quote());
                 }
-                self.inner = self.settings.instantiate_current_writer(&filename)?;
+                self.inner = self.settings.instantiate_current_writer(&filename, true)?;
                 self.num_bytes_remaining_in_current_chunk = self.chunk_size.try_into().unwrap();
             }
 
@@ -1134,55 +1138,135 @@ impl<'a> Write for LineBytesChunkWriter<'a> {
 struct OutFile {
     filename: String,
     maybe_writer: Option<BufWriter<Box<dyn Write>>>,
+    is_new: bool,
 }
 
-impl OutFile {
-    /// Get the writer for the output file
-    /// Instantiate the writer if it has not been instantiated upfront
-    fn get_writer(&mut self, settings: &Settings) -> UResult<&mut BufWriter<Box<dyn Write>>> {
-        if self.maybe_writer.is_some() {
-            Ok(self.maybe_writer.as_mut().unwrap())
-        } else {
-            // Writer was not instantiated upfront
-            // Instantiate it and record for future use
-            self.maybe_writer = Some(settings.instantiate_current_writer(self.filename.as_str())?);
-            Ok(self.maybe_writer.as_mut().unwrap())
+// impl OutFile {
+//     /// Get the writer for the output file.
+//     /// Instantiate the writer if it has not been instantiated upfront
+//     /// or temporarily closed to free up system resources
+//     fn get_writer(&mut self, settings: &Settings) -> UResult<&mut BufWriter<Box<dyn Write>>> {
+//         if self.maybe_writer.is_some() {
+//             Ok(self.maybe_writer.as_mut().unwrap())
+//         } else {
+//             // Writer was not instantiated upfront or was temporarily closed due to system resources constraints.
+//             // Instantiate it and record for future use.
+//             self.maybe_writer =
+//                 Some(settings.instantiate_current_writer(self.filename.as_str(), self.is_new)?);
+//             Ok(self.maybe_writer.as_mut().unwrap())
+//         }
+//     }
+// }
+
+/// A set of output files
+/// Used in [`n_chunks_by_byte`], [`n_chunks_by_line`]
+/// and [`n_chunks_by_line_round_robin`] functions.
+type OutFiles = Vec<OutFile>;
+trait ManageOutFiles {
+    /// Initialize a new set of output files
+    /// Each OutFile is generated with filename, while the writer for it could be
+    /// optional, to be instantiated later by the calling function as needed.
+    /// Optional writers could happen in the following situations:
+    /// * in [`n_chunks_by_line`] if `elide_empty_files` parameter is set to `true`
+    /// * if the number of files is greater than system limit for open files
+    fn init(num_files: u64, settings: &Settings, is_writer_optional: bool) -> UResult<Self>
+    where
+        Self: Sized;
+    /// Get the writer for the output file by index.
+    /// If system limit of open files has been reached
+    /// it will try to close one of previously instantiated writers
+    /// to free up resources and re-try instantiating current writer,
+    /// except for `--filter` mode.
+    /// The writers that get closed to free up resources for the current writer
+    /// are flagged as `is_new=false`, so they can be re-opened for appending
+    /// instead of created anew if we need to keep writing into them later,
+    /// i.e. in case of round robin distribution as in [`n_chunks_by_line_round_robin`]
+    fn get_writer(
+        &mut self,
+        idx: usize,
+        settings: &Settings,
+    ) -> UResult<&mut BufWriter<Box<dyn Write>>>;
+}
+
+impl ManageOutFiles for OutFiles {
+    fn init(num_files: u64, settings: &Settings, is_writer_optional: bool) -> UResult<Self> {
+        // This object is responsible for creating the filename for each chunk
+        let mut filename_iterator: FilenameIterator<'_> =
+            FilenameIterator::new(&settings.prefix, &settings.suffix)
+                .map_err(|e| io::Error::new(ErrorKind::Other, format!("{e}")))?;
+        let mut out_files: Self = Self::new();
+        for _ in 0..num_files {
+            let filename = filename_iterator
+                .next()
+                .ok_or_else(|| USimpleError::new(1, "output file suffixes exhausted"))?;
+            let maybe_writer = if is_writer_optional {
+                None
+            } else {
+                let instantiated = settings.instantiate_current_writer(filename.as_str(), true);
+                // If there was an error instantiating the writer for a file,
+                // it could be due to hitting the system limit of open files,
+                // so record it as None and let [`get_writer`] function handle closing/re-opening
+                // of writers as needed within system limits.
+                // However, for `--filter` child process writers - propagate the error,
+                // as working around system limits of open files for child shell processes
+                // is currently not supported (same as in GNU)
+                match instantiated {
+                    Ok(writer) => Some(writer),
+                    Err(e) if settings.filter.is_some() => {
+                        return Err(e.into());
+                    }
+                    Err(_) => None,
+                }
+            };
+            out_files.push(OutFile {
+                filename,
+                maybe_writer,
+                is_new: true,
+            });
         }
+        Ok(out_files)
     }
-}
 
-/// Generate a set of Output Files
-/// This is a helper function to [`n_chunks_by_byte`], [`n_chunks_by_line`]
-/// and [`n_chunks_by_line_round_robin`].
-/// Each OutFile is generated with filename, while the writer for it could be
-/// optional, to be instantiated later by the calling function as needed.
-/// Optional writers could happen in [`n_chunks_by_line`]
-/// if `elide_empty_files` parameter is set to `true`.
-fn get_out_files(
-    num_files: u64,
-    settings: &Settings,
-    is_writer_optional: bool,
-) -> UResult<Vec<OutFile>> {
-    // This object is responsible for creating the filename for each chunk
-    let mut filename_iterator: FilenameIterator<'_> =
-        FilenameIterator::new(&settings.prefix, &settings.suffix)
-            .map_err(|e| io::Error::new(ErrorKind::Other, format!("{e}")))?;
-    let mut out_files: Vec<OutFile> = Vec::new();
-    for _ in 0..num_files {
-        let filename = filename_iterator
-            .next()
-            .ok_or_else(|| USimpleError::new(1, "output file suffixes exhausted"))?;
-        let maybe_writer = if is_writer_optional {
-            None
+    fn get_writer(
+        &mut self,
+        idx: usize,
+        settings: &Settings,
+    ) -> UResult<&mut BufWriter<Box<dyn Write>>> {
+        if self[idx].maybe_writer.is_some() {
+            Ok(self[idx].maybe_writer.as_mut().unwrap())
         } else {
-            Some(settings.instantiate_current_writer(filename.as_str())?)
-        };
-        out_files.push(OutFile {
-            filename,
-            maybe_writer,
-        });
+            // Writer was not instantiated upfront or was temporarily closed due to system resources constraints.
+            // Instantiate it and record for future use.
+            let maybe_writer =
+                settings.instantiate_current_writer(self[idx].filename.as_str(), self[idx].is_new);
+            if let Ok(writer) = maybe_writer {
+                self[idx].maybe_writer = Some(writer);
+                Ok(self[idx].maybe_writer.as_mut().unwrap())
+            } else if settings.filter.is_some() {
+                // Propagate error if in `--filter` mode
+                Err(maybe_writer.err().unwrap().into())
+            } else {
+                // Could have hit system limit for open files.
+                // Try to close one previously instantiated writer first
+                for (i, out_file) in self.iter_mut().enumerate() {
+                    if i != idx && out_file.maybe_writer.is_some() {
+                        out_file.maybe_writer.as_mut().unwrap().flush()?;
+                        out_file.maybe_writer = None;
+                        out_file.is_new = false;
+                        break;
+                    }
+                }
+                // And then try to instantiate the writer again
+                // If this fails - give up and propagate the error
+                self[idx].maybe_writer =
+                    Some(settings.instantiate_current_writer(
+                        self[idx].filename.as_str(),
+                        self[idx].is_new,
+                    )?);
+                Ok(self[idx].maybe_writer.as_mut().unwrap())
+            }
+        }
     }
-    Ok(out_files)
 }
 
 /// Split a file or STDIN into a specific number of chunks by byte.
@@ -1261,7 +1345,7 @@ where
     // In Kth chunk of N mode - we will write to stdout instead of to a file.
     let mut stdout_writer = std::io::stdout().lock();
     // In N chunks mode - we will write to `num_chunks` files
-    let mut out_files: Vec<OutFile> = Vec::new();
+    let mut out_files: OutFiles = OutFiles::new();
 
     // Calculate chunk size base and modulo reminder
     // to be used in calculating chunk_size later on
@@ -1273,7 +1357,7 @@ where
     // This will create each of the underlying files
     // or stdin pipes to child shell/command processes if in `--filter` mode
     if kth_chunk.is_none() {
-        out_files = get_out_files(num_chunks, settings, false)?;
+        out_files = OutFiles::init(num_chunks, settings, false)?;
     }
 
     for i in 1_u64..=num_chunks {
@@ -1317,7 +1401,7 @@ where
                 }
                 None => {
                     let idx = (i - 1) as usize;
-                    let writer = out_files[idx].get_writer(settings)?;
+                    let writer = out_files.get_writer(idx, settings)?;
                     writer.write_all(buf)?;
                 }
             }
@@ -1387,7 +1471,7 @@ where
     // In Kth chunk of N mode - we will write to stdout instead of to a file.
     let mut stdout_writer = std::io::stdout().lock();
     // In N chunks mode - we will write to `num_chunks` files
-    let mut out_files: Vec<OutFile> = Vec::new();
+    let mut out_files: OutFiles = OutFiles::new();
 
     // Calculate chunk size base and modulo reminder
     // to be used in calculating `num_bytes_should_be_written` later on
@@ -1402,7 +1486,7 @@ where
     // Otherwise keep writer optional, to be instantiated later if there is data
     // to write for the associated chunk.
     if kth_chunk.is_none() {
-        out_files = get_out_files(num_chunks, settings, settings.elide_empty_files)?;
+        out_files = OutFiles::init(num_chunks, settings, settings.elide_empty_files)?;
     }
 
     let mut chunk_number = 1;
@@ -1429,7 +1513,7 @@ where
             None => {
                 // Should write into a file
                 let idx = (chunk_number - 1) as usize;
-                let writer = out_files[idx].get_writer(settings)?;
+                let writer = out_files.get_writer(idx, settings)?;
                 custom_write_all(bytes, writer, settings)?;
             }
         }
@@ -1503,14 +1587,14 @@ where
     // In Kth chunk of N mode - we will write to stdout instead of to a file.
     let mut stdout_writer = std::io::stdout().lock();
     // In N chunks mode - we will write to `num_chunks` files
-    let mut out_files: Vec<OutFile> = Vec::new();
+    let mut out_files: OutFiles = OutFiles::new();
 
     // If in N chunks mode
     // Create one writer for each chunk.
     // This will create each of the underlying files
     // or stdin pipes to child shell/command processes if in `--filter` mode
     if kth_chunk.is_none() {
-        out_files = get_out_files(num_chunks, settings, false)?;
+        out_files = OutFiles::init(num_chunks, settings, false)?;
     }
 
     let num_chunks: usize = num_chunks.try_into().unwrap();
@@ -1532,7 +1616,7 @@ where
                 }
             }
             None => {
-                let writer = out_files[i % num_chunks].get_writer(settings)?;
+                let writer = out_files.get_writer(i % num_chunks, settings)?;
                 let writer_stdin_open = custom_write_all(bytes, writer, settings)?;
                 if !writer_stdin_open {
                     closed_writers += 1;

From 440e7b1a597091b5b0e3d81007f55ea6fbe96ee3 Mon Sep 17 00:00:00 2001
From: zhitkoff <zhitkoff@gmail.com>
Date: Fri, 24 Nov 2023 19:10:47 -0500
Subject: [PATCH 067/429] split: r-chunk test compliance

---
 src/uu/split/src/split.rs | 22 ++++++++++++++++++----
 1 file changed, 18 insertions(+), 4 deletions(-)

diff --git a/src/uu/split/src/split.rs b/src/uu/split/src/split.rs
index e5f9032c947..932013ad9b3 100644
--- a/src/uu/split/src/split.rs
+++ b/src/uu/split/src/split.rs
@@ -1167,7 +1167,7 @@ trait ManageOutFiles {
     /// Each OutFile is generated with filename, while the writer for it could be
     /// optional, to be instantiated later by the calling function as needed.
     /// Optional writers could happen in the following situations:
-    /// * in [`n_chunks_by_line`] if `elide_empty_files` parameter is set to `true`
+    /// * in [`n_chunks_by_line`] and [`n_chunks_by_line_round_robin`] if `elide_empty_files` parameter is set to `true`
     /// * if the number of files is greater than system limit for open files
     fn init(num_files: u64, settings: &Settings, is_writer_optional: bool) -> UResult<Self>
     where
@@ -1584,6 +1584,12 @@ fn n_chunks_by_line_round_robin<R>(
 where
     R: BufRead,
 {
+    // Get the size of the input in bytes and compute the number
+    // of bytes per chunk.
+    let initial_buf = &mut Vec::new();
+    let num_bytes = get_input_size(&settings.input, reader, initial_buf, &settings.io_blksize)?;
+    let reader = initial_buf.chain(reader);
+
     // In Kth chunk of N mode - we will write to stdout instead of to a file.
     let mut stdout_writer = std::io::stdout().lock();
     // In N chunks mode - we will write to `num_chunks` files
@@ -1594,16 +1600,22 @@ where
     // This will create each of the underlying files
     // or stdin pipes to child shell/command processes if in `--filter` mode
     if kth_chunk.is_none() {
-        out_files = OutFiles::init(num_chunks, settings, false)?;
+        out_files = OutFiles::init(num_chunks, settings, settings.elide_empty_files)?;
     }
 
     let num_chunks: usize = num_chunks.try_into().unwrap();
     let sep = settings.separator;
     let mut closed_writers = 0;
+    let mut num_bytes_written = 0;
+
     for (i, line_result) in reader.split(sep).enumerate() {
-        // add separator back in at the end of the line
         let mut line = line_result?;
-        line.push(sep);
+        // add separator back in at the end of the line,
+        // since `reader.split(sep)` removes it,
+        // except if the last line did not end with separator character
+        if (num_bytes_written + line.len() as u64) < num_bytes {
+            line.push(sep);
+        }
         let bytes = line.as_slice();
 
         match kth_chunk {
@@ -1627,6 +1639,8 @@ where
                 }
             }
         }
+        let num_line_bytes = bytes.len() as u64;
+        num_bytes_written += num_line_bytes;
     }
 
     Ok(())

From 7b2a3e236e86786f35e3c9314cb1e8916ad37247 Mon Sep 17 00:00:00 2001
From: zhitkoff <zhitkoff@gmail.com>
Date: Fri, 24 Nov 2023 20:56:05 -0500
Subject: [PATCH 068/429] split: r-chunk tests and infinite input

---
 src/uu/split/src/split.rs   | 66 ++++++++++++-------------------------
 tests/by-util/test_split.rs | 26 +++++++++++++--
 2 files changed, 44 insertions(+), 48 deletions(-)

diff --git a/src/uu/split/src/split.rs b/src/uu/split/src/split.rs
index 932013ad9b3..a837bcb21ec 100644
--- a/src/uu/split/src/split.rs
+++ b/src/uu/split/src/split.rs
@@ -622,7 +622,7 @@ fn custom_write_all<T: Write>(
 
 /// Get the size of the input file in bytes
 /// Used only for subset of `--number=CHUNKS` strategy, as there is a need
-/// to determine input file size upfront in order to know chunk size
+/// to determine input file size upfront in order to estimate the chunk size
 /// to be written into each of N files/chunks:
 /// * N       split into N files based on size of input
 /// * K/N     output Kth of N to stdout
@@ -1141,23 +1141,6 @@ struct OutFile {
     is_new: bool,
 }
 
-// impl OutFile {
-//     /// Get the writer for the output file.
-//     /// Instantiate the writer if it has not been instantiated upfront
-//     /// or temporarily closed to free up system resources
-//     fn get_writer(&mut self, settings: &Settings) -> UResult<&mut BufWriter<Box<dyn Write>>> {
-//         if self.maybe_writer.is_some() {
-//             Ok(self.maybe_writer.as_mut().unwrap())
-//         } else {
-//             // Writer was not instantiated upfront or was temporarily closed due to system resources constraints.
-//             // Instantiate it and record for future use.
-//             self.maybe_writer =
-//                 Some(settings.instantiate_current_writer(self.filename.as_str(), self.is_new)?);
-//             Ok(self.maybe_writer.as_mut().unwrap())
-//         }
-//     }
-// }
-
 /// A set of output files
 /// Used in [`n_chunks_by_byte`], [`n_chunks_by_line`]
 /// and [`n_chunks_by_line_round_robin`] functions.
@@ -1551,7 +1534,11 @@ where
 }
 
 /// Split a file or STDIN into a specific number of chunks by line, but
-/// assign lines via round-robin
+/// assign lines via round-robin.
+/// Note: There is no need to know the size of the input upfront for this method,
+/// since the lines are assigned to chunks randomly and the size of each chunk
+/// does not need to be estimated. As a result, "infinite" inputs are supported
+/// for this method, i.e. `yes | split -n r/10` or `yes | split -n r/3/11`
 ///
 /// In Kth chunk of N mode - writes to stdout the contents of the chunk identified by `kth_chunk`
 ///
@@ -1584,12 +1571,6 @@ fn n_chunks_by_line_round_robin<R>(
 where
     R: BufRead,
 {
-    // Get the size of the input in bytes and compute the number
-    // of bytes per chunk.
-    let initial_buf = &mut Vec::new();
-    let num_bytes = get_input_size(&settings.input, reader, initial_buf, &settings.io_blksize)?;
-    let reader = initial_buf.chain(reader);
-
     // In Kth chunk of N mode - we will write to stdout instead of to a file.
     let mut stdout_writer = std::io::stdout().lock();
     // In N chunks mode - we will write to `num_chunks` files
@@ -1606,23 +1587,20 @@ where
     let num_chunks: usize = num_chunks.try_into().unwrap();
     let sep = settings.separator;
     let mut closed_writers = 0;
-    let mut num_bytes_written = 0;
 
-    for (i, line_result) in reader.split(sep).enumerate() {
-        let mut line = line_result?;
-        // add separator back in at the end of the line,
-        // since `reader.split(sep)` removes it,
-        // except if the last line did not end with separator character
-        if (num_bytes_written + line.len() as u64) < num_bytes {
-            line.push(sep);
-        }
-        let bytes = line.as_slice();
+    let mut i = 0;
+    loop {
+        let line = &mut Vec::new();
+        let num_bytes_read = reader.by_ref().read_until(sep, line)?;
 
+        // if there is nothing else to read - exit the loop
+        if num_bytes_read == 0 {
+            break;
+        };
+
+        let bytes = line.as_slice();
         match kth_chunk {
             Some(chunk_number) => {
-                // The `.enumerate()` method returns index `i` starting with 0,
-                // but chunk number is given as a 1-indexed number,
-                // so compare to `chunk_number - 1`
                 if (i % num_chunks) == (chunk_number - 1) as usize {
                     stdout_writer.write_all(bytes)?;
                 }
@@ -1632,17 +1610,15 @@ where
                 let writer_stdin_open = custom_write_all(bytes, writer, settings)?;
                 if !writer_stdin_open {
                     closed_writers += 1;
-                    if closed_writers == num_chunks {
-                        // all writers are closed - stop reading
-                        break;
-                    }
                 }
             }
         }
-        let num_line_bytes = bytes.len() as u64;
-        num_bytes_written += num_line_bytes;
+        i += 1;
+        if closed_writers == num_chunks {
+            // all writers are closed - stop reading
+            break;
+        }
     }
-
     Ok(())
 }
 
diff --git a/tests/by-util/test_split.rs b/tests/by-util/test_split.rs
index 2c9a56bddee..acb8ab56140 100644
--- a/tests/by-util/test_split.rs
+++ b/tests/by-util/test_split.rs
@@ -2,11 +2,13 @@
 //
 // For the full copyright and license information, please view the LICENSE
 // file that was distributed with this source code.
-// spell-checker:ignore xzaaa sixhundredfiftyonebytes ninetyonebytes threebytes asciilowercase ghijkl mnopq rstuv wxyz fivelines twohundredfortyonebytes onehundredlines nbbbb dxen ncccc
+// spell-checker:ignore xzaaa sixhundredfiftyonebytes ninetyonebytes threebytes asciilowercase ghijkl mnopq rstuv wxyz fivelines twohundredfortyonebytes onehundredlines nbbbb dxen ncccc rlimit NOFILE
 
 use crate::common::util::{AtPath, TestScenario};
 use rand::{thread_rng, Rng, SeedableRng};
 use regex::Regex;
+#[cfg(any(target_os = "linux", target_os = "android"))]
+use rlimit::Resource;
 #[cfg(not(windows))]
 use std::env;
 use std::path::Path;
@@ -1250,10 +1252,19 @@ fn test_number_by_lines_kth_no_end_sep() {
         .succeeds()
         .stdout_only("2222\n");
     new_ucmd!()
-        .args(&["-e", "-n", "l/8/10"])
+        .args(&["-e", "-n", "l/2/2"])
         .pipe_in("1\n2222\n3\n4")
         .succeeds()
-        .stdout_only("3\n");
+        .stdout_only("3\n4");
+}
+
+#[test]
+fn test_number_by_lines_rr_kth_no_end_sep() {
+    new_ucmd!()
+        .args(&["-n", "r/2/3"])
+        .pipe_in("1\n2\n3\n4\n5")
+        .succeeds()
+        .stdout_only("2\n5");
 }
 
 #[test]
@@ -1626,6 +1637,15 @@ fn test_round_robin() {
     assert_eq!(at.read("xab"), "2\n4\n");
 }
 
+#[test]
+#[cfg(any(target_os = "linux", target_os = "android"))]
+fn test_round_robin_limited_file_descriptors() {
+    new_ucmd!()
+        .args(&["-n", "r/40", "onehundredlines.txt"])
+        .limit(Resource::NOFILE, 9, 9)
+        .succeeds();
+}
+
 #[test]
 fn test_split_invalid_input() {
     // Test if stdout/stderr for '--lines' option is correct

From f8f63461264208ccd26842ec02f61f120c751072 Mon Sep 17 00:00:00 2001
From: zhitkoff <zhitkoff@gmail.com>
Date: Sat, 25 Nov 2023 18:16:34 -0500
Subject: [PATCH 069/429] wc: fix FilesDisabled error message

---
 src/uu/wc/src/wc.rs      | 12 ++++++++----
 tests/by-util/test_wc.rs |  3 ++-
 2 files changed, 10 insertions(+), 5 deletions(-)

diff --git a/src/uu/wc/src/wc.rs b/src/uu/wc/src/wc.rs
index 663bbda151b..ae9b24f5d84 100644
--- a/src/uu/wc/src/wc.rs
+++ b/src/uu/wc/src/wc.rs
@@ -167,7 +167,7 @@ impl<'a> Inputs<'a> {
                     None => Ok(Self::Files0From(input)),
                 }
             }
-            (Some(_), Some(_)) => Err(WcError::FilesDisabled.into()),
+            (Some(mut files), Some(_)) => Err(WcError::files_disabled(files.next()).into()),
         }
     }
 
@@ -342,8 +342,8 @@ impl TotalWhen {
 
 #[derive(Debug, Error)]
 enum WcError {
-    #[error("file operands cannot be combined with --files0-from")]
-    FilesDisabled,
+    #[error("extra operand '{extra}'\nfile operands cannot be combined with --files0-from")]
+    FilesDisabled { extra: Cow<'static, str> },
     #[error("when reading file names from stdin, no file name of '-' allowed")]
     StdinReprNotAllowed,
     #[error("invalid zero-length file name")]
@@ -365,11 +365,15 @@ impl WcError {
             None => Self::ZeroLengthFileName,
         }
     }
+    fn files_disabled(first_extra: Option<&OsString>) -> Self {
+        let extra = first_extra.unwrap().to_string_lossy().into_owned().into();
+        Self::FilesDisabled { extra }
+    }
 }
 
 impl UError for WcError {
     fn usage(&self) -> bool {
-        matches!(self, Self::FilesDisabled)
+        matches!(self, Self::FilesDisabled { .. })
     }
 }
 
diff --git a/tests/by-util/test_wc.rs b/tests/by-util/test_wc.rs
index 6417470c57f..8358a542a23 100644
--- a/tests/by-util/test_wc.rs
+++ b/tests/by-util/test_wc.rs
@@ -423,7 +423,8 @@ fn test_files_from_pseudo_filesystem() {
 
 #[test]
 fn test_files0_disabled_files_argument() {
-    const MSG: &str = "file operands cannot be combined with --files0-from";
+    const MSG: &str =
+        "extra operand 'lorem_ipsum.txt'\nfile operands cannot be combined with --files0-from";
     new_ucmd!()
         .args(&["--files0-from=files0_list.txt"])
         .arg("lorem_ipsum.txt")

From 04e568db7354347a103f88e6a1a0c34c74d54128 Mon Sep 17 00:00:00 2001
From: "renovate[bot]" <29139614+renovate[bot]@users.noreply.github.com>
Date: Sun, 26 Nov 2023 00:47:15 +0000
Subject: [PATCH 070/429] chore(deps): update
 davidanson/markdownlint-cli2-action action to v14

---
 .github/workflows/CICD.yml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/.github/workflows/CICD.yml b/.github/workflows/CICD.yml
index 66ee23168b8..8dfa0b1d103 100644
--- a/.github/workflows/CICD.yml
+++ b/.github/workflows/CICD.yml
@@ -133,7 +133,7 @@ jobs:
       shell: bash
       run: |
         RUSTDOCFLAGS="-Dwarnings" cargo doc  ${{ steps.vars.outputs.CARGO_FEATURES_OPTION }} --no-deps --workspace --document-private-items
-    - uses: DavidAnson/markdownlint-cli2-action@v13
+    - uses: DavidAnson/markdownlint-cli2-action@v14
       with:
         fix: "true"
         globs: |

From b6553edfb7ecefe54aecc21bc130e878852c9ba5 Mon Sep 17 00:00:00 2001
From: Gary Yendell <gary.yendell@diamond.ac.uk>
Date: Sat, 25 Nov 2023 17:35:48 +0000
Subject: [PATCH 071/429] hashsum: Remove usage of crash! macro

---
 src/uu/hashsum/src/hashsum.rs | 204 +++++++++++++++++-----------------
 1 file changed, 105 insertions(+), 99 deletions(-)

diff --git a/src/uu/hashsum/src/hashsum.rs b/src/uu/hashsum/src/hashsum.rs
index d27b09b98ed..22ef4152070 100644
--- a/src/uu/hashsum/src/hashsum.rs
+++ b/src/uu/hashsum/src/hashsum.rs
@@ -20,12 +20,13 @@ use std::io::{self, stdin, BufRead, BufReader, Read};
 use std::iter;
 use std::num::ParseIntError;
 use std::path::Path;
+use uucore::error::USimpleError;
 use uucore::error::{FromIo, UError, UResult};
 use uucore::sum::{
     Blake2b, Blake3, Digest, DigestWriter, Md5, Sha1, Sha224, Sha256, Sha384, Sha3_224, Sha3_256,
     Sha3_384, Sha3_512, Sha512, Shake128, Shake256,
 };
-use uucore::{crash, display::Quotable, show_warning};
+use uucore::{display::Quotable, show_warning};
 use uucore::{format_usage, help_about, help_usage};
 
 const NAME: &str = "hashsum";
@@ -51,28 +52,32 @@ struct Options {
 ///
 /// # Returns
 ///
-/// Returns a tuple containing the algorithm name, the hasher instance, and the output length in bits.
-///
-/// # Panics
-///
-/// Panics if the length is not a multiple of 8 or if it is greater than 512.
-fn create_blake2b(matches: &ArgMatches) -> (&'static str, Box<dyn Digest>, usize) {
+/// Returns a UResult of a tuple containing the algorithm name, the hasher instance, and
+/// the output length in bits or an Err if the length is not a multiple of 8 or if it is
+/// greater than 512.
+fn create_blake2b(matches: &ArgMatches) -> UResult<(&'static str, Box<dyn Digest>, usize)> {
     match matches.get_one::<usize>("length") {
-        Some(0) | None => ("BLAKE2", Box::new(Blake2b::new()) as Box<dyn Digest>, 512),
+        Some(0) | None => Ok(("BLAKE2", Box::new(Blake2b::new()) as Box<dyn Digest>, 512)),
         Some(length_in_bits) => {
             if *length_in_bits > 512 {
-                crash!(1, "Invalid length (maximum digest length is 512 bits)")
+                return Err(USimpleError::new(
+                    1,
+                    "Invalid length (maximum digest length is 512 bits)",
+                ));
             }
 
             if length_in_bits % 8 == 0 {
                 let length_in_bytes = length_in_bits / 8;
-                (
+                Ok((
                     "BLAKE2",
                     Box::new(Blake2b::with_output_bytes(length_in_bytes)),
                     *length_in_bits,
-                )
+                ))
             } else {
-                crash!(1, "Invalid length (expected a multiple of 8)")
+                Err(USimpleError::new(
+                    1,
+                    "Invalid length (expected a multiple of 8)",
+                ))
             }
         }
     }
@@ -82,38 +87,36 @@ fn create_blake2b(matches: &ArgMatches) -> (&'static str, Box<dyn Digest>, usize
 ///
 /// # Returns
 ///
-/// Returns a tuple containing the algorithm name, the hasher instance, and the output length in bits.
-///
-/// # Panics
-///
-/// Panics if an unsupported output size is provided, or if the `--bits` flag is missing.
-fn create_sha3(matches: &ArgMatches) -> (&'static str, Box<dyn Digest>, usize) {
+/// Returns a UResult of a tuple containing the algorithm name, the hasher instance, and
+/// the output length in bits or an Err if an unsupported output size is provided, or if
+/// the `--bits` flag is missing.
+fn create_sha3(matches: &ArgMatches) -> UResult<(&'static str, Box<dyn Digest>, usize)> {
     match matches.get_one::<usize>("bits") {
-        Some(224) => (
+        Some(224) => Ok((
             "SHA3-224",
             Box::new(Sha3_224::new()) as Box<dyn Digest>,
             224,
-        ),
-        Some(256) => (
+        )),
+        Some(256) => Ok((
             "SHA3-256",
             Box::new(Sha3_256::new()) as Box<dyn Digest>,
             256,
-        ),
-        Some(384) => (
+        )),
+        Some(384) => Ok((
             "SHA3-384",
             Box::new(Sha3_384::new()) as Box<dyn Digest>,
             384,
-        ),
-        Some(512) => (
+        )),
+        Some(512) => Ok((
             "SHA3-512",
             Box::new(Sha3_512::new()) as Box<dyn Digest>,
             512,
-        ),
-        Some(_) => crash!(
+        )),
+        Some(_) => Err(USimpleError::new(
             1,
-            "Invalid output size for SHA3 (expected 224, 256, 384, or 512)"
-        ),
-        None => crash!(1, "--bits required for SHA3"),
+            "Invalid output size for SHA3 (expected 224, 256, 384, or 512)",
+        )),
+        None => Err(USimpleError::new(1, "--bits required for SHA3")),
     }
 }
 
@@ -121,19 +124,16 @@ fn create_sha3(matches: &ArgMatches) -> (&'static str, Box<dyn Digest>, usize) {
 ///
 /// # Returns
 ///
-/// Returns a tuple containing the algorithm name, the hasher instance, and the output length in bits.
-///
-/// # Panics
-///
-/// Panics if the `--bits` flag is missing.
-fn create_shake128(matches: &ArgMatches) -> (&'static str, Box<dyn Digest>, usize) {
+/// Returns a UResult of a tuple containing the algorithm name, the hasher instance, and
+/// the output length in bits, or an Err if `--bits` flag is missing.
+fn create_shake128(matches: &ArgMatches) -> UResult<(&'static str, Box<dyn Digest>, usize)> {
     match matches.get_one::<usize>("bits") {
-        Some(bits) => (
+        Some(bits) => Ok((
             "SHAKE128",
             Box::new(Shake128::new()) as Box<dyn Digest>,
             *bits,
-        ),
-        None => crash!(1, "--bits required for SHAKE-128"),
+        )),
+        None => Err(USimpleError::new(1, "--bits required for SHAKE-128")),
     }
 }
 
@@ -141,19 +141,16 @@ fn create_shake128(matches: &ArgMatches) -> (&'static str, Box<dyn Digest>, usiz
 ///
 /// # Returns
 ///
-/// Returns a tuple containing the algorithm name, the hasher instance, and the output length in bits.
-///
-/// # Panics
-///
-/// Panics if the `--bits` flag is missing.
-fn create_shake256(matches: &ArgMatches) -> (&'static str, Box<dyn Digest>, usize) {
+/// Returns a UResult of a tuple containing the algorithm name, the hasher instance, and
+/// the output length in bits, or an Err if the `--bits` flag is missing.
+fn create_shake256(matches: &ArgMatches) -> UResult<(&'static str, Box<dyn Digest>, usize)> {
     match matches.get_one::<usize>("bits") {
-        Some(bits) => (
+        Some(bits) => Ok((
             "SHAKE256",
             Box::new(Shake256::new()) as Box<dyn Digest>,
             *bits,
-        ),
-        None => crash!(1, "--bits required for SHAKE-256"),
+        )),
+        None => Err(USimpleError::new(1, "--bits required for SHAKE-256")),
     }
 }
 
@@ -166,46 +163,46 @@ fn create_shake256(matches: &ArgMatches) -> (&'static str, Box<dyn Digest>, usiz
 ///
 /// # Returns
 ///
-/// Returns a tuple containing the algorithm name, the hasher instance, and the output length in bits.
+/// Returns a UResult of a tuple containing the algorithm name, the hasher instance, and
+/// the output length in bits, or an Err if a matching algorithm is not found.
 fn detect_algo(
     program: &str,
     matches: &ArgMatches,
-) -> (&'static str, Box<dyn Digest + 'static>, usize) {
-    let (name, alg, output_bits) = match program {
-        "md5sum" => ("MD5", Box::new(Md5::new()) as Box<dyn Digest>, 128),
-        "sha1sum" => ("SHA1", Box::new(Sha1::new()) as Box<dyn Digest>, 160),
-        "sha224sum" => ("SHA224", Box::new(Sha224::new()) as Box<dyn Digest>, 224),
-        "sha256sum" => ("SHA256", Box::new(Sha256::new()) as Box<dyn Digest>, 256),
-        "sha384sum" => ("SHA384", Box::new(Sha384::new()) as Box<dyn Digest>, 384),
-        "sha512sum" => ("SHA512", Box::new(Sha512::new()) as Box<dyn Digest>, 512),
+) -> UResult<(&'static str, Box<dyn Digest + 'static>, usize)> {
+    match program {
+        "md5sum" => Ok(("MD5", Box::new(Md5::new()) as Box<dyn Digest>, 128)),
+        "sha1sum" => Ok(("SHA1", Box::new(Sha1::new()) as Box<dyn Digest>, 160)),
+        "sha224sum" => Ok(("SHA224", Box::new(Sha224::new()) as Box<dyn Digest>, 224)),
+        "sha256sum" => Ok(("SHA256", Box::new(Sha256::new()) as Box<dyn Digest>, 256)),
+        "sha384sum" => Ok(("SHA384", Box::new(Sha384::new()) as Box<dyn Digest>, 384)),
+        "sha512sum" => Ok(("SHA512", Box::new(Sha512::new()) as Box<dyn Digest>, 512)),
         "b2sum" => create_blake2b(matches),
-        "b3sum" => ("BLAKE3", Box::new(Blake3::new()) as Box<dyn Digest>, 256),
+        "b3sum" => Ok(("BLAKE3", Box::new(Blake3::new()) as Box<dyn Digest>, 256)),
         "sha3sum" => create_sha3(matches),
-        "sha3-224sum" => (
+        "sha3-224sum" => Ok((
             "SHA3-224",
             Box::new(Sha3_224::new()) as Box<dyn Digest>,
             224,
-        ),
-        "sha3-256sum" => (
+        )),
+        "sha3-256sum" => Ok((
             "SHA3-256",
             Box::new(Sha3_256::new()) as Box<dyn Digest>,
             256,
-        ),
-        "sha3-384sum" => (
+        )),
+        "sha3-384sum" => Ok((
             "SHA3-384",
             Box::new(Sha3_384::new()) as Box<dyn Digest>,
             384,
-        ),
-        "sha3-512sum" => (
+        )),
+        "sha3-512sum" => Ok((
             "SHA3-512",
             Box::new(Sha3_512::new()) as Box<dyn Digest>,
             512,
-        ),
+        )),
         "shake128sum" => create_shake128(matches),
         "shake256sum" => create_shake256(matches),
         _ => create_algorithm_from_flags(matches),
-    };
-    (name, alg, output_bits)
+    }
 }
 
 /// Creates a hasher instance based on the command-line flags.
@@ -216,80 +213,89 @@ fn detect_algo(
 ///
 /// # Returns
 ///
-/// Returns a tuple containing the algorithm name, the hasher instance, and the output length in bits.
-///
-/// # Panics
-///
-/// Panics if multiple hash algorithms are specified or if a required flag is missing.
+/// Returns a UResult of a tuple containing the algorithm name, the hasher instance, and
+/// the output length in bits or an Err if multiple hash algorithms are specified or if a
+/// required flag is missing.
 #[allow(clippy::cognitive_complexity)]
-fn create_algorithm_from_flags(matches: &ArgMatches) -> (&'static str, Box<dyn Digest>, usize) {
+fn create_algorithm_from_flags(
+    matches: &ArgMatches,
+) -> UResult<(&'static str, Box<dyn Digest>, usize)> {
     let mut alg: Option<Box<dyn Digest>> = None;
     let mut name: &'static str = "";
     let mut output_bits = 0;
-    let mut set_or_crash = |n, val, bits| {
+    let mut set_or_err = |n, val, bits| {
         if alg.is_some() {
-            crash!(1, "You cannot combine multiple hash algorithms!");
+            return Err(USimpleError::new(
+                1,
+                "You cannot combine multiple hash algorithms!",
+            ));
         };
         name = n;
         alg = Some(val);
         output_bits = bits;
+
+        Ok(())
     };
 
     if matches.get_flag("md5") {
-        set_or_crash("MD5", Box::new(Md5::new()), 128);
+        set_or_err("MD5", Box::new(Md5::new()), 128)?;
     }
     if matches.get_flag("sha1") {
-        set_or_crash("SHA1", Box::new(Sha1::new()), 160);
+        set_or_err("SHA1", Box::new(Sha1::new()), 160)?;
     }
     if matches.get_flag("sha224") {
-        set_or_crash("SHA224", Box::new(Sha224::new()), 224);
+        set_or_err("SHA224", Box::new(Sha224::new()), 224)?;
     }
     if matches.get_flag("sha256") {
-        set_or_crash("SHA256", Box::new(Sha256::new()), 256);
+        set_or_err("SHA256", Box::new(Sha256::new()), 256)?;
     }
     if matches.get_flag("sha384") {
-        set_or_crash("SHA384", Box::new(Sha384::new()), 384);
+        set_or_err("SHA384", Box::new(Sha384::new()), 384)?;
     }
     if matches.get_flag("sha512") {
-        set_or_crash("SHA512", Box::new(Sha512::new()), 512);
+        set_or_err("SHA512", Box::new(Sha512::new()), 512)?;
     }
     if matches.get_flag("b2sum") {
-        set_or_crash("BLAKE2", Box::new(Blake2b::new()), 512);
+        set_or_err("BLAKE2", Box::new(Blake2b::new()), 512)?;
     }
     if matches.get_flag("b3sum") {
-        set_or_crash("BLAKE3", Box::new(Blake3::new()), 256);
+        set_or_err("BLAKE3", Box::new(Blake3::new()), 256)?;
     }
     if matches.get_flag("sha3") {
-        let (n, val, bits) = create_sha3(matches);
-        set_or_crash(n, val, bits);
+        let (n, val, bits) = create_sha3(matches)?;
+        set_or_err(n, val, bits)?;
     }
     if matches.get_flag("sha3-224") {
-        set_or_crash("SHA3-224", Box::new(Sha3_224::new()), 224);
+        set_or_err("SHA3-224", Box::new(Sha3_224::new()), 224)?;
     }
     if matches.get_flag("sha3-256") {
-        set_or_crash("SHA3-256", Box::new(Sha3_256::new()), 256);
+        set_or_err("SHA3-256", Box::new(Sha3_256::new()), 256)?;
     }
     if matches.get_flag("sha3-384") {
-        set_or_crash("SHA3-384", Box::new(Sha3_384::new()), 384);
+        set_or_err("SHA3-384", Box::new(Sha3_384::new()), 384)?;
     }
     if matches.get_flag("sha3-512") {
-        set_or_crash("SHA3-512", Box::new(Sha3_512::new()), 512);
+        set_or_err("SHA3-512", Box::new(Sha3_512::new()), 512)?;
     }
     if matches.get_flag("shake128") {
         match matches.get_one::<usize>("bits") {
-            Some(bits) => set_or_crash("SHAKE128", Box::new(Shake128::new()), *bits),
-            None => crash!(1, "--bits required for SHAKE-128"),
-        }
+            Some(bits) => set_or_err("SHAKE128", Box::new(Shake128::new()), *bits)?,
+            None => return Err(USimpleError::new(1, "--bits required for SHAKE-128")),
+        };
     }
     if matches.get_flag("shake256") {
         match matches.get_one::<usize>("bits") {
-            Some(bits) => set_or_crash("SHAKE256", Box::new(Shake256::new()), *bits),
-            None => crash!(1, "--bits required for SHAKE-256"),
-        }
+            Some(bits) => set_or_err("SHAKE256", Box::new(Shake256::new()), *bits)?,
+            None => return Err(USimpleError::new(1, "--bits required for SHAKE-256")),
+        };
     }
 
-    let alg = alg.unwrap_or_else(|| crash!(1, "You must specify hash algorithm!"));
-    (name, alg, output_bits)
+    let alg = match alg {
+        Some(a) => a,
+        None => return Err(USimpleError::new(1, "You must specify hash algorithm!")),
+    };
+
+    Ok((name, alg, output_bits))
 }
 
 // TODO: return custom error type
@@ -319,7 +325,7 @@ pub fn uumain(mut args: impl uucore::Args) -> UResult<()> {
     //        least somewhat better from a user's perspective.
     let matches = command.try_get_matches_from(args)?;
 
-    let (name, algo, bits) = detect_algo(&binary_name, &matches);
+    let (name, algo, bits) = detect_algo(&binary_name, &matches)?;
 
     let binary = if matches.get_flag("binary") {
         true

From 16f6a136971f79293cde5b615453eca237d9148c Mon Sep 17 00:00:00 2001
From: zhitkoff <zhitkoff@gmail.com>
Date: Sun, 26 Nov 2023 15:14:48 -0500
Subject: [PATCH 072/429] wc: change where to unwrap

---
 src/uu/wc/src/wc.rs | 8 +++++---
 1 file changed, 5 insertions(+), 3 deletions(-)

diff --git a/src/uu/wc/src/wc.rs b/src/uu/wc/src/wc.rs
index ae9b24f5d84..83081124d1b 100644
--- a/src/uu/wc/src/wc.rs
+++ b/src/uu/wc/src/wc.rs
@@ -167,7 +167,9 @@ impl<'a> Inputs<'a> {
                     None => Ok(Self::Files0From(input)),
                 }
             }
-            (Some(mut files), Some(_)) => Err(WcError::files_disabled(files.next()).into()),
+            (Some(mut files), Some(_)) => {
+                Err(WcError::files_disabled(files.next().unwrap()).into())
+            }
         }
     }
 
@@ -365,8 +367,8 @@ impl WcError {
             None => Self::ZeroLengthFileName,
         }
     }
-    fn files_disabled(first_extra: Option<&OsString>) -> Self {
-        let extra = first_extra.unwrap().to_string_lossy().into_owned().into();
+    fn files_disabled(first_extra: &OsString) -> Self {
+        let extra = first_extra.to_string_lossy().into_owned().into();
         Self::FilesDisabled { extra }
     }
 }

From 016ae34d50e2e6e5ec50fca6fc88ad257a4758a2 Mon Sep 17 00:00:00 2001
From: Jeffrey Finkelstein <jeffrey.finkelstein@protonmail.com>
Date: Sun, 12 Mar 2023 19:02:48 -0400
Subject: [PATCH 073/429] dd: add Settings.buffered field

Add the `Settings.buffered` field to indicate whether partial output
blocks should be buffered until they are complete.
---
 src/uu/dd/src/dd.rs                   |  8 +++
 src/uu/dd/src/parseargs.rs            | 74 +++++++++++++++------------
 src/uu/dd/src/parseargs/unit_tests.rs |  1 +
 3 files changed, 49 insertions(+), 34 deletions(-)

diff --git a/src/uu/dd/src/dd.rs b/src/uu/dd/src/dd.rs
index b79ae22da4e..7d9138791cf 100644
--- a/src/uu/dd/src/dd.rs
+++ b/src/uu/dd/src/dd.rs
@@ -76,6 +76,8 @@ struct Settings {
     oconv: OConvFlags,
     oflags: OFlags,
     status: Option<StatusLevel>,
+    /// Whether the output writer should buffer partial blocks until complete.
+    buffered: bool,
 }
 
 /// A timer which triggers on a given interval
@@ -128,6 +130,12 @@ enum Num {
     Bytes(u64),
 }
 
+impl Default for Num {
+    fn default() -> Self {
+        Self::Blocks(0)
+    }
+}
+
 impl Num {
     fn force_bytes_if(self, force: bool) -> Self {
         match self {
diff --git a/src/uu/dd/src/parseargs.rs b/src/uu/dd/src/parseargs.rs
index 0ff6e752c02..60ce9a6971f 100644
--- a/src/uu/dd/src/parseargs.rs
+++ b/src/uu/dd/src/parseargs.rs
@@ -35,41 +35,28 @@ pub enum ParseError {
 }
 
 /// Contains a temporary state during parsing of the arguments
-#[derive(Debug, PartialEq)]
+#[derive(Debug, PartialEq, Default)]
 pub struct Parser {
     infile: Option<String>,
     outfile: Option<String>,
-    ibs: usize,
-    obs: usize,
+    /// The block size option specified on the command-line, if any.
+    bs: Option<usize>,
+    /// The input block size option specified on the command-line, if any.
+    ibs: Option<usize>,
+    /// The output block size option specified on the command-line, if any.
+    obs: Option<usize>,
     cbs: Option<usize>,
     skip: Num,
     seek: Num,
     count: Option<Num>,
     conv: ConvFlags,
+    /// Whether a data-transforming `conv` option has been specified.
+    is_conv_specified: bool,
     iflag: IFlags,
     oflag: OFlags,
     status: Option<StatusLevel>,
 }
 
-impl Default for Parser {
-    fn default() -> Self {
-        Self {
-            ibs: 512,
-            obs: 512,
-            cbs: None,
-            infile: None,
-            outfile: None,
-            skip: Num::Blocks(0),
-            seek: Num::Blocks(0),
-            count: None,
-            conv: ConvFlags::default(),
-            iflag: IFlags::default(),
-            oflag: OFlags::default(),
-            status: None,
-        }
-    }
-}
-
 #[derive(Debug, Default, PartialEq, Eq)]
 pub struct ConvFlags {
     ascii: bool,
@@ -212,15 +199,34 @@ impl Parser {
             fsync: conv.fsync,
         };
 
+        // Input and output block sizes.
+        //
+        // The `bs` option takes precedence. If either is not
+        // provided, `ibs` and `obs` are each 512 bytes by default.
+        let (ibs, obs) = match self.bs {
+            None => (self.ibs.unwrap_or(512), self.obs.unwrap_or(512)),
+            Some(bs) => (bs, bs),
+        };
+
+        // Whether to buffer partial output blocks until they are completed.
+        //
+        // From the GNU `dd` documentation for the `bs=BYTES` option:
+        //
+        // > [...] if no data-transforming 'conv' option is specified,
+        // > input is copied to the output as soon as it's read, even if
+        // > it is smaller than the block size.
+        //
+        let buffered = self.bs.is_none() || self.is_conv_specified;
+
         let skip = self
             .skip
             .force_bytes_if(self.iflag.skip_bytes)
-            .to_bytes(self.ibs as u64);
+            .to_bytes(ibs as u64);
 
         let seek = self
             .seek
             .force_bytes_if(self.oflag.seek_bytes)
-            .to_bytes(self.obs as u64);
+            .to_bytes(obs as u64);
 
         let count = self.count.map(|c| c.force_bytes_if(self.iflag.count_bytes));
 
@@ -230,8 +236,9 @@ impl Parser {
             count,
             iconv,
             oconv,
-            ibs: self.ibs,
-            obs: self.obs,
+            ibs,
+            obs,
+            buffered,
             infile: self.infile,
             outfile: self.outfile,
             iflags: self.iflag,
@@ -244,18 +251,17 @@ impl Parser {
         match operand.split_once('=') {
             None => return Err(ParseError::UnrecognizedOperand(operand.to_string())),
             Some((k, v)) => match k {
-                "bs" => {
-                    let bs = Self::parse_bytes(k, v)?;
-                    self.ibs = bs;
-                    self.obs = bs;
-                }
+                "bs" => self.bs = Some(Self::parse_bytes(k, v)?),
                 "cbs" => self.cbs = Some(Self::parse_bytes(k, v)?),
-                "conv" => self.parse_conv_flags(v)?,
+                "conv" => {
+                    self.is_conv_specified = true;
+                    self.parse_conv_flags(v)?;
+                }
                 "count" => self.count = Some(Self::parse_n(v)?),
-                "ibs" => self.ibs = Self::parse_bytes(k, v)?,
+                "ibs" => self.ibs = Some(Self::parse_bytes(k, v)?),
                 "if" => self.infile = Some(v.to_string()),
                 "iflag" => self.parse_input_flags(v)?,
-                "obs" => self.obs = Self::parse_bytes(k, v)?,
+                "obs" => self.obs = Some(Self::parse_bytes(k, v)?),
                 "of" => self.outfile = Some(v.to_string()),
                 "oflag" => self.parse_output_flags(v)?,
                 "seek" | "oseek" => self.seek = Self::parse_n(v)?,
diff --git a/src/uu/dd/src/parseargs/unit_tests.rs b/src/uu/dd/src/parseargs/unit_tests.rs
index 142e49fd0ba..51b0933e926 100644
--- a/src/uu/dd/src/parseargs/unit_tests.rs
+++ b/src/uu/dd/src/parseargs/unit_tests.rs
@@ -358,6 +358,7 @@ fn parse_icf_tokens_remaining() {
                 fsync: true,
                 ..Default::default()
             },
+            is_conv_specified: true,
             ..Default::default()
         })
     );

From 5142f35f8395130dd331cc5756a0cd0466a1e74c Mon Sep 17 00:00:00 2001
From: Jeffrey Finkelstein <jeffrey.finkelstein@protonmail.com>
Date: Fri, 17 Mar 2023 20:55:49 -0400
Subject: [PATCH 074/429] dd: add BufferedOutput to buffer partial blocks

---
 src/uu/dd/src/bufferedoutput.rs | 201 ++++++++++++++++++++++++++++++++
 src/uu/dd/src/dd.rs             |  19 ++-
 2 files changed, 209 insertions(+), 11 deletions(-)
 create mode 100644 src/uu/dd/src/bufferedoutput.rs

diff --git a/src/uu/dd/src/bufferedoutput.rs b/src/uu/dd/src/bufferedoutput.rs
new file mode 100644
index 00000000000..1735ae10d80
--- /dev/null
+++ b/src/uu/dd/src/bufferedoutput.rs
@@ -0,0 +1,201 @@
+// This file is part of the uutils coreutils package.
+//
+// For the full copyright and license information, please view the LICENSE
+// file that was distributed with this source code.
+//
+// spell-checker:ignore wstat towrite cdefg bufferedoutput
+//! Buffer partial output blocks until they are completed.
+//!
+//! Use the [`BufferedOutput`] struct to create a buffered form of the
+//! [`Output`] writer.
+use crate::{Output, WriteStat};
+
+/// Buffer partial output blocks until they are completed.
+///
+/// Complete blocks are written immediately to the inner [`Output`],
+/// but partial blocks are stored in an internal buffer until they are
+/// completed.
+pub(crate) struct BufferedOutput<'a> {
+    /// The unbuffered inner block writer.
+    inner: Output<'a>,
+
+    /// The internal buffer that stores a partial block.
+    ///
+    /// The size of this buffer is always less than the output block
+    /// size (that is, the value of the `obs` command-line option).
+    buf: Vec<u8>,
+}
+
+impl<'a> BufferedOutput<'a> {
+    /// Add partial block buffering to the given block writer.
+    ///
+    /// The internal buffer size is at most the value of `obs` as
+    /// defined in `inner`.
+    pub(crate) fn new(inner: Output<'a>) -> Self {
+        let obs = inner.settings.obs;
+        Self {
+            inner,
+            buf: Vec::with_capacity(obs),
+        }
+    }
+
+    pub(crate) fn discard_cache(&self, offset: libc::off_t, len: libc::off_t) {
+        self.inner.discard_cache(offset, len);
+    }
+
+    /// Flush the partial block stored in the internal buffer.
+    pub(crate) fn flush(&mut self) -> std::io::Result<WriteStat> {
+        let wstat = self.inner.write_blocks(&self.buf)?;
+        let n = wstat.bytes_total;
+        for _ in 0..n {
+            self.buf.remove(0);
+        }
+        Ok(wstat)
+    }
+
+    /// Synchronize the inner block writer.
+    pub(crate) fn sync(&mut self) -> std::io::Result<()> {
+        self.inner.sync()
+    }
+
+    /// Truncate the underlying file to the current stream position, if possible.
+    pub(crate) fn truncate(&mut self) -> std::io::Result<()> {
+        self.inner.dst.truncate()
+    }
+
+    /// Write the given bytes one block at a time.
+    ///
+    /// Only complete blocks will be written. Partial blocks will be
+    /// buffered until enough bytes have been provided to complete a
+    /// block. The returned [`WriteStat`] object will include the
+    /// number of blocks written during execution of this function.
+    pub(crate) fn write_blocks(&mut self, buf: &[u8]) -> std::io::Result<WriteStat> {
+        // Concatenate the old partial block with the new incoming bytes.
+        let towrite = [&self.buf, buf].concat();
+
+        // Write all complete blocks to the inner block writer.
+        //
+        // For example, if the output block size were 3, the buffered
+        // partial block were `b"ab"` and the new incoming bytes were
+        // `b"cdefg"`, then we would write blocks `b"abc"` and
+        // b`"def"` to the inner block writer.
+        let n = towrite.len();
+        let rem = n % self.inner.settings.obs;
+        let wstat = self.inner.write_blocks(&towrite[..n - rem])?;
+        self.buf.clear();
+
+        // Buffer any remaining bytes as a partial block.
+        //
+        // Continuing the example above, the last byte `b"g"` would be
+        // buffered as a partial block until the next call to
+        // `write_blocks()`.
+        for byte in &towrite[n - rem..] {
+            self.buf.push(*byte);
+        }
+
+        Ok(wstat)
+    }
+}
+
+#[cfg(unix)]
+#[cfg(test)]
+mod tests {
+    use crate::bufferedoutput::BufferedOutput;
+    use crate::{Dest, Output, Settings};
+
+    #[test]
+    fn test_buffered_output_write_blocks_empty() {
+        let settings = Settings {
+            obs: 3,
+            ..Default::default()
+        };
+        let inner = Output {
+            dst: Dest::Sink,
+            settings: &settings,
+        };
+        let mut output = BufferedOutput::new(inner);
+        let wstat = output.write_blocks(&[]).unwrap();
+        assert_eq!(wstat.writes_complete, 0);
+        assert_eq!(wstat.writes_partial, 0);
+        assert_eq!(wstat.bytes_total, 0);
+        assert_eq!(output.buf, vec![]);
+    }
+
+    #[test]
+    fn test_buffered_output_write_blocks_partial() {
+        let settings = Settings {
+            obs: 3,
+            ..Default::default()
+        };
+        let inner = Output {
+            dst: Dest::Sink,
+            settings: &settings,
+        };
+        let mut output = BufferedOutput::new(inner);
+        let wstat = output.write_blocks(b"ab").unwrap();
+        assert_eq!(wstat.writes_complete, 0);
+        assert_eq!(wstat.writes_partial, 0);
+        assert_eq!(wstat.bytes_total, 0);
+        assert_eq!(output.buf, b"ab");
+    }
+
+    #[test]
+    fn test_buffered_output_write_blocks_complete() {
+        let settings = Settings {
+            obs: 3,
+            ..Default::default()
+        };
+        let inner = Output {
+            dst: Dest::Sink,
+            settings: &settings,
+        };
+        let mut output = BufferedOutput::new(inner);
+        let wstat = output.write_blocks(b"abcd").unwrap();
+        assert_eq!(wstat.writes_complete, 1);
+        assert_eq!(wstat.writes_partial, 0);
+        assert_eq!(wstat.bytes_total, 3);
+        assert_eq!(output.buf, b"d");
+    }
+
+    #[test]
+    fn test_buffered_output_write_blocks_append() {
+        let settings = Settings {
+            obs: 3,
+            ..Default::default()
+        };
+        let inner = Output {
+            dst: Dest::Sink,
+            settings: &settings,
+        };
+        let mut output = BufferedOutput {
+            inner,
+            buf: b"ab".to_vec(),
+        };
+        let wstat = output.write_blocks(b"cdefg").unwrap();
+        assert_eq!(wstat.writes_complete, 2);
+        assert_eq!(wstat.writes_partial, 0);
+        assert_eq!(wstat.bytes_total, 6);
+        assert_eq!(output.buf, b"g");
+    }
+
+    #[test]
+    fn test_buffered_output_flush() {
+        let settings = Settings {
+            obs: 10,
+            ..Default::default()
+        };
+        let inner = Output {
+            dst: Dest::Sink,
+            settings: &settings,
+        };
+        let mut output = BufferedOutput {
+            inner,
+            buf: b"abc".to_vec(),
+        };
+        let wstat = output.flush().unwrap();
+        assert_eq!(wstat.writes_complete, 0);
+        assert_eq!(wstat.writes_partial, 1);
+        assert_eq!(wstat.bytes_total, 3);
+        assert_eq!(output.buf, vec![]);
+    }
+}
diff --git a/src/uu/dd/src/dd.rs b/src/uu/dd/src/dd.rs
index 7d9138791cf..9374ca0cd37 100644
--- a/src/uu/dd/src/dd.rs
+++ b/src/uu/dd/src/dd.rs
@@ -3,23 +3,20 @@
 // For the full copyright and license information, please view the LICENSE
 // file that was distributed with this source code.
 
-// spell-checker:ignore fname, ftype, tname, fpath, specfile, testfile, unspec, ifile, ofile, outfile, fullblock, urand, fileio, atoe, atoibm, behaviour, bmax, bremain, cflags, creat, ctable, ctty, datastructures, doesnt, etoa, fileout, fname, gnudd, iconvflags, iseek, nocache, noctty, noerror, nofollow, nolinks, nonblock, oconvflags, oseek, outfile, parseargs, rlen, rmax, rremain, rsofar, rstat, sigusr, wlen, wstat seekable oconv canonicalized fadvise Fadvise FADV DONTNEED ESPIPE
+// spell-checker:ignore fname, ftype, tname, fpath, specfile, testfile, unspec, ifile, ofile, outfile, fullblock, urand, fileio, atoe, atoibm, behaviour, bmax, bremain, cflags, creat, ctable, ctty, datastructures, doesnt, etoa, fileout, fname, gnudd, iconvflags, iseek, nocache, noctty, noerror, nofollow, nolinks, nonblock, oconvflags, oseek, outfile, parseargs, rlen, rmax, rremain, rsofar, rstat, sigusr, wlen, wstat seekable oconv canonicalized fadvise Fadvise FADV DONTNEED ESPIPE bufferedoutput
 
+mod blocks;
+mod bufferedoutput;
+mod conversion_tables;
 mod datastructures;
-use datastructures::*;
-
+mod numbers;
 mod parseargs;
-use parseargs::Parser;
-
-mod conversion_tables;
-
 mod progress;
-use progress::{gen_prog_updater, ProgUpdate, ReadStat, StatusLevel, WriteStat};
 
-mod blocks;
 use blocks::conv_block_unblock_helper;
-
-mod numbers;
+use datastructures::*;
+use parseargs::Parser;
+use progress::{gen_prog_updater, ProgUpdate, ReadStat, StatusLevel, WriteStat};
 
 use std::cmp;
 use std::env;

From b383e609988a7f171643a387a81c512cab1257be Mon Sep 17 00:00:00 2001
From: Jeffrey Finkelstein <jeffrey.finkelstein@protonmail.com>
Date: Fri, 17 Mar 2023 22:41:10 -0400
Subject: [PATCH 075/429] dd: implement Add for WriteStat

---
 src/uu/dd/src/progress.rs | 11 +++++++++++
 1 file changed, 11 insertions(+)

diff --git a/src/uu/dd/src/progress.rs b/src/uu/dd/src/progress.rs
index 4fe04cb0e67..ac7517c2c0c 100644
--- a/src/uu/dd/src/progress.rs
+++ b/src/uu/dd/src/progress.rs
@@ -379,6 +379,17 @@ impl std::ops::AddAssign for WriteStat {
     }
 }
 
+impl std::ops::Add for WriteStat {
+    type Output = Self;
+    fn add(self, other: Self) -> Self {
+        Self {
+            writes_complete: self.writes_complete + other.writes_complete,
+            writes_partial: self.writes_partial + other.writes_partial,
+            bytes_total: self.bytes_total + other.bytes_total,
+        }
+    }
+}
+
 /// How much detail to report when printing transfer statistics.
 ///
 /// This corresponds to the available settings of the `status`

From f343b7e964091507e9373c94da4619c962c8d23c Mon Sep 17 00:00:00 2001
From: Jeffrey Finkelstein <jeffrey.finkelstein@protonmail.com>
Date: Fri, 17 Mar 2023 22:41:56 -0400
Subject: [PATCH 076/429] dd: use read statistics for termination condition

Correct the behavior of `dd` so that the termination condition of the
main loop uses the number of bytes read, not the number of bytes
written, when the `count` command-line option is given in bytes
instead of blocks.
---
 src/uu/dd/src/dd.rs | 14 ++++----------
 1 file changed, 4 insertions(+), 10 deletions(-)

diff --git a/src/uu/dd/src/dd.rs b/src/uu/dd/src/dd.rs
index 9374ca0cd37..b760d98e022 100644
--- a/src/uu/dd/src/dd.rs
+++ b/src/uu/dd/src/dd.rs
@@ -901,7 +901,7 @@ fn dd_copy(mut i: Input, mut o: Output) -> std::io::Result<()> {
     // blocks to this output. Read/write statistics are updated on
     // each iteration and cumulative statistics are reported to
     // the progress reporting thread.
-    while below_count_limit(&i.settings.count, &rstat, &wstat) {
+    while below_count_limit(&i.settings.count, &rstat) {
         // Read a block from the input then write the block to the output.
         //
         // As an optimization, make an educated guess about the
@@ -1108,16 +1108,10 @@ fn calc_loop_bsize(
 
 // Decide if the current progress is below a count=N limit or return
 // true if no such limit is set.
-fn below_count_limit(count: &Option<Num>, rstat: &ReadStat, wstat: &WriteStat) -> bool {
+fn below_count_limit(count: &Option<Num>, rstat: &ReadStat) -> bool {
     match count {
-        Some(Num::Blocks(n)) => {
-            let n = *n;
-            rstat.reads_complete + rstat.reads_partial <= n
-        }
-        Some(Num::Bytes(n)) => {
-            let n = (*n).try_into().unwrap();
-            wstat.bytes_total <= n
-        }
+        Some(Num::Blocks(n)) => rstat.reads_complete + rstat.reads_partial < *n,
+        Some(Num::Bytes(n)) => rstat.bytes_total < *n,
         None => true,
     }
 }

From ceccd2ecc61ed83d9c66ac55f82913723ca4d96e Mon Sep 17 00:00:00 2001
From: Jeffrey Finkelstein <jeffrey.finkelstein@protonmail.com>
Date: Fri, 17 Mar 2023 22:42:24 -0400
Subject: [PATCH 077/429] dd: buffer partial blocks in the output writer

Add buffering of partial blocks in the output block writer until they
are completed.
---
 src/uu/dd/src/bufferedoutput.rs |  31 +++++----
 src/uu/dd/src/dd.rs             | 115 +++++++++++++++++++++++++++-----
 tests/by-util/test_dd.rs        |  78 +++++++++++++++++++++-
 3 files changed, 194 insertions(+), 30 deletions(-)

diff --git a/src/uu/dd/src/bufferedoutput.rs b/src/uu/dd/src/bufferedoutput.rs
index 1735ae10d80..6ac3b430046 100644
--- a/src/uu/dd/src/bufferedoutput.rs
+++ b/src/uu/dd/src/bufferedoutput.rs
@@ -46,10 +46,8 @@ impl<'a> BufferedOutput<'a> {
     /// Flush the partial block stored in the internal buffer.
     pub(crate) fn flush(&mut self) -> std::io::Result<WriteStat> {
         let wstat = self.inner.write_blocks(&self.buf)?;
-        let n = wstat.bytes_total;
-        for _ in 0..n {
-            self.buf.remove(0);
-        }
+        let n = wstat.bytes_total.try_into().unwrap();
+        self.buf.drain(0..n);
         Ok(wstat)
     }
 
@@ -70,8 +68,19 @@ impl<'a> BufferedOutput<'a> {
     /// block. The returned [`WriteStat`] object will include the
     /// number of blocks written during execution of this function.
     pub(crate) fn write_blocks(&mut self, buf: &[u8]) -> std::io::Result<WriteStat> {
-        // Concatenate the old partial block with the new incoming bytes.
-        let towrite = [&self.buf, buf].concat();
+        // Split the incoming buffer into two parts: the bytes to write
+        // and the bytes to buffer for next time.
+        //
+        // If `buf` does not include enough bytes to form a full block,
+        // just buffer the whole thing and write zero blocks.
+        let n = self.buf.len() + buf.len();
+        let rem = n % self.inner.settings.obs;
+        let i = buf.len().saturating_sub(rem);
+        let (to_write, to_buffer) = buf.split_at(i);
+
+        // Concatenate the old partial block with the new bytes to form
+        // some number of complete blocks.
+        self.buf.extend_from_slice(to_write);
 
         // Write all complete blocks to the inner block writer.
         //
@@ -79,19 +88,15 @@ impl<'a> BufferedOutput<'a> {
         // partial block were `b"ab"` and the new incoming bytes were
         // `b"cdefg"`, then we would write blocks `b"abc"` and
         // b`"def"` to the inner block writer.
-        let n = towrite.len();
-        let rem = n % self.inner.settings.obs;
-        let wstat = self.inner.write_blocks(&towrite[..n - rem])?;
-        self.buf.clear();
+        let wstat = self.inner.write_blocks(&self.buf)?;
 
         // Buffer any remaining bytes as a partial block.
         //
         // Continuing the example above, the last byte `b"g"` would be
         // buffered as a partial block until the next call to
         // `write_blocks()`.
-        for byte in &towrite[n - rem..] {
-            self.buf.push(*byte);
-        }
+        self.buf.clear();
+        self.buf.extend_from_slice(to_buffer);
 
         Ok(wstat)
     }
diff --git a/src/uu/dd/src/dd.rs b/src/uu/dd/src/dd.rs
index b760d98e022..645c2496766 100644
--- a/src/uu/dd/src/dd.rs
+++ b/src/uu/dd/src/dd.rs
@@ -13,6 +13,7 @@ mod numbers;
 mod parseargs;
 mod progress;
 
+use crate::bufferedoutput::BufferedOutput;
 use blocks::conv_block_unblock_helper;
 use datastructures::*;
 use parseargs::Parser;
@@ -801,6 +802,68 @@ impl<'a> Output<'a> {
             Ok(())
         }
     }
+
+    /// Truncate the underlying file to the current stream position, if possible.
+    fn truncate(&mut self) -> std::io::Result<()> {
+        self.dst.truncate()
+    }
+}
+
+/// The block writer either with or without partial block buffering.
+enum BlockWriter<'a> {
+    /// Block writer with partial block buffering.
+    ///
+    /// Partial blocks are buffered until completed.
+    Buffered(BufferedOutput<'a>),
+
+    /// Block writer without partial block buffering.
+    ///
+    /// Partial blocks are written immediately.
+    Unbuffered(Output<'a>),
+}
+
+impl<'a> BlockWriter<'a> {
+    fn discard_cache(&self, offset: libc::off_t, len: libc::off_t) {
+        match self {
+            Self::Unbuffered(o) => o.discard_cache(offset, len),
+            Self::Buffered(o) => o.discard_cache(offset, len),
+        }
+    }
+
+    fn flush(&mut self) -> io::Result<WriteStat> {
+        match self {
+            Self::Unbuffered(_) => Ok(WriteStat::default()),
+            Self::Buffered(o) => o.flush(),
+        }
+    }
+
+    fn sync(&mut self) -> io::Result<()> {
+        match self {
+            Self::Unbuffered(o) => o.sync(),
+            Self::Buffered(o) => o.sync(),
+        }
+    }
+
+    /// Truncate the file to the final cursor location.
+    fn truncate(&mut self) {
+        // Calling `set_len()` may result in an error (for example,
+        // when calling it on `/dev/null`), but we don't want to
+        // terminate the process when that happens. Instead, we
+        // suppress the error by calling `Result::ok()`. This matches
+        // the behavior of GNU `dd` when given the command-line
+        // argument `of=/dev/null`.
+        match self {
+            Self::Unbuffered(o) => o.truncate().ok(),
+            Self::Buffered(o) => o.truncate().ok(),
+        };
+    }
+
+    fn write_blocks(&mut self, buf: &[u8]) -> std::io::Result<WriteStat> {
+        match self {
+            Self::Unbuffered(o) => o.write_blocks(buf),
+            Self::Buffered(o) => o.write_blocks(buf),
+        }
+    }
 }
 
 /// Copy the given input data to this output, consuming both.
@@ -814,7 +877,7 @@ impl<'a> Output<'a> {
 ///
 /// If there is a problem reading from the input or writing to
 /// this output.
-fn dd_copy(mut i: Input, mut o: Output) -> std::io::Result<()> {
+fn dd_copy(mut i: Input, o: Output) -> std::io::Result<()> {
     // The read and write statistics.
     //
     // These objects are counters, initialized to zero. After each
@@ -851,6 +914,9 @@ fn dd_copy(mut i: Input, mut o: Output) -> std::io::Result<()> {
     let (prog_tx, rx) = mpsc::channel();
     let output_thread = thread::spawn(gen_prog_updater(rx, i.settings.status));
 
+    // Whether to truncate the output file after all blocks have been written.
+    let truncate = !o.settings.oconv.notrunc;
+
     // Optimization: if no blocks are to be written, then don't
     // bother allocating any buffers.
     if let Some(Num::Blocks(0) | Num::Bytes(0)) = i.settings.count {
@@ -875,7 +941,15 @@ fn dd_copy(mut i: Input, mut o: Output) -> std::io::Result<()> {
             let len = o.dst.len()?.try_into().unwrap();
             o.discard_cache(offset, len);
         }
-        return finalize(&mut o, rstat, wstat, start, &prog_tx, output_thread);
+        return finalize(
+            BlockWriter::Unbuffered(o),
+            rstat,
+            wstat,
+            start,
+            &prog_tx,
+            output_thread,
+            truncate,
+        );
     };
 
     // Create a common buffer with a capacity of the block size.
@@ -895,6 +969,16 @@ fn dd_copy(mut i: Input, mut o: Output) -> std::io::Result<()> {
     let mut read_offset = 0;
     let mut write_offset = 0;
 
+    let input_nocache = i.settings.iflags.nocache;
+    let output_nocache = o.settings.oflags.nocache;
+
+    // Add partial block buffering, if needed.
+    let mut o = if o.settings.buffered {
+        BlockWriter::Buffered(BufferedOutput::new(o))
+    } else {
+        BlockWriter::Unbuffered(o)
+    };
+
     // The main read/write loop.
     //
     // Each iteration reads blocks from the input and writes
@@ -919,7 +1003,7 @@ fn dd_copy(mut i: Input, mut o: Output) -> std::io::Result<()> {
         //
         // TODO Better error handling for overflowing `offset` and `len`.
         let read_len = rstat_update.bytes_total;
-        if i.settings.iflags.nocache {
+        if input_nocache {
             let offset = read_offset.try_into().unwrap();
             let len = read_len.try_into().unwrap();
             i.discard_cache(offset, len);
@@ -931,7 +1015,7 @@ fn dd_copy(mut i: Input, mut o: Output) -> std::io::Result<()> {
         //
         // TODO Better error handling for overflowing `offset` and `len`.
         let write_len = wstat_update.bytes_total;
-        if o.settings.oflags.nocache {
+        if output_nocache {
             let offset = write_offset.try_into().unwrap();
             let len = write_len.try_into().unwrap();
             o.discard_cache(offset, len);
@@ -951,34 +1035,33 @@ fn dd_copy(mut i: Input, mut o: Output) -> std::io::Result<()> {
             prog_tx.send(prog_update).unwrap_or(());
         }
     }
-    finalize(&mut o, rstat, wstat, start, &prog_tx, output_thread)
+    finalize(o, rstat, wstat, start, &prog_tx, output_thread, truncate)
 }
 
 /// Flush output, print final stats, and join with the progress thread.
 fn finalize<T>(
-    output: &mut Output,
+    mut output: BlockWriter,
     rstat: ReadStat,
     wstat: WriteStat,
     start: Instant,
     prog_tx: &mpsc::Sender<ProgUpdate>,
     output_thread: thread::JoinHandle<T>,
+    truncate: bool,
 ) -> std::io::Result<()> {
-    // Flush the output, if configured to do so.
+    // Flush the output in case a partial write has been buffered but
+    // not yet written.
+    let wstat_update = output.flush()?;
+
+    // Sync the output, if configured to do so.
     output.sync()?;
 
     // Truncate the file to the final cursor location.
-    //
-    // Calling `set_len()` may result in an error (for example,
-    // when calling it on `/dev/null`), but we don't want to
-    // terminate the process when that happens. Instead, we
-    // suppress the error by calling `Result::ok()`. This matches
-    // the behavior of GNU `dd` when given the command-line
-    // argument `of=/dev/null`.
-    if !output.settings.oconv.notrunc {
-        output.dst.truncate().ok();
+    if truncate {
+        output.truncate();
     }
 
     // Print the final read/write statistics.
+    let wstat = wstat + wstat_update;
     let prog_update = ProgUpdate::new(rstat, wstat, start.elapsed(), true);
     prog_tx.send(prog_update).unwrap_or(());
     // Wait for the output thread to finish
diff --git a/tests/by-util/test_dd.rs b/tests/by-util/test_dd.rs
index d5ac8dc801c..a4c70097c8b 100644
--- a/tests/by-util/test_dd.rs
+++ b/tests/by-util/test_dd.rs
@@ -2,7 +2,7 @@
 //
 // For the full copyright and license information, please view the LICENSE
 // file that was distributed with this source code.
-// spell-checker:ignore fname, tname, fpath, specfile, testfile, unspec, ifile, ofile, outfile, fullblock, urand, fileio, atoe, atoibm, availible, behaviour, bmax, bremain, btotal, cflags, creat, ctable, ctty, datastructures, doesnt, etoa, fileout, fname, gnudd, iconvflags, iseek, nocache, noctty, noerror, nofollow, nolinks, nonblock, oconvflags, oseek, outfile, parseargs, rlen, rmax, rposition, rremain, rsofar, rstat, sigusr, sigval, wlen, wstat abcdefghijklm abcdefghi nabcde nabcdefg abcdefg
+// spell-checker:ignore fname, tname, fpath, specfile, testfile, unspec, ifile, ofile, outfile, fullblock, urand, fileio, atoe, atoibm, availible, behaviour, bmax, bremain, btotal, cflags, creat, ctable, ctty, datastructures, doesnt, etoa, fileout, fname, gnudd, iconvflags, iseek, nocache, noctty, noerror, nofollow, nolinks, nonblock, oconvflags, oseek, outfile, parseargs, rlen, rmax, rposition, rremain, rsofar, rstat, sigusr, sigval, wlen, wstat abcdefghijklm abcdefghi nabcde nabcdefg abcdefg fifoname
 
 #[cfg(unix)]
 use crate::common::util::run_ucmd_as_root_with_stdin_stdout;
@@ -15,6 +15,8 @@ use regex::Regex;
 use std::fs::{File, OpenOptions};
 use std::io::{BufReader, Read, Write};
 use std::path::PathBuf;
+#[cfg(all(unix, not(target_os = "macos"), not(target_os = "freebsd")))]
+use std::process::{Command, Stdio};
 #[cfg(not(windows))]
 use std::thread::sleep;
 #[cfg(not(windows))]
@@ -1582,3 +1584,77 @@ fn test_seek_past_dev() {
         print!("TEST SKIPPED");
     }
 }
+
+#[test]
+#[cfg(all(unix, not(target_os = "macos"), not(target_os = "freebsd")))]
+fn test_reading_partial_blocks_from_fifo() {
+    // Create the FIFO.
+    let ts = TestScenario::new(util_name!());
+    let at = ts.fixtures.clone();
+    at.mkfifo("fifo");
+    let fifoname = at.plus_as_string("fifo");
+
+    // Start a `dd` process that reads from the fifo (so it will wait
+    // until the writer process starts).
+    let mut reader_command = Command::new(TESTS_BINARY);
+    let child = reader_command
+        .args(["dd", "ibs=3", "obs=3", &format!("if={}", fifoname)])
+        .stdout(Stdio::piped())
+        .stderr(Stdio::piped())
+        .spawn()
+        .unwrap();
+
+    // Start different processes to write to the FIFO, with a small
+    // pause in between.
+    let mut writer_command = Command::new("sh");
+    writer_command
+        .args([
+            "-c",
+            &format!("(printf \"ab\"; sleep 0.1; printf \"cd\") > {}", fifoname),
+        ])
+        .spawn()
+        .unwrap();
+
+    let output = child.wait_with_output().unwrap();
+    assert_eq!(output.stdout, b"abcd");
+    let expected = b"0+2 records in\n1+1 records out\n4 bytes copied";
+    assert!(output.stderr.starts_with(expected));
+}
+
+#[test]
+#[cfg(all(unix, not(target_os = "macos"), not(target_os = "freebsd")))]
+fn test_reading_partial_blocks_from_fifo_unbuffered() {
+    // Create the FIFO.
+    let ts = TestScenario::new(util_name!());
+    let at = ts.fixtures.clone();
+    at.mkfifo("fifo");
+    let fifoname = at.plus_as_string("fifo");
+
+    // Start a `dd` process that reads from the fifo (so it will wait
+    // until the writer process starts).
+    //
+    // `bs=N` takes precedence over `ibs=N` and `obs=N`.
+    let mut reader_command = Command::new(TESTS_BINARY);
+    let child = reader_command
+        .args(["dd", "bs=3", "ibs=1", "obs=1", &format!("if={}", fifoname)])
+        .stdout(Stdio::piped())
+        .stderr(Stdio::piped())
+        .spawn()
+        .unwrap();
+
+    // Start different processes to write to the FIFO, with a small
+    // pause in between.
+    let mut writer_command = Command::new("sh");
+    writer_command
+        .args([
+            "-c",
+            &format!("(printf \"ab\"; sleep 0.1; printf \"cd\") > {}", fifoname),
+        ])
+        .spawn()
+        .unwrap();
+
+    let output = child.wait_with_output().unwrap();
+    assert_eq!(output.stdout, b"abcd");
+    let expected = b"0+2 records in\n0+2 records out\n4 bytes copied";
+    assert!(output.stderr.starts_with(expected));
+}

From 8eb66ab7ea93de366165f45127206da04cdb342d Mon Sep 17 00:00:00 2001
From: Terts Diepraam <terts.diepraam@gmail.com>
Date: Mon, 27 Nov 2023 11:50:55 +0100
Subject: [PATCH 078/429] printf: remove whitespace, remove redundant spelling
 ignore and revert matching on result

---
 src/uu/printf/src/printf.rs                     | 17 ++++++-----------
 src/uu/seq/src/number.rs                        |  2 +-
 src/uu/seq/src/numberparse.rs                   |  2 +-
 src/uu/seq/src/seq.rs                           |  2 +-
 .../src/lib/features/format/num_format.rs       |  1 -
 5 files changed, 9 insertions(+), 15 deletions(-)

diff --git a/src/uu/printf/src/printf.rs b/src/uu/printf/src/printf.rs
index cfb0315cfb0..663411b8952 100644
--- a/src/uu/printf/src/printf.rs
+++ b/src/uu/printf/src/printf.rs
@@ -10,9 +10,9 @@ use std::io::stdout;
 use std::ops::ControlFlow;
 
 use clap::{crate_version, Arg, ArgAction, Command};
-use uucore::error::{UError, UResult, UUsageError};
+use uucore::error::{UResult, UUsageError};
 use uucore::format::{parse_spec_and_escape, FormatArgument};
-use uucore::{format_usage, help_about, help_section, help_usage, show};
+use uucore::{format_usage, help_about, help_section, help_usage};
 
 const VERSION: &str = "version";
 const HELP: &str = "help";
@@ -49,15 +49,10 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
 
     while args.peek().is_some() {
         for item in parse_spec_and_escape(format_string.as_ref()) {
-            match item {
-                Ok(item) => {
-                    match item.write(stdout(), &mut args)? {
-                        ControlFlow::Continue(()) => {}
-                        ControlFlow::Break(()) => return Ok(()),
-                    };
-                }
-                Err(e) => show!(e),
-            }
+            match item?.write(stdout(), &mut args)? {
+                ControlFlow::Continue(()) => {}
+                ControlFlow::Break(()) => return Ok(()),
+            };
         }
     }
     Ok(())
diff --git a/src/uu/seq/src/number.rs b/src/uu/seq/src/number.rs
index 182431a9210..314c842ba15 100644
--- a/src/uu/seq/src/number.rs
+++ b/src/uu/seq/src/number.rs
@@ -2,7 +2,7 @@
 //
 // For the full copyright and license information, please view the LICENSE
 // file that was distributed with this source code.
-// spell-checker:ignore extendedbigdecimal extendedbigint
+// spell-checker:ignore extendedbigdecimal
 use num_traits::Zero;
 
 use crate::extendedbigdecimal::ExtendedBigDecimal;
diff --git a/src/uu/seq/src/numberparse.rs b/src/uu/seq/src/numberparse.rs
index a82d1e88776..df7c1f7d1dd 100644
--- a/src/uu/seq/src/numberparse.rs
+++ b/src/uu/seq/src/numberparse.rs
@@ -2,7 +2,7 @@
 //
 // For the full copyright and license information, please view the LICENSE
 // file that was distributed with this source code.
-// spell-checker:ignore extendedbigdecimal extendedbigint bigdecimal numberparse
+// spell-checker:ignore extendedbigdecimal bigdecimal numberparse
 //! Parsing numbers for use in `seq`.
 //!
 //! This module provides an implementation of [`FromStr`] for the
diff --git a/src/uu/seq/src/seq.rs b/src/uu/seq/src/seq.rs
index 05338864545..33b7636edbc 100644
--- a/src/uu/seq/src/seq.rs
+++ b/src/uu/seq/src/seq.rs
@@ -2,7 +2,7 @@
 //
 // For the full copyright and license information, please view the LICENSE
 // file that was distributed with this source code.
-// spell-checker:ignore (ToDO) istr chiter argptr ilen extendedbigdecimal extendedbigint numberparse
+// spell-checker:ignore (ToDO) extendedbigdecimal numberparse
 use std::io::{stdout, ErrorKind, Write};
 
 use clap::{crate_version, Arg, ArgAction, Command};
diff --git a/src/uucore/src/lib/features/format/num_format.rs b/src/uucore/src/lib/features/format/num_format.rs
index 6fd177d1325..51f3336cf61 100644
--- a/src/uucore/src/lib/features/format/num_format.rs
+++ b/src/uucore/src/lib/features/format/num_format.rs
@@ -28,7 +28,6 @@ pub enum UnsignedIntVariant {
 }
 
 #[derive(Clone, Copy, Debug)]
-
 pub enum FloatVariant {
     Decimal,
     Scientific,

From 83784b2d96bc4b68a67186ac57014822a14034d7 Mon Sep 17 00:00:00 2001
From: Terts Diepraam <terts.diepraam@gmail.com>
Date: Mon, 27 Nov 2023 11:37:39 +0100
Subject: [PATCH 079/429] expr: refactor AST and parsing

---
 src/uu/expr/src/expr.rs        |  87 ++--
 src/uu/expr/src/syntax_tree.rs | 924 ++++++++++++++++-----------------
 src/uu/expr/src/tokens.rs      | 147 ------
 3 files changed, 494 insertions(+), 664 deletions(-)
 delete mode 100644 src/uu/expr/src/tokens.rs

diff --git a/src/uu/expr/src/expr.rs b/src/uu/expr/src/expr.rs
index 909c4c37653..c271f0935fd 100644
--- a/src/uu/expr/src/expr.rs
+++ b/src/uu/expr/src/expr.rs
@@ -3,14 +3,19 @@
 // For the full copyright and license information, please view the LICENSE
 // file that was distributed with this source code.
 
+use std::fmt::Display;
+
 use clap::{crate_version, Arg, ArgAction, Command};
+use syntax_tree::AstNode;
 use uucore::{
-    error::{UResult, USimpleError, UUsageError},
+    display::Quotable,
+    error::{UError, UResult},
     format_usage, help_about, help_section, help_usage,
 };
 
+use crate::syntax_tree::is_truthy;
+
 mod syntax_tree;
-mod tokens;
 
 mod options {
     pub const VERSION: &str = "version";
@@ -18,6 +23,51 @@ mod options {
     pub const EXPRESSION: &str = "expression";
 }
 
+pub type ExprResult<T> = Result<T, ExprError>;
+
+#[derive(Debug, PartialEq, Eq)]
+pub enum ExprError {
+    UnexpectedArgument(String),
+    MissingArgument(String),
+    NonIntegerArgument,
+    MissingOperand,
+    DivisionByZero,
+    InvalidRegexExpression,
+    ExpectedClosingBraceAfter(String),
+}
+
+impl Display for ExprError {
+    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
+        match self {
+            Self::UnexpectedArgument(s) => {
+                write!(f, "syntax error: unexpected argument {}", s.quote())
+            }
+            Self::MissingArgument(s) => {
+                write!(f, "syntax error: missing argument after {}", s.quote())
+            }
+            Self::NonIntegerArgument => write!(f, "non-integer argument"),
+            Self::MissingOperand => write!(f, "missing operand"),
+            Self::DivisionByZero => write!(f, "division by zero"),
+            Self::InvalidRegexExpression => write!(f, "Invalid regex expression"),
+            Self::ExpectedClosingBraceAfter(s) => {
+                write!(f, "expected ')' after {}", s.quote())
+            }
+        }
+    }
+}
+
+impl std::error::Error for ExprError {}
+
+impl UError for ExprError {
+    fn code(&self) -> i32 {
+        2
+    }
+
+    fn usage(&self) -> bool {
+        *self == Self::MissingOperand
+    }
+}
+
 pub fn uu_app() -> Command {
     Command::new(uucore::util_name())
         .version(crate_version!())
@@ -53,36 +103,15 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
     // For expr utility we do not want getopts.
     // The following usage should work without escaping hyphens: `expr -15 = 1 +  2 \* \( 3 - -4 \)`
     let matches = uu_app().try_get_matches_from(args)?;
-    let token_strings = matches
+    let token_strings: Vec<&str> = matches
         .get_many::<String>(options::EXPRESSION)
         .map(|v| v.into_iter().map(|s| s.as_ref()).collect::<Vec<_>>())
         .unwrap_or_default();
 
-    if token_strings.is_empty() {
-        return Err(UUsageError::new(2, "missing operand"));
-    }
-
-    match process_expr(&token_strings[..]) {
-        Ok(expr_result) => print_expr_ok(&expr_result),
-        Err(expr_error) => Err(USimpleError::new(2, &expr_error)),
+    let res = AstNode::parse(&token_strings)?.eval()?;
+    println!("{res}");
+    if !is_truthy(&res) {
+        return Err(1.into());
     }
-}
-
-fn process_expr(token_strings: &[&str]) -> Result<String, String> {
-    let maybe_tokens = tokens::strings_to_tokens(token_strings);
-    let maybe_ast = syntax_tree::tokens_to_ast(maybe_tokens);
-    evaluate_ast(maybe_ast)
-}
-
-fn print_expr_ok(expr_result: &str) -> UResult<()> {
-    println!("{expr_result}");
-    if expr_result.parse::<i32>() == Ok(0) || expr_result.is_empty() {
-        Err(1.into())
-    } else {
-        Ok(())
-    }
-}
-
-fn evaluate_ast(maybe_ast: Result<Box<syntax_tree::AstNode>, String>) -> Result<String, String> {
-    maybe_ast.and_then(|ast| ast.evaluate())
+    Ok(())
 }
diff --git a/src/uu/expr/src/syntax_tree.rs b/src/uu/expr/src/syntax_tree.rs
index 2260b2e2186..f81f1da1ec4 100644
--- a/src/uu/expr/src/syntax_tree.rs
+++ b/src/uu/expr/src/syntax_tree.rs
@@ -3,574 +3,522 @@
 // For the full copyright and license information, please view the LICENSE
 // file that was distributed with this source code.
 
-//!
-//! Here we employ shunting-yard algorithm for building AST from tokens according to operators' precedence and associative-ness.
-//! * `<https://en.wikipedia.org/wiki/Shunting-yard_algorithm>`
-//!
-
 // spell-checker:ignore (ToDO) ints paren prec multibytes
 
 use num_bigint::BigInt;
-use num_traits::Zero;
 use onig::{Regex, RegexOptions, Syntax};
-use uucore::display::Quotable;
 
-use crate::tokens::Token;
+use crate::{ExprError, ExprResult};
 
-type TokenStack = Vec<(usize, Token)>;
-pub type OperandsList = Vec<Box<AstNode>>;
+#[derive(Debug, Clone, Copy, PartialEq, Eq)]
+pub enum BinOp {
+    Relation(RelationOp),
+    Numeric(NumericOp),
+    String(StringOp),
+}
 
-#[derive(Debug)]
-pub enum AstNode {
-    Leaf {
-        token_idx: usize,
-        value: String,
-    },
-    Node {
-        token_idx: usize,
-        op_type: String,
-        operands: OperandsList,
-    },
+#[derive(Debug, Clone, Copy, PartialEq, Eq)]
+pub enum RelationOp {
+    Lt,
+    Leq,
+    Eq,
+    Neq,
+    Gt,
+    Geq,
 }
 
-impl AstNode {
-    fn debug_dump(&self) {
-        self.debug_dump_impl(1);
-    }
+#[derive(Debug, Clone, Copy, PartialEq, Eq)]
+pub enum NumericOp {
+    Add,
+    Sub,
+    Mul,
+    Div,
+    Mod,
+}
 
-    fn debug_dump_impl(&self, depth: usize) {
-        for _ in 0..depth {
-            print!("\t",);
-        }
+#[derive(Debug, Clone, Copy, PartialEq, Eq)]
+pub enum StringOp {
+    Match,
+    Index,
+    And,
+    Or,
+}
+
+impl BinOp {
+    fn eval(&self, left: &AstNode, right: &AstNode) -> ExprResult<String> {
         match self {
-            Self::Leaf { token_idx, value } => println!(
-                "Leaf( {} ) at #{} ( evaluate -> {:?} )",
-                value,
-                token_idx,
-                self.evaluate()
-            ),
-            Self::Node {
-                token_idx,
-                op_type,
-                operands,
-            } => {
-                println!(
-                    "Node( {} ) at #{} ( evaluate -> {:?} )",
-                    op_type,
-                    token_idx,
-                    self.evaluate()
-                );
-                for operand in operands {
-                    operand.debug_dump_impl(depth + 1);
-                }
-            }
+            Self::Relation(op) => op.eval(left, right),
+            Self::Numeric(op) => op.eval(left, right),
+            Self::String(op) => op.eval(left, right),
         }
     }
+}
 
-    fn new_node(token_idx: usize, op_type: &str, operands: OperandsList) -> Box<Self> {
-        Box::new(Self::Node {
-            token_idx,
-            op_type: op_type.into(),
-            operands,
-        })
-    }
-
-    fn new_leaf(token_idx: usize, value: &str) -> Box<Self> {
-        Box::new(Self::Leaf {
-            token_idx,
-            value: value.into(),
-        })
+impl RelationOp {
+    fn eval(&self, a: &AstNode, b: &AstNode) -> ExprResult<String> {
+        let a = a.eval()?;
+        let b = b.eval()?;
+        let b = if let (Ok(a), Ok(b)) = (a.parse::<BigInt>(), b.parse::<BigInt>()) {
+            match self {
+                Self::Lt => a < b,
+                Self::Leq => a <= b,
+                Self::Eq => a == b,
+                Self::Neq => a != b,
+                Self::Gt => a > b,
+                Self::Geq => a >= b,
+            }
+        } else {
+            // These comparisons should be using locale settings
+            match self {
+                Self::Lt => a < b,
+                Self::Leq => a <= b,
+                Self::Eq => a == b,
+                Self::Neq => a != b,
+                Self::Gt => a > b,
+                Self::Geq => a >= b,
+            }
+        };
+        if b {
+            Ok("1".into())
+        } else {
+            Ok("0".into())
+        }
     }
+}
 
-    pub fn evaluate(&self) -> Result<String, String> {
-        match self {
-            Self::Leaf { value, .. } => Ok(value.clone()),
-            Self::Node { op_type, .. } => match self.operand_values() {
-                Err(reason) => Err(reason),
-                Ok(operand_values) => match op_type.as_ref() {
-                    "+" => {
-                        infix_operator_two_ints(|a: BigInt, b: BigInt| Ok(a + b), &operand_values)
-                    }
-                    "-" => {
-                        infix_operator_two_ints(|a: BigInt, b: BigInt| Ok(a - b), &operand_values)
-                    }
-                    "*" => {
-                        infix_operator_two_ints(|a: BigInt, b: BigInt| Ok(a * b), &operand_values)
-                    }
-                    "/" => infix_operator_two_ints(
-                        |a: BigInt, b: BigInt| {
-                            if b.is_zero() {
-                                Err("division by zero".to_owned())
-                            } else {
-                                Ok(a / b)
-                            }
-                        },
-                        &operand_values,
-                    ),
-                    "%" => infix_operator_two_ints(
-                        |a: BigInt, b: BigInt| {
-                            if b.is_zero() {
-                                Err("division by zero".to_owned())
-                            } else {
-                                Ok(a % b)
-                            }
-                        },
-                        &operand_values,
-                    ),
-                    "=" => infix_operator_two_ints_or_two_strings(
-                        |a: BigInt, b: BigInt| Ok(bool_as_int(a == b)),
-                        |a: &String, b: &String| Ok(bool_as_string(a == b)),
-                        &operand_values,
-                    ),
-                    "!=" => infix_operator_two_ints_or_two_strings(
-                        |a: BigInt, b: BigInt| Ok(bool_as_int(a != b)),
-                        |a: &String, b: &String| Ok(bool_as_string(a != b)),
-                        &operand_values,
-                    ),
-                    "<" => infix_operator_two_ints_or_two_strings(
-                        |a: BigInt, b: BigInt| Ok(bool_as_int(a < b)),
-                        |a: &String, b: &String| Ok(bool_as_string(a < b)),
-                        &operand_values,
-                    ),
-                    ">" => infix_operator_two_ints_or_two_strings(
-                        |a: BigInt, b: BigInt| Ok(bool_as_int(a > b)),
-                        |a: &String, b: &String| Ok(bool_as_string(a > b)),
-                        &operand_values,
-                    ),
-                    "<=" => infix_operator_two_ints_or_two_strings(
-                        |a: BigInt, b: BigInt| Ok(bool_as_int(a <= b)),
-                        |a: &String, b: &String| Ok(bool_as_string(a <= b)),
-                        &operand_values,
-                    ),
-                    ">=" => infix_operator_two_ints_or_two_strings(
-                        |a: BigInt, b: BigInt| Ok(bool_as_int(a >= b)),
-                        |a: &String, b: &String| Ok(bool_as_string(a >= b)),
-                        &operand_values,
-                    ),
-                    "|" => Ok(infix_operator_or(&operand_values)),
-                    "&" => Ok(infix_operator_and(&operand_values)),
-                    ":" | "match" => operator_match(&operand_values),
-                    "length" => Ok(prefix_operator_length(&operand_values)),
-                    "index" => Ok(prefix_operator_index(&operand_values)),
-                    "substr" => Ok(prefix_operator_substr(&operand_values)),
-
-                    _ => Err(format!("operation not implemented: {op_type}")),
-                },
+impl NumericOp {
+    fn eval(&self, left: &AstNode, right: &AstNode) -> ExprResult<String> {
+        let a: BigInt = left
+            .eval()?
+            .parse()
+            .map_err(|_| ExprError::NonIntegerArgument)?;
+        let b: BigInt = right
+            .eval()?
+            .parse()
+            .map_err(|_| ExprError::NonIntegerArgument)?;
+        Ok(match self {
+            Self::Add => a + b,
+            Self::Sub => a - b,
+            Self::Mul => a * b,
+            Self::Div => match a.checked_div(&b) {
+                Some(x) => x,
+                None => return Err(ExprError::DivisionByZero),
             },
+            Self::Mod => {
+                if a.checked_div(&b).is_none() {
+                    return Err(ExprError::DivisionByZero);
+                };
+                a % b
+            }
         }
+        .to_string())
     }
+}
 
-    pub fn operand_values(&self) -> Result<Vec<String>, String> {
-        if let Self::Node {
-            operands, op_type, ..
-        } = self
-        {
-            let mut out = Vec::with_capacity(operands.len());
-            let mut operands = operands.iter();
-
-            if let Some(value) = operands.next() {
-                let value = value.evaluate()?;
-                out.push(value.clone());
-                // short-circuit evaluation for `|` and `&`
-                // push dummy to pass `assert!(values.len() == 2);`
-                match op_type.as_ref() {
-                    "|" => {
-                        if value_as_bool(&value) {
-                            out.push(String::from("dummy"));
-                            return Ok(out);
-                        }
-                    }
-                    "&" => {
-                        if !value_as_bool(&value) {
-                            out.push(String::from("dummy"));
-                            return Ok(out);
+impl StringOp {
+    fn eval(&self, left: &AstNode, right: &AstNode) -> ExprResult<String> {
+        match self {
+            Self::Or => {
+                let left = left.eval()?;
+                if is_truthy(&left) {
+                    return Ok(left);
+                }
+                let right = right.eval()?;
+                if is_truthy(&right) {
+                    return Ok(right);
+                }
+                Ok("0".into())
+            }
+            Self::And => {
+                let left = left.eval()?;
+                if !is_truthy(&left) {
+                    return Ok("0".into());
+                }
+                let right = right.eval()?;
+                if !is_truthy(&right) {
+                    return Ok("0".into());
+                }
+                Ok(left)
+            }
+            Self::Match => {
+                let left = left.eval()?;
+                let right = right.eval()?;
+                let re_string = format!("^{}", &right);
+                let re = Regex::with_options(
+                    &re_string,
+                    RegexOptions::REGEX_OPTION_NONE,
+                    Syntax::grep(),
+                )
+                .map_err(|_| ExprError::InvalidRegexExpression)?;
+                Ok(if re.captures_len() > 0 {
+                    re.captures(&left)
+                        .map(|captures| captures.at(1).unwrap())
+                        .unwrap_or("")
+                        .to_string()
+                } else {
+                    re.find(&left)
+                        .map_or("0".to_string(), |(start, end)| (end - start).to_string())
+                })
+            }
+            Self::Index => {
+                let left = left.eval()?;
+                let right = right.eval()?;
+                for (current_idx, ch_h) in left.chars().enumerate() {
+                    for ch_n in right.chars() {
+                        if ch_n == ch_h {
+                            return Ok((current_idx + 1).to_string());
                         }
                     }
-                    _ => {}
                 }
+                Ok("0".to_string())
             }
-
-            for operand in operands {
-                let value = operand.evaluate()?;
-                out.push(value);
-            }
-            Ok(out)
-        } else {
-            panic!("Invoked .operand_values(&self) not with ASTNode::Node")
         }
     }
 }
 
-pub fn tokens_to_ast(
-    maybe_tokens: Result<Vec<(usize, Token)>, String>,
-) -> Result<Box<AstNode>, String> {
-    maybe_tokens.and_then(|tokens| {
-        let mut out_stack: TokenStack = Vec::new();
-        let mut op_stack: TokenStack = Vec::new();
-
-        for (token_idx, token) in tokens {
-            push_token_to_either_stack(token_idx, &token, &mut out_stack, &mut op_stack)?;
-        }
-        move_rest_of_ops_to_out(&mut out_stack, &mut op_stack)?;
-        assert!(op_stack.is_empty());
-
-        maybe_dump_rpn(&out_stack);
-        let result = ast_from_rpn(&mut out_stack);
-        if out_stack.is_empty() {
-            maybe_dump_ast(&result);
-            result
-        } else {
-            Err(
-                "syntax error (first RPN token does not represent the root of the expression AST)"
-                    .to_owned(),
-            )
-        }
-    })
+/// Precedence for infix binary operators
+const PRECEDENCE: &[&[(&str, BinOp)]] = &[
+    &[("|", BinOp::String(StringOp::Or))],
+    &[("&", BinOp::String(StringOp::And))],
+    &[
+        ("<", BinOp::Relation(RelationOp::Lt)),
+        ("<=", BinOp::Relation(RelationOp::Leq)),
+        ("=", BinOp::Relation(RelationOp::Eq)),
+        ("!=", BinOp::Relation(RelationOp::Neq)),
+        (">=", BinOp::Relation(RelationOp::Geq)),
+        (">", BinOp::Relation(RelationOp::Gt)),
+    ],
+    &[
+        ("+", BinOp::Numeric(NumericOp::Add)),
+        ("-", BinOp::Numeric(NumericOp::Sub)),
+    ],
+    &[
+        ("*", BinOp::Numeric(NumericOp::Mul)),
+        ("/", BinOp::Numeric(NumericOp::Div)),
+        ("%", BinOp::Numeric(NumericOp::Mod)),
+    ],
+    &[(":", BinOp::String(StringOp::Match))],
+];
+
+#[derive(Debug, PartialEq, Eq)]
+pub enum AstNode {
+    Leaf {
+        value: String,
+    },
+    BinOp {
+        op_type: BinOp,
+        left: Box<AstNode>,
+        right: Box<AstNode>,
+    },
+    Substr {
+        string: Box<AstNode>,
+        pos: Box<AstNode>,
+        length: Box<AstNode>,
+    },
+    Length {
+        string: Box<AstNode>,
+    },
 }
 
-fn maybe_dump_ast(result: &Result<Box<AstNode>, String>) {
-    use std::env;
-    if let Ok(debug_var) = env::var("EXPR_DEBUG_AST") {
-        if debug_var == "1" {
-            println!("EXPR_DEBUG_AST");
-            match result {
-                Ok(ast) => ast.debug_dump(),
-                Err(reason) => println!("\terr: {reason:?}"),
-            }
-        }
+impl AstNode {
+    pub fn parse(input: &[&str]) -> ExprResult<Self> {
+        Parser::new(input).parse()
     }
-}
 
-#[allow(clippy::ptr_arg)]
-fn maybe_dump_rpn(rpn: &TokenStack) {
-    use std::env;
-    if let Ok(debug_var) = env::var("EXPR_DEBUG_RPN") {
-        if debug_var == "1" {
-            println!("EXPR_DEBUG_RPN");
-            for token in rpn {
-                println!("\t{token:?}");
+    pub fn eval(&self) -> ExprResult<String> {
+        match self {
+            Self::Leaf { value } => Ok(value.into()),
+            Self::BinOp {
+                op_type,
+                left,
+                right,
+            } => op_type.eval(left, right),
+            Self::Substr {
+                string,
+                pos,
+                length,
+            } => {
+                let string = string.eval()?;
+
+                // The GNU docs say:
+                //
+                // > If either position or length is negative, zero, or
+                // > non-numeric, returns the null string.
+                //
+                // So we coerce errors into 0 to make that the only case we
+                // have to care about.
+                let pos: usize = pos.eval()?.parse().unwrap_or(0);
+                let length: usize = length.eval()?.parse().unwrap_or(0);
+
+                let (Some(pos), Some(_)) = (pos.checked_sub(1), length.checked_sub(1)) else {
+                    return Ok(String::new());
+                };
+
+                Ok(string.chars().skip(pos).take(length).collect())
             }
+            Self::Length { string } => Ok(string.eval()?.chars().count().to_string()),
         }
     }
 }
 
-fn ast_from_rpn(rpn: &mut TokenStack) -> Result<Box<AstNode>, String> {
-    match rpn.pop() {
-        None => Err("syntax error (premature end of expression)".to_owned()),
-        Some((token_idx, Token::Value { value })) => Ok(AstNode::new_leaf(token_idx, &value)),
+struct Parser<'a> {
+    input: &'a [&'a str],
+    index: usize,
+}
+
+impl<'a> Parser<'a> {
+    fn new(input: &'a [&'a str]) -> Self {
+        Self { input, index: 0 }
+    }
 
-        Some((token_idx, Token::InfixOp { value, .. })) => {
-            maybe_ast_node(token_idx, &value, 2, rpn)
+    fn next(&mut self) -> ExprResult<&'a str> {
+        let next = self.input.get(self.index);
+        if let Some(next) = next {
+            self.index += 1;
+            Ok(next)
+        } else {
+            // The indexing won't panic, because we know that the input size
+            // is greater than zero.
+            Err(ExprError::MissingArgument(
+                self.input[self.index - 1].into(),
+            ))
         }
+    }
 
-        Some((token_idx, Token::PrefixOp { value, arity })) => {
-            maybe_ast_node(token_idx, &value, arity, rpn)
+    fn accept<T>(&mut self, f: impl Fn(&str) -> Option<T>) -> Option<T> {
+        let next = self.input.get(self.index)?;
+        let tok = f(next);
+        if let Some(tok) = tok {
+            self.index += 1;
+            Some(tok)
+        } else {
+            None
         }
+    }
 
-        Some((token_idx, unexpected_token)) => {
-            panic!("unexpected token at #{token_idx} {unexpected_token:?}")
+    fn parse(&mut self) -> ExprResult<AstNode> {
+        if self.input.is_empty() {
+            return Err(ExprError::MissingOperand);
+        }
+        let res = self.parse_expression()?;
+        if let Some(arg) = self.input.get(self.index) {
+            return Err(ExprError::UnexpectedArgument(arg.to_string()));
         }
+        Ok(res)
     }
-}
 
-fn maybe_ast_node(
-    token_idx: usize,
-    op_type: &str,
-    arity: usize,
-    rpn: &mut TokenStack,
-) -> Result<Box<AstNode>, String> {
-    let mut operands = Vec::with_capacity(arity);
-    for _ in 0..arity {
-        let operand = ast_from_rpn(rpn)?;
-        operands.push(operand);
+    fn parse_expression(&mut self) -> ExprResult<AstNode> {
+        self.parse_precedence(0)
     }
-    operands.reverse();
-    Ok(AstNode::new_node(token_idx, op_type, operands))
-}
 
-fn move_rest_of_ops_to_out(
-    out_stack: &mut TokenStack,
-    op_stack: &mut TokenStack,
-) -> Result<(), String> {
-    loop {
-        match op_stack.pop() {
-            None => return Ok(()),
-            Some((token_idx, Token::ParOpen)) => {
-                return Err(format!(
-                    "syntax error (Mismatched open-parenthesis at #{token_idx})"
-                ))
-            }
-            Some((token_idx, Token::ParClose)) => {
-                return Err(format!(
-                    "syntax error (Mismatched close-parenthesis at #{token_idx})"
-                ))
+    fn parse_op(&mut self, precedence: usize) -> Option<BinOp> {
+        self.accept(|s| {
+            for (op_string, op) in PRECEDENCE[precedence] {
+                if s == *op_string {
+                    return Some(*op);
+                }
             }
-            Some(other) => out_stack.push(other),
-        }
+            None
+        })
     }
-}
 
-fn push_token_to_either_stack(
-    token_idx: usize,
-    token: &Token,
-    out_stack: &mut TokenStack,
-    op_stack: &mut TokenStack,
-) -> Result<(), String> {
-    let result = match token {
-        Token::Value { .. } => {
-            out_stack.push((token_idx, token.clone()));
-            Ok(())
+    fn parse_precedence(&mut self, precedence: usize) -> ExprResult<AstNode> {
+        if precedence >= PRECEDENCE.len() {
+            return self.parse_simple_expression();
         }
 
-        Token::InfixOp { .. } => {
-            if op_stack.is_empty() {
-                op_stack.push((token_idx, token.clone()));
-                Ok(())
-            } else {
-                push_op_to_stack(token_idx, token, out_stack, op_stack)
-            }
+        let mut left = self.parse_precedence(precedence + 1)?;
+        while let Some(op) = self.parse_op(precedence) {
+            let right = self.parse_precedence(precedence + 1)?;
+            left = AstNode::BinOp {
+                op_type: op,
+                left: Box::new(left),
+                right: Box::new(right),
+            };
         }
+        Ok(left)
+    }
 
-        Token::ParOpen => {
-            if out_stack.is_empty() {
-                op_stack.push((token_idx, token.clone()));
-                Ok(())
-            } else {
-                Err("syntax error: unexpected argument '('".to_string())
+    fn parse_simple_expression(&mut self) -> ExprResult<AstNode> {
+        let first = self.next()?;
+        Ok(match first {
+            "match" => {
+                let left = self.parse_expression()?;
+                let right = self.parse_expression()?;
+                AstNode::BinOp {
+                    op_type: BinOp::String(StringOp::Match),
+                    left: Box::new(left),
+                    right: Box::new(right),
+                }
             }
-        }
-
-        Token::PrefixOp { value, .. } => {
-            if out_stack.is_empty() {
-                op_stack.push((token_idx, token.clone()));
-                Ok(())
-            } else {
-                Err(format!(
-                    "syntax error: unexpected argument {}",
-                    value.quote()
-                ))
+            "substr" => {
+                let string = self.parse_expression()?;
+                let pos = self.parse_expression()?;
+                let length = self.parse_expression()?;
+                AstNode::Substr {
+                    string: Box::new(string),
+                    pos: Box::new(pos),
+                    length: Box::new(length),
+                }
             }
-        }
-
-        Token::ParClose => move_till_match_paren(out_stack, op_stack),
-    };
-    maybe_dump_shunting_yard_step(token_idx, token, out_stack, op_stack, &result);
-    result
-}
-
-#[allow(clippy::ptr_arg)]
-fn maybe_dump_shunting_yard_step(
-    token_idx: usize,
-    token: &Token,
-    out_stack: &TokenStack,
-    op_stack: &TokenStack,
-    result: &Result<(), String>,
-) {
-    use std::env;
-    if let Ok(debug_var) = env::var("EXPR_DEBUG_SYA_STEP") {
-        if debug_var == "1" {
-            println!("EXPR_DEBUG_SYA_STEP");
-            println!("\t{token_idx} => {token:?}");
-            println!("\t\tout: {out_stack:?}");
-            println!("\t\top : {op_stack:?}");
-            println!("\t\tresult: {result:?}");
-        }
-    }
-}
-
-fn push_op_to_stack(
-    token_idx: usize,
-    token: &Token,
-    out_stack: &mut TokenStack,
-    op_stack: &mut TokenStack,
-) -> Result<(), String> {
-    if let Token::InfixOp {
-        precedence: prec,
-        left_assoc: la,
-        ..
-    } = *token
-    {
-        loop {
-            match op_stack.last() {
-                None | Some(&(_, Token::ParOpen)) => {
-                    op_stack.push((token_idx, token.clone()));
-                    return Ok(());
+            "index" => {
+                let left = self.parse_expression()?;
+                let right = self.parse_expression()?;
+                AstNode::BinOp {
+                    op_type: BinOp::String(StringOp::Index),
+                    left: Box::new(left),
+                    right: Box::new(right),
                 }
-
-                Some(&(
-                    _,
-                    Token::InfixOp {
-                        precedence: prev_prec,
-                        ..
-                    },
-                )) => {
-                    if la && prev_prec >= prec || !la && prev_prec > prec {
-                        out_stack.push(op_stack.pop().unwrap());
-                    } else {
-                        op_stack.push((token_idx, token.clone()));
-                        return Ok(());
-                    }
+            }
+            "length" => {
+                let string = self.parse_expression()?;
+                AstNode::Length {
+                    string: Box::new(string),
                 }
-
-                Some(&(_, Token::PrefixOp { .. })) => {
-                    op_stack.push((token_idx, token.clone()));
-                    return Ok(());
+            }
+            "+" => AstNode::Leaf {
+                value: self.next()?.into(),
+            },
+            "(" => {
+                let s = self.parse_expression()?;
+                let close_paren = self.next()?;
+                if close_paren != ")" {
+                    // Since we have parsed at least a '(', there will be a token
+                    // at `self.index - 1`. So this indexing won't panic.
+                    return Err(ExprError::ExpectedClosingBraceAfter(
+                        self.input[self.index - 1].into(),
+                    ));
                 }
-
-                Some(_) => panic!("Non-operator on op_stack"),
+                s
             }
-        }
-    } else {
-        panic!("Expected infix-op")
+            s => AstNode::Leaf { value: s.into() },
+        })
     }
 }
 
-fn move_till_match_paren(
-    out_stack: &mut TokenStack,
-    op_stack: &mut TokenStack,
-) -> Result<(), String> {
-    loop {
-        let op = op_stack
-            .pop()
-            .ok_or_else(|| "syntax error (Mismatched close-parenthesis)".to_string())?;
-        match op {
-            (_, Token::ParOpen) => return Ok(()),
-            other => out_stack.push(other),
-        }
+/// Determine whether `expr` should evaluate the string as "truthy"
+///
+/// Truthy strings are either empty or match the regex "-?0+".
+pub fn is_truthy(s: &str) -> bool {
+    // Edge case: `-` followed by nothing is truthy
+    if s == "-" {
+        return true;
     }
+
+    let mut bytes = s.bytes();
+
+    // Empty string is falsy
+    let Some(first) = bytes.next() else {
+        return false;
+    };
+
+    let is_zero = (first == b'-' || first == b'0') && bytes.all(|b| b == b'0');
+    !is_zero
 }
 
-fn infix_operator_two_ints<F>(f: F, values: &[String]) -> Result<String, String>
-where
-    F: Fn(BigInt, BigInt) -> Result<BigInt, String>,
-{
-    assert!(values.len() == 2);
-    if let Ok(left) = values[0].parse::<BigInt>() {
-        if let Ok(right) = values[1].parse::<BigInt>() {
-            return f(left, right).map(|big_int| big_int.to_string());
+#[cfg(test)]
+mod test {
+    use super::{AstNode, BinOp, NumericOp, RelationOp, StringOp};
+
+    impl From<&str> for AstNode {
+        fn from(value: &str) -> Self {
+            Self::Leaf {
+                value: value.into(),
+            }
         }
     }
-    Err("Expected an integer operand".to_string())
-}
 
-fn infix_operator_two_ints_or_two_strings<FI, FS>(
-    fi: FI,
-    fs: FS,
-    values: &[String],
-) -> Result<String, String>
-where
-    FI: Fn(BigInt, BigInt) -> Result<u8, String>,
-    FS: Fn(&String, &String) -> Result<String, String>,
-{
-    assert!(values.len() == 2);
-    if let (Some(a_int), Some(b_int)) = (
-        values[0].parse::<BigInt>().ok(),
-        values[1].parse::<BigInt>().ok(),
-    ) {
-        match fi(a_int, b_int) {
-            Ok(result) => Ok(result.to_string()),
-            Err(reason) => Err(reason),
+    fn op(op_type: BinOp, left: impl Into<AstNode>, right: impl Into<AstNode>) -> AstNode {
+        AstNode::BinOp {
+            op_type,
+            left: Box::new(left.into()),
+            right: Box::new(right.into()),
         }
-    } else {
-        fs(&values[0], &values[1])
     }
-}
 
-fn infix_operator_or(values: &[String]) -> String {
-    assert!(values.len() == 2);
-    if value_as_bool(&values[0]) {
-        values[0].clone()
-    } else if value_as_bool(&values[1]) {
-        values[1].clone()
-    } else {
-        0.to_string()
+    fn length(string: impl Into<AstNode>) -> AstNode {
+        AstNode::Length {
+            string: Box::new(string.into()),
+        }
     }
-}
 
-fn infix_operator_and(values: &[String]) -> String {
-    assert!(values.len() == 2);
-    if value_as_bool(&values[0]) && value_as_bool(&values[1]) {
-        values[0].clone()
-    } else {
-        0.to_string()
+    fn substr(
+        string: impl Into<AstNode>,
+        pos: impl Into<AstNode>,
+        length: impl Into<AstNode>,
+    ) -> AstNode {
+        AstNode::Substr {
+            string: Box::new(string.into()),
+            pos: Box::new(pos.into()),
+            length: Box::new(length.into()),
+        }
     }
-}
 
-fn operator_match(values: &[String]) -> Result<String, String> {
-    assert!(values.len() == 2);
-    let re_string = format!("^{}", &values[1]);
-    let re = Regex::with_options(&re_string, RegexOptions::REGEX_OPTION_NONE, Syntax::grep())
-        .map_err(|err| err.description().to_string())?;
-    Ok(if re.captures_len() > 0 {
-        re.captures(&values[0])
-            .map(|captures| captures.at(1).unwrap())
-            .unwrap_or("")
-            .to_string()
-    } else {
-        re.find(&values[0])
-            .map_or("0".to_string(), |(start, end)| (end - start).to_string())
-    })
-}
-
-fn prefix_operator_length(values: &[String]) -> String {
-    assert!(values.len() == 1);
-    // Use chars().count() as we can have some multibytes chars
-    // See https://github.com/uutils/coreutils/issues/3132
-    values[0].chars().count().to_string()
-}
-
-fn prefix_operator_index(values: &[String]) -> String {
-    assert!(values.len() == 2);
-    let haystack = &values[0];
-    let needles = &values[1];
-
-    for (current_idx, ch_h) in haystack.chars().enumerate() {
-        for ch_n in needles.chars() {
-            if ch_n == ch_h {
-                return (current_idx + 1).to_string();
-            }
+    #[test]
+    fn infix_operators() {
+        let cases = [
+            ("|", BinOp::String(StringOp::Or)),
+            ("&", BinOp::String(StringOp::And)),
+            ("<", BinOp::Relation(RelationOp::Lt)),
+            ("<=", BinOp::Relation(RelationOp::Leq)),
+            ("=", BinOp::Relation(RelationOp::Eq)),
+            ("!=", BinOp::Relation(RelationOp::Neq)),
+            (">=", BinOp::Relation(RelationOp::Geq)),
+            (">", BinOp::Relation(RelationOp::Gt)),
+            ("+", BinOp::Numeric(NumericOp::Add)),
+            ("-", BinOp::Numeric(NumericOp::Sub)),
+            ("*", BinOp::Numeric(NumericOp::Mul)),
+            ("/", BinOp::Numeric(NumericOp::Div)),
+            ("%", BinOp::Numeric(NumericOp::Mod)),
+            (":", BinOp::String(StringOp::Match)),
+        ];
+        for (string, value) in cases {
+            assert_eq!(AstNode::parse(&["1", string, "2"]), Ok(op(value, "1", "2")));
         }
     }
-    "0".to_string()
-}
-
-fn prefix_operator_substr(values: &[String]) -> String {
-    assert!(values.len() == 3);
-    let subj = &values[0];
-    let idx = match values[1]
-        .parse::<usize>()
-        .ok()
-        .and_then(|v| v.checked_sub(1))
-    {
-        Some(i) => i,
-        None => return String::new(),
-    };
-    let len = match values[2].parse::<usize>() {
-        Ok(i) => i,
-        Err(_) => return String::new(),
-    };
-
-    subj.chars().skip(idx).take(len).collect()
-}
-
-fn bool_as_int(b: bool) -> u8 {
-    u8::from(b)
-}
 
-fn bool_as_string(b: bool) -> String {
-    if b {
-        "1".to_string()
-    } else {
-        "0".to_string()
+    #[test]
+    fn other_operators() {
+        assert_eq!(
+            AstNode::parse(&["match", "1", "2"]),
+            Ok(op(BinOp::String(StringOp::Match), "1", "2")),
+        );
+        assert_eq!(
+            AstNode::parse(&["index", "1", "2"]),
+            Ok(op(BinOp::String(StringOp::Index), "1", "2")),
+        );
+        assert_eq!(AstNode::parse(&["length", "1"]), Ok(length("1")),);
+        assert_eq!(
+            AstNode::parse(&["substr", "1", "2", "3"]),
+            Ok(substr("1", "2", "3")),
+        );
     }
-}
 
-fn value_as_bool(s: &str) -> bool {
-    if s.is_empty() {
-        return false;
-    }
-    match s.parse::<BigInt>() {
-        Ok(n) => n != Zero::zero(),
-        Err(_) => true,
+    #[test]
+    fn precedence() {
+        assert_eq!(
+            AstNode::parse(&["1", "+", "2", "*", "3"]),
+            Ok(op(
+                BinOp::Numeric(NumericOp::Add),
+                "1",
+                op(BinOp::Numeric(NumericOp::Mul), "2", "3")
+            ))
+        );
+        assert_eq!(
+            AstNode::parse(&["(", "1", "+", "2", ")", "*", "3"]),
+            Ok(op(
+                BinOp::Numeric(NumericOp::Mul),
+                op(BinOp::Numeric(NumericOp::Add), "1", "2"),
+                "3"
+            ))
+        );
+        assert_eq!(
+            AstNode::parse(&["1", "*", "2", "+", "3"]),
+            Ok(op(
+                BinOp::Numeric(NumericOp::Add),
+                op(BinOp::Numeric(NumericOp::Mul), "1", "2"),
+                "3"
+            )),
+        );
     }
 }
diff --git a/src/uu/expr/src/tokens.rs b/src/uu/expr/src/tokens.rs
deleted file mode 100644
index f499881c138..00000000000
--- a/src/uu/expr/src/tokens.rs
+++ /dev/null
@@ -1,147 +0,0 @@
-// This file is part of the uutils coreutils package.
-//
-// For the full copyright and license information, please view the LICENSE
-// file that was distributed with this source code.
-
-//!
-//! The following tokens are present in the expr grammar:
-//! * integer literal;
-//! * string literal;
-//! * infix binary operators;
-//! * prefix operators.
-//!
-//! According to the man-page of expr we have expression split into tokens (each token -- separate CLI-argument).
-//! Hence all we need is to map the strings into the Token structures, except for some ugly fiddling with +-escaping.
-//!
-
-// spell-checker:ignore (ToDO) paren
-
-#[derive(Debug, Clone)]
-pub enum Token {
-    Value {
-        value: String,
-    },
-
-    ParOpen,
-    ParClose,
-
-    InfixOp {
-        precedence: u8,
-        left_assoc: bool,
-        value: String,
-    },
-
-    PrefixOp {
-        arity: usize,
-        value: String,
-    },
-}
-
-impl Token {
-    fn new_infix_op(v: &str, left_assoc: bool, precedence: u8) -> Self {
-        Self::InfixOp {
-            left_assoc,
-            precedence,
-            value: v.into(),
-        }
-    }
-
-    fn new_value(v: &str) -> Self {
-        Self::Value { value: v.into() }
-    }
-
-    fn is_infix_plus(&self) -> bool {
-        match self {
-            Self::InfixOp { value, .. } => value == "+",
-            _ => false,
-        }
-    }
-
-    fn is_a_value(&self) -> bool {
-        matches!(*self, Self::Value { .. })
-    }
-
-    fn is_a_close_paren(&self) -> bool {
-        matches!(*self, Self::ParClose)
-    }
-}
-
-pub fn strings_to_tokens(strings: &[&str]) -> Result<Vec<(usize, Token)>, String> {
-    let mut tokens_acc = Vec::with_capacity(strings.len());
-    let mut tok_idx = 1;
-
-    for s in strings {
-        let token_if_not_escaped = match *s {
-            "(" => Token::ParOpen,
-            ")" => Token::ParClose,
-
-            "^" => Token::new_infix_op(s, false, 7),
-
-            ":" => Token::new_infix_op(s, true, 6),
-
-            "*" | "/" | "%" => Token::new_infix_op(s, true, 5),
-
-            "+" | "-" => Token::new_infix_op(s, true, 4),
-
-            "=" | "!=" | "<" | ">" | "<=" | ">=" => Token::new_infix_op(s, true, 3),
-
-            "&" => Token::new_infix_op(s, true, 2),
-
-            "|" => Token::new_infix_op(s, true, 1),
-
-            "match" | "index" => Token::PrefixOp {
-                arity: 2,
-                value: s.to_string(),
-            },
-            "substr" => Token::PrefixOp {
-                arity: 3,
-                value: s.to_string(),
-            },
-            "length" => Token::PrefixOp {
-                arity: 1,
-                value: s.to_string(),
-            },
-
-            _ => Token::new_value(s),
-        };
-        push_token_if_not_escaped(&mut tokens_acc, tok_idx, token_if_not_escaped, s);
-        tok_idx += 1;
-    }
-    maybe_dump_tokens_acc(&tokens_acc);
-
-    Ok(tokens_acc)
-}
-
-fn maybe_dump_tokens_acc(tokens_acc: &[(usize, Token)]) {
-    use std::env;
-
-    if let Ok(debug_var) = env::var("EXPR_DEBUG_TOKENS") {
-        if debug_var == "1" {
-            println!("EXPR_DEBUG_TOKENS");
-            for token in tokens_acc {
-                println!("\t{token:?}");
-            }
-        }
-    }
-}
-
-fn push_token_if_not_escaped(acc: &mut Vec<(usize, Token)>, tok_idx: usize, token: Token, s: &str) {
-    // `+` may be escaped such as `expr + 1` and `expr 1 + + 1`
-    let prev_is_plus = match acc.last() {
-        None => false,
-        Some(t) => t.1.is_infix_plus(),
-    };
-    let should_use_as_escaped = if prev_is_plus && acc.len() >= 2 {
-        let pre_prev = &acc[acc.len() - 2];
-        !(pre_prev.1.is_a_value() || pre_prev.1.is_a_close_paren())
-    } else {
-        prev_is_plus
-    };
-
-    if should_use_as_escaped {
-        acc.pop();
-        acc.push((tok_idx, Token::new_value(s)));
-    } else {
-        acc.push((tok_idx, token));
-    }
-}

From 01c32a5220ef036bdc1d9bae8928336a815db619 Mon Sep 17 00:00:00 2001
From: Terts Diepraam <terts.diepraam@gmail.com>
Date: Tue, 28 Nov 2023 11:40:33 +0100
Subject: [PATCH 080/429] fmt: clean up some small bits

---
 src/uu/fmt/src/linebreak.rs |  37 +++---
 src/uu/fmt/src/parasplit.rs | 232 ++++++++++++++++++------------------
 2 files changed, 132 insertions(+), 137 deletions(-)

diff --git a/src/uu/fmt/src/linebreak.rs b/src/uu/fmt/src/linebreak.rs
index fbd990fff1e..7cd65d86149 100644
--- a/src/uu/fmt/src/linebreak.rs
+++ b/src/uu/fmt/src/linebreak.rs
@@ -46,7 +46,7 @@ pub fn break_lines(
     ostream: &mut BufWriter<Stdout>,
 ) -> std::io::Result<()> {
     // indent
-    let p_indent = &para.indent_str[..];
+    let p_indent = &para.indent_str;
     let p_indent_len = para.indent_len;
 
     // words
@@ -55,14 +55,12 @@ pub fn break_lines(
 
     // the first word will *always* appear on the first line
     // make sure of this here
-    let (w, w_len) = match p_words_words.next() {
-        Some(winfo) => (winfo.word, winfo.word_nchars),
-        None => {
-            return ostream.write_all(b"\n");
-        }
+    let Some(winfo) = p_words_words.next() else {
+        return ostream.write_all(b"\n");
     };
+
     // print the init, if it exists, and get its length
-    let p_init_len = w_len
+    let p_init_len = winfo.word_nchars
         + if opts.crown || opts.tagged {
             // handle "init" portion
             ostream.write_all(para.init_str.as_bytes())?;
@@ -75,8 +73,9 @@ pub fn break_lines(
             // except that mail headers get no indent at all
             0
         };
+
     // write first word after writing init
-    ostream.write_all(w.as_bytes())?;
+    ostream.write_all(winfo.word.as_bytes())?;
 
     // does this paragraph require uniform spacing?
     let uniform = para.mail_header || opts.uniform;
@@ -103,15 +102,16 @@ fn break_simple<'a, T: Iterator<Item = &'a WordInfo<'a>>>(
     mut iter: T,
     args: &mut BreakArgs<'a>,
 ) -> std::io::Result<()> {
-    iter.try_fold((args.init_len, false), |l, winfo| {
-        accum_words_simple(args, l, winfo)
+    iter.try_fold((args.init_len, false), |(l, prev_punct), winfo| {
+        accum_words_simple(args, l, prev_punct, winfo)
     })?;
     args.ostream.write_all(b"\n")
 }
 
 fn accum_words_simple<'a>(
     args: &mut BreakArgs<'a>,
-    (l, prev_punct): (usize, bool),
+    l: usize,
+    prev_punct: bool,
     winfo: &'a WordInfo<'a>,
 ) -> std::io::Result<(usize, bool)> {
     // compute the length of this word, considering how tabs will expand at this position on the line
@@ -233,14 +233,14 @@ fn find_kp_breakpoints<'a, T: Iterator<Item = &'a WordInfo<'a>>>(
         linebreak: None,
         break_before: false,
         demerits: 0,
-        prev_rat: 0.0f32,
+        prev_rat: 0.0,
         length: args.init_len,
         fresh: false,
     }];
     // this vec holds the current active linebreaks; next_ holds the breaks that will be active for
     // the next word
-    let active_breaks = &mut vec![0];
-    let next_active_breaks = &mut vec![];
+    let mut active_breaks = vec![0];
+    let mut next_active_breaks = vec![];
 
     let stretch = (args.opts.width - args.opts.goal) as isize;
     let minlength = args.opts.goal - stretch as usize;
@@ -248,10 +248,7 @@ fn find_kp_breakpoints<'a, T: Iterator<Item = &'a WordInfo<'a>>>(
     let mut is_sentence_start = false;
     let mut least_demerits = 0;
     loop {
-        let w = match iter.next() {
-            None => break,
-            Some(w) => w,
-        };
+        let Some(w) = iter.next() else { break };
 
         // if this is the last word, we don't add additional demerits for this break
         let (is_last_word, is_sentence_end) = match iter.peek() {
@@ -358,13 +355,13 @@ fn find_kp_breakpoints<'a, T: Iterator<Item = &'a WordInfo<'a>>>(
             least_demerits = cmp::max(ld_next, 0);
         }
         // swap in new list of active breaks
-        mem::swap(active_breaks, next_active_breaks);
+        mem::swap(&mut active_breaks, &mut next_active_breaks);
         // If this was the last word in a sentence, the next one must be the first in the next.
         is_sentence_start = is_sentence_end;
     }
 
     // return the best path
-    build_best_path(&linebreaks, active_breaks)
+    build_best_path(&linebreaks, &active_breaks)
 }
 
 fn build_best_path<'a>(paths: &[LineBreak<'a>], active: &[usize]) -> Vec<(&'a WordInfo<'a>, bool)> {
diff --git a/src/uu/fmt/src/parasplit.rs b/src/uu/fmt/src/parasplit.rs
index 68c8f78fa89..311ddbc9b83 100644
--- a/src/uu/fmt/src/parasplit.rs
+++ b/src/uu/fmt/src/parasplit.rs
@@ -52,18 +52,22 @@ impl Line {
     }
 }
 
-// each line's prefix has to be considered to know whether to merge it with
-// the next line or not
+/// Each line's prefix has to be considered to know whether to merge it with
+/// the next line or not
 #[derive(Debug)]
 pub struct FileLine {
     line: String,
-    indent_end: usize, // the end of the indent, always the start of the text
-    pfxind_end: usize, // the end of the PREFIX's indent, that is, the spaces before the prefix
-    indent_len: usize, // display length of indent taking into account tabs
-    prefix_len: usize, // PREFIX indent length taking into account tabs
+    /// The end of the indent, always the start of the text
+    indent_end: usize,
+    /// The end of the PREFIX's indent, that is, the spaces before the prefix
+    pfxind_end: usize,
+    /// Display length of indent taking into account tabs
+    indent_len: usize,
+    /// PREFIX indent length taking into account tabs
+    prefix_len: usize,
 }
 
-// iterator that produces a stream of Lines from a file
+/// Iterator that produces a stream of Lines from a file
 pub struct FileLines<'a> {
     opts: &'a FmtOptions,
     lines: Lines<&'a mut FileOrStdReader>,
@@ -74,7 +78,7 @@ impl<'a> FileLines<'a> {
         FileLines { opts, lines }
     }
 
-    // returns true if this line should be formatted
+    /// returns true if this line should be formatted
     fn match_prefix(&self, line: &str) -> (bool, usize) {
         if !self.opts.use_prefix {
             return (true, 0);
@@ -83,7 +87,7 @@ impl<'a> FileLines<'a> {
         FileLines::match_prefix_generic(&self.opts.prefix[..], line, self.opts.xprefix)
     }
 
-    // returns true if this line should be formatted
+    /// returns true if this line should be formatted
     fn match_anti_prefix(&self, line: &str) -> bool {
         if !self.opts.use_anti_prefix {
             return true;
@@ -148,13 +152,7 @@ impl<'a> Iterator for FileLines<'a> {
     type Item = Line;
 
     fn next(&mut self) -> Option<Line> {
-        let n = match self.lines.next() {
-            Some(t) => match t {
-                Ok(tt) => tt,
-                Err(_) => return None,
-            },
-            None => return None,
-        };
+        let n = self.lines.next()?.ok()?;
 
         // if this line is entirely whitespace,
         // emit a blank line
@@ -205,24 +203,33 @@ impl<'a> Iterator for FileLines<'a> {
     }
 }
 
-// a paragraph : a collection of FileLines that are to be formatted
-// plus info about the paragraph's indentation
-// (but we only retain the String from the FileLine; the other info
-// is only there to help us in deciding how to merge lines into Paragraphs
+/// A paragraph : a collection of FileLines that are to be formatted
+/// plus info about the paragraph's indentation
+///
+/// We only retain the String from the FileLine; the other info
+/// is only there to help us in deciding how to merge lines into Paragraphs
 #[derive(Debug)]
 pub struct Paragraph {
-    lines: Vec<String>,     // the lines of the file
-    pub init_str: String,   // string representing the init, that is, the first line's indent
-    pub init_len: usize,    // printable length of the init string considering TABWIDTH
-    init_end: usize,        // byte location of end of init in first line String
-    pub indent_str: String, // string representing indent
-    pub indent_len: usize,  // length of above
-    indent_end: usize, // byte location of end of indent (in crown and tagged mode, only applies to 2nd line and onward)
-    pub mail_header: bool, // we need to know if this is a mail header because we do word splitting differently in that case
+    /// the lines of the file
+    lines: Vec<String>,
+    /// string representing the init, that is, the first line's indent
+    pub init_str: String,
+    /// printable length of the init string considering TABWIDTH    
+    pub init_len: usize,
+    /// byte location of end of init in first line String
+    init_end: usize,
+    /// string representing indent
+    pub indent_str: String,
+    /// length of above
+    pub indent_len: usize,
+    /// byte location of end of indent (in crown and tagged mode, only applies to 2nd line and onward)
+    indent_end: usize,
+    /// we need to know if this is a mail header because we do word splitting differently in that case
+    pub mail_header: bool,
 }
 
-// an iterator producing a stream of paragraphs from a stream of lines
-// given a set of options.
+/// An iterator producing a stream of paragraphs from a stream of lines
+/// given a set of options.
 pub struct ParagraphStream<'a> {
     lines: Peekable<FileLines<'a>>,
     next_mail: bool,
@@ -240,7 +247,7 @@ impl<'a> ParagraphStream<'a> {
         }
     }
 
-    // detect RFC822 mail header
+    /// Detect RFC822 mail header
     fn is_mail_header(line: &FileLine) -> bool {
         // a mail header begins with either "From " (envelope sender line)
         // or with a sequence of printable ASCII chars (33 to 126, inclusive,
@@ -276,12 +283,9 @@ impl<'a> Iterator for ParagraphStream<'a> {
     #[allow(clippy::cognitive_complexity)]
     fn next(&mut self) -> Option<Result<Paragraph, String>> {
         // return a NoFormatLine in an Err; it should immediately be output
-        let noformat = match self.lines.peek() {
-            None => return None,
-            Some(l) => match *l {
-                Line::FormatLine(_) => false,
-                Line::NoFormatLine(_, _) => true,
-            },
+        let noformat = match self.lines.peek()? {
+            Line::FormatLine(_) => false,
+            Line::NoFormatLine(_, _) => true,
         };
 
         // found a NoFormatLine, immediately dump it out
@@ -305,95 +309,89 @@ impl<'a> Iterator for ParagraphStream<'a> {
         let mut in_mail = false;
         let mut second_done = false; // for when we use crown or tagged mode
         loop {
-            {
-                // peek ahead
-                // need to explicitly force fl out of scope before we can call self.lines.next()
-                let fl = match self.lines.peek() {
-                    None => break,
-                    Some(l) => match *l {
-                        Line::FormatLine(ref x) => x,
-                        Line::NoFormatLine(..) => break,
-                    },
-                };
+            // peek ahead
+            // need to explicitly force fl out of scope before we can call self.lines.next()
+            let Some(Line::FormatLine(fl)) = self.lines.peek() else {
+                break;
+            };
 
-                if p_lines.is_empty() {
-                    // first time through the loop, get things set up
-                    // detect mail header
-                    if self.opts.mail && self.next_mail && ParagraphStream::is_mail_header(fl) {
-                        in_mail = true;
-                        // there can't be any indent or pfxind because otherwise is_mail_header
-                        // would fail since there cannot be any whitespace before the colon in a
-                        // valid header field
-                        indent_str.push_str("  ");
-                        indent_len = 2;
+            if p_lines.is_empty() {
+                // first time through the loop, get things set up
+                // detect mail header
+                if self.opts.mail && self.next_mail && ParagraphStream::is_mail_header(fl) {
+                    in_mail = true;
+                    // there can't be any indent or pfxind because otherwise is_mail_header
+                    // would fail since there cannot be any whitespace before the colon in a
+                    // valid header field
+                    indent_str.push_str("  ");
+                    indent_len = 2;
+                } else {
+                    if self.opts.crown || self.opts.tagged {
+                        init_str.push_str(&fl.line[..fl.indent_end]);
+                        init_len = fl.indent_len;
+                        init_end = fl.indent_end;
                     } else {
-                        if self.opts.crown || self.opts.tagged {
-                            init_str.push_str(&fl.line[..fl.indent_end]);
-                            init_len = fl.indent_len;
-                            init_end = fl.indent_end;
-                        } else {
-                            second_done = true;
-                        }
-
-                        // these will be overwritten in the 2nd line of crown or tagged mode, but
-                        // we are not guaranteed to get to the 2nd line, e.g., if the next line
-                        // is a NoFormatLine or None. Thus, we set sane defaults the 1st time around
-                        indent_str.push_str(&fl.line[..fl.indent_end]);
-                        indent_len = fl.indent_len;
-                        indent_end = fl.indent_end;
-
-                        // save these to check for matching lines
-                        prefix_len = fl.prefix_len;
-                        pfxind_end = fl.pfxind_end;
-
-                        // in tagged mode, add 4 spaces of additional indenting by default
-                        // (gnu fmt's behavior is different: it seems to find the closest column to
-                        // indent_end that is divisible by 3. But honestly that behavior seems
-                        // pretty arbitrary.
-                        // Perhaps a better default would be 1 TABWIDTH? But ugh that's so big.
-                        if self.opts.tagged {
-                            indent_str.push_str("    ");
-                            indent_len += 4;
-                        }
-                    }
-                } else if in_mail {
-                    // lines following mail headers must begin with spaces
-                    if fl.indent_end == 0 || (self.opts.use_prefix && fl.pfxind_end == 0) {
-                        break; // this line does not begin with spaces
+                        second_done = true;
                     }
-                } else if !second_done {
-                    // now we have enough info to handle crown margin and tagged mode
 
-                    // in both crown and tagged modes we require that prefix_len is the same
-                    if prefix_len != fl.prefix_len || pfxind_end != fl.pfxind_end {
-                        break;
-                    }
-
-                    // in tagged mode, indent has to be *different* on following lines
-                    if self.opts.tagged
-                        && indent_len - 4 == fl.indent_len
-                        && indent_end == fl.indent_end
-                    {
-                        break;
-                    }
-
-                    // this is part of the same paragraph, get the indent info from this line
-                    indent_str.clear();
+                    // these will be overwritten in the 2nd line of crown or tagged mode, but
+                    // we are not guaranteed to get to the 2nd line, e.g., if the next line
+                    // is a NoFormatLine or None. Thus, we set sane defaults the 1st time around
                     indent_str.push_str(&fl.line[..fl.indent_end]);
                     indent_len = fl.indent_len;
                     indent_end = fl.indent_end;
 
-                    second_done = true;
-                } else {
-                    // detect mismatch
-                    if indent_end != fl.indent_end
-                        || pfxind_end != fl.pfxind_end
-                        || indent_len != fl.indent_len
-                        || prefix_len != fl.prefix_len
-                    {
-                        break;
+                    // save these to check for matching lines
+                    prefix_len = fl.prefix_len;
+                    pfxind_end = fl.pfxind_end;
+
+                    // in tagged mode, add 4 spaces of additional indenting by default
+                    // (gnu fmt's behavior is different: it seems to find the closest column to
+                    // indent_end that is divisible by 3. But honestly that behavior seems
+                    // pretty arbitrary.
+                    // Perhaps a better default would be 1 TABWIDTH? But ugh that's so big.
+                    if self.opts.tagged {
+                        indent_str.push_str("    ");
+                        indent_len += 4;
                     }
                 }
+            } else if in_mail {
+                // lines following mail headers must begin with spaces
+                if fl.indent_end == 0 || (self.opts.use_prefix && fl.pfxind_end == 0) {
+                    break; // this line does not begin with spaces
+                }
+            } else if !second_done {
+                // now we have enough info to handle crown margin and tagged mode
+
+                // in both crown and tagged modes we require that prefix_len is the same
+                if prefix_len != fl.prefix_len || pfxind_end != fl.pfxind_end {
+                    break;
+                }
+
+                // in tagged mode, indent has to be *different* on following lines
+                if self.opts.tagged
+                    && indent_len - 4 == fl.indent_len
+                    && indent_end == fl.indent_end
+                {
+                    break;
+                }
+
+                // this is part of the same paragraph, get the indent info from this line
+                indent_str.clear();
+                indent_str.push_str(&fl.line[..fl.indent_end]);
+                indent_len = fl.indent_len;
+                indent_end = fl.indent_end;
+
+                second_done = true;
+            } else {
+                // detect mismatch
+                if indent_end != fl.indent_end
+                    || pfxind_end != fl.pfxind_end
+                    || indent_len != fl.indent_len
+                    || prefix_len != fl.prefix_len
+                {
+                    break;
+                }
             }
 
             p_lines.push(self.lines.next().unwrap().get_formatline().line);
@@ -429,7 +427,7 @@ pub struct ParaWords<'a> {
 }
 
 impl<'a> ParaWords<'a> {
-    pub fn new<'b>(opts: &'b FmtOptions, para: &'b Paragraph) -> ParaWords<'b> {
+    pub fn new(opts: &'a FmtOptions, para: &'a Paragraph) -> Self {
         let mut pw = ParaWords {
             opts,
             para,

From d78923e4ccda95db136c358913a09642f4ee9729 Mon Sep 17 00:00:00 2001
From: Terts Diepraam <terts.diepraam@gmail.com>
Date: Tue, 28 Nov 2023 11:54:43 +0100
Subject: [PATCH 081/429] fmt: extract determining options to separate function

---
 src/uu/fmt/src/fmt.rs | 194 +++++++++++++++++++++---------------------
 1 file changed, 95 insertions(+), 99 deletions(-)

diff --git a/src/uu/fmt/src/fmt.rs b/src/uu/fmt/src/fmt.rs
index c30d923b76b..3a494c868e5 100644
--- a/src/uu/fmt/src/fmt.rs
+++ b/src/uu/fmt/src/fmt.rs
@@ -5,7 +5,7 @@
 
 // spell-checker:ignore (ToDO) PSKIP linebreak ostream parasplit tabwidth xanti xprefix
 
-use clap::{crate_version, Arg, ArgAction, Command};
+use clap::{crate_version, Arg, ArgAction, ArgMatches, Command};
 use std::cmp;
 use std::fs::File;
 use std::io::{stdin, stdout, Write};
@@ -40,6 +40,9 @@ static OPT_TAB_WIDTH: &str = "tab-width";
 
 static ARG_FILES: &str = "files";
 
+// by default, goal is 93% of width
+const DEFAULT_GOAL_TO_WIDTH_RATIO: usize = 93;
+
 pub type FileOrStdReader = BufReader<Box<dyn Read + 'static>>;
 pub struct FmtOptions {
     crown: bool,
@@ -59,25 +62,97 @@ pub struct FmtOptions {
     tabwidth: usize,
 }
 
-impl Default for FmtOptions {
-    fn default() -> Self {
-        Self {
-            crown: false,
-            tagged: false,
-            mail: false,
-            uniform: false,
-            quick: false,
-            split_only: false,
-            use_prefix: false,
-            prefix: String::new(),
-            xprefix: false,
-            use_anti_prefix: false,
-            anti_prefix: String::new(),
-            xanti_prefix: false,
-            width: 75,
-            goal: 70,
-            tabwidth: 8,
+impl FmtOptions {
+    fn from_matches(matches: &ArgMatches) -> UResult<Self> {
+        let mut tagged = matches.get_flag(OPT_TAGGED_PARAGRAPH);
+        let mut crown = matches.get_flag(OPT_CROWN_MARGIN);
+
+        let mail = matches.get_flag(OPT_PRESERVE_HEADERS);
+        let uniform = matches.get_flag(OPT_UNIFORM_SPACING);
+        let quick = matches.get_flag(OPT_QUICK);
+        let split_only = matches.get_flag(OPT_SPLIT_ONLY);
+
+        if crown {
+            tagged = false;
+        }
+        if split_only {
+            crown = false;
+            tagged = false;
+        }
+
+        let xprefix = matches.contains_id(OPT_EXACT_PREFIX);
+        let xanti_prefix = matches.contains_id(OPT_SKIP_PREFIX);
+
+        let mut prefix = String::new();
+        let mut use_prefix = false;
+        if let Some(s) = matches.get_one::<String>(OPT_PREFIX).map(String::from) {
+            prefix = s;
+            use_prefix = true;
+        };
+
+        let mut anti_prefix = String::new();
+        let mut use_anti_prefix = false;
+        if let Some(s) = matches.get_one::<String>(OPT_SKIP_PREFIX).map(String::from) {
+            anti_prefix = s;
+            use_anti_prefix = true;
+        };
+
+        let mut width = 75;
+        let mut goal = 70;
+        if let Some(w) = matches.get_one::<usize>(OPT_WIDTH) {
+            width = *w;
+            if width > MAX_WIDTH {
+                return Err(USimpleError::new(
+                    1,
+                    format!("invalid width: '{}': Numerical result out of range", width),
+                ));
+            }
+            goal = cmp::min(width * DEFAULT_GOAL_TO_WIDTH_RATIO / 100, width - 3);
+        };
+
+        if let Some(g) = matches.get_one::<usize>(OPT_GOAL) {
+            goal = *g;
+            if !matches.contains_id(OPT_WIDTH) {
+                width = cmp::max(goal * 100 / DEFAULT_GOAL_TO_WIDTH_RATIO, goal + 3);
+            } else if goal > width {
+                return Err(USimpleError::new(1, "GOAL cannot be greater than WIDTH."));
+            }
+        };
+
+        let mut tabwidth = 8;
+        if let Some(s) = matches.get_one::<String>(OPT_TAB_WIDTH) {
+            tabwidth = match s.parse::<usize>() {
+                Ok(t) => t,
+                Err(e) => {
+                    return Err(USimpleError::new(
+                        1,
+                        format!("Invalid TABWIDTH specification: {}: {}", s.quote(), e),
+                    ));
+                }
+            };
+        };
+
+        if tabwidth < 1 {
+            tabwidth = 1;
         }
+
+        Ok(Self {
+            crown,
+            tagged,
+            mail,
+            uniform,
+            quick,
+            split_only,
+            use_prefix,
+            prefix,
+            xprefix,
+            use_anti_prefix,
+            anti_prefix,
+            xanti_prefix,
+            width,
+            goal,
+            tabwidth,
+        })
     }
 }
 
@@ -90,12 +165,7 @@ impl Default for FmtOptions {
 /// # Returns
 ///
 /// A tuple containing a vector of file names and a `FmtOptions` struct.
-#[allow(clippy::cognitive_complexity)]
-#[allow(clippy::field_reassign_with_default)]
 fn parse_arguments(args: impl uucore::Args) -> UResult<(Vec<String>, FmtOptions)> {
-    // by default, goal is 93% of width
-    const DEFAULT_GOAL_TO_WIDTH_RATIO: usize = 93;
-
     let matches = uu_app().try_get_matches_from(args)?;
 
     let mut files: Vec<String> = matches
@@ -103,81 +173,7 @@ fn parse_arguments(args: impl uucore::Args) -> UResult<(Vec<String>, FmtOptions)
         .map(|v| v.map(ToString::to_string).collect())
         .unwrap_or_default();
 
-    let mut fmt_opts = FmtOptions::default();
-
-    fmt_opts.tagged = matches.get_flag(OPT_TAGGED_PARAGRAPH);
-    if matches.get_flag(OPT_CROWN_MARGIN) {
-        fmt_opts.crown = true;
-        fmt_opts.tagged = false;
-    }
-    fmt_opts.mail = matches.get_flag(OPT_PRESERVE_HEADERS);
-    fmt_opts.uniform = matches.get_flag(OPT_UNIFORM_SPACING);
-    fmt_opts.quick = matches.get_flag(OPT_QUICK);
-    if matches.get_flag(OPT_SPLIT_ONLY) {
-        fmt_opts.split_only = true;
-        fmt_opts.crown = false;
-        fmt_opts.tagged = false;
-    }
-    fmt_opts.xprefix = matches.contains_id(OPT_EXACT_PREFIX);
-    fmt_opts.xanti_prefix = matches.contains_id(OPT_SKIP_PREFIX);
-
-    if let Some(s) = matches.get_one::<String>(OPT_PREFIX).map(String::from) {
-        fmt_opts.prefix = s;
-        fmt_opts.use_prefix = true;
-    };
-
-    if let Some(s) = matches.get_one::<String>(OPT_SKIP_PREFIX).map(String::from) {
-        fmt_opts.anti_prefix = s;
-        fmt_opts.use_anti_prefix = true;
-    };
-
-    if let Some(width) = matches.get_one::<usize>(OPT_WIDTH) {
-        fmt_opts.width = *width;
-        if fmt_opts.width > MAX_WIDTH {
-            return Err(USimpleError::new(
-                1,
-                format!(
-                    "invalid width: '{}': Numerical result out of range",
-                    fmt_opts.width,
-                ),
-            ));
-        }
-        fmt_opts.goal = cmp::min(
-            fmt_opts.width * DEFAULT_GOAL_TO_WIDTH_RATIO / 100,
-            fmt_opts.width - 3,
-        );
-    };
-
-    if let Some(goal) = matches.get_one::<usize>(OPT_GOAL) {
-        fmt_opts.goal = *goal;
-        if !matches.contains_id(OPT_WIDTH) {
-            fmt_opts.width = cmp::max(
-                fmt_opts.goal * 100 / DEFAULT_GOAL_TO_WIDTH_RATIO,
-                fmt_opts.goal + 3,
-            );
-        } else if fmt_opts.goal > fmt_opts.width {
-            return Err(USimpleError::new(1, "GOAL cannot be greater than WIDTH."));
-        }
-    };
-
-    if let Some(s) = matches.get_one::<String>(OPT_TAB_WIDTH) {
-        fmt_opts.tabwidth = match s.parse::<usize>() {
-            Ok(t) => t,
-            Err(e) => {
-                return Err(USimpleError::new(
-                    1,
-                    format!("Invalid TABWIDTH specification: {}: {}", s.quote(), e),
-                ));
-            }
-        };
-    };
-
-    if fmt_opts.tabwidth < 1 {
-        fmt_opts.tabwidth = 1;
-    }
-
-    // immutable now
-    let fmt_opts = fmt_opts;
+    let fmt_opts = FmtOptions::from_matches(&matches)?;
 
     if files.is_empty() {
         files.push("-".to_owned());

From f5206ce783d1606432c20f67d8ab027fcab06e7c Mon Sep 17 00:00:00 2001
From: Terts Diepraam <terts.diepraam@gmail.com>
Date: Tue, 28 Nov 2023 12:05:35 +0100
Subject: [PATCH 082/429] fmt: merge prefix and use_prefix options (same for
 anti_prefix)

---
 src/uu/fmt/src/fmt.rs       | 23 ++++-------------------
 src/uu/fmt/src/parasplit.rs | 22 +++++++++-------------
 2 files changed, 13 insertions(+), 32 deletions(-)

diff --git a/src/uu/fmt/src/fmt.rs b/src/uu/fmt/src/fmt.rs
index 3a494c868e5..3a02c642902 100644
--- a/src/uu/fmt/src/fmt.rs
+++ b/src/uu/fmt/src/fmt.rs
@@ -49,11 +49,9 @@ pub struct FmtOptions {
     tagged: bool,
     mail: bool,
     split_only: bool,
-    use_prefix: bool,
-    prefix: String,
+    prefix: Option<String>,
     xprefix: bool,
-    use_anti_prefix: bool,
-    anti_prefix: String,
+    anti_prefix: Option<String>,
     xanti_prefix: bool,
     uniform: bool,
     quick: bool,
@@ -83,19 +81,8 @@ impl FmtOptions {
         let xprefix = matches.contains_id(OPT_EXACT_PREFIX);
         let xanti_prefix = matches.contains_id(OPT_SKIP_PREFIX);
 
-        let mut prefix = String::new();
-        let mut use_prefix = false;
-        if let Some(s) = matches.get_one::<String>(OPT_PREFIX).map(String::from) {
-            prefix = s;
-            use_prefix = true;
-        };
-
-        let mut anti_prefix = String::new();
-        let mut use_anti_prefix = false;
-        if let Some(s) = matches.get_one::<String>(OPT_SKIP_PREFIX).map(String::from) {
-            anti_prefix = s;
-            use_anti_prefix = true;
-        };
+        let prefix = matches.get_one::<String>(OPT_PREFIX).map(String::from);
+        let anti_prefix = matches.get_one::<String>(OPT_SKIP_PREFIX).map(String::from);
 
         let mut width = 75;
         let mut goal = 70;
@@ -143,10 +130,8 @@ impl FmtOptions {
             uniform,
             quick,
             split_only,
-            use_prefix,
             prefix,
             xprefix,
-            use_anti_prefix,
             anti_prefix,
             xanti_prefix,
             width,
diff --git a/src/uu/fmt/src/parasplit.rs b/src/uu/fmt/src/parasplit.rs
index 311ddbc9b83..f22400dff20 100644
--- a/src/uu/fmt/src/parasplit.rs
+++ b/src/uu/fmt/src/parasplit.rs
@@ -80,24 +80,20 @@ impl<'a> FileLines<'a> {
 
     /// returns true if this line should be formatted
     fn match_prefix(&self, line: &str) -> (bool, usize) {
-        if !self.opts.use_prefix {
+        let Some(prefix) = &self.opts.prefix else {
             return (true, 0);
-        }
+        };
 
-        FileLines::match_prefix_generic(&self.opts.prefix[..], line, self.opts.xprefix)
+        FileLines::match_prefix_generic(prefix, line, self.opts.xprefix)
     }
 
     /// returns true if this line should be formatted
     fn match_anti_prefix(&self, line: &str) -> bool {
-        if !self.opts.use_anti_prefix {
+        let Some(anti_prefix) = &self.opts.anti_prefix else {
             return true;
-        }
+        };
 
-        match FileLines::match_prefix_generic(
-            &self.opts.anti_prefix[..],
-            line,
-            self.opts.xanti_prefix,
-        ) {
+        match FileLines::match_prefix_generic(anti_prefix, line, self.opts.xanti_prefix) {
             (true, _) => false,
             (_, _) => true,
         }
@@ -176,7 +172,7 @@ impl<'a> Iterator for FileLines<'a> {
         // not truly blank we will not allow mail headers on the
         // following line)
         if pmatch
-            && n[poffset + self.opts.prefix.len()..]
+            && n[poffset + self.opts.prefix.as_ref().map_or(0, |s| s.len())..]
                 .chars()
                 .all(char::is_whitespace)
         {
@@ -190,7 +186,7 @@ impl<'a> Iterator for FileLines<'a> {
         }
 
         // figure out the indent, prefix, and prefixindent ending points
-        let prefix_end = poffset + self.opts.prefix.len();
+        let prefix_end = poffset + self.opts.prefix.as_ref().map_or(0, |s| s.len());
         let (indent_end, prefix_len, indent_len) = self.compute_indent(&n[..], prefix_end);
 
         Some(Line::FormatLine(FileLine {
@@ -357,7 +353,7 @@ impl<'a> Iterator for ParagraphStream<'a> {
                 }
             } else if in_mail {
                 // lines following mail headers must begin with spaces
-                if fl.indent_end == 0 || (self.opts.use_prefix && fl.pfxind_end == 0) {
+                if fl.indent_end == 0 || (self.opts.prefix.is_some() && fl.pfxind_end == 0) {
                     break; // this line does not begin with spaces
                 }
             } else if !second_done {

From 96ca5e609eacf4fd09316da2c4bbd165ff052273 Mon Sep 17 00:00:00 2001
From: Terts Diepraam <terts.diepraam@gmail.com>
Date: Tue, 28 Nov 2023 12:22:46 +0100
Subject: [PATCH 083/429] fmt: refactor width and goal calculation

---
 src/uu/fmt/src/fmt.rs | 42 +++++++++++++++++++++++-------------------
 1 file changed, 23 insertions(+), 19 deletions(-)

diff --git a/src/uu/fmt/src/fmt.rs b/src/uu/fmt/src/fmt.rs
index 3a02c642902..0ed32641fbb 100644
--- a/src/uu/fmt/src/fmt.rs
+++ b/src/uu/fmt/src/fmt.rs
@@ -6,7 +6,6 @@
 // spell-checker:ignore (ToDO) PSKIP linebreak ostream parasplit tabwidth xanti xprefix
 
 use clap::{crate_version, Arg, ArgAction, ArgMatches, Command};
-use std::cmp;
 use std::fs::File;
 use std::io::{stdin, stdout, Write};
 use std::io::{BufReader, BufWriter, Read, Stdout};
@@ -84,28 +83,33 @@ impl FmtOptions {
         let prefix = matches.get_one::<String>(OPT_PREFIX).map(String::from);
         let anti_prefix = matches.get_one::<String>(OPT_SKIP_PREFIX).map(String::from);
 
-        let mut width = 75;
-        let mut goal = 70;
-        if let Some(w) = matches.get_one::<usize>(OPT_WIDTH) {
-            width = *w;
-            if width > MAX_WIDTH {
-                return Err(USimpleError::new(
-                    1,
-                    format!("invalid width: '{}': Numerical result out of range", width),
-                ));
+        let width_opt = matches.get_one::<usize>(OPT_WIDTH);
+        let goal_opt = matches.get_one::<usize>(OPT_GOAL);
+        let (width, goal) = match (width_opt, goal_opt) {
+            (Some(&w), Some(&g)) => {
+                if g > w {
+                    return Err(USimpleError::new(1, "GOAL cannot be greater than WIDTH."));
+                }
+                (w, g)
             }
-            goal = cmp::min(width * DEFAULT_GOAL_TO_WIDTH_RATIO / 100, width - 3);
-        };
-
-        if let Some(g) = matches.get_one::<usize>(OPT_GOAL) {
-            goal = *g;
-            if !matches.contains_id(OPT_WIDTH) {
-                width = cmp::max(goal * 100 / DEFAULT_GOAL_TO_WIDTH_RATIO, goal + 3);
-            } else if goal > width {
-                return Err(USimpleError::new(1, "GOAL cannot be greater than WIDTH."));
+            (Some(&w), None) => {
+                let g = (w * DEFAULT_GOAL_TO_WIDTH_RATIO / 100).min(w - 3);
+                (w, g)
             }
+            (None, Some(&g)) => {
+                let w = (g * 100 / DEFAULT_GOAL_TO_WIDTH_RATIO).max(g + 3);
+                (w, g)
+            }
+            (None, None) => (75, 70),
         };
 
+        if width > MAX_WIDTH {
+            return Err(USimpleError::new(
+                1,
+                format!("invalid width: '{}': Numerical result out of range", width),
+            ));
+        }
+
         let mut tabwidth = 8;
         if let Some(s) = matches.get_one::<String>(OPT_TAB_WIDTH) {
             tabwidth = match s.parse::<usize>() {

From 8a494530572ca1a2221416a284144a9e44177f8e Mon Sep 17 00:00:00 2001
From: Terts Diepraam <terts.diepraam@gmail.com>
Date: Tue, 28 Nov 2023 12:24:18 +0100
Subject: [PATCH 084/429] fmt: clean up imports

---
 src/uu/fmt/src/fmt.rs       | 4 ++--
 src/uu/fmt/src/linebreak.rs | 4 +---
 2 files changed, 3 insertions(+), 5 deletions(-)

diff --git a/src/uu/fmt/src/fmt.rs b/src/uu/fmt/src/fmt.rs
index 0ed32641fbb..3461a79ba7f 100644
--- a/src/uu/fmt/src/fmt.rs
+++ b/src/uu/fmt/src/fmt.rs
@@ -13,8 +13,8 @@ use uucore::display::Quotable;
 use uucore::error::{FromIo, UResult, USimpleError};
 use uucore::{format_usage, help_about, help_usage, show_warning};
 
-use self::linebreak::break_lines;
-use self::parasplit::ParagraphStream;
+use linebreak::break_lines;
+use parasplit::ParagraphStream;
 
 mod linebreak;
 mod parasplit;
diff --git a/src/uu/fmt/src/linebreak.rs b/src/uu/fmt/src/linebreak.rs
index 7cd65d86149..306c15f3614 100644
--- a/src/uu/fmt/src/linebreak.rs
+++ b/src/uu/fmt/src/linebreak.rs
@@ -5,10 +5,8 @@
 
 // spell-checker:ignore (ToDO) INFTY MULT accum breakwords linebreak linebreaking linebreaks linelen maxlength minlength nchars ostream overlen parasplit plass posn powf punct signum slen sstart tabwidth tlen underlen winfo wlen wordlen
 
-use std::cmp;
-use std::i64;
 use std::io::{BufWriter, Stdout, Write};
-use std::mem;
+use std::{cmp, i64, mem};
 
 use uucore::crash;
 

From 0b4d4b610cc510a7aff4095447ddf8195cf27072 Mon Sep 17 00:00:00 2001
From: Terts Diepraam <terts.diepraam@gmail.com>
Date: Tue, 28 Nov 2023 12:30:01 +0100
Subject: [PATCH 085/429] fmt: put options into module and change static to
 const

---
 src/uu/fmt/src/fmt.rs | 100 +++++++++++++++++++++---------------------
 1 file changed, 51 insertions(+), 49 deletions(-)

diff --git a/src/uu/fmt/src/fmt.rs b/src/uu/fmt/src/fmt.rs
index 3461a79ba7f..e44b7e0e5be 100644
--- a/src/uu/fmt/src/fmt.rs
+++ b/src/uu/fmt/src/fmt.rs
@@ -7,8 +7,7 @@
 
 use clap::{crate_version, Arg, ArgAction, ArgMatches, Command};
 use std::fs::File;
-use std::io::{stdin, stdout, Write};
-use std::io::{BufReader, BufWriter, Read, Stdout};
+use std::io::{stdin, stdout, BufReader, BufWriter, Read, Stdout, Write};
 use uucore::display::Quotable;
 use uucore::error::{FromIo, UResult, USimpleError};
 use uucore::{format_usage, help_about, help_usage, show_warning};
@@ -19,25 +18,26 @@ use parasplit::ParagraphStream;
 mod linebreak;
 mod parasplit;
 
-static ABOUT: &str = help_about!("fmt.md");
+const ABOUT: &str = help_about!("fmt.md");
 const USAGE: &str = help_usage!("fmt.md");
-static MAX_WIDTH: usize = 2500;
-
-static OPT_CROWN_MARGIN: &str = "crown-margin";
-static OPT_TAGGED_PARAGRAPH: &str = "tagged-paragraph";
-static OPT_PRESERVE_HEADERS: &str = "preserve-headers";
-static OPT_SPLIT_ONLY: &str = "split-only";
-static OPT_UNIFORM_SPACING: &str = "uniform-spacing";
-static OPT_PREFIX: &str = "prefix";
-static OPT_SKIP_PREFIX: &str = "skip-prefix";
-static OPT_EXACT_PREFIX: &str = "exact-prefix";
-static OPT_EXACT_SKIP_PREFIX: &str = "exact-skip-prefix";
-static OPT_WIDTH: &str = "width";
-static OPT_GOAL: &str = "goal";
-static OPT_QUICK: &str = "quick";
-static OPT_TAB_WIDTH: &str = "tab-width";
-
-static ARG_FILES: &str = "files";
+const MAX_WIDTH: usize = 2500;
+
+mod options {
+    pub const CROWN_MARGIN: &str = "crown-margin";
+    pub const TAGGED_PARAGRAPH: &str = "tagged-paragraph";
+    pub const PRESERVE_HEADERS: &str = "preserve-headers";
+    pub const SPLIT_ONLY: &str = "split-only";
+    pub const UNIFORM_SPACING: &str = "uniform-spacing";
+    pub const PREFIX: &str = "prefix";
+    pub const SKIP_PREFIX: &str = "skip-prefix";
+    pub const EXACT_PREFIX: &str = "exact-prefix";
+    pub const EXACT_SKIP_PREFIX: &str = "exact-skip-prefix";
+    pub const WIDTH: &str = "width";
+    pub const GOAL: &str = "goal";
+    pub const QUICK: &str = "quick";
+    pub const TAB_WIDTH: &str = "tab-width";
+    pub const FILES: &str = "files";
+}
 
 // by default, goal is 93% of width
 const DEFAULT_GOAL_TO_WIDTH_RATIO: usize = 93;
@@ -61,13 +61,13 @@ pub struct FmtOptions {
 
 impl FmtOptions {
     fn from_matches(matches: &ArgMatches) -> UResult<Self> {
-        let mut tagged = matches.get_flag(OPT_TAGGED_PARAGRAPH);
-        let mut crown = matches.get_flag(OPT_CROWN_MARGIN);
+        let mut tagged = matches.get_flag(options::TAGGED_PARAGRAPH);
+        let mut crown = matches.get_flag(options::CROWN_MARGIN);
 
-        let mail = matches.get_flag(OPT_PRESERVE_HEADERS);
-        let uniform = matches.get_flag(OPT_UNIFORM_SPACING);
-        let quick = matches.get_flag(OPT_QUICK);
-        let split_only = matches.get_flag(OPT_SPLIT_ONLY);
+        let mail = matches.get_flag(options::PRESERVE_HEADERS);
+        let uniform = matches.get_flag(options::UNIFORM_SPACING);
+        let quick = matches.get_flag(options::QUICK);
+        let split_only = matches.get_flag(options::SPLIT_ONLY);
 
         if crown {
             tagged = false;
@@ -77,14 +77,16 @@ impl FmtOptions {
             tagged = false;
         }
 
-        let xprefix = matches.contains_id(OPT_EXACT_PREFIX);
-        let xanti_prefix = matches.contains_id(OPT_SKIP_PREFIX);
+        let xprefix = matches.contains_id(options::EXACT_PREFIX);
+        let xanti_prefix = matches.contains_id(options::SKIP_PREFIX);
 
-        let prefix = matches.get_one::<String>(OPT_PREFIX).map(String::from);
-        let anti_prefix = matches.get_one::<String>(OPT_SKIP_PREFIX).map(String::from);
+        let prefix = matches.get_one::<String>(options::PREFIX).map(String::from);
+        let anti_prefix = matches
+            .get_one::<String>(options::SKIP_PREFIX)
+            .map(String::from);
 
-        let width_opt = matches.get_one::<usize>(OPT_WIDTH);
-        let goal_opt = matches.get_one::<usize>(OPT_GOAL);
+        let width_opt = matches.get_one::<usize>(options::WIDTH);
+        let goal_opt = matches.get_one::<usize>(options::GOAL);
         let (width, goal) = match (width_opt, goal_opt) {
             (Some(&w), Some(&g)) => {
                 if g > w {
@@ -111,7 +113,7 @@ impl FmtOptions {
         }
 
         let mut tabwidth = 8;
-        if let Some(s) = matches.get_one::<String>(OPT_TAB_WIDTH) {
+        if let Some(s) = matches.get_one::<String>(options::TAB_WIDTH) {
             tabwidth = match s.parse::<usize>() {
                 Ok(t) => t,
                 Err(e) => {
@@ -158,7 +160,7 @@ fn parse_arguments(args: impl uucore::Args) -> UResult<(Vec<String>, FmtOptions)
     let matches = uu_app().try_get_matches_from(args)?;
 
     let mut files: Vec<String> = matches
-        .get_many::<String>(ARG_FILES)
+        .get_many::<String>(options::FILES)
         .map(|v| v.map(ToString::to_string).collect())
         .unwrap_or_default();
 
@@ -242,9 +244,9 @@ pub fn uu_app() -> Command {
         .override_usage(format_usage(USAGE))
         .infer_long_args(true)
         .arg(
-            Arg::new(OPT_CROWN_MARGIN)
+            Arg::new(options::CROWN_MARGIN)
                 .short('c')
-                .long(OPT_CROWN_MARGIN)
+                .long(options::CROWN_MARGIN)
                 .help(
                     "First and second line of paragraph \
                     may have different indentations, in which \
@@ -254,7 +256,7 @@ pub fn uu_app() -> Command {
                 .action(ArgAction::SetTrue),
         )
         .arg(
-            Arg::new(OPT_TAGGED_PARAGRAPH)
+            Arg::new(options::TAGGED_PARAGRAPH)
                 .short('t')
                 .long("tagged-paragraph")
                 .help(
@@ -264,7 +266,7 @@ pub fn uu_app() -> Command {
                 .action(ArgAction::SetTrue),
         )
         .arg(
-            Arg::new(OPT_PRESERVE_HEADERS)
+            Arg::new(options::PRESERVE_HEADERS)
                 .short('m')
                 .long("preserve-headers")
                 .help(
@@ -274,14 +276,14 @@ pub fn uu_app() -> Command {
                 .action(ArgAction::SetTrue),
         )
         .arg(
-            Arg::new(OPT_SPLIT_ONLY)
+            Arg::new(options::SPLIT_ONLY)
                 .short('s')
                 .long("split-only")
                 .help("Split lines only, do not reflow.")
                 .action(ArgAction::SetTrue),
         )
         .arg(
-            Arg::new(OPT_UNIFORM_SPACING)
+            Arg::new(options::UNIFORM_SPACING)
                 .short('u')
                 .long("uniform-spacing")
                 .help(
@@ -294,7 +296,7 @@ pub fn uu_app() -> Command {
                 .action(ArgAction::SetTrue),
         )
         .arg(
-            Arg::new(OPT_PREFIX)
+            Arg::new(options::PREFIX)
                 .short('p')
                 .long("prefix")
                 .help(
@@ -306,7 +308,7 @@ pub fn uu_app() -> Command {
                 .value_name("PREFIX"),
         )
         .arg(
-            Arg::new(OPT_SKIP_PREFIX)
+            Arg::new(options::SKIP_PREFIX)
                 .short('P')
                 .long("skip-prefix")
                 .help(
@@ -317,7 +319,7 @@ pub fn uu_app() -> Command {
                 .value_name("PSKIP"),
         )
         .arg(
-            Arg::new(OPT_EXACT_PREFIX)
+            Arg::new(options::EXACT_PREFIX)
                 .short('x')
                 .long("exact-prefix")
                 .help(
@@ -327,7 +329,7 @@ pub fn uu_app() -> Command {
                 .action(ArgAction::SetTrue),
         )
         .arg(
-            Arg::new(OPT_EXACT_SKIP_PREFIX)
+            Arg::new(options::EXACT_SKIP_PREFIX)
                 .short('X')
                 .long("exact-skip-prefix")
                 .help(
@@ -337,7 +339,7 @@ pub fn uu_app() -> Command {
                 .action(ArgAction::SetTrue),
         )
         .arg(
-            Arg::new(OPT_WIDTH)
+            Arg::new(options::WIDTH)
                 .short('w')
                 .long("width")
                 .help("Fill output lines up to a maximum of WIDTH columns, default 75.")
@@ -345,7 +347,7 @@ pub fn uu_app() -> Command {
                 .value_parser(clap::value_parser!(usize)),
         )
         .arg(
-            Arg::new(OPT_GOAL)
+            Arg::new(options::GOAL)
                 .short('g')
                 .long("goal")
                 .help("Goal width, default of 93% of WIDTH. Must be less than WIDTH.")
@@ -353,7 +355,7 @@ pub fn uu_app() -> Command {
                 .value_parser(clap::value_parser!(usize)),
         )
         .arg(
-            Arg::new(OPT_QUICK)
+            Arg::new(options::QUICK)
                 .short('q')
                 .long("quick")
                 .help(
@@ -363,7 +365,7 @@ pub fn uu_app() -> Command {
                 .action(ArgAction::SetTrue),
         )
         .arg(
-            Arg::new(OPT_TAB_WIDTH)
+            Arg::new(options::TAB_WIDTH)
                 .short('T')
                 .long("tab-width")
                 .help(
@@ -374,7 +376,7 @@ pub fn uu_app() -> Command {
                 .value_name("TABWIDTH"),
         )
         .arg(
-            Arg::new(ARG_FILES)
+            Arg::new(options::FILES)
                 .action(ArgAction::Append)
                 .value_hint(clap::ValueHint::FilePath),
         )

From 2a8f4ec294369c228bc8063676879a9ac9e436e5 Mon Sep 17 00:00:00 2001
From: Terts Diepraam <terts.diepraam@gmail.com>
Date: Tue, 28 Nov 2023 12:34:04 +0100
Subject: [PATCH 086/429] fmt: inline parse_arguments function

---
 src/uu/fmt/src/fmt.rs | 35 ++++++++---------------------------
 1 file changed, 8 insertions(+), 27 deletions(-)

diff --git a/src/uu/fmt/src/fmt.rs b/src/uu/fmt/src/fmt.rs
index e44b7e0e5be..4380487814b 100644
--- a/src/uu/fmt/src/fmt.rs
+++ b/src/uu/fmt/src/fmt.rs
@@ -147,32 +147,6 @@ impl FmtOptions {
     }
 }
 
-/// Parse the command line arguments and return the list of files and formatting options.
-///
-/// # Arguments
-///
-/// * `args` - Command line arguments.
-///
-/// # Returns
-///
-/// A tuple containing a vector of file names and a `FmtOptions` struct.
-fn parse_arguments(args: impl uucore::Args) -> UResult<(Vec<String>, FmtOptions)> {
-    let matches = uu_app().try_get_matches_from(args)?;
-
-    let mut files: Vec<String> = matches
-        .get_many::<String>(options::FILES)
-        .map(|v| v.map(ToString::to_string).collect())
-        .unwrap_or_default();
-
-    let fmt_opts = FmtOptions::from_matches(&matches)?;
-
-    if files.is_empty() {
-        files.push("-".to_owned());
-    }
-
-    Ok((files, fmt_opts))
-}
-
 /// Process the content of a file and format it according to the provided options.
 ///
 /// # Arguments
@@ -226,7 +200,14 @@ fn process_file(
 
 #[uucore::main]
 pub fn uumain(args: impl uucore::Args) -> UResult<()> {
-    let (files, fmt_opts) = parse_arguments(args)?;
+    let matches = uu_app().try_get_matches_from(args)?;
+
+    let files: Vec<String> = matches
+        .get_many::<String>(options::FILES)
+        .map(|v| v.map(ToString::to_string).collect())
+        .unwrap_or(vec!["-".into()]);
+
+    let fmt_opts = FmtOptions::from_matches(&matches)?;
 
     let mut ostream = BufWriter::new(stdout());
 

From 2d5ea264106b26caea8133f8d3d1c31ade2ac3ba Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Tue, 28 Nov 2023 14:33:19 +0100
Subject: [PATCH 087/429] fmt: rename pfxind_end -> prefix_indent_end

---
 src/uu/fmt/src/parasplit.rs | 20 ++++++++++----------
 1 file changed, 10 insertions(+), 10 deletions(-)

diff --git a/src/uu/fmt/src/parasplit.rs b/src/uu/fmt/src/parasplit.rs
index f22400dff20..1ae8ea34f42 100644
--- a/src/uu/fmt/src/parasplit.rs
+++ b/src/uu/fmt/src/parasplit.rs
@@ -3,7 +3,7 @@
 // For the full copyright and license information, please view the LICENSE
 // file that was distributed with this source code.
 
-// spell-checker:ignore (ToDO) INFTY MULT PSKIP accum aftertab beforetab breakwords fmt's formatline linebreak linebreaking linebreaks linelen maxlength minlength nchars noformat noformatline ostream overlen parasplit pfxind plass pmatch poffset posn powf prefixindent punct signum slen sstart tabwidth tlen underlen winfo wlen wordlen wordsplits xanti xprefix
+// spell-checker:ignore (ToDO) INFTY MULT PSKIP accum aftertab beforetab breakwords fmt's formatline linebreak linebreaking linebreaks linelen maxlength minlength nchars noformat noformatline ostream overlen parasplit plass pmatch poffset posn powf prefixindent punct signum slen sstart tabwidth tlen underlen winfo wlen wordlen wordsplits xanti xprefix
 
 use std::io::{BufRead, Lines};
 use std::iter::Peekable;
@@ -60,7 +60,7 @@ pub struct FileLine {
     /// The end of the indent, always the start of the text
     indent_end: usize,
     /// The end of the PREFIX's indent, that is, the spaces before the prefix
-    pfxind_end: usize,
+    prefix_indent_end: usize,
     /// Display length of indent taking into account tabs
     indent_len: usize,
     /// PREFIX indent length taking into account tabs
@@ -192,7 +192,7 @@ impl<'a> Iterator for FileLines<'a> {
         Some(Line::FormatLine(FileLine {
             line: n,
             indent_end,
-            pfxind_end: poffset,
+            prefix_indent_end: poffset,
             indent_len,
             prefix_len,
         }))
@@ -210,7 +210,7 @@ pub struct Paragraph {
     lines: Vec<String>,
     /// string representing the init, that is, the first line's indent
     pub init_str: String,
-    /// printable length of the init string considering TABWIDTH    
+    /// printable length of the init string considering TABWIDTH
     pub init_len: usize,
     /// byte location of end of init in first line String
     init_end: usize,
@@ -299,7 +299,7 @@ impl<'a> Iterator for ParagraphStream<'a> {
         let mut indent_end = 0;
         let mut indent_len = 0;
         let mut prefix_len = 0;
-        let mut pfxind_end = 0;
+        let mut prefix_indent_end = 0;
         let mut p_lines = Vec::new();
 
         let mut in_mail = false;
@@ -316,7 +316,7 @@ impl<'a> Iterator for ParagraphStream<'a> {
                 // detect mail header
                 if self.opts.mail && self.next_mail && ParagraphStream::is_mail_header(fl) {
                     in_mail = true;
-                    // there can't be any indent or pfxind because otherwise is_mail_header
+                    // there can't be any indent or prefixindent because otherwise is_mail_header
                     // would fail since there cannot be any whitespace before the colon in a
                     // valid header field
                     indent_str.push_str("  ");
@@ -339,7 +339,7 @@ impl<'a> Iterator for ParagraphStream<'a> {
 
                     // save these to check for matching lines
                     prefix_len = fl.prefix_len;
-                    pfxind_end = fl.pfxind_end;
+                    prefix_indent_end = fl.prefix_indent_end;
 
                     // in tagged mode, add 4 spaces of additional indenting by default
                     // (gnu fmt's behavior is different: it seems to find the closest column to
@@ -353,14 +353,14 @@ impl<'a> Iterator for ParagraphStream<'a> {
                 }
             } else if in_mail {
                 // lines following mail headers must begin with spaces
-                if fl.indent_end == 0 || (self.opts.prefix.is_some() && fl.pfxind_end == 0) {
+                if fl.indent_end == 0 || (self.opts.prefix.is_some() && fl.prefix_indent_end == 0) {
                     break; // this line does not begin with spaces
                 }
             } else if !second_done {
                 // now we have enough info to handle crown margin and tagged mode
 
                 // in both crown and tagged modes we require that prefix_len is the same
-                if prefix_len != fl.prefix_len || pfxind_end != fl.pfxind_end {
+                if prefix_len != fl.prefix_len || prefix_indent_end != fl.prefix_indent_end {
                     break;
                 }
 
@@ -382,7 +382,7 @@ impl<'a> Iterator for ParagraphStream<'a> {
             } else {
                 // detect mismatch
                 if indent_end != fl.indent_end
-                    || pfxind_end != fl.pfxind_end
+                    || prefix_indent_end != fl.prefix_indent_end
                     || indent_len != fl.indent_len
                     || prefix_len != fl.prefix_len
                 {

From 7383820354d497b647bd721f3b147d9700676847 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Dylan=20A=C3=AFssi?= <dylan.aissi@collabora.com>
Date: Tue, 28 Nov 2023 16:51:20 +0100
Subject: [PATCH 088/429] uuhelp_parser: include missing LICENSE
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Signed-off-by: Dylan Aïssi <dylan.aissi@collabora.com>
---
 src/uuhelp_parser/LICENSE | 1 +
 1 file changed, 1 insertion(+)
 create mode 120000 src/uuhelp_parser/LICENSE

diff --git a/src/uuhelp_parser/LICENSE b/src/uuhelp_parser/LICENSE
new file mode 120000
index 00000000000..30cff7403da
--- /dev/null
+++ b/src/uuhelp_parser/LICENSE
@@ -0,0 +1 @@
+../../LICENSE
\ No newline at end of file

From 6eec4fe8f9ce40e95199de2fc67170d2cd11bfae Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Wed, 29 Nov 2023 09:35:22 +0100
Subject: [PATCH 089/429] cut: add test & improve error message

---
 src/uu/cut/src/cut.rs     |  2 +-
 tests/by-util/test_cut.rs | 11 ++++++++++-
 2 files changed, 11 insertions(+), 2 deletions(-)

diff --git a/src/uu/cut/src/cut.rs b/src/uu/cut/src/cut.rs
index 05e8bc6e424..0555be14f73 100644
--- a/src/uu/cut/src/cut.rs
+++ b/src/uu/cut/src/cut.rs
@@ -426,7 +426,7 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
                             delim = "";
                         }
                         if delim.chars().count() > 1 {
-                            Err("invalid input: The '--delimiter' ('-d') option expects empty or 1 character long, but was provided a value 2 characters or longer".into())
+                            Err("the delimiter must be a single character".into())
                         } else {
                             let delim = if delim.is_empty() {
                                 "\0".to_owned()
diff --git a/tests/by-util/test_cut.rs b/tests/by-util/test_cut.rs
index 184e413a867..112dc0fd3e5 100644
--- a/tests/by-util/test_cut.rs
+++ b/tests/by-util/test_cut.rs
@@ -126,7 +126,7 @@ fn test_too_large() {
 }
 
 #[test]
-fn test_specify_delimiter() {
+fn test_delimiter() {
     for param in ["-d", "--delimiter", "--del"] {
         new_ucmd!()
             .args(&[param, ":", "-f", COMPLEX_SEQUENCE.sequence, INPUT])
@@ -135,6 +135,15 @@ fn test_specify_delimiter() {
     }
 }
 
+#[test]
+fn test_delimiter_with_more_than_one_char() {
+    new_ucmd!()
+        .args(&["-d", "ab", "-f1"])
+        .fails()
+        .stderr_contains("cut: the delimiter must be a single character")
+        .no_stdout();
+}
+
 #[test]
 fn test_output_delimiter() {
     // we use -d here to ensure output delimiter

From 66e0835e72a72d8ff0a97213b5320fc45973ecbc Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Wed, 29 Nov 2023 09:55:55 +0100
Subject: [PATCH 090/429] fuzz the echo command

---
 fuzz/Cargo.toml                |  7 +++
 fuzz/fuzz_targets/fuzz_echo.rs | 93 ++++++++++++++++++++++++++++++++++
 2 files changed, 100 insertions(+)
 create mode 100644 fuzz/fuzz_targets/fuzz_echo.rs

diff --git a/fuzz/Cargo.toml b/fuzz/Cargo.toml
index 630af4650b6..b27f5b58677 100644
--- a/fuzz/Cargo.toml
+++ b/fuzz/Cargo.toml
@@ -17,6 +17,7 @@ uu_date = { path = "../src/uu/date/" }
 uu_test = { path = "../src/uu/test/" }
 uu_expr = { path = "../src/uu/expr/" }
 uu_printf = { path = "../src/uu/printf/" }
+uu_echo = { path = "../src/uu/echo/" }
 
 
 # Prevent this from interfering with workspaces
@@ -35,6 +36,12 @@ path = "fuzz_targets/fuzz_printf.rs"
 test = false
 doc = false
 
+[[bin]]
+name = "fuzz_echo"
+path = "fuzz_targets/fuzz_echo.rs"
+test = false
+doc = false
+
 [[bin]]
 name = "fuzz_expr"
 path = "fuzz_targets/fuzz_expr.rs"
diff --git a/fuzz/fuzz_targets/fuzz_echo.rs b/fuzz/fuzz_targets/fuzz_echo.rs
new file mode 100644
index 00000000000..3d810085301
--- /dev/null
+++ b/fuzz/fuzz_targets/fuzz_echo.rs
@@ -0,0 +1,93 @@
+#![no_main]
+use libfuzzer_sys::fuzz_target;
+use uu_echo::uumain; // Changed from uu_printf to uu_echo
+
+use rand::prelude::SliceRandom;
+use rand::Rng;
+use std::ffi::OsString;
+
+mod fuzz_common;
+use crate::fuzz_common::CommandResult;
+use crate::fuzz_common::{
+    compare_result, generate_and_run_uumain, generate_random_string, run_gnu_cmd,
+};
+
+static CMD_PATH: &str = "/usr/bin/echo"; // Changed from "printf" to "echo"
+
+fn generate_echo() -> String {
+    let mut rng = rand::thread_rng();
+    let mut echo_str = String::new();
+
+    // Randomly decide whether to include options
+    let include_n = rng.gen_bool(0.1); // 10% chance
+    let include_e = rng.gen_bool(0.1); // 10% chance
+    let include_E = rng.gen_bool(0.1); // 10% chance
+                                       // --help and --version are typically not included in fuzzing as they don't change output format
+
+    if include_n {
+        echo_str.push_str("-n ");
+    }
+    if include_e {
+        echo_str.push_str("-e ");
+    }
+    if include_E {
+        echo_str.push_str("-E ");
+    }
+
+    // Add a random string
+    echo_str.push_str(&generate_random_string(rng.gen_range(1..=10)));
+
+    // Include escape sequences if -e is enabled
+    if include_e {
+        // Add a 10% chance of including an escape sequence
+        if rng.gen_bool(0.1) {
+            echo_str.push_str(&generate_escape_sequence(&mut rng)); // This function should handle echo-specific sequences
+        }
+    }
+
+    echo_str
+}
+
+// You should also modify the generate_escape_sequence function to include echo-specific sequences
+fn generate_escape_sequence(rng: &mut impl Rng) -> String {
+    let escape_sequences = [
+        "\\\\", "\\a", "\\b", "\\c", "\\e", "\\f", "\\n", "\\r", "\\t", "\\v",
+        "\\0NNN", // You can randomly generate NNN
+        "\\xHH",  // You can randomly generate HH
+                  // ... other sequences
+    ];
+    escape_sequences.choose(rng).unwrap().to_string()
+}
+
+fuzz_target!(|_data: &[u8]| {
+    let echo_input = generate_echo(); // Changed from generate_printf to generate_echo
+    let mut args = vec![OsString::from("echo")]; // Changed from "printf" to "echo"
+    args.extend(echo_input.split_whitespace().map(OsString::from));
+    let rust_result = generate_and_run_uumain(&args, uumain); // uumain function from uu_echo
+
+    let gnu_result = match run_gnu_cmd(CMD_PATH, &args[1..], false) {
+        Ok(result) => result,
+        Err(error_result) => {
+            eprintln!("Failed to run GNU command:");
+            eprintln!("Stderr: {}", error_result.stderr);
+            eprintln!("Exit Code: {}", error_result.exit_code);
+            CommandResult {
+                stdout: String::new(),
+                stderr: error_result.stderr,
+                exit_code: error_result.exit_code,
+            }
+        }
+    };
+
+    compare_result(
+        "echo",
+        &format!("{:?}", &args[1..]),
+        &rust_result.stdout,
+        &gnu_result.stdout,
+        &rust_result.stderr,
+        &gnu_result.stderr,
+        rust_result.exit_code,
+        gnu_result.exit_code,
+        false, // Set to true if you want to fail on stderr diff
+    );
+});

From 203e79d74b406a02ab7202f36c66ed148f11411c Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Wed, 29 Nov 2023 14:09:13 +0100
Subject: [PATCH 091/429] Fix unused import: `UError`

---
 src/uu/kill/src/kill.rs | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/uu/kill/src/kill.rs b/src/uu/kill/src/kill.rs
index b0e18a79820..f353fd7cab3 100644
--- a/src/uu/kill/src/kill.rs
+++ b/src/uu/kill/src/kill.rs
@@ -10,7 +10,7 @@ use nix::sys::signal::{self, Signal};
 use nix::unistd::Pid;
 use std::io::Error;
 use uucore::display::Quotable;
-use uucore::error::{FromIo, UError, UResult, USimpleError};
+use uucore::error::{FromIo, UResult, USimpleError};
 use uucore::signals::{signal_by_name_or_value, ALL_SIGNALS};
 use uucore::{format_usage, help_about, help_usage, show};
 

From 420df3db3d14f89c1b11278fc485aac7fd1d9745 Mon Sep 17 00:00:00 2001
From: Laurent Cheylus <foxy@free.fr>
Date: Wed, 29 Nov 2023 17:44:50 +0100
Subject: [PATCH 092/429] Add support in uucore for OpenBSD

  - uucore/src/lib/features/fs.rs: add target_os = OpenBSD when needed
  - uucore/src/lib/features/fsext.rs: implement FsUsage::new for OpenBSD

  - fixes uutils/coreutils#5448

  - initial code by n1000 https://github.com/n1000/coreutils/tree/openbsd_compile_fixes

Signed-off-by: Laurent Cheylus <foxy@free.fr>
---
 src/uucore/src/lib/features/fs.rs    |  5 +++-
 src/uucore/src/lib/features/fsext.rs | 39 ++++++++++++++++++++++++----
 2 files changed, 38 insertions(+), 6 deletions(-)

diff --git a/src/uucore/src/lib/features/fs.rs b/src/uucore/src/lib/features/fs.rs
index de4c0b08dbe..94ca82c8098 100644
--- a/src/uucore/src/lib/features/fs.rs
+++ b/src/uucore/src/lib/features/fs.rs
@@ -115,6 +115,7 @@ impl FileInformation {
             not(target_os = "android"),
             not(target_os = "freebsd"),
             not(target_os = "netbsd"),
+            not(target_os = "openbsd"),
             not(target_os = "illumos"),
             not(target_os = "solaris"),
             not(target_arch = "aarch64"),
@@ -130,6 +131,7 @@ impl FileInformation {
                 target_os = "android",
                 target_os = "freebsd",
                 target_os = "netbsd",
+                target_os = "openbsd",
                 target_os = "illumos",
                 target_os = "solaris",
                 target_arch = "aarch64",
@@ -146,13 +148,14 @@ impl FileInformation {
     #[cfg(unix)]
     pub fn inode(&self) -> u64 {
         #[cfg(all(
-            not(any(target_os = "freebsd", target_os = "netbsd")),
+            not(any(target_os = "freebsd", target_os = "netbsd", target_os = "openbsd")),
             target_pointer_width = "64"
         ))]
         return self.0.st_ino;
         #[cfg(any(
             target_os = "freebsd",
             target_os = "netbsd",
+            target_os = "openbsd",
             not(target_pointer_width = "64")
         ))]
         return self.0.st_ino.into();
diff --git a/src/uucore/src/lib/features/fsext.rs b/src/uucore/src/lib/features/fsext.rs
index 8b1c42de6d1..93fedb44b7c 100644
--- a/src/uucore/src/lib/features/fsext.rs
+++ b/src/uucore/src/lib/features/fsext.rs
@@ -497,7 +497,10 @@ impl FsUsage {
     #[cfg(unix)]
     pub fn new(statvfs: StatFs) -> Self {
         {
-            #[cfg(all(not(target_os = "freebsd"), target_pointer_width = "64"))]
+            #[cfg(all(
+                not(any(target_os = "freebsd", target_os = "openbsd")),
+                target_pointer_width = "64"
+            ))]
             return Self {
                 blocksize: statvfs.f_bsize as u64, // or `statvfs.f_frsize` ?
                 blocks: statvfs.f_blocks,
@@ -507,7 +510,10 @@ impl FsUsage {
                 files: statvfs.f_files,
                 ffree: statvfs.f_ffree,
             };
-            #[cfg(all(not(target_os = "freebsd"), not(target_pointer_width = "64")))]
+            #[cfg(all(
+                not(any(target_os = "freebsd", target_os = "openbsd")),
+                not(target_pointer_width = "64")
+            ))]
             return Self {
                 blocksize: statvfs.f_bsize as u64, // or `statvfs.f_frsize` ?
                 blocks: statvfs.f_blocks.into(),
@@ -530,6 +536,19 @@ impl FsUsage {
                 files: statvfs.f_files,
                 ffree: statvfs.f_ffree.try_into().unwrap(),
             };
+            #[cfg(target_os = "openbsd")]
+            return Self {
+                blocksize: statvfs.f_bsize.into(),
+                blocks: statvfs.f_blocks,
+                bfree: statvfs.f_bfree,
+                bavail: statvfs.f_bavail.try_into().unwrap(),
+                bavail_top_bit_set: ((std::convert::TryInto::<u64>::try_into(statvfs.f_bavail)
+                    .unwrap())
+                    & (1u64.rotate_right(1)))
+                    != 0,
+                files: statvfs.f_files,
+                ffree: statvfs.f_ffree,
+            };
         }
     }
     #[cfg(not(unix))]
@@ -617,6 +636,7 @@ impl FsMeta for StatFs {
             not(target_vendor = "apple"),
             not(target_os = "android"),
             not(target_os = "freebsd"),
+            not(target_os = "openbsd"),
             not(target_os = "illumos"),
             not(target_os = "solaris"),
             not(target_arch = "s390x"),
@@ -630,6 +650,7 @@ impl FsMeta for StatFs {
                 target_arch = "s390x",
                 target_vendor = "apple",
                 target_os = "android",
+                target_os = "openbsd",
                 not(target_pointer_width = "64")
             )
         ))]
@@ -655,11 +676,19 @@ impl FsMeta for StatFs {
         return self.f_bfree.into();
     }
     fn avail_blocks(&self) -> u64 {
-        #[cfg(all(not(target_os = "freebsd"), target_pointer_width = "64"))]
+        #[cfg(all(
+            not(target_os = "freebsd"),
+            not(target_os = "openbsd"),
+            target_pointer_width = "64"
+        ))]
         return self.f_bavail;
-        #[cfg(all(not(target_os = "freebsd"), not(target_pointer_width = "64")))]
+        #[cfg(all(
+            not(target_os = "freebsd"),
+            not(target_os = "openbsd"),
+            not(target_pointer_width = "64")
+        ))]
         return self.f_bavail.into();
-        #[cfg(target_os = "freebsd")]
+        #[cfg(any(target_os = "freebsd", target_os = "openbsd"))]
         return self.f_bavail.try_into().unwrap();
     }
     fn total_file_nodes(&self) -> u64 {

From 173153122b255bb57afbbad1872a26ebe9050c16 Mon Sep 17 00:00:00 2001
From: "renovate[bot]" <29139614+renovate[bot]@users.noreply.github.com>
Date: Wed, 29 Nov 2023 21:49:08 +0000
Subject: [PATCH 093/429] chore(deps): update rust crate lscolors to 0.16.0

---
 Cargo.lock | 4 ++--
 Cargo.toml | 2 +-
 2 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/Cargo.lock b/Cargo.lock
index d7682f839e4..3f5e4280964 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -1240,9 +1240,9 @@ dependencies = [
 
 [[package]]
 name = "lscolors"
-version = "0.15.0"
+version = "0.16.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "bf7015a04103ad78abb77e4b79ed151e767922d1cfde5f62640471c629a2320d"
+checksum = "ab0b209ec3976527806024406fe765474b9a1750a0ed4b8f0372364741f50e7b"
 dependencies = [
  "nu-ansi-term",
 ]
diff --git a/Cargo.toml b/Cargo.toml
index ba701b2d5e5..14e700ee0a6 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -287,7 +287,7 @@ half = "2.3"
 indicatif = "0.17"
 itertools = "0.12.0"
 libc = "0.2.150"
-lscolors = { version = "0.15.0", default-features = false, features = [
+lscolors = { version = "0.16.0", default-features = false, features = [
   "nu-ansi-term",
 ] }
 memchr = "2"

From 4d5c034eb10d0a07098abb75ddd5771b6d444c05 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Wed, 29 Nov 2023 14:11:43 +0100
Subject: [PATCH 094/429] Run the echo fuzzer in the CI

---
 .github/workflows/fuzzing.yml  |  1 +
 fuzz/fuzz_targets/fuzz_echo.rs | 21 ++++++++-------------
 2 files changed, 9 insertions(+), 13 deletions(-)

diff --git a/.github/workflows/fuzzing.yml b/.github/workflows/fuzzing.yml
index 2274f6905c1..cc1547c87a6 100644
--- a/.github/workflows/fuzzing.yml
+++ b/.github/workflows/fuzzing.yml
@@ -42,6 +42,7 @@ jobs:
           - { name: fuzz_date, should_pass: false }
           - { name: fuzz_expr, should_pass: true }
           - { name: fuzz_printf, should_pass: false }
+          - { name: fuzz_echo, should_pass: false }
           - { name: fuzz_parse_glob, should_pass: true }
           - { name: fuzz_parse_size, should_pass: true }
           - { name: fuzz_parse_time, should_pass: true }
diff --git a/fuzz/fuzz_targets/fuzz_echo.rs b/fuzz/fuzz_targets/fuzz_echo.rs
index 3d810085301..826fd6da3eb 100644
--- a/fuzz/fuzz_targets/fuzz_echo.rs
+++ b/fuzz/fuzz_targets/fuzz_echo.rs
@@ -1,6 +1,6 @@
 #![no_main]
 use libfuzzer_sys::fuzz_target;
-use uu_echo::uumain; // Changed from uu_printf to uu_echo
+use uu_echo::uumain;
 
 use rand::prelude::SliceRandom;
 use rand::Rng;
@@ -12,7 +12,7 @@ use crate::fuzz_common::{
     compare_result, generate_and_run_uumain, generate_random_string, run_gnu_cmd,
 };
 
-static CMD_PATH: &str = "/usr/bin/echo"; // Changed from "printf" to "echo"
+static CMD_PATH: &str = "echo";
 
 fn generate_echo() -> String {
     let mut rng = rand::thread_rng();
@@ -22,7 +22,6 @@ fn generate_echo() -> String {
     let include_n = rng.gen_bool(0.1); // 10% chance
     let include_e = rng.gen_bool(0.1); // 10% chance
     let include_E = rng.gen_bool(0.1); // 10% chance
-                                       // --help and --version are typically not included in fuzzing as they don't change output format
 
     if include_n {
         echo_str.push_str("-n ");
@@ -41,29 +40,25 @@ fn generate_echo() -> String {
     if include_e {
         // Add a 10% chance of including an escape sequence
         if rng.gen_bool(0.1) {
-            echo_str.push_str(&generate_escape_sequence(&mut rng)); // This function should handle echo-specific sequences
+            echo_str.push_str(&generate_escape_sequence(&mut rng));
         }
     }
 
     echo_str
 }
 
-// You should also modify the generate_escape_sequence function to include echo-specific sequences
 fn generate_escape_sequence(rng: &mut impl Rng) -> String {
     let escape_sequences = [
-        "\\\\", "\\a", "\\b", "\\c", "\\e", "\\f", "\\n", "\\r", "\\t", "\\v",
-        "\\0NNN", // You can randomly generate NNN
-        "\\xHH",  // You can randomly generate HH
-                  // ... other sequences
+        "\\\\", "\\a", "\\b", "\\c", "\\e", "\\f", "\\n", "\\r", "\\t", "\\v", "\\0NNN", "\\xHH",
     ];
     escape_sequences.choose(rng).unwrap().to_string()
 }
 
 fuzz_target!(|_data: &[u8]| {
-    let echo_input = generate_echo(); // Changed from generate_printf to generate_echo
-    let mut args = vec![OsString::from("echo")]; // Changed from "printf" to "echo"
+    let echo_input = generate_echo();
+    let mut args = vec![OsString::from("echo")];
     args.extend(echo_input.split_whitespace().map(OsString::from));
-    let rust_result = generate_and_run_uumain(&args, uumain); // uumain function from uu_echo
+    let rust_result = generate_and_run_uumain(&args, uumain);
 
     let gnu_result = match run_gnu_cmd(CMD_PATH, &args[1..], false) {
         Ok(result) => result,
@@ -88,6 +83,6 @@ fuzz_target!(|_data: &[u8]| {
         &gnu_result.stderr,
         rust_result.exit_code,
         gnu_result.exit_code,
-        false, // Set to true if you want to fail on stderr diff
+        true,
     );
 });

From 9061b2ba7e1267cd6c8466108ecb197614ce29ea Mon Sep 17 00:00:00 2001
From: clara swanson <69856940+cswn@users.noreply.github.com>
Date: Thu, 30 Nov 2023 11:01:31 +0100
Subject: [PATCH 095/429] libstdbuf: remove crash macro (#5565)

* libstdbuf: remove crash macro

* libstdbuf: remove uucore macro/struct and use gnu messages

* libstdbuf: remove crash macro

* libstdbuf: remove uucore macro/struct and use gnu messages

* libstdbuf: remove :? from print by printing file descriptor instead of file

* merge main into libstdbuf-remove-crash-macro

* libstdbuf: remove uucore from dependencies
---
 Cargo.lock                                   |  1 -
 src/uu/stdbuf/src/libstdbuf/Cargo.toml       |  1 -
 src/uu/stdbuf/src/libstdbuf/src/libstdbuf.rs | 14 ++++++++++----
 3 files changed, 10 insertions(+), 6 deletions(-)

diff --git a/Cargo.lock b/Cargo.lock
index 3f5e4280964..bf638b421a1 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -2952,7 +2952,6 @@ dependencies = [
  "cpp",
  "cpp_build",
  "libc",
- "uucore",
 ]
 
 [[package]]
diff --git a/src/uu/stdbuf/src/libstdbuf/Cargo.toml b/src/uu/stdbuf/src/libstdbuf/Cargo.toml
index be97c47aeaf..eaa82e6e73d 100644
--- a/src/uu/stdbuf/src/libstdbuf/Cargo.toml
+++ b/src/uu/stdbuf/src/libstdbuf/Cargo.toml
@@ -22,7 +22,6 @@ crate-type = [
 [dependencies]
 cpp = "0.5"
 libc = { workspace = true }
-uucore = { version = ">=0.0.19", package = "uucore", path = "../../../../uucore" }
 
 [build-dependencies]
 cpp_build = "0.5"
diff --git a/src/uu/stdbuf/src/libstdbuf/src/libstdbuf.rs b/src/uu/stdbuf/src/libstdbuf/src/libstdbuf.rs
index a29d01b78f3..d744ca4c545 100644
--- a/src/uu/stdbuf/src/libstdbuf/src/libstdbuf.rs
+++ b/src/uu/stdbuf/src/libstdbuf/src/libstdbuf.rs
@@ -5,10 +5,9 @@
 // spell-checker:ignore (ToDO) IOFBF IOLBF IONBF cstdio setvbuf
 
 use cpp::cpp;
-use libc::{c_char, c_int, size_t, FILE, _IOFBF, _IOLBF, _IONBF};
+use libc::{c_char, c_int, fileno, size_t, FILE, _IOFBF, _IOLBF, _IONBF};
 use std::env;
 use std::ptr;
-use uucore::crash;
 
 cpp! {{
     #include <cstdio>
@@ -40,7 +39,10 @@ fn set_buffer(stream: *mut FILE, value: &str) {
         input => {
             let buff_size: usize = match input.parse() {
                 Ok(num) => num,
-                Err(e) => crash!(1, "incorrect size of buffer!: {}", e),
+                Err(_) => {
+                    eprintln!("failed to allocate a {} byte stdio buffer", value);
+                    std::process::exit(1);
+                }
             };
             (_IOFBF, buff_size as size_t)
         }
@@ -52,7 +54,11 @@ fn set_buffer(stream: *mut FILE, value: &str) {
         res = libc::setvbuf(stream, buffer, mode, size);
     }
     if res != 0 {
-        crash!(res, "error while calling setvbuf!");
+        eprintln!(
+            "could not set buffering of {} to mode {}",
+            unsafe { fileno(stream) },
+            mode
+        );
     }
 }
 

From 0ec6802459bf79d6f36c0289aa1cb262c40537ba Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Thu, 30 Nov 2023 16:13:54 +0100
Subject: [PATCH 096/429] ls: fix padding of size column when using -l

---
 src/uu/ls/src/ls.rs      |  2 +-
 tests/by-util/test_ls.rs | 15 +++++++++++++++
 2 files changed, 16 insertions(+), 1 deletion(-)

diff --git a/src/uu/ls/src/ls.rs b/src/uu/ls/src/ls.rs
index 88af56bb186..cba9cdf5375 100644
--- a/src/uu/ls/src/ls.rs
+++ b/src/uu/ls/src/ls.rs
@@ -3228,7 +3228,7 @@ fn calculate_padding_collection(
                 padding_collections.minor = minor_len.max(padding_collections.minor);
                 padding_collections.size = size_len
                     .max(padding_collections.size)
-                    .max(padding_collections.major + padding_collections.minor + 2usize);
+                    .max(padding_collections.major);
             }
         }
     }
diff --git a/tests/by-util/test_ls.rs b/tests/by-util/test_ls.rs
index 07ea8c9cd63..19a3f5578fa 100644
--- a/tests/by-util/test_ls.rs
+++ b/tests/by-util/test_ls.rs
@@ -1023,6 +1023,21 @@ fn test_ls_long_format() {
     ).unwrap());
 }
 
+#[test]
+fn test_ls_long_padding_of_size_column_with_multiple_files() {
+    let (at, mut ucmd) = at_and_ucmd!();
+
+    at.mkdir("dir");
+    at.touch("dir/a");
+    at.touch("dir/b");
+
+    ucmd.arg("-l")
+        .arg("dir")
+        .succeeds()
+        .stdout_contains(" 0 ")
+        .stdout_does_not_contain("  0 ");
+}
+
 /// This test tests `ls -laR --color`.
 /// This test is mainly about coloring, but, the recursion, symlink `->` processing,
 /// and `.` and `..` being present in `-a` all need to work for the test to pass.

From 8d591a7acce618ab3a9290f50487e9c0de22c5ed Mon Sep 17 00:00:00 2001
From: Piotr Kwiecinski <piotr.kwiecinski@codemanufacture.com>
Date: Thu, 30 Nov 2023 17:59:48 +0100
Subject: [PATCH 097/429] Bump freebsd-vm action to v1.0.2 & use ubuntu

---
 .github/workflows/freebsd.yml | 21 ++++++++++++---------
 1 file changed, 12 insertions(+), 9 deletions(-)

diff --git a/.github/workflows/freebsd.yml b/.github/workflows/freebsd.yml
index 5af3da320a7..b932f9aa8f5 100644
--- a/.github/workflows/freebsd.yml
+++ b/.github/workflows/freebsd.yml
@@ -25,7 +25,7 @@ jobs:
       fail-fast: false
       matrix:
         job:
-          - { os: macos-12 , features: unix } ## GHA MacOS-11.0 VM won't have VirtualBox; refs: <https://github.com/actions/virtual-environments/issues/4060> , <https://github.com/actions/virtual-environments/pull/4010>
+          - { os: ubuntu-22.04 , features: unix }
     env:
       SCCACHE_GHA_ENABLED: "true"
       RUSTC_WRAPPER: "sccache"
@@ -35,9 +35,11 @@ jobs:
     - name: Run sccache-cache
       uses: mozilla-actions/sccache-action@v0.0.3
     - name: Prepare, build and test
-      uses: vmactions/freebsd-vm@v0.3.1
+      uses: vmactions/freebsd-vm@v1.0.2
       with:
         usesh: true
+        sync: rsync
+        copyback: false
         # We need jq to run show-utils.sh and bash to use inline shell string replacement
         prepare: pkg install -y curl sudo jq bash
         run: |
@@ -48,11 +50,11 @@ jobs:
           #
           TEST_USER=tester
           REPO_NAME=${GITHUB_WORKSPACE##*/}
-          WORKSPACE_PARENT="/Users/runner/work/${REPO_NAME}"
+          WORKSPACE_PARENT="/home/runner/work/${REPO_NAME}"
           WORKSPACE="${WORKSPACE_PARENT}/${REPO_NAME}"
           #
           pw adduser -n ${TEST_USER} -d /root/ -g wheel -c "Coreutils user to build" -w random
-          chown -R ${TEST_USER}:wheel /root/ "/Users/runner/work/${REPO_NAME}"/
+          chown -R ${TEST_USER}:wheel /root/ "${WORKSPACE_PARENT}"/
           whoami
           #
           # Further work needs to be done in a sudo as we are changing users
@@ -114,7 +116,7 @@ jobs:
       fail-fast: false
       matrix:
         job:
-          - { os: macos-12 , features: unix } ## GHA MacOS-11.0 VM won't have VirtualBox; refs: <https://github.com/actions/virtual-environments/issues/4060> , <https://github.com/actions/virtual-environments/pull/4010>
+          - { os: ubuntu-22.04 , features: unix }
     env:
       mem: 4096
       SCCACHE_GHA_ENABLED: "true"
@@ -125,10 +127,11 @@ jobs:
     - name: Run sccache-cache
       uses: mozilla-actions/sccache-action@v0.0.3
     - name: Prepare, build and test
-      uses: vmactions/freebsd-vm@v0.3.1
+      uses: vmactions/freebsd-vm@v1.0.2
       with:
         usesh: true
-        # sync: sshfs
+        sync: rsync
+        copyback: false
         prepare: pkg install -y curl gmake sudo
         run: |
           ## Prepare, build, and test
@@ -141,12 +144,12 @@ jobs:
           #
           TEST_USER=tester
           REPO_NAME=${GITHUB_WORKSPACE##*/}
-          WORKSPACE_PARENT="/Users/runner/work/${REPO_NAME}"
+          WORKSPACE_PARENT="/home/runner/work/${REPO_NAME}"
           WORKSPACE="${WORKSPACE_PARENT}/${REPO_NAME}"
           #
           pw adduser -n ${TEST_USER} -d /root/ -g wheel -c "Coreutils user to build" -w random
           # chown -R ${TEST_USER}:wheel /root/ "${WORKSPACE_PARENT}"/
-          chown -R ${TEST_USER}:wheel /root/ "/Users/runner/work/${REPO_NAME}"/
+          chown -R ${TEST_USER}:wheel /root/ "${WORKSPACE_PARENT}"/
           whoami
           #
           # Further work needs to be done in a sudo as we are changing users

From c6e7fdcabe46e9bcd903567900c11d7e230f9c1f Mon Sep 17 00:00:00 2001
From: Piotr Kwiecinski <piotr.kwiecinski@codemanufacture.com>
Date: Thu, 30 Nov 2023 18:45:06 +0100
Subject: [PATCH 098/429] skip test_cp_arg_update_interactive on FreeBSD

---
 tests/by-util/test_cp.rs | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/tests/by-util/test_cp.rs b/tests/by-util/test_cp.rs
index 14b68da3718..36bca68b0d0 100644
--- a/tests/by-util/test_cp.rs
+++ b/tests/by-util/test_cp.rs
@@ -257,6 +257,8 @@ fn test_cp_target_directory_is_file() {
 }
 
 #[test]
+// FixMe: for FreeBSD, flaky test; track repair progress at GH:uutils/coreutils/issue/4725
+#[cfg(not(target_os = "freebsd"))]
 fn test_cp_arg_update_interactive() {
     new_ucmd!()
         .arg(TEST_HELLO_WORLD_SOURCE)

From 6b3f00cc3192624f2e0f763fef668de3cc9ab25d Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Fri, 1 Dec 2023 10:03:44 +0100
Subject: [PATCH 099/429] dd: skip two tests without "printf" feature

---
 tests/by-util/test_dd.rs | 21 ++++++++++++++++++---
 1 file changed, 18 insertions(+), 3 deletions(-)

diff --git a/tests/by-util/test_dd.rs b/tests/by-util/test_dd.rs
index a4c70097c8b..bd43ad077d3 100644
--- a/tests/by-util/test_dd.rs
+++ b/tests/by-util/test_dd.rs
@@ -15,7 +15,12 @@ use regex::Regex;
 use std::fs::{File, OpenOptions};
 use std::io::{BufReader, Read, Write};
 use std::path::PathBuf;
-#[cfg(all(unix, not(target_os = "macos"), not(target_os = "freebsd")))]
+#[cfg(all(
+    unix,
+    not(target_os = "macos"),
+    not(target_os = "freebsd"),
+    feature = "printf"
+))]
 use std::process::{Command, Stdio};
 #[cfg(not(windows))]
 use std::thread::sleep;
@@ -1586,7 +1591,12 @@ fn test_seek_past_dev() {
 }
 
 #[test]
-#[cfg(all(unix, not(target_os = "macos"), not(target_os = "freebsd")))]
+#[cfg(all(
+    unix,
+    not(target_os = "macos"),
+    not(target_os = "freebsd"),
+    feature = "printf"
+))]
 fn test_reading_partial_blocks_from_fifo() {
     // Create the FIFO.
     let ts = TestScenario::new(util_name!());
@@ -1622,7 +1632,12 @@ fn test_reading_partial_blocks_from_fifo() {
 }
 
 #[test]
-#[cfg(all(unix, not(target_os = "macos"), not(target_os = "freebsd")))]
+#[cfg(all(
+    unix,
+    not(target_os = "macos"),
+    not(target_os = "freebsd"),
+    feature = "printf"
+))]
 fn test_reading_partial_blocks_from_fifo_unbuffered() {
     // Create the FIFO.
     let ts = TestScenario::new(util_name!());

From 4d2bdf497ab030871a7a84191010637a355ffd7e Mon Sep 17 00:00:00 2001
From: Piotr Kwiecinski <piotr.kwiecinski@codemanufacture.com>
Date: Fri, 1 Dec 2023 11:52:23 +0100
Subject: [PATCH 100/429] prevent CI creating 2 events on each pull request
 push

---
 .github/workflows/CICD.yml         | 6 +++++-
 .github/workflows/GnuTests.yml     | 6 +++++-
 .github/workflows/android.yml      | 7 ++++++-
 .github/workflows/code-quality.yml | 6 +++++-
 .github/workflows/freebsd.yml      | 6 +++++-
 .github/workflows/fuzzing.yml      | 6 +++++-
 6 files changed, 31 insertions(+), 6 deletions(-)

diff --git a/.github/workflows/CICD.yml b/.github/workflows/CICD.yml
index 8dfa0b1d103..8c96ce693ee 100644
--- a/.github/workflows/CICD.yml
+++ b/.github/workflows/CICD.yml
@@ -15,7 +15,11 @@ env:
   # * style job configuration
   STYLE_FAIL_ON_FAULT: true ## (bool) fail the build if a style job contains a fault (error or warning); may be overridden on a per-job basis
 
-on: [push, pull_request]
+on:
+  pull_request:
+  push:
+    branches:
+      - main
 
 permissions:
   contents: read # to fetch code (actions/checkout)
diff --git a/.github/workflows/GnuTests.yml b/.github/workflows/GnuTests.yml
index 61f30eba4c1..87e4373eddc 100644
--- a/.github/workflows/GnuTests.yml
+++ b/.github/workflows/GnuTests.yml
@@ -9,7 +9,11 @@ name: GnuTests
 
 # * note: to run a single test => `REPO/util/run-gnu-test.sh PATH/TO/TEST/SCRIPT`
 
-on: [push, pull_request]
+on:
+  pull_request:
+  push:
+    branches:
+      - main
 
 permissions:
   contents: read
diff --git a/.github/workflows/android.yml b/.github/workflows/android.yml
index 5834aceffe8..69ca970c0fa 100644
--- a/.github/workflows/android.yml
+++ b/.github/workflows/android.yml
@@ -2,7 +2,12 @@ name: Android
 
 # spell-checker:ignore TERMUX reactivecircus Swatinem  noaudio pkill swiftshader dtolnay juliangruber
 
-on: [push, pull_request]
+on:
+  pull_request:
+  push:
+    branches:
+      - main
+
 
 permissions:
   contents: read # to fetch code (actions/checkout)
diff --git a/.github/workflows/code-quality.yml b/.github/workflows/code-quality.yml
index 98691f34bc8..289830f8171 100644
--- a/.github/workflows/code-quality.yml
+++ b/.github/workflows/code-quality.yml
@@ -2,7 +2,11 @@ name: Code Quality
 
 # spell-checker:ignore TERMUX reactivecircus Swatinem  noaudio pkill swiftshader dtolnay juliangruber
 
-on: [push, pull_request]
+on:
+  pull_request:
+  push:
+    branches:
+      - main
 
 env:
   # * style job configuration
diff --git a/.github/workflows/freebsd.yml b/.github/workflows/freebsd.yml
index b932f9aa8f5..02c0137e7b2 100644
--- a/.github/workflows/freebsd.yml
+++ b/.github/workflows/freebsd.yml
@@ -6,7 +6,11 @@ env:
   # * style job configuration
   STYLE_FAIL_ON_FAULT: true ## (bool) fail the build if a style job contains a fault (error or warning); may be overridden on a per-job basis
 
-on: [push, pull_request]
+on:
+  pull_request:
+  push:
+    branches:
+      - main
 
 permissions:
   contents: read # to fetch code (actions/checkout)
diff --git a/.github/workflows/fuzzing.yml b/.github/workflows/fuzzing.yml
index 2274f6905c1..4e47ea0e281 100644
--- a/.github/workflows/fuzzing.yml
+++ b/.github/workflows/fuzzing.yml
@@ -2,7 +2,11 @@ name: Fuzzing
 
 # spell-checker:ignore fuzzer
 
-on: [push, pull_request]
+on:
+  pull_request:
+  push:
+    branches:
+      - main
 
 permissions:
   contents: read # to fetch code (actions/checkout)

From 13a4c9114c4574ee8d14ffe0bb6b326ad203375d Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Sat, 2 Dec 2023 10:28:45 +0100
Subject: [PATCH 101/429] create datastructures for colors

---
 src/uucore/src/lib/features.rs        |   2 +
 src/uucore/src/lib/features/colors.rs | 225 ++++++++++++++++++++++++++
 2 files changed, 227 insertions(+)
 create mode 100644 src/uucore/src/lib/features/colors.rs

diff --git a/src/uucore/src/lib/features.rs b/src/uucore/src/lib/features.rs
index 1d0d437824d..a28e8a7bfc9 100644
--- a/src/uucore/src/lib/features.rs
+++ b/src/uucore/src/lib/features.rs
@@ -6,6 +6,8 @@
 
 #[cfg(feature = "backup-control")]
 pub mod backup_control;
+#[cfg(feature = "colors")]
+pub mod colors;
 #[cfg(feature = "encoding")]
 pub mod encoding;
 #[cfg(feature = "format")]
diff --git a/src/uucore/src/lib/features/colors.rs b/src/uucore/src/lib/features/colors.rs
new file mode 100644
index 00000000000..58b0b757084
--- /dev/null
+++ b/src/uucore/src/lib/features/colors.rs
@@ -0,0 +1,225 @@
+// This file is part of the uutils coreutils package.
+//
+// For the full copyright and license information, please view the LICENSE
+// file that was distributed with this source code.
+
+/* The keywords COLOR, OPTIONS, and EIGHTBIT (honored by the
+ * slackware version of dircolors) are recognized but ignored.
+ * Global config options can be specified before TERM or COLORTERM entries
+ * below are TERM or COLORTERM entries, which can be glob patterns, which
+ * restrict following config to systems with matching environment variables.
+ * COLORTERM ?*
+*/
+
+static TERMS: &[&str] = &[
+    "Eterm",
+    "ansi",
+    "*color*",
+    "con[0-9]*x[0-9]*",
+    "cons25",
+    "console",
+    "cygwin",
+    "*direct*",
+    "dtterm",
+    "gnome",
+    "hurd",
+    "jfbterm",
+    "konsole",
+    "kterm",
+    "linux",
+    "linux-c",
+    "mlterm",
+    "putty",
+    "rxvt*",
+    "screen*",
+    "st",
+    "terminator",
+    "tmux*",
+    "vt100",
+    "xterm*",
+];
+
+/*
+# Below are the color init strings for the basic file types.
+# One can use codes for 256 or more colors supported by modern terminals.
+# The default color codes use the capabilities of an 8 color terminal
+# with some additional attributes as per the following codes:
+# Attribute codes:
+# 00=none 01=bold 04=underscore 05=blink 07=reverse 08=concealed
+# Text color codes:
+# 30=black 31=red 32=green 33=yellow 34=blue 35=magenta 36=cyan 37=white
+# Background color codes:
+# 40=black 41=red 42=green 43=yellow 44=blue 45=magenta 46=cyan 47=white
+#NORMAL 00 # no color code at all
+#FILE 00 # regular file: use no color at all
+*/
+static FILE_TYPES: &[(&str, &str)] = &[
+    ("RESET", "0"),                     // reset to "normal" color
+    ("DIR", "01;34"),                   // directory
+    ("LINK", "01;36"),                  // symbolic link
+    ("MULTIHARDLINK", "00"),            // regular file with more than one link
+    ("FIFO", "40;33"),                  // pipe
+    ("SOCK", "01;35"),                  // socket
+    ("DOOR", "01;35"),                  // door
+    ("BLK", "40;33;01"),                // block device driver
+    ("CHR", "40;33;01"),                // character device driver
+    ("ORPHAN", "40;31;01"),             // symlink to nonexistent file, or non-stat'able file
+    ("MISSING", "00"),                  // ... and the files they point to
+    ("SETUID", "37;41"),                // file that is setuid (u+s)
+    ("SETGID", "30;43"),                // file that is setgid (g+s)
+    ("CAPABILITY", "00"),               // file with capability
+    ("STICKY_OTHER_WRITABLE", "30;42"), // dir that is sticky and other-writable (+t,o+w)
+    ("OTHER_WRITABLE", "34;42"),        // dir that is other-writable (o+w) and not sticky
+    ("STICKY", "37;44"),                // dir with the sticky bit set (+t) and not other-writable
+    ("EXEC", "01;32"),                  // files with execute permission
+];
+
+/*
+# List any file extensions like '.gz' or '.tar' that you would like ls
+# to color below. Put the extension, a space, and the color init string.
+# (and any comments you want to add after a '#')
+*/
+static FILE_COLORS: &[(&str, &str)] = &[
+    // Executables (Windows)
+    (".cmd", "01;32"),
+    (".exe", "01;32"),
+    (".com", "01;32"),
+    (".btm", "01;32"),
+    (".bat", "01;32"),
+    (".sh", "01;32"),
+    (".csh", "01;32"),
+    // Archives or compressed
+    (".tar", "01;31"),
+    (".tgz", "01;31"),
+    (".arc", "01;31"),
+    (".arj", "01;31"),
+    (".taz", "01;31"),
+    (".lha", "01;31"),
+    (".lz4", "01;31"),
+    (".lzh", "01;31"),
+    (".lzma", "01;31"),
+    (".tlz", "01;31"),
+    (".txz", "01;31"),
+    (".tzo", "01;31"),
+    (".t7z", "01;31"),
+    (".zip", "01;31"),
+    (".z", "01;31"),
+    (".dz", "01;31"),
+    (".gz", "01;31"),
+    (".lrz", "01;31"),
+    (".lz", "01;31"),
+    (".lzo", "01;31"),
+    (".xz", "01;31"),
+    (".zst", "01;31"),
+    (".tzst", "01;31"),
+    (".bz2", "01;31"),
+    (".bz", "01;31"),
+    (".tbz", "01;31"),
+    (".tbz2", "01;31"),
+    (".tz", "01;31"),
+    (".deb", "01;31"),
+    (".rpm", "01;31"),
+    (".jar", "01;31"),
+    (".war", "01;31"),
+    (".ear", "01;31"),
+    (".sar", "01;31"),
+    (".rar", "01;31"),
+    (".alz", "01;31"),
+    (".ace", "01;31"),
+    (".zoo", "01;31"),
+    (".cpio", "01;31"),
+    (".7z", "01;31"),
+    (".rz", "01;31"),
+    (".cab", "01;31"),
+    (".wim", "01;31"),
+    (".swm", "01;31"),
+    (".dwm", "01;31"),
+    (".esd", "01;31"),
+    // Image formats
+    (".avif", "01;35"),
+    (".jpg", "01;35"),
+    (".jpeg", "01;35"),
+    (".mjpg", "01;35"),
+    (".mjpeg", "01;35"),
+    (".gif", "01;35"),
+    (".bmp", "01;35"),
+    (".pbm", "01;35"),
+    (".pgm", "01;35"),
+    (".ppm", "01;35"),
+    (".tga", "01;35"),
+    (".xbm", "01;35"),
+    (".xpm", "01;35"),
+    (".tif", "01;35"),
+    (".tiff", "01;35"),
+    (".png", "01;35"),
+    (".svg", "01;35"),
+    (".svgz", "01;35"),
+    (".mng", "01;35"),
+    (".pcx", "01;35"),
+    (".mov", "01;35"),
+    (".mpg", "01;35"),
+    (".mpeg", "01;35"),
+    (".m2v", "01;35"),
+    (".mkv", "01;35"),
+    (".webm", "01;35"),
+    (".webp", "01;35"),
+    (".ogm", "01;35"),
+    (".mp4", "01;35"),
+    (".m4v", "01;35"),
+    (".mp4v", "01;35"),
+    (".vob", "01;35"),
+    (".qt", "01;35"),
+    (".nuv", "01;35"),
+    (".wmv", "01;35"),
+    (".asf", "01;35"),
+    (".rm", "01;35"),
+    (".rmvb", "01;35"),
+    (".flc", "01;35"),
+    (".avi", "01;35"),
+    (".fli", "01;35"),
+    (".flv", "01;35"),
+    (".gl", "01;35"),
+    (".dl", "01;35"),
+    (".xcf", "01;35"),
+    (".xwd", "01;35"),
+    (".yuv", "01;35"),
+    (".cgm", "01;35"),
+    (".emf", "01;35"),
+    (".ogv", "01;35"),
+    (".ogx", "01;35"),
+    // Audio formats
+    (".aac", "00;36"),
+    (".au", "00;36"),
+    (".flac", "00;36"),
+    (".m4a", "00;36"),
+    (".mid", "00;36"),
+    (".midi", "00;36"),
+    (".mka", "00;36"),
+    (".mp3", "00;36"),
+    (".mpc", "00;36"),
+    (".ogg", "00;36"),
+    (".ra", "00;36"),
+    (".wav", "00;36"),
+    (".oga", "00;36"),
+    (".opus", "00;36"),
+    (".spx", "00;36"),
+    (".xspf", "00;36"),
+    // Backup files
+    ("*~", "00;90"),
+    ("*#", "00;90"),
+    (".bak", "00;90"),
+    (".old", "00;90"),
+    (".orig", "00;90"),
+    (".part", "00;90"),
+    (".rej", "00;90"),
+    (".swp", "00;90"),
+    (".tmp", "00;90"),
+    (".dpkg-dist", "00;90"),
+    (".dpkg-old", "00;90"),
+    (".ucf-dist", "00;90"),
+    (".ucf-new", "00;90"),
+    (".ucf-old", "00;90"),
+    (".rpmnew", "00;90"),
+    (".rpmorig", "00;90"),
+    (".rpmsave", "00;90"),
+];

From 0e8c171c80ab35f4d16a2613700648ec059ebaa5 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Sat, 2 Dec 2023 11:00:55 +0100
Subject: [PATCH 102/429] dircolors: move the FILE_ATTRIBUTE_CODES
 datastructures and use it

---
 src/uu/dircolors/Cargo.toml           |   2 +-
 src/uu/dircolors/src/dircolors.rs     |  43 +--
 src/uucore/Cargo.toml                 |   1 +
 src/uucore/src/lib/features/colors.rs | 458 +++++++++++++++-----------
 src/uucore/src/lib/lib.rs             |   2 +
 5 files changed, 273 insertions(+), 233 deletions(-)

diff --git a/src/uu/dircolors/Cargo.toml b/src/uu/dircolors/Cargo.toml
index 6099b5a8428..66ee792f839 100644
--- a/src/uu/dircolors/Cargo.toml
+++ b/src/uu/dircolors/Cargo.toml
@@ -16,7 +16,7 @@ path = "src/dircolors.rs"
 
 [dependencies]
 clap = { workspace = true }
-uucore = { workspace = true }
+uucore = { workspace = true, features = ["colors"] }
 
 [[bin]]
 name = "dircolors"
diff --git a/src/uu/dircolors/src/dircolors.rs b/src/uu/dircolors/src/dircolors.rs
index 2e3087d810b..58228ddeb57 100644
--- a/src/uu/dircolors/src/dircolors.rs
+++ b/src/uu/dircolors/src/dircolors.rs
@@ -12,6 +12,7 @@ use std::io::{BufRead, BufReader};
 use std::path::Path;
 
 use clap::{crate_version, Arg, ArgAction, Command};
+use uucore::colors::FILE_ATTRIBUTE_CODES;
 use uucore::display::Quotable;
 use uucore::error::{UResult, USimpleError, UUsageError};
 use uucore::{help_about, help_section, help_usage};
@@ -276,7 +277,6 @@ enum ParseState {
     Pass,
 }
 
-use std::collections::HashMap;
 use uucore::{format_usage, parse_glob};
 
 #[allow(clippy::cognitive_complexity)]
@@ -294,45 +294,6 @@ where
         OutputFmt::Unknown => unreachable!(),
     }
 
-    let mut table: HashMap<&str, &str> = HashMap::with_capacity(48);
-    table.insert("normal", "no");
-    table.insert("norm", "no");
-    table.insert("file", "fi");
-    table.insert("reset", "rs");
-    table.insert("dir", "di");
-    table.insert("lnk", "ln");
-    table.insert("link", "ln");
-    table.insert("symlink", "ln");
-    table.insert("orphan", "or");
-    table.insert("missing", "mi");
-    table.insert("fifo", "pi");
-    table.insert("pipe", "pi");
-    table.insert("sock", "so");
-    table.insert("blk", "bd");
-    table.insert("block", "bd");
-    table.insert("chr", "cd");
-    table.insert("char", "cd");
-    table.insert("door", "do");
-    table.insert("exec", "ex");
-    table.insert("left", "lc");
-    table.insert("leftcode", "lc");
-    table.insert("right", "rc");
-    table.insert("rightcode", "rc");
-    table.insert("end", "ec");
-    table.insert("endcode", "ec");
-    table.insert("suid", "su");
-    table.insert("setuid", "su");
-    table.insert("sgid", "sg");
-    table.insert("setgid", "sg");
-    table.insert("sticky", "st");
-    table.insert("other_writable", "ow");
-    table.insert("owr", "ow");
-    table.insert("sticky_other_writable", "tw");
-    table.insert("owt", "tw");
-    table.insert("capability", "ca");
-    table.insert("multihardlink", "mh");
-    table.insert("clrtoeol", "cl");
-
     let term = env::var("TERM").unwrap_or_else(|_| "none".to_owned());
     let term = term.as_str();
 
@@ -384,7 +345,7 @@ where
                     }
                 } else if lower == "options" || lower == "color" || lower == "eightbit" {
                     // Slackware only. Ignore
-                } else if let Some(s) = table.get(lower.as_str()) {
+                } else if let Some(s) = FILE_ATTRIBUTE_CODES.get(lower.as_str()) {
                     if *fmt == OutputFmt::Display {
                         result.push_str(format!("\x1b[{val}m{s}\t{val}\x1b[0m\n").as_str());
                     } else {
diff --git a/src/uucore/Cargo.toml b/src/uucore/Cargo.toml
index b43445b4a92..44f8bb2d13f 100644
--- a/src/uucore/Cargo.toml
+++ b/src/uucore/Cargo.toml
@@ -72,6 +72,7 @@ windows-sys = { workspace = true, optional = true, default-features = false, fea
 default = []
 # * non-default features
 backup-control = []
+colors = []
 encoding = ["data-encoding", "data-encoding-macro", "z85", "thiserror"]
 entries = ["libc"]
 fs = ["dunce", "libc", "winapi-util", "windows-sys"]
diff --git a/src/uucore/src/lib/features/colors.rs b/src/uucore/src/lib/features/colors.rs
index 58b0b757084..69be16ba291 100644
--- a/src/uucore/src/lib/features/colors.rs
+++ b/src/uucore/src/lib/features/colors.rs
@@ -3,6 +3,9 @@
 // For the full copyright and license information, please view the LICENSE
 // file that was distributed with this source code.
 
+use once_cell::sync::Lazy;
+use std::collections::HashMap;
+
 /* The keywords COLOR, OPTIONS, and EIGHTBIT (honored by the
  * slackware version of dircolors) are recognized but ignored.
  * Global config options can be specified before TERM or COLORTERM entries
@@ -11,33 +14,41 @@
  * COLORTERM ?*
 */
 
-static TERMS: &[&str] = &[
-    "Eterm",
-    "ansi",
-    "*color*",
-    "con[0-9]*x[0-9]*",
-    "cons25",
-    "console",
-    "cygwin",
-    "*direct*",
-    "dtterm",
-    "gnome",
-    "hurd",
-    "jfbterm",
-    "konsole",
-    "kterm",
-    "linux",
-    "linux-c",
-    "mlterm",
-    "putty",
-    "rxvt*",
-    "screen*",
-    "st",
-    "terminator",
-    "tmux*",
-    "vt100",
-    "xterm*",
-];
+pub static TERMS: Lazy<HashMap<&str, &str>> = Lazy::new(|| {
+    let mut m = HashMap::new();
+    [
+        "Eterm",
+        "ansi",
+        "*color*",
+        "con[0-9]*x[0-9]*",
+        "cons25",
+        "console",
+        "cygwin",
+        "*direct*",
+        "dtterm",
+        "gnome",
+        "hurd",
+        "jfbterm",
+        "konsole",
+        "kterm",
+        "linux",
+        "linux-c",
+        "mlterm",
+        "putty",
+        "rxvt*",
+        "screen*",
+        "st",
+        "terminator",
+        "tmux*",
+        "vt100",
+        "xterm*",
+    ]
+    .iter()
+    .for_each(|&term| {
+        m.insert(term, "");
+    });
+    m
+});
 
 /*
 # Below are the color init strings for the basic file types.
@@ -53,173 +64,238 @@ static TERMS: &[&str] = &[
 #NORMAL 00 # no color code at all
 #FILE 00 # regular file: use no color at all
 */
-static FILE_TYPES: &[(&str, &str)] = &[
-    ("RESET", "0"),                     // reset to "normal" color
-    ("DIR", "01;34"),                   // directory
-    ("LINK", "01;36"),                  // symbolic link
-    ("MULTIHARDLINK", "00"),            // regular file with more than one link
-    ("FIFO", "40;33"),                  // pipe
-    ("SOCK", "01;35"),                  // socket
-    ("DOOR", "01;35"),                  // door
-    ("BLK", "40;33;01"),                // block device driver
-    ("CHR", "40;33;01"),                // character device driver
-    ("ORPHAN", "40;31;01"),             // symlink to nonexistent file, or non-stat'able file
-    ("MISSING", "00"),                  // ... and the files they point to
-    ("SETUID", "37;41"),                // file that is setuid (u+s)
-    ("SETGID", "30;43"),                // file that is setgid (g+s)
-    ("CAPABILITY", "00"),               // file with capability
-    ("STICKY_OTHER_WRITABLE", "30;42"), // dir that is sticky and other-writable (+t,o+w)
-    ("OTHER_WRITABLE", "34;42"),        // dir that is other-writable (o+w) and not sticky
-    ("STICKY", "37;44"),                // dir with the sticky bit set (+t) and not other-writable
-    ("EXEC", "01;32"),                  // files with execute permission
-];
+// FILE_TYPES with Lazy initialization
+pub static FILE_TYPES: Lazy<HashMap<&str, &str>> = Lazy::new(|| {
+    let mut m = HashMap::new();
+    [
+        ("RESET", "0"),                     // reset to "normal" color
+        ("DIR", "01;34"),                   // directory
+        ("LINK", "01;36"),                  // symbolic link
+        ("MULTIHARDLINK", "00"),            // regular file with more than one link
+        ("FIFO", "40;33"),                  // pipe
+        ("SOCK", "01;35"),                  // socket
+        ("DOOR", "01;35"),                  // door
+        ("BLK", "40;33;01"),                // block device driver
+        ("CHR", "40;33;01"),                // character device driver
+        ("ORPHAN", "40;31;01"),             // symlink to nonexistent file, or non-stat'able file
+        ("MISSING", "00"),                  // ... and the files they point to
+        ("SETUID", "37;41"),                // file that is setuid (u+s)
+        ("SETGID", "30;43"),                // file that is setgid (g+s)
+        ("CAPABILITY", "00"),               // file with capability
+        ("STICKY_OTHER_WRITABLE", "30;42"), // dir that is sticky and other-writable (+t,o+w)
+        ("OTHER_WRITABLE", "34;42"),        // dir that is other-writable (o+w) and not sticky
+        ("STICKY", "37;44"), // dir with the sticky bit set (+t) and not other-writable
+        ("EXEC", "01;32"),   // files with execute permission
+    ]
+    .iter()
+    .for_each(|&(k, v)| {
+        m.insert(k, v);
+    });
+    m
+});
 
 /*
 # List any file extensions like '.gz' or '.tar' that you would like ls
 # to color below. Put the extension, a space, and the color init string.
 # (and any comments you want to add after a '#')
 */
-static FILE_COLORS: &[(&str, &str)] = &[
-    // Executables (Windows)
-    (".cmd", "01;32"),
-    (".exe", "01;32"),
-    (".com", "01;32"),
-    (".btm", "01;32"),
-    (".bat", "01;32"),
-    (".sh", "01;32"),
-    (".csh", "01;32"),
-    // Archives or compressed
-    (".tar", "01;31"),
-    (".tgz", "01;31"),
-    (".arc", "01;31"),
-    (".arj", "01;31"),
-    (".taz", "01;31"),
-    (".lha", "01;31"),
-    (".lz4", "01;31"),
-    (".lzh", "01;31"),
-    (".lzma", "01;31"),
-    (".tlz", "01;31"),
-    (".txz", "01;31"),
-    (".tzo", "01;31"),
-    (".t7z", "01;31"),
-    (".zip", "01;31"),
-    (".z", "01;31"),
-    (".dz", "01;31"),
-    (".gz", "01;31"),
-    (".lrz", "01;31"),
-    (".lz", "01;31"),
-    (".lzo", "01;31"),
-    (".xz", "01;31"),
-    (".zst", "01;31"),
-    (".tzst", "01;31"),
-    (".bz2", "01;31"),
-    (".bz", "01;31"),
-    (".tbz", "01;31"),
-    (".tbz2", "01;31"),
-    (".tz", "01;31"),
-    (".deb", "01;31"),
-    (".rpm", "01;31"),
-    (".jar", "01;31"),
-    (".war", "01;31"),
-    (".ear", "01;31"),
-    (".sar", "01;31"),
-    (".rar", "01;31"),
-    (".alz", "01;31"),
-    (".ace", "01;31"),
-    (".zoo", "01;31"),
-    (".cpio", "01;31"),
-    (".7z", "01;31"),
-    (".rz", "01;31"),
-    (".cab", "01;31"),
-    (".wim", "01;31"),
-    (".swm", "01;31"),
-    (".dwm", "01;31"),
-    (".esd", "01;31"),
-    // Image formats
-    (".avif", "01;35"),
-    (".jpg", "01;35"),
-    (".jpeg", "01;35"),
-    (".mjpg", "01;35"),
-    (".mjpeg", "01;35"),
-    (".gif", "01;35"),
-    (".bmp", "01;35"),
-    (".pbm", "01;35"),
-    (".pgm", "01;35"),
-    (".ppm", "01;35"),
-    (".tga", "01;35"),
-    (".xbm", "01;35"),
-    (".xpm", "01;35"),
-    (".tif", "01;35"),
-    (".tiff", "01;35"),
-    (".png", "01;35"),
-    (".svg", "01;35"),
-    (".svgz", "01;35"),
-    (".mng", "01;35"),
-    (".pcx", "01;35"),
-    (".mov", "01;35"),
-    (".mpg", "01;35"),
-    (".mpeg", "01;35"),
-    (".m2v", "01;35"),
-    (".mkv", "01;35"),
-    (".webm", "01;35"),
-    (".webp", "01;35"),
-    (".ogm", "01;35"),
-    (".mp4", "01;35"),
-    (".m4v", "01;35"),
-    (".mp4v", "01;35"),
-    (".vob", "01;35"),
-    (".qt", "01;35"),
-    (".nuv", "01;35"),
-    (".wmv", "01;35"),
-    (".asf", "01;35"),
-    (".rm", "01;35"),
-    (".rmvb", "01;35"),
-    (".flc", "01;35"),
-    (".avi", "01;35"),
-    (".fli", "01;35"),
-    (".flv", "01;35"),
-    (".gl", "01;35"),
-    (".dl", "01;35"),
-    (".xcf", "01;35"),
-    (".xwd", "01;35"),
-    (".yuv", "01;35"),
-    (".cgm", "01;35"),
-    (".emf", "01;35"),
-    (".ogv", "01;35"),
-    (".ogx", "01;35"),
-    // Audio formats
-    (".aac", "00;36"),
-    (".au", "00;36"),
-    (".flac", "00;36"),
-    (".m4a", "00;36"),
-    (".mid", "00;36"),
-    (".midi", "00;36"),
-    (".mka", "00;36"),
-    (".mp3", "00;36"),
-    (".mpc", "00;36"),
-    (".ogg", "00;36"),
-    (".ra", "00;36"),
-    (".wav", "00;36"),
-    (".oga", "00;36"),
-    (".opus", "00;36"),
-    (".spx", "00;36"),
-    (".xspf", "00;36"),
-    // Backup files
-    ("*~", "00;90"),
-    ("*#", "00;90"),
-    (".bak", "00;90"),
-    (".old", "00;90"),
-    (".orig", "00;90"),
-    (".part", "00;90"),
-    (".rej", "00;90"),
-    (".swp", "00;90"),
-    (".tmp", "00;90"),
-    (".dpkg-dist", "00;90"),
-    (".dpkg-old", "00;90"),
-    (".ucf-dist", "00;90"),
-    (".ucf-new", "00;90"),
-    (".ucf-old", "00;90"),
-    (".rpmnew", "00;90"),
-    (".rpmorig", "00;90"),
-    (".rpmsave", "00;90"),
-];
+pub static FILE_COLORS: Lazy<HashMap<&str, &str>> = Lazy::new(|| {
+    let mut m = HashMap::new();
+    [
+        // Executables (Windows)
+        (".cmd", "01;32"),
+        (".exe", "01;32"),
+        (".com", "01;32"),
+        (".btm", "01;32"),
+        (".bat", "01;32"),
+        (".sh", "01;32"),
+        (".csh", "01;32"),
+        // Archives or compressed
+        (".tar", "01;31"),
+        (".tgz", "01;31"),
+        (".arc", "01;31"),
+        (".arj", "01;31"),
+        (".taz", "01;31"),
+        (".lha", "01;31"),
+        (".lz4", "01;31"),
+        (".lzh", "01;31"),
+        (".lzma", "01;31"),
+        (".tlz", "01;31"),
+        (".txz", "01;31"),
+        (".tzo", "01;31"),
+        (".t7z", "01;31"),
+        (".zip", "01;31"),
+        (".z", "01;31"),
+        (".dz", "01;31"),
+        (".gz", "01;31"),
+        (".lrz", "01;31"),
+        (".lz", "01;31"),
+        (".lzo", "01;31"),
+        (".xz", "01;31"),
+        (".zst", "01;31"),
+        (".tzst", "01;31"),
+        (".bz2", "01;31"),
+        (".bz", "01;31"),
+        (".tbz", "01;31"),
+        (".tbz2", "01;31"),
+        (".tz", "01;31"),
+        (".deb", "01;31"),
+        (".rpm", "01;31"),
+        (".jar", "01;31"),
+        (".war", "01;31"),
+        (".ear", "01;31"),
+        (".sar", "01;31"),
+        (".rar", "01;31"),
+        (".alz", "01;31"),
+        (".ace", "01;31"),
+        (".zoo", "01;31"),
+        (".cpio", "01;31"),
+        (".7z", "01;31"),
+        (".rz", "01;31"),
+        (".cab", "01;31"),
+        (".wim", "01;31"),
+        (".swm", "01;31"),
+        (".dwm", "01;31"),
+        (".esd", "01;31"),
+        // Image formats
+        (".avif", "01;35"),
+        (".jpg", "01;35"),
+        (".jpeg", "01;35"),
+        (".mjpg", "01;35"),
+        (".mjpeg", "01;35"),
+        (".gif", "01;35"),
+        (".bmp", "01;35"),
+        (".pbm", "01;35"),
+        (".pgm", "01;35"),
+        (".ppm", "01;35"),
+        (".tga", "01;35"),
+        (".xbm", "01;35"),
+        (".xpm", "01;35"),
+        (".tif", "01;35"),
+        (".tiff", "01;35"),
+        (".png", "01;35"),
+        (".svg", "01;35"),
+        (".svgz", "01;35"),
+        (".mng", "01;35"),
+        (".pcx", "01;35"),
+        (".mov", "01;35"),
+        (".mpg", "01;35"),
+        (".mpeg", "01;35"),
+        (".m2v", "01;35"),
+        (".mkv", "01;35"),
+        (".webm", "01;35"),
+        (".webp", "01;35"),
+        (".ogm", "01;35"),
+        (".mp4", "01;35"),
+        (".m4v", "01;35"),
+        (".mp4v", "01;35"),
+        (".vob", "01;35"),
+        (".qt", "01;35"),
+        (".nuv", "01;35"),
+        (".wmv", "01;35"),
+        (".asf", "01;35"),
+        (".rm", "01;35"),
+        (".rmvb", "01;35"),
+        (".flc", "01;35"),
+        (".avi", "01;35"),
+        (".fli", "01;35"),
+        (".flv", "01;35"),
+        (".gl", "01;35"),
+        (".dl", "01;35"),
+        (".xcf", "01;35"),
+        (".xwd", "01;35"),
+        (".yuv", "01;35"),
+        (".cgm", "01;35"),
+        (".emf", "01;35"),
+        (".ogv", "01;35"),
+        (".ogx", "01;35"),
+        // Audio formats
+        (".aac", "00;36"),
+        (".au", "00;36"),
+        (".flac", "00;36"),
+        (".m4a", "00;36"),
+        (".mid", "00;36"),
+        (".midi", "00;36"),
+        (".mka", "00;36"),
+        (".mp3", "00;36"),
+        (".mpc", "00;36"),
+        (".ogg", "00;36"),
+        (".ra", "00;36"),
+        (".wav", "00;36"),
+        (".oga", "00;36"),
+        (".opus", "00;36"),
+        (".spx", "00;36"),
+        (".xspf", "00;36"),
+        // Backup files
+        ("*~", "00;90"),
+        ("*#", "00;90"),
+        (".bak", "00;90"),
+        (".old", "00;90"),
+        (".orig", "00;90"),
+        (".part", "00;90"),
+        (".rej", "00;90"),
+        (".swp", "00;90"),
+        (".tmp", "00;90"),
+        (".dpkg-dist", "00;90"),
+        (".dpkg-old", "00;90"),
+        (".ucf-dist", "00;90"),
+        (".ucf-new", "00;90"),
+        (".ucf-old", "00;90"),
+        (".rpmnew", "00;90"),
+        (".rpmorig", "00;90"),
+        (".rpmsave", "00;90"),
+    ]
+    .iter()
+    .for_each(|&(k, v)| {
+        m.insert(k, v);
+    });
+    m
+});
+
+pub static FILE_ATTRIBUTE_CODES: Lazy<HashMap<&str, &str>> = Lazy::new(|| {
+    let mut m = HashMap::new();
+    [
+        ("normal", "no"),
+        ("norm", "no"),
+        ("file", "fi"),
+        ("reset", "rs"),
+        ("dir", "di"),
+        ("lnk", "ln"),
+        ("link", "ln"),
+        ("symlink", "ln"),
+        ("orphan", "or"),
+        ("missing", "mi"),
+        ("fifo", "pi"),
+        ("pipe", "pi"),
+        ("sock", "so"),
+        ("blk", "bd"),
+        ("block", "bd"),
+        ("chr", "cd"),
+        ("char", "cd"),
+        ("door", "do"),
+        ("exec", "ex"),
+        ("left", "lc"),
+        ("leftcode", "lc"),
+        ("right", "rc"),
+        ("rightcode", "rc"),
+        ("end", "ec"),
+        ("endcode", "ec"),
+        ("suid", "su"),
+        ("setuid", "su"),
+        ("sgid", "sg"),
+        ("setgid", "sg"),
+        ("sticky", "st"),
+        ("other_writable", "ow"),
+        ("owr", "ow"),
+        ("sticky_other_writable", "tw"),
+        ("owt", "tw"),
+        ("capability", "ca"),
+        ("multihardlink", "mh"),
+        ("clrtoeol", "cl"),
+    ]
+    .iter()
+    .for_each(|&(k, v)| {
+        m.insert(k, v);
+    });
+    m
+});
diff --git a/src/uucore/src/lib/lib.rs b/src/uucore/src/lib/lib.rs
index af8668ef02f..426b4216ca2 100644
--- a/src/uucore/src/lib/lib.rs
+++ b/src/uucore/src/lib/lib.rs
@@ -35,6 +35,8 @@ pub use crate::parser::shortcut_value_parser;
 // * feature-gated modules
 #[cfg(feature = "backup-control")]
 pub use crate::features::backup_control;
+#[cfg(feature = "colors")]
+pub use crate::features::colors;
 #[cfg(feature = "encoding")]
 pub use crate::features::encoding;
 #[cfg(feature = "format")]

From 5d19f79cd0b791bf28c9c8d9d8f4fd61817f6026 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Sat, 2 Dec 2023 12:57:38 +0100
Subject: [PATCH 103/429] dircolors should use the datastructures when printing

---
 src/uu/dircolors/src/dircolors.rs     | 119 ++++++++++++++++++++++----
 src/uucore/src/lib/features/colors.rs |  89 +++++++------------
 2 files changed, 134 insertions(+), 74 deletions(-)

diff --git a/src/uu/dircolors/src/dircolors.rs b/src/uu/dircolors/src/dircolors.rs
index 58228ddeb57..43e35c3d2a9 100644
--- a/src/uu/dircolors/src/dircolors.rs
+++ b/src/uu/dircolors/src/dircolors.rs
@@ -12,7 +12,7 @@ use std::io::{BufRead, BufReader};
 use std::path::Path;
 
 use clap::{crate_version, Arg, ArgAction, Command};
-use uucore::colors::FILE_ATTRIBUTE_CODES;
+use uucore::colors::{FILE_ATTRIBUTE_CODES, FILE_COLORS, FILE_TYPES};
 use uucore::display::Quotable;
 use uucore::error::{UResult, USimpleError, UUsageError};
 use uucore::{help_about, help_section, help_usage};
@@ -58,6 +58,89 @@ pub fn guess_syntax() -> OutputFmt {
     }
 }
 
+fn get_colors_format_strings(fmt: &OutputFmt) -> (String, String) {
+    let prefix = match fmt {
+        OutputFmt::Shell => "LS_COLORS='".to_string(),
+        OutputFmt::CShell => "setenv LS_COLORS '".to_string(),
+        OutputFmt::Display => String::new(),
+        OutputFmt::Unknown => unreachable!(),
+    };
+
+    let suffix = match fmt {
+        OutputFmt::Shell => "';\nexport LS_COLORS".to_string(),
+        OutputFmt::CShell => "'".to_string(),
+        OutputFmt::Display => String::new(),
+        OutputFmt::Unknown => unreachable!(),
+    };
+
+    (prefix, suffix)
+}
+
+pub fn generate_type_output(fmt: &OutputFmt) -> String {
+    match fmt {
+        OutputFmt::Display => FILE_TYPES
+            .iter()
+            .map(|&(_, key, val)| format!("\x1b[{}m{}\t{}\x1b[0m", val, key, val))
+            .collect::<Vec<String>>()
+            .join("\n"),
+        _ => {
+            // Existing logic for other formats
+            FILE_TYPES
+                .iter()
+                .map(|&(_, v1, v2)| format!("{}={}", v1, v2))
+                .collect::<Vec<String>>()
+                .join(":")
+        }
+    }
+}
+
+enum ExtensionFormat {
+    StarDot, // Format as ".*ext"
+    Dot,     // Format as ".ext"
+    NoDot,   // Format as "ext"
+}
+
+fn generate_ls_colors(fmt: &OutputFmt, format: ExtensionFormat, sep: &str) -> String {
+    match fmt {
+        OutputFmt::Display => {
+            let mut display_parts = vec![];
+            let type_output = generate_type_output(fmt);
+            display_parts.push(type_output);
+            for &(extension, code) in FILE_COLORS.iter() {
+                display_parts.push(format!("\x1b[{}m*{}\t{}\x1b[0m", code, extension, code));
+            }
+            display_parts.join("\n")
+        }
+        _ => {
+            // existing logic for other formats
+            let mut parts = vec![];
+            for &(extension, code) in FILE_COLORS.iter() {
+                let formatted_extension = match format {
+                    ExtensionFormat::StarDot => format!("*{}", extension),
+                    ExtensionFormat::Dot => extension.to_string(),
+                    ExtensionFormat::NoDot => {
+                        if extension.starts_with('.') {
+                            extension[1..].to_string()
+                        } else {
+                            extension.to_string()
+                        }
+                    }
+                };
+                parts.push(format!("{}={}", formatted_extension, code));
+            }
+            let (prefix, suffix) = get_colors_format_strings(&fmt);
+            let ls_colors = parts.join(sep);
+            format!(
+                "{}{}:{}:{}",
+                prefix,
+                generate_type_output(&fmt),
+                ls_colors,
+                suffix
+            )
+        }
+    }
+}
+
 #[uucore::main]
 pub fn uumain(args: impl uucore::Args) -> UResult<()> {
     let args = args.collect_ignore();
@@ -126,7 +209,12 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
 
     let result;
     if files.is_empty() {
-        result = parse(INTERNAL_DB.lines(), &out_format, "");
+        println!(
+            "{}",
+            generate_ls_colors(&out_format, ExtensionFormat::StarDot, ":")
+        );
+
+        return Ok(());
     } else if files.len() > 1 {
         return Err(UUsageError::new(
             1,
@@ -287,12 +375,9 @@ where
 {
     // 1790 > $(dircolors | wc -m)
     let mut result = String::with_capacity(1790);
-    match fmt {
-        OutputFmt::Shell => result.push_str("LS_COLORS='"),
-        OutputFmt::CShell => result.push_str("setenv LS_COLORS '"),
-        OutputFmt::Display => (),
-        OutputFmt::Unknown => unreachable!(),
-    }
+    let (prefix, suffix) = get_colors_format_strings(&fmt);
+
+    result.push_str(&prefix);
 
     let term = env::var("TERM").unwrap_or_else(|_| "none".to_owned());
     let term = term.as_str();
@@ -331,6 +416,7 @@ where
                 state = ParseState::Continue;
             }
             if state != ParseState::Pass {
+                let search_key = lower.as_str();
                 if key.starts_with('.') {
                     if *fmt == OutputFmt::Display {
                         result.push_str(format!("\x1b[{val}m*{key}\t{val}\x1b[0m\n").as_str());
@@ -345,7 +431,10 @@ where
                     }
                 } else if lower == "options" || lower == "color" || lower == "eightbit" {
                     // Slackware only. Ignore
-                } else if let Some(s) = FILE_ATTRIBUTE_CODES.get(lower.as_str()) {
+                } else if let Some((_, s)) = FILE_ATTRIBUTE_CODES
+                    .iter()
+                    .find(|&&(key, _)| key == search_key)
+                {
                     if *fmt == OutputFmt::Display {
                         result.push_str(format!("\x1b[{val}m{s}\t{val}\x1b[0m\n").as_str());
                     } else {
@@ -363,15 +452,11 @@ where
         }
     }
 
-    match fmt {
-        OutputFmt::Shell => result.push_str("';\nexport LS_COLORS"),
-        OutputFmt::CShell => result.push('\''),
-        OutputFmt::Display => {
-            // remove latest "\n"
-            result.pop();
-        }
-        OutputFmt::Unknown => unreachable!(),
+    if fmt == &OutputFmt::Display {
+        // remove latest "\n"
+        result.pop();
     }
+    result.push_str(&suffix);
 
     Ok(result)
 }
diff --git a/src/uucore/src/lib/features/colors.rs b/src/uucore/src/lib/features/colors.rs
index 69be16ba291..96ca6d45672 100644
--- a/src/uucore/src/lib/features/colors.rs
+++ b/src/uucore/src/lib/features/colors.rs
@@ -4,19 +4,15 @@
 // file that was distributed with this source code.
 
 use once_cell::sync::Lazy;
-use std::collections::HashMap;
 
 /* The keywords COLOR, OPTIONS, and EIGHTBIT (honored by the
  * slackware version of dircolors) are recognized but ignored.
  * Global config options can be specified before TERM or COLORTERM entries
  * below are TERM or COLORTERM entries, which can be glob patterns, which
  * restrict following config to systems with matching environment variables.
- * COLORTERM ?*
 */
-
-pub static TERMS: Lazy<HashMap<&str, &str>> = Lazy::new(|| {
-    let mut m = HashMap::new();
-    [
+pub static TERMS: Lazy<Vec<&str>> = Lazy::new(|| {
+    vec![
         "Eterm",
         "ansi",
         "*color*",
@@ -43,11 +39,6 @@ pub static TERMS: Lazy<HashMap<&str, &str>> = Lazy::new(|| {
         "vt100",
         "xterm*",
     ]
-    .iter()
-    .for_each(|&term| {
-        m.insert(term, "");
-    });
-    m
 });
 
 /*
@@ -64,34 +55,27 @@ pub static TERMS: Lazy<HashMap<&str, &str>> = Lazy::new(|| {
 #NORMAL 00 # no color code at all
 #FILE 00 # regular file: use no color at all
 */
-// FILE_TYPES with Lazy initialization
-pub static FILE_TYPES: Lazy<HashMap<&str, &str>> = Lazy::new(|| {
-    let mut m = HashMap::new();
-    [
-        ("RESET", "0"),                     // reset to "normal" color
-        ("DIR", "01;34"),                   // directory
-        ("LINK", "01;36"),                  // symbolic link
-        ("MULTIHARDLINK", "00"),            // regular file with more than one link
-        ("FIFO", "40;33"),                  // pipe
-        ("SOCK", "01;35"),                  // socket
-        ("DOOR", "01;35"),                  // door
-        ("BLK", "40;33;01"),                // block device driver
-        ("CHR", "40;33;01"),                // character device driver
-        ("ORPHAN", "40;31;01"),             // symlink to nonexistent file, or non-stat'able file
-        ("MISSING", "00"),                  // ... and the files they point to
-        ("SETUID", "37;41"),                // file that is setuid (u+s)
-        ("SETGID", "30;43"),                // file that is setgid (g+s)
-        ("CAPABILITY", "00"),               // file with capability
-        ("STICKY_OTHER_WRITABLE", "30;42"), // dir that is sticky and other-writable (+t,o+w)
-        ("OTHER_WRITABLE", "34;42"),        // dir that is other-writable (o+w) and not sticky
-        ("STICKY", "37;44"), // dir with the sticky bit set (+t) and not other-writable
-        ("EXEC", "01;32"),   // files with execute permission
+pub static FILE_TYPES: Lazy<Vec<(&'static str, &'static str, &'static str)>> = Lazy::new(|| {
+    vec![
+        ("RESET", "rs", "0"),                     // reset to "normal" color
+        ("DIR", "di", "01;34"),                   // directory
+        ("LINK", "ln", "01;36"),                  // symbolic link
+        ("MULTIHARDLINK", "mh", "00"),            // regular file with more than one link
+        ("FIFO", "pi", "40;33"),                  // pipe
+        ("SOCK", "so", "01;35"),                  // socket
+        ("DOOR", "do", "01;35"),                  // door
+        ("BLK", "bd", "40;33;01"),                // block device driver
+        ("CHR", "cd", "40;33;01"),                // character device driver
+        ("ORPHAN", "or", "40;31;01"), // symlink to nonexistent file, or non-stat'able file
+        ("MISSING", "mi", "00"),      // ... and the files they point to
+        ("SETUID", "su", "37;41"),    // file that is setuid (u+s)
+        ("SETGID", "sg", "30;43"),    // file that is setgid (g+s)
+        ("CAPABILITY", "ca", "00"),   // file with capability
+        ("STICKY_OTHER_WRITABLE", "tw", "30;42"), // dir that is sticky and other-writable (+t,o+w)
+        ("OTHER_WRITABLE", "ow", "34;42"), // dir that is other-writable (o+w) and not sticky
+        ("STICKY", "st", "37;44"),    // dir with the sticky bit set (+t) and not other-writable
+        ("EXEC", "ex", "01;32"),      // files with execute permission
     ]
-    .iter()
-    .for_each(|&(k, v)| {
-        m.insert(k, v);
-    });
-    m
 });
 
 /*
@@ -99,9 +83,9 @@ pub static FILE_TYPES: Lazy<HashMap<&str, &str>> = Lazy::new(|| {
 # to color below. Put the extension, a space, and the color init string.
 # (and any comments you want to add after a '#')
 */
-pub static FILE_COLORS: Lazy<HashMap<&str, &str>> = Lazy::new(|| {
-    let mut m = HashMap::new();
-    [
+pub static FILE_COLORS: Lazy<Vec<(&str, &str)>> = Lazy::new(|| {
+    vec![
+        /*
         // Executables (Windows)
         (".cmd", "01;32"),
         (".exe", "01;32"),
@@ -109,7 +93,7 @@ pub static FILE_COLORS: Lazy<HashMap<&str, &str>> = Lazy::new(|| {
         (".btm", "01;32"),
         (".bat", "01;32"),
         (".sh", "01;32"),
-        (".csh", "01;32"),
+        (".csh", "01;32"),*/
         // Archives or compressed
         (".tar", "01;31"),
         (".tgz", "01;31"),
@@ -207,6 +191,7 @@ pub static FILE_COLORS: Lazy<HashMap<&str, &str>> = Lazy::new(|| {
         (".yuv", "01;35"),
         (".cgm", "01;35"),
         (".emf", "01;35"),
+        // https://wiki.xiph.org/MIME_Types_and_File_Extensions
         (".ogv", "01;35"),
         (".ogx", "01;35"),
         // Audio formats
@@ -222,13 +207,14 @@ pub static FILE_COLORS: Lazy<HashMap<&str, &str>> = Lazy::new(|| {
         (".ogg", "00;36"),
         (".ra", "00;36"),
         (".wav", "00;36"),
+        // https://wiki.xiph.org/MIME_Types_and_File_Extensions
         (".oga", "00;36"),
         (".opus", "00;36"),
         (".spx", "00;36"),
         (".xspf", "00;36"),
         // Backup files
-        ("*~", "00;90"),
-        ("*#", "00;90"),
+        ("~", "00;90"),
+        ("#", "00;90"),
         (".bak", "00;90"),
         (".old", "00;90"),
         (".orig", "00;90"),
@@ -245,16 +231,10 @@ pub static FILE_COLORS: Lazy<HashMap<&str, &str>> = Lazy::new(|| {
         (".rpmorig", "00;90"),
         (".rpmsave", "00;90"),
     ]
-    .iter()
-    .for_each(|&(k, v)| {
-        m.insert(k, v);
-    });
-    m
 });
 
-pub static FILE_ATTRIBUTE_CODES: Lazy<HashMap<&str, &str>> = Lazy::new(|| {
-    let mut m = HashMap::new();
-    [
+pub static FILE_ATTRIBUTE_CODES: Lazy<Vec<(&str, &str)>> = Lazy::new(|| {
+    vec![
         ("normal", "no"),
         ("norm", "no"),
         ("file", "fi"),
@@ -293,9 +273,4 @@ pub static FILE_ATTRIBUTE_CODES: Lazy<HashMap<&str, &str>> = Lazy::new(|| {
         ("multihardlink", "mh"),
         ("clrtoeol", "cl"),
     ]
-    .iter()
-    .for_each(|&(k, v)| {
-        m.insert(k, v);
-    });
-    m
 });

From e4b875043429ac78f4ae4b2824caea3e8d180244 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Sat, 2 Dec 2023 15:06:09 +0100
Subject: [PATCH 104/429] dircolors -p: generate it dynamically

---
 src/uu/dircolors/src/colors.rs             | 225 ---------------------
 src/uu/dircolors/src/dircolors.rs          |  65 +++++-
 tests/fixtures/dircolors/internal.expected |  60 ++----
 3 files changed, 75 insertions(+), 275 deletions(-)
 delete mode 100644 src/uu/dircolors/src/colors.rs

diff --git a/src/uu/dircolors/src/colors.rs b/src/uu/dircolors/src/colors.rs
deleted file mode 100644
index c0a981db89c..00000000000
--- a/src/uu/dircolors/src/colors.rs
+++ /dev/null
@@ -1,225 +0,0 @@
-// This file is part of the uutils coreutils package.
-//
-// For the full copyright and license information, please view the LICENSE
-// file that was distributed with this source code.
-// spell-checker:ignore (ToDO) EIGHTBIT ETERM MULTIHARDLINK cpio dtterm jfbterm konsole kterm mlterm rmvb rxvt stat'able svgz tmux webm xspf COLORTERM tzst avif tzst mjpg mjpeg webp dpkg rpmnew rpmorig rpmsave
-
-pub const INTERNAL_DB: &str = r#"# Configuration file for dircolors, a utility to help you set the
-# LS_COLORS environment variable used by GNU ls with the --color option.
-# Copyright (C) 1996-2022 Free Software Foundation, Inc.
-# Copying and distribution of this file, with or without modification,
-# are permitted provided the copyright notice and this notice are preserved.
-# The keywords COLOR, OPTIONS, and EIGHTBIT (honored by the
-# slackware version of dircolors) are recognized but ignored.
-# Global config options can be specified before TERM or COLORTERM entries
-# Below are TERM or COLORTERM entries, which can be glob patterns, which
-# restrict following config to systems with matching environment variables.
-COLORTERM ?*
-TERM Eterm
-TERM ansi
-TERM *color*
-TERM con[0-9]*x[0-9]*
-TERM cons25
-TERM console
-TERM cygwin
-TERM *direct*
-TERM dtterm
-TERM gnome
-TERM hurd
-TERM jfbterm
-TERM konsole
-TERM kterm
-TERM linux
-TERM linux-c
-TERM mlterm
-TERM putty
-TERM rxvt*
-TERM screen*
-TERM st
-TERM terminator
-TERM tmux*
-TERM vt100
-TERM xterm*
-# Below are the color init strings for the basic file types.
-# One can use codes for 256 or more colors supported by modern terminals.
-# The default color codes use the capabilities of an 8 color terminal
-# with some additional attributes as per the following codes:
-# Attribute codes:
-# 00=none 01=bold 04=underscore 05=blink 07=reverse 08=concealed
-# Text color codes:
-# 30=black 31=red 32=green 33=yellow 34=blue 35=magenta 36=cyan 37=white
-# Background color codes:
-# 40=black 41=red 42=green 43=yellow 44=blue 45=magenta 46=cyan 47=white
-#NORMAL 00 # no color code at all
-#FILE 00 # regular file: use no color at all
-RESET 0 # reset to "normal" color
-DIR 01;34 # directory
-LINK 01;36 # symbolic link. (If you set this to 'target' instead of a
- # numerical value, the color is as for the file pointed to.)
-MULTIHARDLINK 00 # regular file with more than one link
-FIFO 40;33 # pipe
-SOCK 01;35 # socket
-DOOR 01;35 # door
-BLK 40;33;01 # block device driver
-CHR 40;33;01 # character device driver
-ORPHAN 40;31;01 # symlink to nonexistent file, or non-stat'able file ...
-MISSING 00 # ... and the files they point to
-SETUID 37;41 # file that is setuid (u+s)
-SETGID 30;43 # file that is setgid (g+s)
-CAPABILITY 00 # file with capability (very expensive to lookup)
-STICKY_OTHER_WRITABLE 30;42 # dir that is sticky and other-writable (+t,o+w)
-OTHER_WRITABLE 34;42 # dir that is other-writable (o+w) and not sticky
-STICKY 37;44 # dir with the sticky bit set (+t) and not other-writable
-# This is for files with execute permission:
-EXEC 01;32
-# List any file extensions like '.gz' or '.tar' that you would like ls
-# to color below. Put the extension, a space, and the color init string.
-# (and any comments you want to add after a '#')
-# If you use DOS-style suffixes, you may want to uncomment the following:
-#.cmd 01;32 # executables (bright green)
-#.exe 01;32
-#.com 01;32
-#.btm 01;32
-#.bat 01;32
-# Or if you want to color scripts even if they do not have the
-# executable bit actually set.
-#.sh 01;32
-#.csh 01;32
- # archives or compressed (bright red)
-.tar 01;31
-.tgz 01;31
-.arc 01;31
-.arj 01;31
-.taz 01;31
-.lha 01;31
-.lz4 01;31
-.lzh 01;31
-.lzma 01;31
-.tlz 01;31
-.txz 01;31
-.tzo 01;31
-.t7z 01;31
-.zip 01;31
-.z 01;31
-.dz 01;31
-.gz 01;31
-.lrz 01;31
-.lz 01;31
-.lzo 01;31
-.xz 01;31
-.zst 01;31
-.tzst 01;31
-.bz2 01;31
-.bz 01;31
-.tbz 01;31
-.tbz2 01;31
-.tz 01;31
-.deb 01;31
-.rpm 01;31
-.jar 01;31
-.war 01;31
-.ear 01;31
-.sar 01;31
-.rar 01;31
-.alz 01;31
-.ace 01;31
-.zoo 01;31
-.cpio 01;31
-.7z 01;31
-.rz 01;31
-.cab 01;31
-.wim 01;31
-.swm 01;31
-.dwm 01;31
-.esd 01;31
-# image formats
-.avif 01;35
-.jpg 01;35
-.jpeg 01;35
-.mjpg 01;35
-.mjpeg 01;35
-.gif 01;35
-.bmp 01;35
-.pbm 01;35
-.pgm 01;35
-.ppm 01;35
-.tga 01;35
-.xbm 01;35
-.xpm 01;35
-.tif 01;35
-.tiff 01;35
-.png 01;35
-.svg 01;35
-.svgz 01;35
-.mng 01;35
-.pcx 01;35
-.mov 01;35
-.mpg 01;35
-.mpeg 01;35
-.m2v 01;35
-.mkv 01;35
-.webm 01;35
-.webp 01;35
-.ogm 01;35
-.mp4 01;35
-.m4v 01;35
-.mp4v 01;35
-.vob 01;35
-.qt 01;35
-.nuv 01;35
-.wmv 01;35
-.asf 01;35
-.rm 01;35
-.rmvb 01;35
-.flc 01;35
-.avi 01;35
-.fli 01;35
-.flv 01;35
-.gl 01;35
-.dl 01;35
-.xcf 01;35
-.xwd 01;35
-.yuv 01;35
-.cgm 01;35
-.emf 01;35
-# https://wiki.xiph.org/MIME_Types_and_File_Extensions
-.ogv 01;35
-.ogx 01;35
-# audio formats
-.aac 00;36
-.au 00;36
-.flac 00;36
-.m4a 00;36
-.mid 00;36
-.midi 00;36
-.mka 00;36
-.mp3 00;36
-.mpc 00;36
-.ogg 00;36
-.ra 00;36
-.wav 00;36
-# https://wiki.xiph.org/MIME_Types_and_File_Extensions
-.oga 00;36
-.opus 00;36
-.spx 00;36
-.xspf 00;36
-# backup files
-*~ 00;90
-*# 00;90
-.bak 00;90
-.old 00;90
-.orig 00;90
-.part 00;90
-.rej 00;90
-.swp 00;90
-.tmp 00;90
-.dpkg-dist 00;90
-.dpkg-old 00;90
-.ucf-dist 00;90
-.ucf-new 00;90
-.ucf-old 00;90
-.rpmnew 00;90
-.rpmorig 00;90
-.rpmsave 00;90
-# Subsequent TERM or COLORTERM entries, can be used to add / override
-# config specific to those matching environment variables."#;
diff --git a/src/uu/dircolors/src/dircolors.rs b/src/uu/dircolors/src/dircolors.rs
index 43e35c3d2a9..338bf83e514 100644
--- a/src/uu/dircolors/src/dircolors.rs
+++ b/src/uu/dircolors/src/dircolors.rs
@@ -10,9 +10,10 @@ use std::env;
 use std::fs::File;
 use std::io::{BufRead, BufReader};
 use std::path::Path;
+use std::fmt::Write;
 
 use clap::{crate_version, Arg, ArgAction, Command};
-use uucore::colors::{FILE_ATTRIBUTE_CODES, FILE_COLORS, FILE_TYPES};
+use uucore::colors::{FILE_ATTRIBUTE_CODES, FILE_COLORS, FILE_TYPES, TERMS};
 use uucore::display::Quotable;
 use uucore::error::{UResult, USimpleError, UUsageError};
 use uucore::{help_about, help_section, help_usage};
@@ -29,9 +30,6 @@ const USAGE: &str = help_usage!("dircolors.md");
 const ABOUT: &str = help_about!("dircolors.md");
 const AFTER_HELP: &str = help_section!("after help", "dircolors.md");
 
-mod colors;
-use self::colors::INTERNAL_DB;
-
 #[derive(PartialEq, Eq, Debug)]
 pub enum OutputFmt {
     Shell,
@@ -181,7 +179,8 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
                 ),
             ));
         }
-        println!("{INTERNAL_DB}");
+
+        println!("{}", generate_dircolors_config());
         return Ok(());
     }
 
@@ -222,6 +221,7 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
         ));
     } else if files[0].eq("-") {
         let fin = BufReader::new(std::io::stdin());
+        // For example, for echo "owt 40;33"|dircolors -b -
         result = parse(fin.lines().map_while(Result::ok), &out_format, files[0]);
     } else {
         let path = Path::new(files[0]);
@@ -368,7 +368,7 @@ enum ParseState {
 use uucore::{format_usage, parse_glob};
 
 #[allow(clippy::cognitive_complexity)]
-fn parse<T>(lines: T, fmt: &OutputFmt, fp: &str) -> Result<String, String>
+fn parse<T>(user_input: T, fmt: &OutputFmt, fp: &str) -> Result<String, String>
 where
     T: IntoIterator,
     T::Item: Borrow<str>,
@@ -384,7 +384,7 @@ where
 
     let mut state = ParseState::Global;
 
-    for (num, line) in lines.into_iter().enumerate() {
+    for (num, line) in user_input.into_iter().enumerate() {
         let num = num + 1;
         let line = line.borrow().purify();
         if line.is_empty() {
@@ -396,13 +396,12 @@ where
         let (key, val) = line.split_two();
         if val.is_empty() {
             return Err(format!(
-                "{}:{}: invalid line;  missing second token",
+                "{}:{}: invalid line; missing second token",
                 fp.maybe_quote(),
                 num
             ));
         }
         let lower = key.to_lowercase();
-
         if lower == "term" || lower == "colorterm" {
             if term.fnmatch(val) {
                 state = ParseState::Matched;
@@ -417,6 +416,7 @@ where
             }
             if state != ParseState::Pass {
                 let search_key = lower.as_str();
+
                 if key.starts_with('.') {
                     if *fmt == OutputFmt::Display {
                         result.push_str(format!("\x1b[{val}m*{key}\t{val}\x1b[0m\n").as_str());
@@ -482,6 +482,53 @@ fn escape(s: &str) -> String {
     result
 }
 
+
+pub fn generate_dircolors_config() -> String {
+    let mut config = String::new();
+
+    // Adding the complete header comments as in the original file
+    writeln!(config, "# Configuration file for dircolors, a utility to help you set the").unwrap();
+    writeln!(config, "# LS_COLORS environment variable used by GNU ls with the --color option.").unwrap();
+    writeln!(config, "# The keywords COLOR, OPTIONS, and EIGHTBIT (honored by the").unwrap();
+    writeln!(config, "# slackware version of dircolors) are recognized but ignored.").unwrap();
+    writeln!(config, "# Global config options can be specified before TERM or COLORTERM entries").unwrap();
+    writeln!(config, "# Below are TERM or COLORTERM entries, which can be glob patterns, which").unwrap();
+    writeln!(config, "# restrict following config to systems with matching environment variables.").unwrap();
+    writeln!(config, "COLORTERM ?*").unwrap();
+    for term in TERMS.iter() {
+        writeln!(config, "TERM {}", term).unwrap();
+    }
+
+    // Adding file types and their color codes with header
+    writeln!(config, "# Below are the color init strings for the basic file types.").unwrap();
+    writeln!(config, "# One can use codes for 256 or more colors supported by modern terminals.").unwrap();
+    writeln!(config, "# The default color codes use the capabilities of an 8 color terminal").unwrap();
+    writeln!(config, "# with some additional attributes as per the following codes:").unwrap();
+    writeln!(config, "# Attribute codes:").unwrap();
+    writeln!(config, "# 00=none 01=bold 04=underscore 05=blink 07=reverse 08=concealed").unwrap();
+    writeln!(config, "# Text color codes:").unwrap();
+    writeln!(config, "# 30=black 31=red 32=green 33=yellow 34=blue 35=magenta 36=cyan 37=white").unwrap();
+    writeln!(config, "# Background color codes:").unwrap();
+    writeln!(config, "# 40=black 41=red 42=green 43=yellow 44=blue 45=magenta 46=cyan 47=white").unwrap();
+    writeln!(config, "#NORMAL 00 # no color code at all").unwrap();
+    writeln!(config, "#FILE 00 # regular file: use no color at all").unwrap();
+
+    for (name, _, code) in FILE_TYPES.iter() {
+        writeln!(config, "{} {}", name, code).unwrap();
+    }
+
+    writeln!(config, "# List any file extensions like '.gz' or '.tar' that you would like ls").unwrap();
+    writeln!(config, "# to color below. Put the extension, a space, and the color init string.").unwrap();
+
+    for (ext, color) in FILE_COLORS.iter() {
+        writeln!(config, "{} {}", ext, color).unwrap();
+    }
+    writeln!(config, "# Subsequent TERM or COLORTERM entries, can be used to add / override").unwrap();
+    write!(config, "# config specific to those matching environment variables.").unwrap();
+
+    config
+}
+
 #[cfg(test)]
 mod tests {
     use super::escape;
diff --git a/tests/fixtures/dircolors/internal.expected b/tests/fixtures/dircolors/internal.expected
index 7bc91ef470c..933e70bc470 100644
--- a/tests/fixtures/dircolors/internal.expected
+++ b/tests/fixtures/dircolors/internal.expected
@@ -1,8 +1,5 @@
 # Configuration file for dircolors, a utility to help you set the
 # LS_COLORS environment variable used by GNU ls with the --color option.
-# Copyright (C) 1996-2022 Free Software Foundation, Inc.
-# Copying and distribution of this file, with or without modification,
-# are permitted provided the copyright notice and this notice are preserved.
 # The keywords COLOR, OPTIONS, and EIGHTBIT (honored by the
 # slackware version of dircolors) are recognized but ignored.
 # Global config options can be specified before TERM or COLORTERM entries
@@ -46,40 +43,26 @@ TERM xterm*
 # 40=black 41=red 42=green 43=yellow 44=blue 45=magenta 46=cyan 47=white
 #NORMAL 00 # no color code at all
 #FILE 00 # regular file: use no color at all
-RESET 0 # reset to "normal" color
-DIR 01;34 # directory
-LINK 01;36 # symbolic link. (If you set this to 'target' instead of a
- # numerical value, the color is as for the file pointed to.)
-MULTIHARDLINK 00 # regular file with more than one link
-FIFO 40;33 # pipe
-SOCK 01;35 # socket
-DOOR 01;35 # door
-BLK 40;33;01 # block device driver
-CHR 40;33;01 # character device driver
-ORPHAN 40;31;01 # symlink to nonexistent file, or non-stat'able file ...
-MISSING 00 # ... and the files they point to
-SETUID 37;41 # file that is setuid (u+s)
-SETGID 30;43 # file that is setgid (g+s)
-CAPABILITY 00 # file with capability (very expensive to lookup)
-STICKY_OTHER_WRITABLE 30;42 # dir that is sticky and other-writable (+t,o+w)
-OTHER_WRITABLE 34;42 # dir that is other-writable (o+w) and not sticky
-STICKY 37;44 # dir with the sticky bit set (+t) and not other-writable
-# This is for files with execute permission:
+RESET 0
+DIR 01;34
+LINK 01;36
+MULTIHARDLINK 00
+FIFO 40;33
+SOCK 01;35
+DOOR 01;35
+BLK 40;33;01
+CHR 40;33;01
+ORPHAN 40;31;01
+MISSING 00
+SETUID 37;41
+SETGID 30;43
+CAPABILITY 00
+STICKY_OTHER_WRITABLE 30;42
+OTHER_WRITABLE 34;42
+STICKY 37;44
 EXEC 01;32
 # List any file extensions like '.gz' or '.tar' that you would like ls
 # to color below. Put the extension, a space, and the color init string.
-# (and any comments you want to add after a '#')
-# If you use DOS-style suffixes, you may want to uncomment the following:
-#.cmd 01;32 # executables (bright green)
-#.exe 01;32
-#.com 01;32
-#.btm 01;32
-#.bat 01;32
-# Or if you want to color scripts even if they do not have the
-# executable bit actually set.
-#.sh 01;32
-#.csh 01;32
- # archives or compressed (bright red)
 .tar 01;31
 .tgz 01;31
 .arc 01;31
@@ -126,7 +109,6 @@ EXEC 01;32
 .swm 01;31
 .dwm 01;31
 .esd 01;31
-# image formats
 .avif 01;35
 .jpg 01;35
 .jpeg 01;35
@@ -176,10 +158,8 @@ EXEC 01;32
 .yuv 01;35
 .cgm 01;35
 .emf 01;35
-# https://wiki.xiph.org/MIME_Types_and_File_Extensions
 .ogv 01;35
 .ogx 01;35
-# audio formats
 .aac 00;36
 .au 00;36
 .flac 00;36
@@ -192,14 +172,12 @@ EXEC 01;32
 .ogg 00;36
 .ra 00;36
 .wav 00;36
-# https://wiki.xiph.org/MIME_Types_and_File_Extensions
 .oga 00;36
 .opus 00;36
 .spx 00;36
 .xspf 00;36
-# backup files
-*~ 00;90
-*# 00;90
+~ 00;90
+# 00;90
 .bak 00;90
 .old 00;90
 .orig 00;90

From 1a4ca7e65dc6991f8584c6f03d493bace427ff2d Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Sat, 2 Dec 2023 15:18:20 +0100
Subject: [PATCH 105/429] fix clippy warnings

---
 src/uu/dircolors/src/dircolors.rs     | 143 +++++++++++++++++---------
 src/uucore/src/lib/features/colors.rs |   2 +-
 2 files changed, 98 insertions(+), 47 deletions(-)

diff --git a/src/uu/dircolors/src/dircolors.rs b/src/uu/dircolors/src/dircolors.rs
index 338bf83e514..28d74775db8 100644
--- a/src/uu/dircolors/src/dircolors.rs
+++ b/src/uu/dircolors/src/dircolors.rs
@@ -7,10 +7,10 @@
 
 use std::borrow::Borrow;
 use std::env;
+use std::fmt::Write;
 use std::fs::File;
 use std::io::{BufRead, BufReader};
 use std::path::Path;
-use std::fmt::Write;
 
 use clap::{crate_version, Arg, ArgAction, Command};
 use uucore::colors::{FILE_ATTRIBUTE_CODES, FILE_COLORS, FILE_TYPES, TERMS};
@@ -92,13 +92,7 @@ pub fn generate_type_output(fmt: &OutputFmt) -> String {
     }
 }
 
-enum ExtensionFormat {
-    StarDot, // Format as ".*ext"
-    Dot,     // Format as ".ext"
-    NoDot,   // Format as "ext"
-}
-
-fn generate_ls_colors(fmt: &OutputFmt, format: ExtensionFormat, sep: &str) -> String {
+fn generate_ls_colors(fmt: &OutputFmt, sep: &str) -> String {
     match fmt {
         OutputFmt::Display => {
             let mut display_parts = vec![];
@@ -113,25 +107,15 @@ fn generate_ls_colors(fmt: &OutputFmt, format: ExtensionFormat, sep: &str) -> St
             // existing logic for other formats
             let mut parts = vec![];
             for &(extension, code) in FILE_COLORS.iter() {
-                let formatted_extension = match format {
-                    ExtensionFormat::StarDot => format!("*{}", extension),
-                    ExtensionFormat::Dot => extension.to_string(),
-                    ExtensionFormat::NoDot => {
-                        if extension.starts_with('.') {
-                            extension[1..].to_string()
-                        } else {
-                            extension.to_string()
-                        }
-                    }
-                };
+                let formatted_extension = format!("*{}", extension);
                 parts.push(format!("{}={}", formatted_extension, code));
             }
-            let (prefix, suffix) = get_colors_format_strings(&fmt);
+            let (prefix, suffix) = get_colors_format_strings(fmt);
             let ls_colors = parts.join(sep);
             format!(
                 "{}{}:{}:{}",
                 prefix,
-                generate_type_output(&fmt),
+                generate_type_output(fmt),
                 ls_colors,
                 suffix
             )
@@ -208,10 +192,7 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
 
     let result;
     if files.is_empty() {
-        println!(
-            "{}",
-            generate_ls_colors(&out_format, ExtensionFormat::StarDot, ":")
-        );
+        println!("{}", generate_ls_colors(&out_format, ":"));
 
         return Ok(());
     } else if files.len() > 1 {
@@ -373,9 +354,8 @@ where
     T: IntoIterator,
     T::Item: Borrow<str>,
 {
-    // 1790 > $(dircolors | wc -m)
     let mut result = String::with_capacity(1790);
-    let (prefix, suffix) = get_colors_format_strings(&fmt);
+    let (prefix, suffix) = get_colors_format_strings(fmt);
 
     result.push_str(&prefix);
 
@@ -482,34 +462,89 @@ fn escape(s: &str) -> String {
     result
 }
 
-
 pub fn generate_dircolors_config() -> String {
     let mut config = String::new();
 
     // Adding the complete header comments as in the original file
-    writeln!(config, "# Configuration file for dircolors, a utility to help you set the").unwrap();
-    writeln!(config, "# LS_COLORS environment variable used by GNU ls with the --color option.").unwrap();
-    writeln!(config, "# The keywords COLOR, OPTIONS, and EIGHTBIT (honored by the").unwrap();
-    writeln!(config, "# slackware version of dircolors) are recognized but ignored.").unwrap();
-    writeln!(config, "# Global config options can be specified before TERM or COLORTERM entries").unwrap();
-    writeln!(config, "# Below are TERM or COLORTERM entries, which can be glob patterns, which").unwrap();
-    writeln!(config, "# restrict following config to systems with matching environment variables.").unwrap();
+    writeln!(
+        config,
+        "# Configuration file for dircolors, a utility to help you set the"
+    )
+    .unwrap();
+    writeln!(
+        config,
+        "# LS_COLORS environment variable used by GNU ls with the --color option."
+    )
+    .unwrap();
+    writeln!(
+        config,
+        "# The keywords COLOR, OPTIONS, and EIGHTBIT (honored by the"
+    )
+    .unwrap();
+    writeln!(
+        config,
+        "# slackware version of dircolors) are recognized but ignored."
+    )
+    .unwrap();
+    writeln!(
+        config,
+        "# Global config options can be specified before TERM or COLORTERM entries"
+    )
+    .unwrap();
+    writeln!(
+        config,
+        "# Below are TERM or COLORTERM entries, which can be glob patterns, which"
+    )
+    .unwrap();
+    writeln!(
+        config,
+        "# restrict following config to systems with matching environment variables."
+    )
+    .unwrap();
     writeln!(config, "COLORTERM ?*").unwrap();
     for term in TERMS.iter() {
         writeln!(config, "TERM {}", term).unwrap();
     }
 
     // Adding file types and their color codes with header
-    writeln!(config, "# Below are the color init strings for the basic file types.").unwrap();
-    writeln!(config, "# One can use codes for 256 or more colors supported by modern terminals.").unwrap();
-    writeln!(config, "# The default color codes use the capabilities of an 8 color terminal").unwrap();
-    writeln!(config, "# with some additional attributes as per the following codes:").unwrap();
+    writeln!(
+        config,
+        "# Below are the color init strings for the basic file types."
+    )
+    .unwrap();
+    writeln!(
+        config,
+        "# One can use codes for 256 or more colors supported by modern terminals."
+    )
+    .unwrap();
+    writeln!(
+        config,
+        "# The default color codes use the capabilities of an 8 color terminal"
+    )
+    .unwrap();
+    writeln!(
+        config,
+        "# with some additional attributes as per the following codes:"
+    )
+    .unwrap();
     writeln!(config, "# Attribute codes:").unwrap();
-    writeln!(config, "# 00=none 01=bold 04=underscore 05=blink 07=reverse 08=concealed").unwrap();
+    writeln!(
+        config,
+        "# 00=none 01=bold 04=underscore 05=blink 07=reverse 08=concealed"
+    )
+    .unwrap();
     writeln!(config, "# Text color codes:").unwrap();
-    writeln!(config, "# 30=black 31=red 32=green 33=yellow 34=blue 35=magenta 36=cyan 37=white").unwrap();
+    writeln!(
+        config,
+        "# 30=black 31=red 32=green 33=yellow 34=blue 35=magenta 36=cyan 37=white"
+    )
+    .unwrap();
     writeln!(config, "# Background color codes:").unwrap();
-    writeln!(config, "# 40=black 41=red 42=green 43=yellow 44=blue 45=magenta 46=cyan 47=white").unwrap();
+    writeln!(
+        config,
+        "# 40=black 41=red 42=green 43=yellow 44=blue 45=magenta 46=cyan 47=white"
+    )
+    .unwrap();
     writeln!(config, "#NORMAL 00 # no color code at all").unwrap();
     writeln!(config, "#FILE 00 # regular file: use no color at all").unwrap();
 
@@ -517,14 +552,30 @@ pub fn generate_dircolors_config() -> String {
         writeln!(config, "{} {}", name, code).unwrap();
     }
 
-    writeln!(config, "# List any file extensions like '.gz' or '.tar' that you would like ls").unwrap();
-    writeln!(config, "# to color below. Put the extension, a space, and the color init string.").unwrap();
+    writeln!(
+        config,
+        "# List any file extensions like '.gz' or '.tar' that you would like ls"
+    )
+    .unwrap();
+    writeln!(
+        config,
+        "# to color below. Put the extension, a space, and the color init string."
+    )
+    .unwrap();
 
     for (ext, color) in FILE_COLORS.iter() {
         writeln!(config, "{} {}", ext, color).unwrap();
     }
-    writeln!(config, "# Subsequent TERM or COLORTERM entries, can be used to add / override").unwrap();
-    write!(config, "# config specific to those matching environment variables.").unwrap();
+    writeln!(
+        config,
+        "# Subsequent TERM or COLORTERM entries, can be used to add / override"
+    )
+    .unwrap();
+    write!(
+        config,
+        "# config specific to those matching environment variables."
+    )
+    .unwrap();
 
     config
 }
diff --git a/src/uucore/src/lib/features/colors.rs b/src/uucore/src/lib/features/colors.rs
index 96ca6d45672..81d117a50b3 100644
--- a/src/uucore/src/lib/features/colors.rs
+++ b/src/uucore/src/lib/features/colors.rs
@@ -2,7 +2,7 @@
 //
 // For the full copyright and license information, please view the LICENSE
 // file that was distributed with this source code.
-
+// cSpell:disable
 use once_cell::sync::Lazy;
 
 /* The keywords COLOR, OPTIONS, and EIGHTBIT (honored by the

From 4903b91973005f039f468d0f7740daf24b1ce282 Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Mon, 6 Nov 2023 09:25:54 +0100
Subject: [PATCH 106/429] du: call unused _du_basics() in test_du_basics()

---
 tests/by-util/test_du.rs | 54 +++++++++++++++++++++++++++++++---------
 1 file changed, 42 insertions(+), 12 deletions(-)

diff --git a/tests/by-util/test_du.rs b/tests/by-util/test_du.rs
index c07de2851ee..8ed7ce8c0c1 100644
--- a/tests/by-util/test_du.rs
+++ b/tests/by-util/test_du.rs
@@ -22,24 +22,54 @@ const SUB_LINK: &str = "subdir/links/sublink.txt";
 
 #[test]
 fn test_du_basics() {
-    new_ucmd!().succeeds().no_stderr();
+    let ts = TestScenario::new(util_name!());
+
+    let result = ts.ucmd().succeeds();
+
+    #[cfg(any(target_os = "linux", target_os = "android"))]
+    {
+        let result_reference = unwrap_or_return!(expected_result(&ts, &[]));
+        if result_reference.succeeded() {
+            assert_eq!(result.stdout_str(), result_reference.stdout_str());
+            return;
+        }
+    }
+    _du_basics(result.stdout_str());
 }
+
 #[cfg(target_vendor = "apple")]
 fn _du_basics(s: &str) {
-    let answer = "32\t./subdir
-8\t./subdir/deeper
-24\t./subdir/links
-40\t.
-";
+    let answer = concat!(
+        "4\t./subdir/deeper/deeper_dir\n",
+        "8\t./subdir/deeper\n",
+        "12\t./subdir/links\n",
+        "20\t./subdir\n",
+        "24\t.\n"
+    );
+    assert_eq!(s, answer);
+}
+
+#[cfg(target_os = "windows")]
+fn _du_basics(s: &str) {
+    let answer = concat!(
+        "0\t.\\subdir\\deeper\\deeper_dir\n",
+        "0\t.\\subdir\\deeper\n",
+        "8\t.\\subdir\\links\n",
+        "8\t.\\subdir\n",
+        "8\t.\n"
+    );
     assert_eq!(s, answer);
 }
-#[cfg(not(target_vendor = "apple"))]
+
+#[cfg(all(not(target_vendor = "apple"), not(target_os = "windows"),))]
 fn _du_basics(s: &str) {
-    let answer = "28\t./subdir
-8\t./subdir/deeper
-16\t./subdir/links
-36\t.
-";
+    let answer = concat!(
+        "8\t./subdir/deeper/deeper_dir\n",
+        "16\t./subdir/deeper\n",
+        "16\t./subdir/links\n",
+        "36\t./subdir\n",
+        "44\t.\n"
+    );
     assert_eq!(s, answer);
 }
 

From 0ea1a7cd88c2a6d02ff4c1e69f5a9fa70c9bc135 Mon Sep 17 00:00:00 2001
From: Nathan Houghton <nathan@brainwerk.org>
Date: Sat, 21 Oct 2023 20:22:25 -0700
Subject: [PATCH 107/429] tests/cp, tests/test: Don't attempt to set sticky
 file bit on FreeBSD

On FreeBSD (and OpenBSD), only the superuser can set the file sticky
bit.
---
 tests/by-util/test_cp.rs   | 20 +++++++++++++++-----
 tests/by-util/test_test.rs |  2 +-
 2 files changed, 16 insertions(+), 6 deletions(-)

diff --git a/tests/by-util/test_cp.rs b/tests/by-util/test_cp.rs
index 36bca68b0d0..37bec522238 100644
--- a/tests/by-util/test_cp.rs
+++ b/tests/by-util/test_cp.rs
@@ -13,7 +13,7 @@ use std::os::unix::fs;
 
 #[cfg(unix)]
 use std::os::unix::fs::MetadataExt;
-#[cfg(all(unix, not(target_os = "freebsd")))]
+#[cfg(unix)]
 use std::os::unix::fs::PermissionsExt;
 #[cfg(windows)]
 use std::os::windows::fs::symlink_file;
@@ -2381,13 +2381,18 @@ fn test_copy_symlink_force() {
 }
 
 #[test]
-#[cfg(all(unix, not(target_os = "freebsd")))]
+#[cfg(unix)]
 fn test_no_preserve_mode() {
     use std::os::unix::prelude::MetadataExt;
 
     use uucore::mode::get_umask;
 
-    const PERMS_ALL: u32 = 0o7777;
+    const PERMS_ALL: u32 = if cfg!(target_os = "freebsd") {
+        // Only the superuser can set the sticky bit on a file.
+        0o6777
+    } else {
+        0o7777
+    };
 
     let (at, mut ucmd) = at_and_ucmd!();
     at.touch("file");
@@ -2407,11 +2412,16 @@ fn test_no_preserve_mode() {
 }
 
 #[test]
-#[cfg(all(unix, not(target_os = "freebsd")))]
+#[cfg(unix)]
 fn test_preserve_mode() {
     use std::os::unix::prelude::MetadataExt;
 
-    const PERMS_ALL: u32 = 0o7777;
+    const PERMS_ALL: u32 = if cfg!(target_os = "freebsd") {
+        // Only the superuser can set the sticky bit on a file.
+        0o6777
+    } else {
+        0o7777
+    };
 
     let (at, mut ucmd) = at_and_ucmd!();
     at.touch("file");
diff --git a/tests/by-util/test_test.rs b/tests/by-util/test_test.rs
index 922d854c640..b91bc727d40 100644
--- a/tests/by-util/test_test.rs
+++ b/tests/by-util/test_test.rs
@@ -553,7 +553,7 @@ fn test_nonexistent_file_is_not_symlink() {
 }
 
 #[test]
-// FixME: freebsd fails with 'chmod: sticky_file: Inappropriate file type or format'
+// Only the superuser is allowed to set the sticky bit on files on FreeBSD.
 // Windows has no concept of sticky bit
 #[cfg(not(any(windows, target_os = "freebsd")))]
 fn test_file_is_sticky() {

From 117ab7737ac1aa61ef4759837ee7718ba016f860 Mon Sep 17 00:00:00 2001
From: Arpit Bhadauria <singharpit511@gmail.com>
Date: Sat, 2 Dec 2023 17:25:57 +0000
Subject: [PATCH 108/429] Optimize expr for numerical values

---
 src/uu/expr/src/expr.rs        |   2 +-
 src/uu/expr/src/syntax_tree.rs | 106 +++++++++++++++++++++------------
 2 files changed, 69 insertions(+), 39 deletions(-)

diff --git a/src/uu/expr/src/expr.rs b/src/uu/expr/src/expr.rs
index c271f0935fd..91d7a878820 100644
--- a/src/uu/expr/src/expr.rs
+++ b/src/uu/expr/src/expr.rs
@@ -108,7 +108,7 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
         .map(|v| v.into_iter().map(|s| s.as_ref()).collect::<Vec<_>>())
         .unwrap_or_default();
 
-    let res = AstNode::parse(&token_strings)?.eval()?;
+    let res = AstNode::parse(&token_strings)?.eval()?.to_string();
     println!("{res}");
     if !is_truthy(&res) {
         return Err(1.into());
diff --git a/src/uu/expr/src/syntax_tree.rs b/src/uu/expr/src/syntax_tree.rs
index f81f1da1ec4..705864f3a6c 100644
--- a/src/uu/expr/src/syntax_tree.rs
+++ b/src/uu/expr/src/syntax_tree.rs
@@ -6,6 +6,7 @@
 // spell-checker:ignore (ToDO) ints paren prec multibytes
 
 use num_bigint::BigInt;
+use num_traits::ToPrimitive;
 use onig::{Regex, RegexOptions, Syntax};
 
 use crate::{ExprError, ExprResult};
@@ -45,7 +46,7 @@ pub enum StringOp {
 }
 
 impl BinOp {
-    fn eval(&self, left: &AstNode, right: &AstNode) -> ExprResult<String> {
+    fn eval(&self, left: &AstNode, right: &AstNode) -> ExprResult<NumOrStr> {
         match self {
             Self::Relation(op) => op.eval(left, right),
             Self::Numeric(op) => op.eval(left, right),
@@ -55,10 +56,10 @@ impl BinOp {
 }
 
 impl RelationOp {
-    fn eval(&self, a: &AstNode, b: &AstNode) -> ExprResult<String> {
+    fn eval(&self, a: &AstNode, b: &AstNode) -> ExprResult<NumOrStr> {
         let a = a.eval()?;
         let b = b.eval()?;
-        let b = if let (Ok(a), Ok(b)) = (a.parse::<BigInt>(), b.parse::<BigInt>()) {
+        let b = if let (NumOrStr::Num(a), NumOrStr::Num(b)) = (&a, &b) {
             match self {
                 Self::Lt => a < b,
                 Self::Leq => a <= b,
@@ -79,24 +80,22 @@ impl RelationOp {
             }
         };
         if b {
-            Ok("1".into())
+            Ok(NumOrStr::Num(BigInt::from(1)))
         } else {
-            Ok("0".into())
+            Ok(NumOrStr::Num(BigInt::from(0)))
         }
     }
 }
 
 impl NumericOp {
-    fn eval(&self, left: &AstNode, right: &AstNode) -> ExprResult<String> {
+    fn eval(&self, left: &AstNode, right: &AstNode) -> ExprResult<NumOrStr> {
         let a: BigInt = left
             .eval()?
-            .parse()
-            .map_err(|_| ExprError::NonIntegerArgument)?;
+            .to_bigint()?;
         let b: BigInt = right
             .eval()?
-            .parse()
-            .map_err(|_| ExprError::NonIntegerArgument)?;
-        Ok(match self {
+            .to_bigint()?;
+        Ok(NumOrStr::Num(match self {
             Self::Add => a + b,
             Self::Sub => a - b,
             Self::Mul => a * b,
@@ -110,67 +109,66 @@ impl NumericOp {
                 };
                 a % b
             }
-        }
-        .to_string())
+        }))
     }
 }
 
 impl StringOp {
-    fn eval(&self, left: &AstNode, right: &AstNode) -> ExprResult<String> {
+    fn eval(&self, left: &AstNode, right: &AstNode) -> ExprResult<NumOrStr> {
         match self {
             Self::Or => {
                 let left = left.eval()?;
-                if is_truthy(&left) {
+                if is_truthy(&left.to_string()) {
                     return Ok(left);
                 }
                 let right = right.eval()?;
-                if is_truthy(&right) {
+                if is_truthy(&right.to_string()) {
                     return Ok(right);
                 }
-                Ok("0".into())
+                Ok(NumOrStr::Num(BigInt::from(0)))
             }
             Self::And => {
                 let left = left.eval()?;
-                if !is_truthy(&left) {
-                    return Ok("0".into());
+                if !is_truthy(&left.to_string()) {
+                    return Ok(NumOrStr::Num(BigInt::from(0)));
                 }
                 let right = right.eval()?;
-                if !is_truthy(&right) {
-                    return Ok("0".into());
+                if !is_truthy(&right.to_string()) {
+                    return Ok(NumOrStr::Num(BigInt::from(0)));
                 }
                 Ok(left)
             }
             Self::Match => {
                 let left = left.eval()?;
                 let right = right.eval()?;
-                let re_string = format!("^{}", &right);
+                let re_string = format!("^{}", right.to_string());
                 let re = Regex::with_options(
                     &re_string,
                     RegexOptions::REGEX_OPTION_NONE,
                     Syntax::grep(),
                 )
                 .map_err(|_| ExprError::InvalidRegexExpression)?;
-                Ok(if re.captures_len() > 0 {
-                    re.captures(&left)
+                Ok(NumOrStr::Str(if re.captures_len() > 0 {
+                    re.captures(&left.to_string())
                         .map(|captures| captures.at(1).unwrap())
                         .unwrap_or("")
                         .to_string()
                 } else {
-                    re.find(&left)
+                    re.find(&left.to_string())
                         .map_or("0".to_string(), |(start, end)| (end - start).to_string())
-                })
+                }))
             }
             Self::Index => {
                 let left = left.eval()?;
                 let right = right.eval()?;
-                for (current_idx, ch_h) in left.chars().enumerate() {
-                    for ch_n in right.chars() {
+                for (current_idx, ch_h) in left.to_string().chars().enumerate() {
+                    for ch_n in right.to_string().chars() {
                         if ch_n == ch_h {
-                            return Ok((current_idx + 1).to_string());
+                            return Ok(NumOrStr::Num(BigInt::from(current_idx + 1)));
                         }
                     }
                 }
-                Ok("0".to_string())
+                Ok(NumOrStr::Num(BigInt::from(0)))
             }
         }
     }
@@ -200,6 +198,38 @@ const PRECEDENCE: &[&[(&str, BinOp)]] = &[
     &[(":", BinOp::String(StringOp::Match))],
 ];
 
+#[derive(Debug, PartialEq, Eq, Ord, PartialOrd)]
+pub enum NumOrStr {
+    Num(BigInt),
+    Str(String),
+}
+
+impl NumOrStr {
+    pub fn to_usize(self: NumOrStr) -> Option<usize> {
+        match self.to_bigint() {
+            Ok(num) => {num.to_usize()}
+            Err(_) => {None},
+        }
+    }
+
+    pub fn to_string(self: &NumOrStr) -> String {
+        match self {
+            NumOrStr::Num(num) => {num.to_string()}
+            NumOrStr::Str(str)  => {str.to_string()},
+        }
+    }
+
+    pub fn to_bigint(self: NumOrStr) -> ExprResult<BigInt> {
+        match self {
+            NumOrStr::Num(num) => {Ok(num)}
+            NumOrStr::Str(str) => { match str.parse::<BigInt>() {
+                Ok(val) => {Ok(val)},
+                Err(_) => {Err(ExprError::NonIntegerArgument)}
+            }},
+        }
+    }
+}
+
 #[derive(Debug, PartialEq, Eq)]
 pub enum AstNode {
     Leaf {
@@ -225,9 +255,9 @@ impl AstNode {
         Parser::new(input).parse()
     }
 
-    pub fn eval(&self) -> ExprResult<String> {
+    pub fn eval(&self) -> ExprResult<NumOrStr> {
         match self {
-            Self::Leaf { value } => Ok(value.into()),
+            Self::Leaf { value } => Ok(NumOrStr::Str(value.to_string())),
             Self::BinOp {
                 op_type,
                 left,
@@ -238,7 +268,7 @@ impl AstNode {
                 pos,
                 length,
             } => {
-                let string = string.eval()?;
+                let string = string.eval()?.to_string();
 
                 // The GNU docs say:
                 //
@@ -247,16 +277,16 @@ impl AstNode {
                 //
                 // So we coerce errors into 0 to make that the only case we
                 // have to care about.
-                let pos: usize = pos.eval()?.parse().unwrap_or(0);
-                let length: usize = length.eval()?.parse().unwrap_or(0);
+                let pos: usize = pos.eval()?.to_usize().unwrap_or(0);
+                let length: usize = length.eval()?.to_usize().unwrap_or(0);
 
                 let (Some(pos), Some(_)) = (pos.checked_sub(1), length.checked_sub(1)) else {
-                    return Ok(String::new());
+                    return Ok(NumOrStr::Str(String::new()));
                 };
 
-                Ok(string.chars().skip(pos).take(length).collect())
+                Ok(NumOrStr::Str(string.chars().skip(pos).take(length).collect()))
             }
-            Self::Length { string } => Ok(string.eval()?.chars().count().to_string()),
+            Self::Length { string } => Ok(NumOrStr::Num(BigInt::from(string.eval()?.to_string().chars().count()))),
         }
     }
 }

From f4141100836ff382b1e217b96c278e1d47e01b74 Mon Sep 17 00:00:00 2001
From: "renovate[bot]" <29139614+renovate[bot]@users.noreply.github.com>
Date: Sun, 3 Dec 2023 12:49:28 +0000
Subject: [PATCH 109/429] chore(deps): update vmactions/freebsd-vm action to
 v1.0.3

---
 .github/workflows/freebsd.yml | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/.github/workflows/freebsd.yml b/.github/workflows/freebsd.yml
index 02c0137e7b2..5261d103c59 100644
--- a/.github/workflows/freebsd.yml
+++ b/.github/workflows/freebsd.yml
@@ -39,7 +39,7 @@ jobs:
     - name: Run sccache-cache
       uses: mozilla-actions/sccache-action@v0.0.3
     - name: Prepare, build and test
-      uses: vmactions/freebsd-vm@v1.0.2
+      uses: vmactions/freebsd-vm@v1.0.3
       with:
         usesh: true
         sync: rsync
@@ -131,7 +131,7 @@ jobs:
     - name: Run sccache-cache
       uses: mozilla-actions/sccache-action@v0.0.3
     - name: Prepare, build and test
-      uses: vmactions/freebsd-vm@v1.0.2
+      uses: vmactions/freebsd-vm@v1.0.3
       with:
         usesh: true
         sync: rsync

From 49fb72ed21ddcb709426159b1336edded3778164 Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Sun, 3 Dec 2023 14:07:03 +0100
Subject: [PATCH 110/429] du: disable test on Android

---
 tests/by-util/test_du.rs | 1 +
 1 file changed, 1 insertion(+)

diff --git a/tests/by-util/test_du.rs b/tests/by-util/test_du.rs
index c07de2851ee..10f32caf52e 100644
--- a/tests/by-util/test_du.rs
+++ b/tests/by-util/test_du.rs
@@ -441,6 +441,7 @@ fn test_du_inodes() {
     }
 }
 
+#[cfg(not(target_os = "android"))]
 #[test]
 fn test_du_inodes_with_count_links() {
     let ts = TestScenario::new(util_name!());

From a6d15d67caf13c86aa2973ea45a7ed7758c8f50b Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Fri, 1 Dec 2023 15:15:44 +0100
Subject: [PATCH 111/429] ls: cleanup "spell-checker:ignore" entries

---
 src/uu/ls/src/ls.rs | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/uu/ls/src/ls.rs b/src/uu/ls/src/ls.rs
index cba9cdf5375..6e7fe405b16 100644
--- a/src/uu/ls/src/ls.rs
+++ b/src/uu/ls/src/ls.rs
@@ -3,7 +3,7 @@
 // For the full copyright and license information, please view the LICENSE
 // file that was distributed with this source code.
 
-// spell-checker:ignore (ToDO) cpio svgz webm somegroup nlink rmvb xspf tabsize dired subdired dtype
+// spell-checker:ignore (ToDO) somegroup nlink tabsize dired subdired dtype
 
 use clap::{
     builder::{NonEmptyStringValueParser, ValueParser},

From c77d389f5b93399bdeb6007f24d745c94e64f454 Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Fri, 1 Dec 2023 16:19:13 +0100
Subject: [PATCH 112/429] ls: improve some var names related to block sizes

---
 src/uu/ls/src/ls.rs | 34 ++++++++++++++++++----------------
 1 file changed, 18 insertions(+), 16 deletions(-)

diff --git a/src/uu/ls/src/ls.rs b/src/uu/ls/src/ls.rs
index 6e7fe405b16..3745cfc9df3 100644
--- a/src/uu/ls/src/ls.rs
+++ b/src/uu/ls/src/ls.rs
@@ -741,14 +741,14 @@ impl Config {
 
         let mut needs_color = extract_color(options);
 
-        let cmd_line_bs = options.get_one::<String>(options::size::BLOCK_SIZE);
-        let opt_si = cmd_line_bs.is_some()
+        let opt_block_size = options.get_one::<String>(options::size::BLOCK_SIZE);
+        let opt_si = opt_block_size.is_some()
             && options
                 .get_one::<String>(options::size::BLOCK_SIZE)
                 .unwrap()
                 .eq("si")
             || options.get_flag(options::size::SI);
-        let opt_hr = (cmd_line_bs.is_some()
+        let opt_hr = (opt_block_size.is_some()
             && options
                 .get_one::<String>(options::size::BLOCK_SIZE)
                 .unwrap()
@@ -756,9 +756,9 @@ impl Config {
             || options.get_flag(options::size::HUMAN_READABLE);
         let opt_kb = options.get_flag(options::size::KIBIBYTES);
 
-        let bs_env_var = std::env::var_os("BLOCK_SIZE");
-        let ls_bs_env_var = std::env::var_os("LS_BLOCK_SIZE");
-        let pc_env_var = std::env::var_os("POSIXLY_CORRECT");
+        let env_var_block_size = std::env::var_os("BLOCK_SIZE");
+        let env_var_ls_block_size = std::env::var_os("LS_BLOCK_SIZE");
+        let env_var_posixly_correct = std::env::var_os("POSIXLY_CORRECT");
 
         let size_format = if opt_si {
             SizeFormat::Decimal
@@ -768,13 +768,13 @@ impl Config {
             SizeFormat::Bytes
         };
 
-        let raw_bs = if let Some(cmd_line_bs) = cmd_line_bs {
-            OsString::from(cmd_line_bs)
+        let raw_block_size = if let Some(opt_block_size) = opt_block_size {
+            OsString::from(opt_block_size)
         } else if !opt_kb {
-            if let Some(ls_bs_env_var) = ls_bs_env_var {
-                ls_bs_env_var
-            } else if let Some(bs_env_var) = bs_env_var {
-                bs_env_var
+            if let Some(env_var_ls_block_size) = env_var_ls_block_size {
+                env_var_ls_block_size
+            } else if let Some(env_var_block_size) = env_var_block_size {
+                env_var_block_size
             } else {
                 OsString::from("")
             }
@@ -782,15 +782,17 @@ impl Config {
             OsString::from("")
         };
 
-        let block_size: Option<u64> = if !opt_si && !opt_hr && !raw_bs.is_empty() {
-            match parse_size_u64(&raw_bs.to_string_lossy()) {
+        let block_size: Option<u64> = if !opt_si && !opt_hr && !raw_block_size.is_empty() {
+            match parse_size_u64(&raw_block_size.to_string_lossy()) {
                 Ok(size) => Some(size),
                 Err(_) => {
-                    show!(LsError::BlockSizeParseError(cmd_line_bs.unwrap().clone()));
+                    show!(LsError::BlockSizeParseError(
+                        opt_block_size.unwrap().clone()
+                    ));
                     None
                 }
             }
-        } else if let Some(pc) = pc_env_var {
+        } else if let Some(pc) = env_var_posixly_correct {
             if pc.as_os_str() == OsStr::new("true") || pc == OsStr::new("1") {
                 Some(POSIXLY_CORRECT_BLOCK_SIZE)
             } else {

From 51fc2d7564b29de22936e8ca4a73883aeca77662 Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Fri, 1 Dec 2023 16:27:05 +0100
Subject: [PATCH 113/429] ls: ignore value of POSIXLY_CORRECT

---
 src/uu/ls/src/ls.rs      | 10 +++-------
 tests/by-util/test_ls.rs | 27 +++++++++++++++++++++++++++
 2 files changed, 30 insertions(+), 7 deletions(-)

diff --git a/src/uu/ls/src/ls.rs b/src/uu/ls/src/ls.rs
index 3745cfc9df3..f645e31d3c2 100644
--- a/src/uu/ls/src/ls.rs
+++ b/src/uu/ls/src/ls.rs
@@ -20,7 +20,7 @@ use std::os::windows::fs::MetadataExt;
 use std::{
     cmp::Reverse,
     error::Error,
-    ffi::{OsStr, OsString},
+    ffi::OsString,
     fmt::{Display, Write as FmtWrite},
     fs::{self, DirEntry, FileType, Metadata, ReadDir},
     io::{stdout, BufWriter, ErrorKind, Stdout, Write},
@@ -792,12 +792,8 @@ impl Config {
                     None
                 }
             }
-        } else if let Some(pc) = env_var_posixly_correct {
-            if pc.as_os_str() == OsStr::new("true") || pc == OsStr::new("1") {
-                Some(POSIXLY_CORRECT_BLOCK_SIZE)
-            } else {
-                None
-            }
+        } else if env_var_posixly_correct.is_some() {
+            Some(POSIXLY_CORRECT_BLOCK_SIZE)
         } else {
             None
         };
diff --git a/tests/by-util/test_ls.rs b/tests/by-util/test_ls.rs
index 19a3f5578fa..fcd57170d48 100644
--- a/tests/by-util/test_ls.rs
+++ b/tests/by-util/test_ls.rs
@@ -3828,3 +3828,30 @@ fn test_ls_cf_output_should_be_delimited_by_tab() {
         .succeeds()
         .stdout_is("a2345/\tb/\n");
 }
+
+#[cfg(all(unix, feature = "dd"))]
+#[test]
+fn test_posixly_correct() {
+    let scene = TestScenario::new(util_name!());
+
+    scene
+        .ccmd("dd")
+        .arg("if=/dev/zero")
+        .arg("of=file")
+        .arg("bs=1024")
+        .arg("count=1")
+        .succeeds();
+
+    scene
+        .ucmd()
+        .arg("-s")
+        .succeeds()
+        .stdout_contains_line("total 4");
+
+    scene
+        .ucmd()
+        .arg("-s")
+        .env("POSIXLY_CORRECT", "some_value")
+        .succeeds()
+        .stdout_contains_line("total 8");
+}

From d8a64a90ece80fc029860f66d7bf8858c79f9e91 Mon Sep 17 00:00:00 2001
From: Arpit Bhadauria <singharpit511@gmail.com>
Date: Sun, 3 Dec 2023 15:09:12 +0000
Subject: [PATCH 114/429] Formatting fixes in expr

---
 src/uu/expr/src/syntax_tree.rs | 34 +++++++++++++++++-----------------
 1 file changed, 17 insertions(+), 17 deletions(-)

diff --git a/src/uu/expr/src/syntax_tree.rs b/src/uu/expr/src/syntax_tree.rs
index 705864f3a6c..1c74b97103b 100644
--- a/src/uu/expr/src/syntax_tree.rs
+++ b/src/uu/expr/src/syntax_tree.rs
@@ -89,12 +89,8 @@ impl RelationOp {
 
 impl NumericOp {
     fn eval(&self, left: &AstNode, right: &AstNode) -> ExprResult<NumOrStr> {
-        let a: BigInt = left
-            .eval()?
-            .to_bigint()?;
-        let b: BigInt = right
-            .eval()?
-            .to_bigint()?;
+        let a: BigInt = left.eval()?.to_bigint()?;
+        let b: BigInt = right.eval()?.to_bigint()?;
         Ok(NumOrStr::Num(match self {
             Self::Add => a + b,
             Self::Sub => a - b,
@@ -207,25 +203,25 @@ pub enum NumOrStr {
 impl NumOrStr {
     pub fn to_usize(self: NumOrStr) -> Option<usize> {
         match self.to_bigint() {
-            Ok(num) => {num.to_usize()}
-            Err(_) => {None},
+            Ok(num) => num.to_usize(),
+            Err(_) => None,
         }
     }
 
     pub fn to_string(self: &NumOrStr) -> String {
         match self {
-            NumOrStr::Num(num) => {num.to_string()}
-            NumOrStr::Str(str)  => {str.to_string()},
+            NumOrStr::Num(num) => num.to_string(),
+            NumOrStr::Str(str) => str.to_string(),
         }
     }
 
     pub fn to_bigint(self: NumOrStr) -> ExprResult<BigInt> {
         match self {
-            NumOrStr::Num(num) => {Ok(num)}
-            NumOrStr::Str(str) => { match str.parse::<BigInt>() {
-                Ok(val) => {Ok(val)},
-                Err(_) => {Err(ExprError::NonIntegerArgument)}
-            }},
+            NumOrStr::Num(num) => Ok(num),
+            NumOrStr::Str(str) => match str.parse::<BigInt>() {
+                Ok(val) => Ok(val),
+                Err(_) => Err(ExprError::NonIntegerArgument),
+            },
         }
     }
 }
@@ -284,9 +280,13 @@ impl AstNode {
                     return Ok(NumOrStr::Str(String::new()));
                 };
 
-                Ok(NumOrStr::Str(string.chars().skip(pos).take(length).collect()))
+                Ok(NumOrStr::Str(
+                    string.chars().skip(pos).take(length).collect(),
+                ))
             }
-            Self::Length { string } => Ok(NumOrStr::Num(BigInt::from(string.eval()?.to_string().chars().count()))),
+            Self::Length { string } => Ok(NumOrStr::Num(BigInt::from(
+                string.eval()?.to_string().chars().count(),
+            ))),
         }
     }
 }

From f8573d555133f22cfdfbfa198a265138277d3f36 Mon Sep 17 00:00:00 2001
From: Arpit Bhadauria <singharpit511@gmail.com>
Date: Sun, 3 Dec 2023 20:03:50 +0000
Subject: [PATCH 115/429] code and styling fixes in expr

---
 src/uu/expr/src/expr.rs        |   4 +-
 src/uu/expr/src/syntax_tree.rs | 126 +++++++++++++++++++++------------
 2 files changed, 81 insertions(+), 49 deletions(-)

diff --git a/src/uu/expr/src/expr.rs b/src/uu/expr/src/expr.rs
index 91d7a878820..b46034f845d 100644
--- a/src/uu/expr/src/expr.rs
+++ b/src/uu/expr/src/expr.rs
@@ -13,7 +13,7 @@ use uucore::{
     format_usage, help_about, help_section, help_usage,
 };
 
-use crate::syntax_tree::is_truthy;
+use crate::syntax_tree::{is_truthy, NumOrStr};
 
 mod syntax_tree;
 
@@ -110,7 +110,7 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
 
     let res = AstNode::parse(&token_strings)?.eval()?.to_string();
     println!("{res}");
-    if !is_truthy(&res) {
+    if !is_truthy(&NumOrStr::from(res)) {
         return Err(1.into());
     }
     Ok(())
diff --git a/src/uu/expr/src/syntax_tree.rs b/src/uu/expr/src/syntax_tree.rs
index 1c74b97103b..79ba8d9ae10 100644
--- a/src/uu/expr/src/syntax_tree.rs
+++ b/src/uu/expr/src/syntax_tree.rs
@@ -57,8 +57,8 @@ impl BinOp {
 
 impl RelationOp {
     fn eval(&self, a: &AstNode, b: &AstNode) -> ExprResult<NumOrStr> {
-        let a = a.eval()?;
-        let b = b.eval()?;
+        let a = a.eval()?.coerce_num();
+        let b = b.eval()?.coerce_num();
         let b = if let (NumOrStr::Num(a), NumOrStr::Num(b)) = (&a, &b) {
             match self {
                 Self::Lt => a < b,
@@ -80,17 +80,17 @@ impl RelationOp {
             }
         };
         if b {
-            Ok(NumOrStr::Num(BigInt::from(1)))
+            Ok(NumOrStr::from(1))
         } else {
-            Ok(NumOrStr::Num(BigInt::from(0)))
+            Ok(NumOrStr::from(0))
         }
     }
 }
 
 impl NumericOp {
     fn eval(&self, left: &AstNode, right: &AstNode) -> ExprResult<NumOrStr> {
-        let a: BigInt = left.eval()?.to_bigint()?;
-        let b: BigInt = right.eval()?.to_bigint()?;
+        let a = left.eval()?.to_bigint()?;
+        let b = right.eval()?.to_bigint()?;
         Ok(NumOrStr::Num(match self {
             Self::Add => a + b,
             Self::Sub => a - b,
@@ -114,23 +114,23 @@ impl StringOp {
         match self {
             Self::Or => {
                 let left = left.eval()?;
-                if is_truthy(&left.to_string()) {
+                if is_truthy(&left) {
                     return Ok(left);
                 }
                 let right = right.eval()?;
-                if is_truthy(&right.to_string()) {
+                if is_truthy(&right) {
                     return Ok(right);
                 }
-                Ok(NumOrStr::Num(BigInt::from(0)))
+                Ok(NumOrStr::from(0))
             }
             Self::And => {
                 let left = left.eval()?;
-                if !is_truthy(&left.to_string()) {
-                    return Ok(NumOrStr::Num(BigInt::from(0)));
+                if !is_truthy(&left) {
+                    return Ok(NumOrStr::from(0));
                 }
                 let right = right.eval()?;
-                if !is_truthy(&right.to_string()) {
-                    return Ok(NumOrStr::Num(BigInt::from(0)));
+                if !is_truthy(&right) {
+                    return Ok(NumOrStr::from(0));
                 }
                 Ok(left)
             }
@@ -144,7 +144,7 @@ impl StringOp {
                     Syntax::grep(),
                 )
                 .map_err(|_| ExprError::InvalidRegexExpression)?;
-                Ok(NumOrStr::Str(if re.captures_len() > 0 {
+                Ok(NumOrStr::from(if re.captures_len() > 0 {
                     re.captures(&left.to_string())
                         .map(|captures| captures.at(1).unwrap())
                         .unwrap_or("")
@@ -155,16 +155,16 @@ impl StringOp {
                 }))
             }
             Self::Index => {
-                let left = left.eval()?;
-                let right = right.eval()?;
-                for (current_idx, ch_h) in left.to_string().chars().enumerate() {
+                let left = left.eval()?.to_string();
+                let right = right.eval()?.to_string();
+                for (current_idx, ch_h) in left.chars().enumerate() {
                     for ch_n in right.to_string().chars() {
                         if ch_n == ch_h {
-                            return Ok(NumOrStr::Num(BigInt::from(current_idx + 1)));
+                            return Ok(NumOrStr::from(current_idx + 1));
                         }
                     }
                 }
-                Ok(NumOrStr::Num(BigInt::from(0)))
+                Ok(NumOrStr::from(0))
             }
         }
     }
@@ -200,27 +200,54 @@ pub enum NumOrStr {
     Str(String),
 }
 
+impl From<usize> for NumOrStr {
+    fn from(num: usize) -> NumOrStr {
+        NumOrStr::Num(BigInt::from(num))
+    }
+}
+
+impl From<BigInt> for NumOrStr {
+    fn from(num: BigInt) -> NumOrStr {
+        NumOrStr::Num(num)
+    }
+}
+
+impl From<String> for NumOrStr {
+    fn from(str: String) -> NumOrStr {
+        NumOrStr::Str(str)
+    }
+}
+
 impl NumOrStr {
-    pub fn to_usize(self: NumOrStr) -> Option<usize> {
+    pub fn to_usize(self: Self) -> Option<usize> {
         match self.to_bigint() {
             Ok(num) => num.to_usize(),
             Err(_) => None,
         }
     }
 
-    pub fn to_string(self: &NumOrStr) -> String {
+    pub fn to_string(self: Self) -> String {
         match self {
-            NumOrStr::Num(num) => num.to_string(),
-            NumOrStr::Str(str) => str.to_string(),
+            Self::Num(num) => num.to_string(),
+            Self::Str(str) => str.to_string(),
         }
     }
 
-    pub fn to_bigint(self: NumOrStr) -> ExprResult<BigInt> {
+    pub fn to_bigint(self: Self) -> ExprResult<BigInt> {
         match self {
-            NumOrStr::Num(num) => Ok(num),
-            NumOrStr::Str(str) => match str.parse::<BigInt>() {
-                Ok(val) => Ok(val),
-                Err(_) => Err(ExprError::NonIntegerArgument),
+            Self::Num(num) => Ok(num),
+            Self::Str(str) => str
+                .parse::<BigInt>()
+                .map_err(|_| ExprError::NonIntegerArgument),
+        }
+    }
+
+    pub fn coerce_num(self: Self) -> NumOrStr {
+        match self {
+            Self::Num(num) => Self::from(num),
+            Self::Str(str) => match str.parse::<BigInt>() {
+                Ok(num) => Self::from(num),
+                Err(_) => Self::from(str),
             },
         }
     }
@@ -253,7 +280,7 @@ impl AstNode {
 
     pub fn eval(&self) -> ExprResult<NumOrStr> {
         match self {
-            Self::Leaf { value } => Ok(NumOrStr::Str(value.to_string())),
+            Self::Leaf { value } => Ok(NumOrStr::from(value.to_string())),
             Self::BinOp {
                 op_type,
                 left,
@@ -277,16 +304,16 @@ impl AstNode {
                 let length: usize = length.eval()?.to_usize().unwrap_or(0);
 
                 let (Some(pos), Some(_)) = (pos.checked_sub(1), length.checked_sub(1)) else {
-                    return Ok(NumOrStr::Str(String::new()));
+                    return Ok(NumOrStr::from(String::new()));
                 };
 
-                Ok(NumOrStr::Str(
-                    string.chars().skip(pos).take(length).collect(),
+                Ok(NumOrStr::from(
+                    string.chars().skip(pos).take(length).collect::<String>(),
                 ))
             }
-            Self::Length { string } => Ok(NumOrStr::Num(BigInt::from(
-                string.eval()?.to_string().chars().count(),
-            ))),
+            Self::Length { string } => {
+                Ok(NumOrStr::from(string.eval()?.to_string().chars().count()))
+            }
         }
     }
 }
@@ -429,21 +456,26 @@ impl<'a> Parser<'a> {
 /// Determine whether `expr` should evaluate the string as "truthy"
 ///
 /// Truthy strings are either empty or match the regex "-?0+".
-pub fn is_truthy(s: &str) -> bool {
-    // Edge case: `-` followed by nothing is truthy
-    if s == "-" {
-        return true;
-    }
+pub fn is_truthy(s: &NumOrStr) -> bool {
+    match s {
+        NumOrStr::Num(num) => num == &BigInt::from(0),
+        NumOrStr::Str(str) => {
+            // Edge case: `-` followed by nothing is truthy
+            if str == "-" {
+                return true;
+            }
 
-    let mut bytes = s.bytes();
+            let mut bytes = str.bytes();
 
-    // Empty string is falsy
-    let Some(first) = bytes.next() else {
-        return false;
-    };
+            // Empty string is falsy
+            let Some(first) = bytes.next() else {
+                return false;
+            };
 
-    let is_zero = (first == b'-' || first == b'0') && bytes.all(|b| b == b'0');
-    !is_zero
+            let is_zero = (first == b'-' || first == b'0') && bytes.all(|b| b == b'0');
+            !is_zero
+        }
+    }
 }
 
 #[cfg(test)]

From 5672e3d9bdec3acc1d1ab22b0217b5fac17ab10b Mon Sep 17 00:00:00 2001
From: Arpit Bhadauria <singharpit511@gmail.com>
Date: Sun, 3 Dec 2023 22:07:56 +0000
Subject: [PATCH 116/429] Fix errors

---
 src/uu/expr/src/syntax_tree.rs | 19 ++++++++-----------
 1 file changed, 8 insertions(+), 11 deletions(-)

diff --git a/src/uu/expr/src/syntax_tree.rs b/src/uu/expr/src/syntax_tree.rs
index 79ba8d9ae10..a4cb99a8365 100644
--- a/src/uu/expr/src/syntax_tree.rs
+++ b/src/uu/expr/src/syntax_tree.rs
@@ -5,7 +5,7 @@
 
 // spell-checker:ignore (ToDO) ints paren prec multibytes
 
-use num_bigint::BigInt;
+use num_bigint::{BigInt, ParseBigIntError};
 use num_traits::ToPrimitive;
 use onig::{Regex, RegexOptions, Syntax};
 
@@ -57,9 +57,9 @@ impl BinOp {
 
 impl RelationOp {
     fn eval(&self, a: &AstNode, b: &AstNode) -> ExprResult<NumOrStr> {
-        let a = a.eval()?.coerce_num();
-        let b = b.eval()?.coerce_num();
-        let b = if let (NumOrStr::Num(a), NumOrStr::Num(b)) = (&a, &b) {
+        let a = a.eval()?;
+        let b = b.eval()?;
+        let b = if let (Ok(a), Ok(b)) = (&a.coerce_bigint(), &b.coerce_bigint()) {
             match self {
                 Self::Lt => a < b,
                 Self::Leq => a <= b,
@@ -242,13 +242,10 @@ impl NumOrStr {
         }
     }
 
-    pub fn coerce_num(self: Self) -> NumOrStr {
+    pub fn coerce_bigint(self: &Self) -> Result<BigInt, ParseBigIntError> {
         match self {
-            Self::Num(num) => Self::from(num),
-            Self::Str(str) => match str.parse::<BigInt>() {
-                Ok(num) => Self::from(num),
-                Err(_) => Self::from(str),
-            },
+            Self::Num(num) => Ok(num.clone()),
+            Self::Str(str) => str.parse::<BigInt>(),
         }
     }
 }
@@ -458,7 +455,7 @@ impl<'a> Parser<'a> {
 /// Truthy strings are either empty or match the regex "-?0+".
 pub fn is_truthy(s: &NumOrStr) -> bool {
     match s {
-        NumOrStr::Num(num) => num == &BigInt::from(0),
+        NumOrStr::Num(num) => num != &BigInt::from(0),
         NumOrStr::Str(str) => {
             // Edge case: `-` followed by nothing is truthy
             if str == "-" {

From 21c041fa79b64d9f55b8672c4a74e22dd941fd96 Mon Sep 17 00:00:00 2001
From: Arpit Bhadauria <singharpit511@gmail.com>
Date: Sun, 3 Dec 2023 22:27:13 +0000
Subject: [PATCH 117/429] Fix lint issues in expr

---
 src/uu/expr/src/syntax_tree.rs | 20 ++++++++++----------
 1 file changed, 10 insertions(+), 10 deletions(-)

diff --git a/src/uu/expr/src/syntax_tree.rs b/src/uu/expr/src/syntax_tree.rs
index a4cb99a8365..4f447e60f54 100644
--- a/src/uu/expr/src/syntax_tree.rs
+++ b/src/uu/expr/src/syntax_tree.rs
@@ -201,39 +201,39 @@ pub enum NumOrStr {
 }
 
 impl From<usize> for NumOrStr {
-    fn from(num: usize) -> NumOrStr {
-        NumOrStr::Num(BigInt::from(num))
+    fn from(num: usize) -> Self {
+        Self::Num(BigInt::from(num))
     }
 }
 
 impl From<BigInt> for NumOrStr {
-    fn from(num: BigInt) -> NumOrStr {
-        NumOrStr::Num(num)
+    fn from(num: BigInt) -> Self {
+        Self::Num(num)
     }
 }
 
 impl From<String> for NumOrStr {
-    fn from(str: String) -> NumOrStr {
-        NumOrStr::Str(str)
+    fn from(str: String) -> Self {
+        Self::Str(str)
     }
 }
 
 impl NumOrStr {
-    pub fn to_usize(self: Self) -> Option<usize> {
+    pub fn to_usize(self) -> Option<usize> {
         match self.to_bigint() {
             Ok(num) => num.to_usize(),
             Err(_) => None,
         }
     }
 
-    pub fn to_string(self: Self) -> String {
+    pub fn to_string(self) -> String {
         match self {
             Self::Num(num) => num.to_string(),
             Self::Str(str) => str.to_string(),
         }
     }
 
-    pub fn to_bigint(self: Self) -> ExprResult<BigInt> {
+    pub fn to_bigint(self) -> ExprResult<BigInt> {
         match self {
             Self::Num(num) => Ok(num),
             Self::Str(str) => str
@@ -242,7 +242,7 @@ impl NumOrStr {
         }
     }
 
-    pub fn coerce_bigint(self: &Self) -> Result<BigInt, ParseBigIntError> {
+    pub fn coerce_bigint(&self) -> Result<BigInt, ParseBigIntError> {
         match self {
             Self::Num(num) => Ok(num.clone()),
             Self::Str(str) => str.parse::<BigInt>(),

From 9ecd6a296e06b6f20a5bc29f876a546cdafd020d Mon Sep 17 00:00:00 2001
From: Arpit Bhadauria <singharpit511@gmail.com>
Date: Sun, 3 Dec 2023 23:32:51 +0000
Subject: [PATCH 118/429] Refactoring for lint issues

---
 src/uu/expr/src/expr.rs        |  2 +-
 src/uu/expr/src/syntax_tree.rs | 53 ++++++++++++++++++++--------------
 2 files changed, 32 insertions(+), 23 deletions(-)

diff --git a/src/uu/expr/src/expr.rs b/src/uu/expr/src/expr.rs
index b46034f845d..1a9bb07de4a 100644
--- a/src/uu/expr/src/expr.rs
+++ b/src/uu/expr/src/expr.rs
@@ -108,7 +108,7 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
         .map(|v| v.into_iter().map(|s| s.as_ref()).collect::<Vec<_>>())
         .unwrap_or_default();
 
-    let res = AstNode::parse(&token_strings)?.eval()?.to_string();
+    let res: String = AstNode::parse(&token_strings)?.eval()?.into();
     println!("{res}");
     if !is_truthy(&NumOrStr::from(res)) {
         return Err(1.into());
diff --git a/src/uu/expr/src/syntax_tree.rs b/src/uu/expr/src/syntax_tree.rs
index 4f447e60f54..7677b5e7e54 100644
--- a/src/uu/expr/src/syntax_tree.rs
+++ b/src/uu/expr/src/syntax_tree.rs
@@ -59,7 +59,7 @@ impl RelationOp {
     fn eval(&self, a: &AstNode, b: &AstNode) -> ExprResult<NumOrStr> {
         let a = a.eval()?;
         let b = b.eval()?;
-        let b = if let (Ok(a), Ok(b)) = (&a.coerce_bigint(), &b.coerce_bigint()) {
+        let b = if let (Ok(a), Ok(b)) = (&a.to_bigint(), &b.to_bigint()) {
             match self {
                 Self::Lt => a < b,
                 Self::Leq => a <= b,
@@ -89,8 +89,8 @@ impl RelationOp {
 
 impl NumericOp {
     fn eval(&self, left: &AstNode, right: &AstNode) -> ExprResult<NumOrStr> {
-        let a = left.eval()?.to_bigint()?;
-        let b = right.eval()?.to_bigint()?;
+        let a = <NumOrStr as Into<ExprResult<BigInt>>>::into(left.eval()?)?;
+        let b = <NumOrStr as Into<ExprResult<BigInt>>>::into(right.eval()?)?;
         Ok(NumOrStr::Num(match self {
             Self::Add => a + b,
             Self::Sub => a - b,
@@ -135,9 +135,9 @@ impl StringOp {
                 Ok(left)
             }
             Self::Match => {
-                let left = left.eval()?;
-                let right = right.eval()?;
-                let re_string = format!("^{}", right.to_string());
+                let left: String = left.eval()?.into();
+                let right: String = right.eval()?.into();
+                let re_string = format!("^{}", right);
                 let re = Regex::with_options(
                     &re_string,
                     RegexOptions::REGEX_OPTION_NONE,
@@ -145,18 +145,18 @@ impl StringOp {
                 )
                 .map_err(|_| ExprError::InvalidRegexExpression)?;
                 Ok(NumOrStr::from(if re.captures_len() > 0 {
-                    re.captures(&left.to_string())
+                    re.captures(&left)
                         .map(|captures| captures.at(1).unwrap())
                         .unwrap_or("")
                         .to_string()
                 } else {
-                    re.find(&left.to_string())
+                    re.find(&left)
                         .map_or("0".to_string(), |(start, end)| (end - start).to_string())
                 }))
             }
             Self::Index => {
-                let left = left.eval()?.to_string();
-                let right = right.eval()?.to_string();
+                let left: String = left.eval()?.into();
+                let right: String = right.eval()?.into();
                 for (current_idx, ch_h) in left.chars().enumerate() {
                     for ch_n in right.to_string().chars() {
                         if ch_n == ch_h {
@@ -218,22 +218,26 @@ impl From<String> for NumOrStr {
     }
 }
 
-impl NumOrStr {
-    pub fn to_usize(self) -> Option<usize> {
-        match self.to_bigint() {
+impl Into<Option<usize>> for NumOrStr {
+    fn into(self) -> Option<usize> {
+        match self.into() {
             Ok(num) => num.to_usize(),
             Err(_) => None,
         }
     }
+}
 
-    pub fn to_string(self) -> String {
+impl Into<String> for NumOrStr {
+    fn into(self) -> String {
         match self {
             Self::Num(num) => num.to_string(),
             Self::Str(str) => str.to_string(),
         }
     }
+}
 
-    pub fn to_bigint(self) -> ExprResult<BigInt> {
+impl Into<ExprResult<BigInt>> for NumOrStr {
+    fn into(self) -> ExprResult<BigInt> {
         match self {
             Self::Num(num) => Ok(num),
             Self::Str(str) => str
@@ -241,8 +245,10 @@ impl NumOrStr {
                 .map_err(|_| ExprError::NonIntegerArgument),
         }
     }
+}
 
-    pub fn coerce_bigint(&self) -> Result<BigInt, ParseBigIntError> {
+impl NumOrStr {
+    pub fn to_bigint(&self) -> Result<BigInt, ParseBigIntError> {
         match self {
             Self::Num(num) => Ok(num.clone()),
             Self::Str(str) => str.parse::<BigInt>(),
@@ -288,7 +294,7 @@ impl AstNode {
                 pos,
                 length,
             } => {
-                let string = string.eval()?.to_string();
+                let string: String = string.eval()?.into();
 
                 // The GNU docs say:
                 //
@@ -297,8 +303,9 @@ impl AstNode {
                 //
                 // So we coerce errors into 0 to make that the only case we
                 // have to care about.
-                let pos: usize = pos.eval()?.to_usize().unwrap_or(0);
-                let length: usize = length.eval()?.to_usize().unwrap_or(0);
+                let pos: usize = <NumOrStr as Into<Option<usize>>>::into(pos.eval()?).unwrap_or(0);
+                let length: usize =
+                    <NumOrStr as Into<Option<usize>>>::into(length.eval()?).unwrap_or(0);
 
                 let (Some(pos), Some(_)) = (pos.checked_sub(1), length.checked_sub(1)) else {
                     return Ok(NumOrStr::from(String::new()));
@@ -308,9 +315,11 @@ impl AstNode {
                     string.chars().skip(pos).take(length).collect::<String>(),
                 ))
             }
-            Self::Length { string } => {
-                Ok(NumOrStr::from(string.eval()?.to_string().chars().count()))
-            }
+            Self::Length { string } => Ok(NumOrStr::from(
+                <NumOrStr as Into<String>>::into(string.eval()?)
+                    .chars()
+                    .count(),
+            )),
         }
     }
 }

From cf853df2dcf4309049ad3a0ff3ab531aabcb86ec Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Mon, 4 Dec 2023 14:48:25 +0100
Subject: [PATCH 119/429] ls: remove "#[allow(unused_variables)]"

---
 src/uu/ls/src/ls.rs | 1 -
 1 file changed, 1 deletion(-)

diff --git a/src/uu/ls/src/ls.rs b/src/uu/ls/src/ls.rs
index cba9cdf5375..626e17ca14d 100644
--- a/src/uu/ls/src/ls.rs
+++ b/src/uu/ls/src/ls.rs
@@ -2946,7 +2946,6 @@ fn classify_file(path: &PathData, out: &mut BufWriter<Stdout>) -> Option<char> {
 ///
 /// Note that non-unicode sequences in symlink targets are dealt with using
 /// [`std::path::Path::to_string_lossy`].
-#[allow(unused_variables)]
 #[allow(clippy::cognitive_complexity)]
 fn display_file_name(
     path: &PathData,

From d4b22a192d9c4af1ed2b92c0b0197a790536e981 Mon Sep 17 00:00:00 2001
From: "renovate[bot]" <29139614+renovate[bot]@users.noreply.github.com>
Date: Mon, 4 Dec 2023 19:09:30 +0000
Subject: [PATCH 120/429] chore(deps): update vmactions/freebsd-vm action to
 v1.0.4

---
 .github/workflows/freebsd.yml | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/.github/workflows/freebsd.yml b/.github/workflows/freebsd.yml
index 5261d103c59..27537cf6dab 100644
--- a/.github/workflows/freebsd.yml
+++ b/.github/workflows/freebsd.yml
@@ -39,7 +39,7 @@ jobs:
     - name: Run sccache-cache
       uses: mozilla-actions/sccache-action@v0.0.3
     - name: Prepare, build and test
-      uses: vmactions/freebsd-vm@v1.0.3
+      uses: vmactions/freebsd-vm@v1.0.4
       with:
         usesh: true
         sync: rsync
@@ -131,7 +131,7 @@ jobs:
     - name: Run sccache-cache
       uses: mozilla-actions/sccache-action@v0.0.3
     - name: Prepare, build and test
-      uses: vmactions/freebsd-vm@v1.0.3
+      uses: vmactions/freebsd-vm@v1.0.4
       with:
         usesh: true
         sync: rsync

From 9ef43191ff28af359989848dc65548aa253e4337 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Mon, 4 Dec 2023 21:20:47 +0100
Subject: [PATCH 121/429] Document that  \0NNN and \xHH need more work

---
 fuzz/fuzz_targets/fuzz_echo.rs | 1 +
 1 file changed, 1 insertion(+)

diff --git a/fuzz/fuzz_targets/fuzz_echo.rs b/fuzz/fuzz_targets/fuzz_echo.rs
index 826fd6da3eb..fda7fd7276f 100644
--- a/fuzz/fuzz_targets/fuzz_echo.rs
+++ b/fuzz/fuzz_targets/fuzz_echo.rs
@@ -51,6 +51,7 @@ fn generate_escape_sequence(rng: &mut impl Rng) -> String {
     let escape_sequences = [
         "\\\\", "\\a", "\\b", "\\c", "\\e", "\\f", "\\n", "\\r", "\\t", "\\v", "\\0NNN", "\\xHH",
     ];
+    // \0NNN and \xHH need more work
     escape_sequences.choose(rng).unwrap().to_string()
 }
 

From f5776bc511ec0fbe5dac93af190ef8a3c8d610be Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Mon, 4 Dec 2023 22:40:18 +0100
Subject: [PATCH 122/429] fix comment

Co-authored-by: Terts Diepraam <terts.diepraam@gmail.com>
---
 src/uucore/src/lib/features/colors.rs | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/src/uucore/src/lib/features/colors.rs b/src/uucore/src/lib/features/colors.rs
index 81d117a50b3..1f55db5a7d2 100644
--- a/src/uucore/src/lib/features/colors.rs
+++ b/src/uucore/src/lib/features/colors.rs
@@ -78,11 +78,11 @@ pub static FILE_TYPES: Lazy<Vec<(&'static str, &'static str, &'static str)>> = L
     ]
 });
 
-/*
-# List any file extensions like '.gz' or '.tar' that you would like ls
-# to color below. Put the extension, a space, and the color init string.
-# (and any comments you want to add after a '#')
-*/
+/// Colors for file types
+///
+/// List any file extensions like '.gz' or '.tar' that you would like ls
+/// to color below. Put the extension, a space, and the color init string.
+/// (and any comments you want to add after a '#')
 pub static FILE_COLORS: Lazy<Vec<(&str, &str)>> = Lazy::new(|| {
     vec![
         /*

From dabbcff9fbbbce7c0ec692431f73fb17657c8199 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Sun, 3 Dec 2023 10:34:33 +0100
Subject: [PATCH 123/429] dircolors: manage the --print-ls-colors pipe option

---
 src/uu/dircolors/src/dircolors.rs | 17 +++++++++++++----
 tests/by-util/test_dircolors.rs   | 10 ++++++++++
 2 files changed, 23 insertions(+), 4 deletions(-)

diff --git a/src/uu/dircolors/src/dircolors.rs b/src/uu/dircolors/src/dircolors.rs
index 28d74775db8..cf8ed62922c 100644
--- a/src/uu/dircolors/src/dircolors.rs
+++ b/src/uu/dircolors/src/dircolors.rs
@@ -9,6 +9,7 @@ use std::borrow::Borrow;
 use std::env;
 use std::fmt::Write;
 use std::fs::File;
+use std::io::IsTerminal;
 use std::io::{BufRead, BufReader};
 use std::path::Path;
 
@@ -192,9 +193,16 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
 
     let result;
     if files.is_empty() {
-        println!("{}", generate_ls_colors(&out_format, ":"));
-
-        return Ok(());
+        // Check if data is being piped into the program
+        if std::io::stdin().is_terminal() {
+            // No data piped, use default behavior
+            println!("{}", generate_ls_colors(&out_format, ":"));
+            return Ok(());
+        } else {
+            // Data is piped, process the input from stdin
+            let fin = BufReader::new(std::io::stdin());
+            result = parse(fin.lines().map_while(Result::ok), &out_format, "-");
+        }
     } else if files.len() > 1 {
         return Err(UUsageError::new(
             1,
@@ -376,7 +384,8 @@ where
         let (key, val) = line.split_two();
         if val.is_empty() {
             return Err(format!(
-                "{}:{}: invalid line; missing second token",
+                // The double space is what GNU is doing
+                "{}:{}: invalid line;  missing second token",
                 fp.maybe_quote(),
                 num
             ));
diff --git a/tests/by-util/test_dircolors.rs b/tests/by-util/test_dircolors.rs
index d4fa0a3b0a3..e3752fcde98 100644
--- a/tests/by-util/test_dircolors.rs
+++ b/tests/by-util/test_dircolors.rs
@@ -159,6 +159,16 @@ fn test_quoting() {
         .no_stderr();
 }
 
+#[test]
+fn test_print_ls_colors() {
+    new_ucmd!()
+        .pipe_in("OWT 40;33\n")
+        .args(&["--print-ls-colors"])
+        .succeeds()
+        .stdout_is("\x1B[40;33mtw\t40;33\x1B[0m\n")
+        .no_stderr();
+}
+
 #[test]
 fn test_extra_operand() {
     new_ucmd!()

From 3e354109076eb1f806715e0d5c89006fd2a1a12a Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Mon, 4 Dec 2023 22:47:42 +0100
Subject: [PATCH 124/429] dircolors: fix comments

---
 src/uucore/src/lib/features/colors.rs | 512 +++++++++++++-------------
 1 file changed, 250 insertions(+), 262 deletions(-)

diff --git a/src/uucore/src/lib/features/colors.rs b/src/uucore/src/lib/features/colors.rs
index 1f55db5a7d2..81d2fd3f336 100644
--- a/src/uucore/src/lib/features/colors.rs
+++ b/src/uucore/src/lib/features/colors.rs
@@ -3,274 +3,262 @@
 // For the full copyright and license information, please view the LICENSE
 // file that was distributed with this source code.
 // cSpell:disable
-use once_cell::sync::Lazy;
 
-/* The keywords COLOR, OPTIONS, and EIGHTBIT (honored by the
- * slackware version of dircolors) are recognized but ignored.
- * Global config options can be specified before TERM or COLORTERM entries
- * below are TERM or COLORTERM entries, which can be glob patterns, which
- * restrict following config to systems with matching environment variables.
-*/
-pub static TERMS: Lazy<Vec<&str>> = Lazy::new(|| {
-    vec![
-        "Eterm",
-        "ansi",
-        "*color*",
-        "con[0-9]*x[0-9]*",
-        "cons25",
-        "console",
-        "cygwin",
-        "*direct*",
-        "dtterm",
-        "gnome",
-        "hurd",
-        "jfbterm",
-        "konsole",
-        "kterm",
-        "linux",
-        "linux-c",
-        "mlterm",
-        "putty",
-        "rxvt*",
-        "screen*",
-        "st",
-        "terminator",
-        "tmux*",
-        "vt100",
-        "xterm*",
-    ]
-});
+/// The keywords COLOR, OPTIONS, and EIGHTBIT (honored by the
+/// slackware version of dircolors) are recognized but ignored.
+/// Global config options can be specified before TERM or COLORTERM entries
+/// below are TERM or COLORTERM entries, which can be glob patterns, which
+/// restrict following config to systems with matching environment variables.
+pub static TERMS: &[&str] = &[
+    "Eterm",
+    "ansi",
+    "*color*",
+    "con[0-9]*x[0-9]*",
+    "cons25",
+    "console",
+    "cygwin",
+    "*direct*",
+    "dtterm",
+    "gnome",
+    "hurd",
+    "jfbterm",
+    "konsole",
+    "kterm",
+    "linux",
+    "linux-c",
+    "mlterm",
+    "putty",
+    "rxvt*",
+    "screen*",
+    "st",
+    "terminator",
+    "tmux*",
+    "vt100",
+    "xterm*",
+];
 
-/*
-# Below are the color init strings for the basic file types.
-# One can use codes for 256 or more colors supported by modern terminals.
-# The default color codes use the capabilities of an 8 color terminal
-# with some additional attributes as per the following codes:
-# Attribute codes:
-# 00=none 01=bold 04=underscore 05=blink 07=reverse 08=concealed
-# Text color codes:
-# 30=black 31=red 32=green 33=yellow 34=blue 35=magenta 36=cyan 37=white
-# Background color codes:
-# 40=black 41=red 42=green 43=yellow 44=blue 45=magenta 46=cyan 47=white
-#NORMAL 00 # no color code at all
-#FILE 00 # regular file: use no color at all
-*/
-pub static FILE_TYPES: Lazy<Vec<(&'static str, &'static str, &'static str)>> = Lazy::new(|| {
-    vec![
-        ("RESET", "rs", "0"),                     // reset to "normal" color
-        ("DIR", "di", "01;34"),                   // directory
-        ("LINK", "ln", "01;36"),                  // symbolic link
-        ("MULTIHARDLINK", "mh", "00"),            // regular file with more than one link
-        ("FIFO", "pi", "40;33"),                  // pipe
-        ("SOCK", "so", "01;35"),                  // socket
-        ("DOOR", "do", "01;35"),                  // door
-        ("BLK", "bd", "40;33;01"),                // block device driver
-        ("CHR", "cd", "40;33;01"),                // character device driver
-        ("ORPHAN", "or", "40;31;01"), // symlink to nonexistent file, or non-stat'able file
-        ("MISSING", "mi", "00"),      // ... and the files they point to
-        ("SETUID", "su", "37;41"),    // file that is setuid (u+s)
-        ("SETGID", "sg", "30;43"),    // file that is setgid (g+s)
-        ("CAPABILITY", "ca", "00"),   // file with capability
-        ("STICKY_OTHER_WRITABLE", "tw", "30;42"), // dir that is sticky and other-writable (+t,o+w)
-        ("OTHER_WRITABLE", "ow", "34;42"), // dir that is other-writable (o+w) and not sticky
-        ("STICKY", "st", "37;44"),    // dir with the sticky bit set (+t) and not other-writable
-        ("EXEC", "ex", "01;32"),      // files with execute permission
-    ]
-});
+/// Below are the color init strings for the basic file types.
+/// One can use codes for 256 or more colors supported by modern terminals.
+/// The default color codes use the capabilities of an 8 color terminal
+/// with some additional attributes as per the following codes:
+/// Attribute codes:
+/// 00=none 01=bold 04=underscore 05=blink 07=reverse 08=concealed
+/// Text color codes:
+/// 30=black 31=red 32=green 33=yellow 34=blue 35=magenta 36=cyan 37=white
+/// Background color codes:
+/// 40=black 41=red 42=green 43=yellow 44=blue 45=magenta 46=cyan 47=white
+/// #NORMAL 00 /// no color code at all
+/// #FILE 00 /// regular file: use no color at all
+pub static FILE_TYPES: &[(&str, &str, &str)] = &[
+    ("RESET", "rs", "0"),                     // reset to "normal" color
+    ("DIR", "di", "01;34"),                   // directory
+    ("LINK", "ln", "01;36"),                  // symbolic link
+    ("MULTIHARDLINK", "mh", "00"),            // regular file with more than one link
+    ("FIFO", "pi", "40;33"),                  // pipe
+    ("SOCK", "so", "01;35"),                  // socket
+    ("DOOR", "do", "01;35"),                  // door
+    ("BLK", "bd", "40;33;01"),                // block device driver
+    ("CHR", "cd", "40;33;01"),                // character device driver
+    ("ORPHAN", "or", "40;31;01"),             // symlink to nonexistent file, or non-stat'able file
+    ("MISSING", "mi", "00"),                  // ... and the files they point to
+    ("SETUID", "su", "37;41"),                // file that is setuid (u+s)
+    ("SETGID", "sg", "30;43"),                // file that is setgid (g+s)
+    ("CAPABILITY", "ca", "00"),               // file with capability
+    ("STICKY_OTHER_WRITABLE", "tw", "30;42"), // dir that is sticky and other-writable (+t,o+w)
+    ("OTHER_WRITABLE", "ow", "34;42"),        // dir that is other-writable (o+w) and not sticky
+    ("STICKY", "st", "37;44"), // dir with the sticky bit set (+t) and not other-writable
+    ("EXEC", "ex", "01;32"),   // files with execute permission
+];
 
 /// Colors for file types
 ///
 /// List any file extensions like '.gz' or '.tar' that you would like ls
 /// to color below. Put the extension, a space, and the color init string.
 /// (and any comments you want to add after a '#')
-pub static FILE_COLORS: Lazy<Vec<(&str, &str)>> = Lazy::new(|| {
-    vec![
-        /*
-        // Executables (Windows)
-        (".cmd", "01;32"),
-        (".exe", "01;32"),
-        (".com", "01;32"),
-        (".btm", "01;32"),
-        (".bat", "01;32"),
-        (".sh", "01;32"),
-        (".csh", "01;32"),*/
-        // Archives or compressed
-        (".tar", "01;31"),
-        (".tgz", "01;31"),
-        (".arc", "01;31"),
-        (".arj", "01;31"),
-        (".taz", "01;31"),
-        (".lha", "01;31"),
-        (".lz4", "01;31"),
-        (".lzh", "01;31"),
-        (".lzma", "01;31"),
-        (".tlz", "01;31"),
-        (".txz", "01;31"),
-        (".tzo", "01;31"),
-        (".t7z", "01;31"),
-        (".zip", "01;31"),
-        (".z", "01;31"),
-        (".dz", "01;31"),
-        (".gz", "01;31"),
-        (".lrz", "01;31"),
-        (".lz", "01;31"),
-        (".lzo", "01;31"),
-        (".xz", "01;31"),
-        (".zst", "01;31"),
-        (".tzst", "01;31"),
-        (".bz2", "01;31"),
-        (".bz", "01;31"),
-        (".tbz", "01;31"),
-        (".tbz2", "01;31"),
-        (".tz", "01;31"),
-        (".deb", "01;31"),
-        (".rpm", "01;31"),
-        (".jar", "01;31"),
-        (".war", "01;31"),
-        (".ear", "01;31"),
-        (".sar", "01;31"),
-        (".rar", "01;31"),
-        (".alz", "01;31"),
-        (".ace", "01;31"),
-        (".zoo", "01;31"),
-        (".cpio", "01;31"),
-        (".7z", "01;31"),
-        (".rz", "01;31"),
-        (".cab", "01;31"),
-        (".wim", "01;31"),
-        (".swm", "01;31"),
-        (".dwm", "01;31"),
-        (".esd", "01;31"),
-        // Image formats
-        (".avif", "01;35"),
-        (".jpg", "01;35"),
-        (".jpeg", "01;35"),
-        (".mjpg", "01;35"),
-        (".mjpeg", "01;35"),
-        (".gif", "01;35"),
-        (".bmp", "01;35"),
-        (".pbm", "01;35"),
-        (".pgm", "01;35"),
-        (".ppm", "01;35"),
-        (".tga", "01;35"),
-        (".xbm", "01;35"),
-        (".xpm", "01;35"),
-        (".tif", "01;35"),
-        (".tiff", "01;35"),
-        (".png", "01;35"),
-        (".svg", "01;35"),
-        (".svgz", "01;35"),
-        (".mng", "01;35"),
-        (".pcx", "01;35"),
-        (".mov", "01;35"),
-        (".mpg", "01;35"),
-        (".mpeg", "01;35"),
-        (".m2v", "01;35"),
-        (".mkv", "01;35"),
-        (".webm", "01;35"),
-        (".webp", "01;35"),
-        (".ogm", "01;35"),
-        (".mp4", "01;35"),
-        (".m4v", "01;35"),
-        (".mp4v", "01;35"),
-        (".vob", "01;35"),
-        (".qt", "01;35"),
-        (".nuv", "01;35"),
-        (".wmv", "01;35"),
-        (".asf", "01;35"),
-        (".rm", "01;35"),
-        (".rmvb", "01;35"),
-        (".flc", "01;35"),
-        (".avi", "01;35"),
-        (".fli", "01;35"),
-        (".flv", "01;35"),
-        (".gl", "01;35"),
-        (".dl", "01;35"),
-        (".xcf", "01;35"),
-        (".xwd", "01;35"),
-        (".yuv", "01;35"),
-        (".cgm", "01;35"),
-        (".emf", "01;35"),
-        // https://wiki.xiph.org/MIME_Types_and_File_Extensions
-        (".ogv", "01;35"),
-        (".ogx", "01;35"),
-        // Audio formats
-        (".aac", "00;36"),
-        (".au", "00;36"),
-        (".flac", "00;36"),
-        (".m4a", "00;36"),
-        (".mid", "00;36"),
-        (".midi", "00;36"),
-        (".mka", "00;36"),
-        (".mp3", "00;36"),
-        (".mpc", "00;36"),
-        (".ogg", "00;36"),
-        (".ra", "00;36"),
-        (".wav", "00;36"),
-        // https://wiki.xiph.org/MIME_Types_and_File_Extensions
-        (".oga", "00;36"),
-        (".opus", "00;36"),
-        (".spx", "00;36"),
-        (".xspf", "00;36"),
-        // Backup files
-        ("~", "00;90"),
-        ("#", "00;90"),
-        (".bak", "00;90"),
-        (".old", "00;90"),
-        (".orig", "00;90"),
-        (".part", "00;90"),
-        (".rej", "00;90"),
-        (".swp", "00;90"),
-        (".tmp", "00;90"),
-        (".dpkg-dist", "00;90"),
-        (".dpkg-old", "00;90"),
-        (".ucf-dist", "00;90"),
-        (".ucf-new", "00;90"),
-        (".ucf-old", "00;90"),
-        (".rpmnew", "00;90"),
-        (".rpmorig", "00;90"),
-        (".rpmsave", "00;90"),
-    ]
-});
+pub static FILE_COLORS: &[(&str, &str)] = &[
+    /*
+    // Executables (Windows)
+    (".cmd", "01;32"),
+    (".exe", "01;32"),
+    (".com", "01;32"),
+    (".btm", "01;32"),
+    (".bat", "01;32"),
+    (".sh", "01;32"),
+    (".csh", "01;32"),*/
+    // Archives or compressed
+    (".tar", "01;31"),
+    (".tgz", "01;31"),
+    (".arc", "01;31"),
+    (".arj", "01;31"),
+    (".taz", "01;31"),
+    (".lha", "01;31"),
+    (".lz4", "01;31"),
+    (".lzh", "01;31"),
+    (".lzma", "01;31"),
+    (".tlz", "01;31"),
+    (".txz", "01;31"),
+    (".tzo", "01;31"),
+    (".t7z", "01;31"),
+    (".zip", "01;31"),
+    (".z", "01;31"),
+    (".dz", "01;31"),
+    (".gz", "01;31"),
+    (".lrz", "01;31"),
+    (".lz", "01;31"),
+    (".lzo", "01;31"),
+    (".xz", "01;31"),
+    (".zst", "01;31"),
+    (".tzst", "01;31"),
+    (".bz2", "01;31"),
+    (".bz", "01;31"),
+    (".tbz", "01;31"),
+    (".tbz2", "01;31"),
+    (".tz", "01;31"),
+    (".deb", "01;31"),
+    (".rpm", "01;31"),
+    (".jar", "01;31"),
+    (".war", "01;31"),
+    (".ear", "01;31"),
+    (".sar", "01;31"),
+    (".rar", "01;31"),
+    (".alz", "01;31"),
+    (".ace", "01;31"),
+    (".zoo", "01;31"),
+    (".cpio", "01;31"),
+    (".7z", "01;31"),
+    (".rz", "01;31"),
+    (".cab", "01;31"),
+    (".wim", "01;31"),
+    (".swm", "01;31"),
+    (".dwm", "01;31"),
+    (".esd", "01;31"),
+    // Image formats
+    (".avif", "01;35"),
+    (".jpg", "01;35"),
+    (".jpeg", "01;35"),
+    (".mjpg", "01;35"),
+    (".mjpeg", "01;35"),
+    (".gif", "01;35"),
+    (".bmp", "01;35"),
+    (".pbm", "01;35"),
+    (".pgm", "01;35"),
+    (".ppm", "01;35"),
+    (".tga", "01;35"),
+    (".xbm", "01;35"),
+    (".xpm", "01;35"),
+    (".tif", "01;35"),
+    (".tiff", "01;35"),
+    (".png", "01;35"),
+    (".svg", "01;35"),
+    (".svgz", "01;35"),
+    (".mng", "01;35"),
+    (".pcx", "01;35"),
+    (".mov", "01;35"),
+    (".mpg", "01;35"),
+    (".mpeg", "01;35"),
+    (".m2v", "01;35"),
+    (".mkv", "01;35"),
+    (".webm", "01;35"),
+    (".webp", "01;35"),
+    (".ogm", "01;35"),
+    (".mp4", "01;35"),
+    (".m4v", "01;35"),
+    (".mp4v", "01;35"),
+    (".vob", "01;35"),
+    (".qt", "01;35"),
+    (".nuv", "01;35"),
+    (".wmv", "01;35"),
+    (".asf", "01;35"),
+    (".rm", "01;35"),
+    (".rmvb", "01;35"),
+    (".flc", "01;35"),
+    (".avi", "01;35"),
+    (".fli", "01;35"),
+    (".flv", "01;35"),
+    (".gl", "01;35"),
+    (".dl", "01;35"),
+    (".xcf", "01;35"),
+    (".xwd", "01;35"),
+    (".yuv", "01;35"),
+    (".cgm", "01;35"),
+    (".emf", "01;35"),
+    // https://wiki.xiph.org/MIME_Types_and_File_Extensions
+    (".ogv", "01;35"),
+    (".ogx", "01;35"),
+    // Audio formats
+    (".aac", "00;36"),
+    (".au", "00;36"),
+    (".flac", "00;36"),
+    (".m4a", "00;36"),
+    (".mid", "00;36"),
+    (".midi", "00;36"),
+    (".mka", "00;36"),
+    (".mp3", "00;36"),
+    (".mpc", "00;36"),
+    (".ogg", "00;36"),
+    (".ra", "00;36"),
+    (".wav", "00;36"),
+    // https://wiki.xiph.org/MIME_Types_and_File_Extensions
+    (".oga", "00;36"),
+    (".opus", "00;36"),
+    (".spx", "00;36"),
+    (".xspf", "00;36"),
+    // Backup files
+    ("~", "00;90"),
+    ("#", "00;90"),
+    (".bak", "00;90"),
+    (".old", "00;90"),
+    (".orig", "00;90"),
+    (".part", "00;90"),
+    (".rej", "00;90"),
+    (".swp", "00;90"),
+    (".tmp", "00;90"),
+    (".dpkg-dist", "00;90"),
+    (".dpkg-old", "00;90"),
+    (".ucf-dist", "00;90"),
+    (".ucf-new", "00;90"),
+    (".ucf-old", "00;90"),
+    (".rpmnew", "00;90"),
+    (".rpmorig", "00;90"),
+    (".rpmsave", "00;90"),
+];
 
-pub static FILE_ATTRIBUTE_CODES: Lazy<Vec<(&str, &str)>> = Lazy::new(|| {
-    vec![
-        ("normal", "no"),
-        ("norm", "no"),
-        ("file", "fi"),
-        ("reset", "rs"),
-        ("dir", "di"),
-        ("lnk", "ln"),
-        ("link", "ln"),
-        ("symlink", "ln"),
-        ("orphan", "or"),
-        ("missing", "mi"),
-        ("fifo", "pi"),
-        ("pipe", "pi"),
-        ("sock", "so"),
-        ("blk", "bd"),
-        ("block", "bd"),
-        ("chr", "cd"),
-        ("char", "cd"),
-        ("door", "do"),
-        ("exec", "ex"),
-        ("left", "lc"),
-        ("leftcode", "lc"),
-        ("right", "rc"),
-        ("rightcode", "rc"),
-        ("end", "ec"),
-        ("endcode", "ec"),
-        ("suid", "su"),
-        ("setuid", "su"),
-        ("sgid", "sg"),
-        ("setgid", "sg"),
-        ("sticky", "st"),
-        ("other_writable", "ow"),
-        ("owr", "ow"),
-        ("sticky_other_writable", "tw"),
-        ("owt", "tw"),
-        ("capability", "ca"),
-        ("multihardlink", "mh"),
-        ("clrtoeol", "cl"),
-    ]
-});
+pub static FILE_ATTRIBUTE_CODES: &[(&str, &str)] = &[
+    ("normal", "no"),
+    ("norm", "no"),
+    ("file", "fi"),
+    ("reset", "rs"),
+    ("dir", "di"),
+    ("lnk", "ln"),
+    ("link", "ln"),
+    ("symlink", "ln"),
+    ("orphan", "or"),
+    ("missing", "mi"),
+    ("fifo", "pi"),
+    ("pipe", "pi"),
+    ("sock", "so"),
+    ("blk", "bd"),
+    ("block", "bd"),
+    ("chr", "cd"),
+    ("char", "cd"),
+    ("door", "do"),
+    ("exec", "ex"),
+    ("left", "lc"),
+    ("leftcode", "lc"),
+    ("right", "rc"),
+    ("rightcode", "rc"),
+    ("end", "ec"),
+    ("endcode", "ec"),
+    ("suid", "su"),
+    ("setuid", "su"),
+    ("sgid", "sg"),
+    ("setgid", "sg"),
+    ("sticky", "st"),
+    ("other_writable", "ow"),
+    ("owr", "ow"),
+    ("sticky_other_writable", "tw"),
+    ("owt", "tw"),
+    ("capability", "ca"),
+    ("multihardlink", "mh"),
+    ("clrtoeol", "cl"),
+];

From 1c9413e185c8eb16175761b929a373578f0607e3 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Mon, 4 Dec 2023 22:51:08 +0100
Subject: [PATCH 125/429]  bring back the old format

---
 src/uucore/src/lib/features/colors.rs      | 4 ++--
 tests/fixtures/dircolors/internal.expected | 4 ++--
 2 files changed, 4 insertions(+), 4 deletions(-)

diff --git a/src/uucore/src/lib/features/colors.rs b/src/uucore/src/lib/features/colors.rs
index 81d2fd3f336..e0de8b1e3e3 100644
--- a/src/uucore/src/lib/features/colors.rs
+++ b/src/uucore/src/lib/features/colors.rs
@@ -204,8 +204,8 @@ pub static FILE_COLORS: &[(&str, &str)] = &[
     (".spx", "00;36"),
     (".xspf", "00;36"),
     // Backup files
-    ("~", "00;90"),
-    ("#", "00;90"),
+    ("*~", "00;90"),
+    ("*#", "00;90"),
     (".bak", "00;90"),
     (".old", "00;90"),
     (".orig", "00;90"),
diff --git a/tests/fixtures/dircolors/internal.expected b/tests/fixtures/dircolors/internal.expected
index 933e70bc470..e151973f200 100644
--- a/tests/fixtures/dircolors/internal.expected
+++ b/tests/fixtures/dircolors/internal.expected
@@ -176,8 +176,8 @@ EXEC 01;32
 .opus 00;36
 .spx 00;36
 .xspf 00;36
-~ 00;90
-# 00;90
+*~ 00;90
+*# 00;90
 .bak 00;90
 .old 00;90
 .orig 00;90

From b0fdb1edef1a197c95faf83ffbb325190dfee9c3 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Mon, 4 Dec 2023 23:25:13 +0100
Subject: [PATCH 126/429] Rest of the comments

---
 src/uu/dircolors/src/dircolors.rs | 158 +++++++++---------------------
 tests/by-util/test_dircolors.rs   |   2 +
 2 files changed, 48 insertions(+), 112 deletions(-)

diff --git a/src/uu/dircolors/src/dircolors.rs b/src/uu/dircolors/src/dircolors.rs
index cf8ed62922c..41e640b2a5f 100644
--- a/src/uu/dircolors/src/dircolors.rs
+++ b/src/uu/dircolors/src/dircolors.rs
@@ -7,9 +7,8 @@
 
 use std::borrow::Borrow;
 use std::env;
-use std::fmt::Write;
 use std::fs::File;
-use std::io::IsTerminal;
+//use std::io::IsTerminal;
 use std::io::{BufRead, BufReader};
 use std::path::Path;
 
@@ -99,16 +98,20 @@ fn generate_ls_colors(fmt: &OutputFmt, sep: &str) -> String {
             let mut display_parts = vec![];
             let type_output = generate_type_output(fmt);
             display_parts.push(type_output);
-            for &(extension, code) in FILE_COLORS.iter() {
-                display_parts.push(format!("\x1b[{}m*{}\t{}\x1b[0m", code, extension, code));
+            for &(extension, code) in FILE_COLORS {
+                let prefix = if extension.starts_with('*') { "" } else { "*" };
+                let formatted_extension =
+                    format!("\x1b[{}m{}{}\t{}\x1b[0m", code, prefix, extension, code);
+                display_parts.push(formatted_extension);
             }
             display_parts.join("\n")
         }
         _ => {
             // existing logic for other formats
             let mut parts = vec![];
-            for &(extension, code) in FILE_COLORS.iter() {
-                let formatted_extension = format!("*{}", extension);
+            for &(extension, code) in FILE_COLORS {
+                let prefix = if extension.starts_with('*') { "" } else { "*" };
+                let formatted_extension = format!("{}{}", prefix, extension);
                 parts.push(format!("{}={}", formatted_extension, code));
             }
             let (prefix, suffix) = get_colors_format_strings(fmt);
@@ -193,6 +196,9 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
 
     let result;
     if files.is_empty() {
+        println!("{}", generate_ls_colors(&out_format, ":"));
+        return Ok(());
+        /*
         // Check if data is being piped into the program
         if std::io::stdin().is_terminal() {
             // No data piped, use default behavior
@@ -203,6 +209,7 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
             let fin = BufReader::new(std::io::stdin());
             result = parse(fin.lines().map_while(Result::ok), &out_format, "-");
         }
+         */
     } else if files.len() > 1 {
         return Err(UUsageError::new(
             1,
@@ -474,117 +481,44 @@ fn escape(s: &str) -> String {
 pub fn generate_dircolors_config() -> String {
     let mut config = String::new();
 
-    // Adding the complete header comments as in the original file
-    writeln!(
-        config,
-        "# Configuration file for dircolors, a utility to help you set the"
-    )
-    .unwrap();
-    writeln!(
-        config,
-        "# LS_COLORS environment variable used by GNU ls with the --color option."
-    )
-    .unwrap();
-    writeln!(
-        config,
-        "# The keywords COLOR, OPTIONS, and EIGHTBIT (honored by the"
-    )
-    .unwrap();
-    writeln!(
-        config,
-        "# slackware version of dircolors) are recognized but ignored."
-    )
-    .unwrap();
-    writeln!(
-        config,
-        "# Global config options can be specified before TERM or COLORTERM entries"
-    )
-    .unwrap();
-    writeln!(
-        config,
-        "# Below are TERM or COLORTERM entries, which can be glob patterns, which"
-    )
-    .unwrap();
-    writeln!(
-        config,
-        "# restrict following config to systems with matching environment variables."
-    )
-    .unwrap();
-    writeln!(config, "COLORTERM ?*").unwrap();
-    for term in TERMS.iter() {
-        writeln!(config, "TERM {}", term).unwrap();
+    config.push_str("# Configuration file for dircolors, a utility to help you set the\n");
+    config.push_str("# LS_COLORS environment variable used by GNU ls with the --color option.\n");
+    config.push_str("# The keywords COLOR, OPTIONS, and EIGHTBIT (honored by the\n");
+    config.push_str("# slackware version of dircolors) are recognized but ignored.\n");
+    config.push_str("# Global config options can be specified before TERM or COLORTERM entries\n");
+    config.push_str("# Below are TERM or COLORTERM entries, which can be glob patterns, which\n");
+    config
+        .push_str("# restrict following config to systems with matching environment variables.\n");
+    config.push_str("COLORTERM ?*\n");
+    for term in TERMS {
+        config.push_str(&format!("TERM {}\n", term));
     }
 
-    // Adding file types and their color codes with header
-    writeln!(
-        config,
-        "# Below are the color init strings for the basic file types."
-    )
-    .unwrap();
-    writeln!(
-        config,
-        "# One can use codes for 256 or more colors supported by modern terminals."
-    )
-    .unwrap();
-    writeln!(
-        config,
-        "# The default color codes use the capabilities of an 8 color terminal"
-    )
-    .unwrap();
-    writeln!(
-        config,
-        "# with some additional attributes as per the following codes:"
-    )
-    .unwrap();
-    writeln!(config, "# Attribute codes:").unwrap();
-    writeln!(
-        config,
-        "# 00=none 01=bold 04=underscore 05=blink 07=reverse 08=concealed"
-    )
-    .unwrap();
-    writeln!(config, "# Text color codes:").unwrap();
-    writeln!(
-        config,
-        "# 30=black 31=red 32=green 33=yellow 34=blue 35=magenta 36=cyan 37=white"
-    )
-    .unwrap();
-    writeln!(config, "# Background color codes:").unwrap();
-    writeln!(
-        config,
-        "# 40=black 41=red 42=green 43=yellow 44=blue 45=magenta 46=cyan 47=white"
-    )
-    .unwrap();
-    writeln!(config, "#NORMAL 00 # no color code at all").unwrap();
-    writeln!(config, "#FILE 00 # regular file: use no color at all").unwrap();
-
-    for (name, _, code) in FILE_TYPES.iter() {
-        writeln!(config, "{} {}", name, code).unwrap();
+    config.push_str("# Below are the color init strings for the basic file types.\n");
+    config.push_str("# One can use codes for 256 or more colors supported by modern terminals.\n");
+    config.push_str("# The default color codes use the capabilities of an 8 color terminal\n");
+    config.push_str("# with some additional attributes as per the following codes:\n");
+    config.push_str("# Attribute codes:\n");
+    config.push_str("# 00=none 01=bold 04=underscore 05=blink 07=reverse 08=concealed\n");
+    config.push_str("# Text color codes:\n");
+    config.push_str("# 30=black 31=red 32=green 33=yellow 34=blue 35=magenta 36=cyan 37=white\n");
+    config.push_str("# Background color codes:\n");
+    config.push_str("# 40=black 41=red 42=green 43=yellow 44=blue 45=magenta 46=cyan 47=white\n");
+    config.push_str("#NORMAL 00 # no color code at all\n");
+    config.push_str("#FILE 00 # regular file: use no color at all\n");
+
+    for (name, _, code) in FILE_TYPES {
+        config.push_str(&format!("{} {}\n", name, code));
     }
 
-    writeln!(
-        config,
-        "# List any file extensions like '.gz' or '.tar' that you would like ls"
-    )
-    .unwrap();
-    writeln!(
-        config,
-        "# to color below. Put the extension, a space, and the color init string."
-    )
-    .unwrap();
-
-    for (ext, color) in FILE_COLORS.iter() {
-        writeln!(config, "{} {}", ext, color).unwrap();
+    config.push_str("# List any file extensions like '.gz' or '.tar' that you would like ls\n");
+    config.push_str("# to color below. Put the extension, a space, and the color init string.\n");
+
+    for (ext, color) in FILE_COLORS {
+        config.push_str(&format!("{} {}\n", ext, color));
     }
-    writeln!(
-        config,
-        "# Subsequent TERM or COLORTERM entries, can be used to add / override"
-    )
-    .unwrap();
-    write!(
-        config,
-        "# config specific to those matching environment variables."
-    )
-    .unwrap();
+    config.push_str("# Subsequent TERM or COLORTERM entries, can be used to add / override\n");
+    config.push_str("# config specific to those matching environment variables.");
 
     config
 }
diff --git a/tests/by-util/test_dircolors.rs b/tests/by-util/test_dircolors.rs
index e3752fcde98..4a256352c76 100644
--- a/tests/by-util/test_dircolors.rs
+++ b/tests/by-util/test_dircolors.rs
@@ -159,6 +159,7 @@ fn test_quoting() {
         .no_stderr();
 }
 
+/*
 #[test]
 fn test_print_ls_colors() {
     new_ucmd!()
@@ -168,6 +169,7 @@ fn test_print_ls_colors() {
         .stdout_is("\x1B[40;33mtw\t40;33\x1B[0m\n")
         .no_stderr();
 }
+*/
 
 #[test]
 fn test_extra_operand() {

From 4d2ae8485cd65429e64606119acac3156158ea2b Mon Sep 17 00:00:00 2001
From: Arpit Bhadauria <singharpit511@gmail.com>
Date: Mon, 4 Dec 2023 22:44:18 +0000
Subject: [PATCH 127/429] impl from trait instead of into

---
 src/uu/expr/src/syntax_tree.rs | 43 ++++++++++++++++------------------
 1 file changed, 20 insertions(+), 23 deletions(-)

diff --git a/src/uu/expr/src/syntax_tree.rs b/src/uu/expr/src/syntax_tree.rs
index 7677b5e7e54..ae2a44e5205 100644
--- a/src/uu/expr/src/syntax_tree.rs
+++ b/src/uu/expr/src/syntax_tree.rs
@@ -89,8 +89,8 @@ impl RelationOp {
 
 impl NumericOp {
     fn eval(&self, left: &AstNode, right: &AstNode) -> ExprResult<NumOrStr> {
-        let a = <NumOrStr as Into<ExprResult<BigInt>>>::into(left.eval()?)?;
-        let b = <NumOrStr as Into<ExprResult<BigInt>>>::into(right.eval()?)?;
+        let a = ExprResult::<BigInt>::from(left.eval()?)?;
+        let b = ExprResult::<BigInt>::from(right.eval()?)?;
         Ok(NumOrStr::Num(match self {
             Self::Add => a + b,
             Self::Sub => a - b,
@@ -218,29 +218,29 @@ impl From<String> for NumOrStr {
     }
 }
 
-impl Into<Option<usize>> for NumOrStr {
-    fn into(self) -> Option<usize> {
-        match self.into() {
+impl From<NumOrStr> for Option<usize> {
+    fn from(s: NumOrStr) -> Self {
+        match s.into() {
             Ok(num) => num.to_usize(),
             Err(_) => None,
         }
     }
 }
 
-impl Into<String> for NumOrStr {
-    fn into(self) -> String {
-        match self {
-            Self::Num(num) => num.to_string(),
-            Self::Str(str) => str.to_string(),
+impl From<NumOrStr> for String {
+    fn from(s: NumOrStr) -> Self {
+        match s {
+            NumOrStr::Num(num) => num.to_string(),
+            NumOrStr::Str(str) => str.to_string(),
         }
     }
 }
 
-impl Into<ExprResult<BigInt>> for NumOrStr {
-    fn into(self) -> ExprResult<BigInt> {
-        match self {
-            Self::Num(num) => Ok(num),
-            Self::Str(str) => str
+impl From<NumOrStr> for ExprResult<BigInt> {
+    fn from(s: NumOrStr) -> Self {
+        match s {
+            NumOrStr::Num(num) => Ok(num),
+            NumOrStr::Str(str) => str
                 .parse::<BigInt>()
                 .map_err(|_| ExprError::NonIntegerArgument),
         }
@@ -303,9 +303,8 @@ impl AstNode {
                 //
                 // So we coerce errors into 0 to make that the only case we
                 // have to care about.
-                let pos: usize = <NumOrStr as Into<Option<usize>>>::into(pos.eval()?).unwrap_or(0);
-                let length: usize =
-                    <NumOrStr as Into<Option<usize>>>::into(length.eval()?).unwrap_or(0);
+                let pos: usize = Option::<usize>::from(pos.eval()?).unwrap_or(0);
+                let length: usize = Option::<usize>::from(length.eval()?).unwrap_or(0);
 
                 let (Some(pos), Some(_)) = (pos.checked_sub(1), length.checked_sub(1)) else {
                     return Ok(NumOrStr::from(String::new()));
@@ -315,11 +314,9 @@ impl AstNode {
                     string.chars().skip(pos).take(length).collect::<String>(),
                 ))
             }
-            Self::Length { string } => Ok(NumOrStr::from(
-                <NumOrStr as Into<String>>::into(string.eval()?)
-                    .chars()
-                    .count(),
-            )),
+            Self::Length { string } => {
+                Ok(NumOrStr::from(String::from(string.eval()?).chars().count()))
+            }
         }
     }
 }

From 2fcfec6490f87af117a03ccd77ebf487192d548c Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Tue, 5 Dec 2023 21:50:38 +0100
Subject: [PATCH 128/429] fuzz seq

---
 .github/workflows/fuzzing.yml |  1 +
 fuzz/Cargo.toml               |  8 +++-
 fuzz/fuzz_targets/fuzz_seq.rs | 78 +++++++++++++++++++++++++++++++++++
 3 files changed, 86 insertions(+), 1 deletion(-)
 create mode 100644 fuzz/fuzz_targets/fuzz_seq.rs

diff --git a/.github/workflows/fuzzing.yml b/.github/workflows/fuzzing.yml
index 623a03f65c7..eed2ae2fc99 100644
--- a/.github/workflows/fuzzing.yml
+++ b/.github/workflows/fuzzing.yml
@@ -47,6 +47,7 @@ jobs:
           - { name: fuzz_expr, should_pass: true }
           - { name: fuzz_printf, should_pass: false }
           - { name: fuzz_echo, should_pass: false }
+          - { name: fuzz_seq, should_pass: false }
           - { name: fuzz_parse_glob, should_pass: true }
           - { name: fuzz_parse_size, should_pass: true }
           - { name: fuzz_parse_time, should_pass: true }
diff --git a/fuzz/Cargo.toml b/fuzz/Cargo.toml
index b27f5b58677..c98f105ad19 100644
--- a/fuzz/Cargo.toml
+++ b/fuzz/Cargo.toml
@@ -18,7 +18,7 @@ uu_test = { path = "../src/uu/test/" }
 uu_expr = { path = "../src/uu/expr/" }
 uu_printf = { path = "../src/uu/printf/" }
 uu_echo = { path = "../src/uu/echo/" }
-
+uu_seq = { path = "../src/uu/seq/" }
 
 # Prevent this from interfering with workspaces
 [workspace]
@@ -42,6 +42,12 @@ path = "fuzz_targets/fuzz_echo.rs"
 test = false
 doc = false
 
+[[bin]]
+name = "fuzz_seq"
+path = "fuzz_targets/fuzz_seq.rs"
+test = false
+doc = false
+
 [[bin]]
 name = "fuzz_expr"
 path = "fuzz_targets/fuzz_expr.rs"
diff --git a/fuzz/fuzz_targets/fuzz_seq.rs b/fuzz/fuzz_targets/fuzz_seq.rs
new file mode 100644
index 00000000000..2e4ff1a4662
--- /dev/null
+++ b/fuzz/fuzz_targets/fuzz_seq.rs
@@ -0,0 +1,78 @@
+// This file is part of the uutils coreutils package.
+//
+// For the full copyright and license information, please view the LICENSE
+// file that was distributed with this source code.
+// spell-checker:ignore parens
+
+#![no_main]
+use libfuzzer_sys::fuzz_target;
+use uu_seq::uumain;
+
+use rand::Rng;
+use std::ffi::OsString;
+
+mod fuzz_common;
+use crate::fuzz_common::CommandResult;
+use crate::fuzz_common::{
+    compare_result, generate_and_run_uumain, generate_random_string, run_gnu_cmd,
+};
+static CMD_PATH: &str = "seq";
+
+fn generate_seq() -> String {
+    let mut rng = rand::thread_rng();
+
+    // Generate 1 to 3 numbers for seq arguments
+    let arg_count = rng.gen_range(1..=3);
+    let mut args = Vec::new();
+
+    for _ in 0..arg_count {
+        if rng.gen_ratio(1, 100) {
+            // 1% chance to add a random string
+            args.push(generate_random_string(rng.gen_range(1..=10)));
+        } else {
+            // 99% chance to add a numeric value
+            match rng.gen_range(0..=3) {
+                0 => args.push(rng.gen_range(-10000..=10000).to_string()), // Large or small integers
+                1 => args.push(rng.gen_range(-100.0..100.0).to_string()),  // Floating-point numbers
+                2 => args.push(rng.gen_range(-100..0).to_string()),        // Negative integers
+                _ => args.push(rng.gen_range(1..=100).to_string()),        // Regular integers
+            }
+        }
+    }
+
+    args.join(" ")
+}
+
+fuzz_target!(|_data: &[u8]| {
+    let seq = generate_seq();
+    let mut args = vec![OsString::from("seq")];
+    args.extend(seq.split_whitespace().map(OsString::from));
+
+    let rust_result = generate_and_run_uumain(&args, uumain);
+
+    let gnu_result = match run_gnu_cmd(CMD_PATH, &args[1..], false) {
+        Ok(result) => result,
+        Err(error_result) => {
+            eprintln!("Failed to run GNU command:");
+            eprintln!("Stderr: {}", error_result.stderr);
+            eprintln!("Exit Code: {}", error_result.exit_code);
+            CommandResult {
+                stdout: String::new(),
+                stderr: error_result.stderr,
+                exit_code: error_result.exit_code,
+            }
+        }
+    };
+
+    compare_result(
+        "seq",
+        &format!("{:?}", &args[1..]),
+        &rust_result.stdout,
+        &gnu_result.stdout,
+        &rust_result.stderr,
+        &gnu_result.stderr,
+        rust_result.exit_code,
+        gnu_result.exit_code,
+        false, // Set to true if you want to fail on stderr diff
+    );
+});

From 97ec99cf28d7b699e7d89793bad93f7ca0976053 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Wed, 6 Dec 2023 21:14:59 +0100
Subject: [PATCH 129/429] use a single push_str

Co-authored-by: Terts Diepraam <terts.diepraam@gmail.com>
---
 src/uu/dircolors/src/dircolors.rs | 19 +++++++++++--------
 1 file changed, 11 insertions(+), 8 deletions(-)

diff --git a/src/uu/dircolors/src/dircolors.rs b/src/uu/dircolors/src/dircolors.rs
index 41e640b2a5f..91544dc7353 100644
--- a/src/uu/dircolors/src/dircolors.rs
+++ b/src/uu/dircolors/src/dircolors.rs
@@ -481,14 +481,17 @@ fn escape(s: &str) -> String {
 pub fn generate_dircolors_config() -> String {
     let mut config = String::new();
 
-    config.push_str("# Configuration file for dircolors, a utility to help you set the\n");
-    config.push_str("# LS_COLORS environment variable used by GNU ls with the --color option.\n");
-    config.push_str("# The keywords COLOR, OPTIONS, and EIGHTBIT (honored by the\n");
-    config.push_str("# slackware version of dircolors) are recognized but ignored.\n");
-    config.push_str("# Global config options can be specified before TERM or COLORTERM entries\n");
-    config.push_str("# Below are TERM or COLORTERM entries, which can be glob patterns, which\n");
-    config
-        .push_str("# restrict following config to systems with matching environment variables.\n");
+   config.push_str(
+        "\
+         # Configuration file for dircolors, a utility to help you set the\n\
+         # LS_COLORS environment variable used by GNU ls with the --color option.\n\
+         # The keywords COLOR, OPTIONS, and EIGHTBIT (honored by the\n\
+         # slackware version of dircolors) are recognized but ignored.\n\
+         # Global config options can be specified before TERM or COLORTERM entries\n\
+         # Below are TERM or COLORTERM entries, which can be glob patterns, which\n\
+         # restrict following config to systems with matching environment variables.\n\
+        ",
+    );
     config.push_str("COLORTERM ?*\n");
     for term in TERMS {
         config.push_str(&format!("TERM {}\n", term));

From bd667efa7b1daf9a38edc5272c3bdab8e5743f56 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Wed, 6 Dec 2023 21:15:43 +0100
Subject: [PATCH 130/429] simplify the declaration

Co-authored-by: Terts Diepraam <terts.diepraam@gmail.com>
---
 src/uu/dircolors/src/dircolors.rs | 28 ++++++++++++++++------------
 1 file changed, 16 insertions(+), 12 deletions(-)

diff --git a/src/uu/dircolors/src/dircolors.rs b/src/uu/dircolors/src/dircolors.rs
index 91544dc7353..fa523451b29 100644
--- a/src/uu/dircolors/src/dircolors.rs
+++ b/src/uu/dircolors/src/dircolors.rs
@@ -497,18 +497,22 @@ pub fn generate_dircolors_config() -> String {
         config.push_str(&format!("TERM {}\n", term));
     }
 
-    config.push_str("# Below are the color init strings for the basic file types.\n");
-    config.push_str("# One can use codes for 256 or more colors supported by modern terminals.\n");
-    config.push_str("# The default color codes use the capabilities of an 8 color terminal\n");
-    config.push_str("# with some additional attributes as per the following codes:\n");
-    config.push_str("# Attribute codes:\n");
-    config.push_str("# 00=none 01=bold 04=underscore 05=blink 07=reverse 08=concealed\n");
-    config.push_str("# Text color codes:\n");
-    config.push_str("# 30=black 31=red 32=green 33=yellow 34=blue 35=magenta 36=cyan 37=white\n");
-    config.push_str("# Background color codes:\n");
-    config.push_str("# 40=black 41=red 42=green 43=yellow 44=blue 45=magenta 46=cyan 47=white\n");
-    config.push_str("#NORMAL 00 # no color code at all\n");
-    config.push_str("#FILE 00 # regular file: use no color at all\n");
+    config.push_str(
+        "\
+        # Below are the color init strings for the basic file types.\n\
+        # One can use codes for 256 or more colors supported by modern terminals.\n\
+        # The default color codes use the capabilities of an 8 color terminal\n\
+        # with some additional attributes as per the following codes:\n\
+        # Attribute codes:\n\
+        # 00=none 01=bold 04=underscore 05=blink 07=reverse 08=concealed\n\
+        # Text color codes:\n\
+        # 30=black 31=red 32=green 33=yellow 34=blue 35=magenta 36=cyan 37=white\n\
+        # Background color codes:\n\
+        # 40=black 41=red 42=green 43=yellow 44=blue 45=magenta 46=cyan 47=white\n\
+        #NORMAL 00 # no color code at all\n\
+        #FILE 00 # regular file: use no color at all\n\
+        ",
+    );
 
     for (name, _, code) in FILE_TYPES {
         config.push_str(&format!("{} {}\n", name, code));

From f99987bb35aade972e187ad3b7df6b039f5b72c2 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Wed, 6 Dec 2023 21:19:59 +0100
Subject: [PATCH 131/429] fix rustfmt

---
 src/uu/dircolors/src/dircolors.rs | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/uu/dircolors/src/dircolors.rs b/src/uu/dircolors/src/dircolors.rs
index fa523451b29..ecca9d16033 100644
--- a/src/uu/dircolors/src/dircolors.rs
+++ b/src/uu/dircolors/src/dircolors.rs
@@ -481,7 +481,7 @@ fn escape(s: &str) -> String {
 pub fn generate_dircolors_config() -> String {
     let mut config = String::new();
 
-   config.push_str(
+    config.push_str(
         "\
          # Configuration file for dircolors, a utility to help you set the\n\
          # LS_COLORS environment variable used by GNU ls with the --color option.\n\

From 5a32ab8004304fe5434bf42e1faf066a58b95736 Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Wed, 6 Dec 2023 15:35:38 +0100
Subject: [PATCH 132/429] ls: implement --hyperlink

---
 Cargo.lock                 |  1 +
 Cargo.toml                 |  1 +
 src/uu/hostname/Cargo.toml |  2 +-
 src/uu/ls/Cargo.toml       |  1 +
 src/uu/ls/src/ls.rs        | 50 ++++++++++++++++++++++++++++++++++++--
 tests/by-util/test_ls.rs   | 30 +++++++++++++++++++++++
 6 files changed, 82 insertions(+), 3 deletions(-)

diff --git a/Cargo.lock b/Cargo.lock
index bf638b421a1..5060da44116 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -2618,6 +2618,7 @@ dependencies = [
  "chrono",
  "clap",
  "glob",
+ "hostname",
  "lscolors",
  "number_prefix",
  "once_cell",
diff --git a/Cargo.toml b/Cargo.toml
index 14e700ee0a6..13b99700851 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -284,6 +284,7 @@ fundu = "2.0.0"
 gcd = "2.3"
 glob = "0.3.1"
 half = "2.3"
+hostname = "0.3"
 indicatif = "0.17"
 itertools = "0.12.0"
 libc = "0.2.150"
diff --git a/src/uu/hostname/Cargo.toml b/src/uu/hostname/Cargo.toml
index a9b033d123b..1fe10170964 100644
--- a/src/uu/hostname/Cargo.toml
+++ b/src/uu/hostname/Cargo.toml
@@ -16,7 +16,7 @@ path = "src/hostname.rs"
 
 [dependencies]
 clap = { workspace = true }
-hostname = { version = "0.3", features = ["set"] }
+hostname = { workspace = true, features = ["set"] }
 uucore = { workspace = true, features = ["wide"] }
 
 [target.'cfg(target_os = "windows")'.dependencies]
diff --git a/src/uu/ls/Cargo.toml b/src/uu/ls/Cargo.toml
index 96cf7df1a0d..a82a1f37e07 100644
--- a/src/uu/ls/Cargo.toml
+++ b/src/uu/ls/Cargo.toml
@@ -31,6 +31,7 @@ uucore = { workspace = true, features = [
 ] }
 once_cell = { workspace = true }
 selinux = { workspace = true, optional = true }
+hostname = { workspace = true }
 
 [[bin]]
 name = "ls"
diff --git a/src/uu/ls/src/ls.rs b/src/uu/ls/src/ls.rs
index c6b10677c6e..deb8aac3dfe 100644
--- a/src/uu/ls/src/ls.rs
+++ b/src/uu/ls/src/ls.rs
@@ -155,6 +155,7 @@ pub mod options {
     pub static GROUP_DIRECTORIES_FIRST: &str = "group-directories-first";
     pub static ZERO: &str = "zero";
     pub static DIRED: &str = "dired";
+    pub static HYPERLINK: &str = "hyperlink";
 }
 
 const DEFAULT_TERM_WIDTH: u16 = 80;
@@ -418,6 +419,7 @@ pub struct Config {
     group_directories_first: bool,
     line_ending: LineEnding,
     dired: bool,
+    hyperlink: bool,
 }
 
 // Fields that can be removed or added to the long format
@@ -566,6 +568,25 @@ fn extract_color(options: &clap::ArgMatches) -> bool {
     }
 }
 
+/// Extracts the hyperlink option to use based on the options provided.
+///
+/// # Returns
+///
+/// A boolean representing whether to hyperlink files.
+fn extract_hyperlink(options: &clap::ArgMatches) -> bool {
+    let hyperlink = options
+        .get_one::<String>(options::HYPERLINK)
+        .unwrap()
+        .as_str();
+
+    match hyperlink {
+        "always" | "yes" | "force" => true,
+        "auto" | "tty" | "if-tty" => std::io::stdout().is_terminal(),
+        "never" | "no" | "none" => false,
+        _ => unreachable!("should be handled by clap"),
+    }
+}
+
 /// Extracts the quoting style to use based on the options provided.
 ///
 /// # Arguments
@@ -736,10 +757,9 @@ impl Config {
         }
 
         let sort = extract_sort(options);
-
         let time = extract_time(options);
-
         let mut needs_color = extract_color(options);
+        let hyperlink = extract_hyperlink(options);
 
         let opt_block_size = options.get_one::<String>(options::size::BLOCK_SIZE);
         let opt_si = opt_block_size.is_some()
@@ -1020,6 +1040,7 @@ impl Config {
             group_directories_first: options.get_flag(options::GROUP_DIRECTORIES_FIRST),
             line_ending: LineEnding::from_zero_flag(options.get_flag(options::ZERO)),
             dired,
+            hyperlink,
         })
     }
 }
@@ -1154,6 +1175,19 @@ pub fn uu_app() -> Command {
                 .help("generate output designed for Emacs' dired (Directory Editor) mode")
                 .action(ArgAction::SetTrue),
         )
+        .arg(
+            Arg::new(options::HYPERLINK)
+                .long(options::HYPERLINK)
+                .help("hyperlink file names WHEN")
+                .value_parser([
+                    "always", "yes", "force", "auto", "tty", "if-tty", "never", "no", "none",
+                ])
+                .require_equals(true)
+                .num_args(0..=1)
+                .default_missing_value("always")
+                .default_value("never")
+                .value_name("WHEN"),
+        )
         // The next four arguments do not override with the other format
         // options, see the comment in Config::from for the reason.
         // Ideally, they would use Arg::override_with, with their own name
@@ -2959,6 +2993,18 @@ fn display_file_name(
     // infer it because the color codes mess up term_grid's width calculation.
     let mut width = name.width();
 
+    if config.hyperlink {
+        let hostname = hostname::get().unwrap_or(OsString::from(""));
+        let hostname = hostname.to_string_lossy();
+
+        let absolute_path = fs::canonicalize(&path.p_buf).unwrap_or_default();
+        let absolute_path = absolute_path.to_string_lossy();
+
+        // TODO encode path
+        // \x1b = ESC, \x07 = BEL
+        name = format!("\x1b]8;;file://{hostname}{absolute_path}\x07{name}\x1b]8;;\x07");
+    }
+
     if let Some(ls_colors) = &config.color {
         let md = path.md(out);
         name = if md.is_some() {
diff --git a/tests/by-util/test_ls.rs b/tests/by-util/test_ls.rs
index fcd57170d48..8bc2b75ac77 100644
--- a/tests/by-util/test_ls.rs
+++ b/tests/by-util/test_ls.rs
@@ -3855,3 +3855,33 @@ fn test_posixly_correct() {
         .succeeds()
         .stdout_contains_line("total 8");
 }
+
+#[test]
+fn test_ls_hyperlink() {
+    let scene = TestScenario::new(util_name!());
+    let at = &scene.fixtures;
+    let file = "a.txt";
+
+    at.touch(file);
+
+    let path = at.root_dir_resolved();
+    let separator = std::path::MAIN_SEPARATOR_STR;
+
+    let result = scene.ucmd().arg("--hyperlink").succeeds();
+    assert!(result.stdout_str().contains("\x1b]8;;file://"));
+    assert!(result
+        .stdout_str()
+        .contains(&format!("{path}{separator}{file}\x07{file}\x1b]8;;\x07")));
+
+    let result = scene.ucmd().arg("--hyperlink=always").succeeds();
+    assert!(result.stdout_str().contains("\x1b]8;;file://"));
+    assert!(result
+        .stdout_str()
+        .contains(&format!("{path}{separator}{file}\x07{file}\x1b]8;;\x07")));
+
+    scene
+        .ucmd()
+        .arg("--hyperlink=never")
+        .succeeds()
+        .stdout_is(format!("{file}\n"));
+}

From 09999427ccfb822918fc6969e16d0fc656087ff1 Mon Sep 17 00:00:00 2001
From: Terts Diepraam <terts.diepraam@gmail.com>
Date: Thu, 7 Dec 2023 10:02:29 +0100
Subject: [PATCH 133/429] du: merge imports

---
 src/uu/du/src/du.rs | 21 ++++++++-------------
 1 file changed, 8 insertions(+), 13 deletions(-)

diff --git a/src/uu/du/src/du.rs b/src/uu/du/src/du.rs
index dc03a64f218..989e663e46c 100644
--- a/src/uu/du/src/du.rs
+++ b/src/uu/du/src/du.rs
@@ -3,35 +3,30 @@
 // For the full copyright and license information, please view the LICENSE
 // file that was distributed with this source code.
 
-use chrono::prelude::DateTime;
-use chrono::Local;
-use clap::ArgAction;
-use clap::{crate_version, Arg, ArgMatches, Command};
+use chrono::{DateTime, Local};
+use clap::{crate_version, Arg, ArgAction, ArgMatches, Command};
 use glob::Pattern;
 use std::collections::HashSet;
 use std::env;
-use std::fs;
-use std::fs::File;
+use std::error::Error;
+use std::fmt::Display;
 #[cfg(not(windows))]
 use std::fs::Metadata;
-use std::io::BufRead;
-use std::io::BufReader;
+use std::fs::{self, File};
+use std::io::{BufRead, BufReader};
 #[cfg(not(windows))]
 use std::os::unix::fs::MetadataExt;
 #[cfg(windows)]
 use std::os::windows::fs::MetadataExt;
 #[cfg(windows)]
 use std::os::windows::io::AsRawHandle;
-use std::path::Path;
-use std::path::PathBuf;
+use std::path::{Path, PathBuf};
 use std::str::FromStr;
 use std::sync::mpsc;
 use std::thread;
 use std::time::{Duration, UNIX_EPOCH};
-use std::{error::Error, fmt::Display};
 use uucore::display::{print_verbatim, Quotable};
-use uucore::error::FromIo;
-use uucore::error::{UError, UResult, USimpleError};
+use uucore::error::{FromIo, UError, UResult, USimpleError};
 use uucore::line_ending::LineEnding;
 use uucore::parse_glob;
 use uucore::parse_size::{parse_size_u64, ParseSizeError};

From 6cae19156926ef0ca68e1e3657dd51e2066d4e8b Mon Sep 17 00:00:00 2001
From: Terts Diepraam <terts.diepraam@gmail.com>
Date: Thu, 7 Dec 2023 11:06:04 +0100
Subject: [PATCH 134/429] du: remove ArgMatches from StatPrinter

---
 src/uu/du/src/du.rs | 165 ++++++++++++++++++++++----------------------
 1 file changed, 84 insertions(+), 81 deletions(-)

diff --git a/src/uu/du/src/du.rs b/src/uu/du/src/du.rs
index 989e663e46c..26e697abb46 100644
--- a/src/uu/du/src/du.rs
+++ b/src/uu/du/src/du.rs
@@ -87,6 +87,18 @@ struct Options {
     count_links: bool,
     inodes: bool,
     verbose: bool,
+    threshold: Option<Threshold>,
+    apparent_size: bool,
+    // TODO: the size conversion fields should be unified
+    si: bool,
+    bytes: bool,
+    human_readable: bool,
+    block_size_1k: bool,
+    block_size_1m: bool,
+    block_size: u64,
+    time: Option<Time>,
+    time_format: String,
+    line_ending: LineEnding,
 }
 
 #[derive(PartialEq, Clone)]
@@ -96,6 +108,13 @@ enum Deref {
     None,
 }
 
+#[derive(Clone, Copy)]
+enum Time {
+    Accessed,
+    Modified,
+    Created,
+}
+
 #[derive(PartialEq, Eq, Hash, Clone, Copy)]
 struct FileInfo {
     file_id: u128,
@@ -273,10 +292,10 @@ fn read_block_size(s: Option<&str>) -> UResult<u64> {
     }
 }
 
-fn choose_size(matches: &ArgMatches, stat: &Stat) -> u64 {
-    if matches.get_flag(options::INODES) {
+fn choose_size(options: &Options, stat: &Stat) -> u64 {
+    if options.inodes {
         stat.inodes
-    } else if matches.get_flag(options::APPARENT_SIZE) || matches.get_flag(options::BYTES) {
+    } else if options.apparent_size || options.bytes {
         stat.size
     } else {
         // The st_blocks field indicates the number of blocks allocated to the file, 512-byte units.
@@ -423,14 +442,14 @@ fn convert_size_other(size: u64, _multiplier: u64, block_size: u64) -> String {
     format!("{}", ((size as f64) / (block_size as f64)).ceil())
 }
 
-fn get_convert_size_fn(matches: &ArgMatches) -> Box<dyn Fn(u64, u64, u64) -> String + Send> {
-    if matches.get_flag(options::HUMAN_READABLE) || matches.get_flag(options::SI) {
+fn get_convert_size_fn(options: &Options) -> Box<dyn Fn(u64, u64, u64) -> String + Send> {
+    if options.human_readable || options.si {
         Box::new(convert_size_human)
-    } else if matches.get_flag(options::BYTES) {
+    } else if options.bytes {
         Box::new(convert_size_b)
-    } else if matches.get_flag(options::BLOCK_SIZE_1K) {
+    } else if options.block_size_1k {
         Box::new(convert_size_k)
-    } else if matches.get_flag(options::BLOCK_SIZE_1M) {
+    } else if options.block_size_1m {
         Box::new(convert_size_m)
     } else {
         Box::new(convert_size_other)
@@ -442,7 +461,7 @@ enum DuError {
     InvalidMaxDepthArg(String),
     SummarizeDepthConflict(String),
     InvalidTimeStyleArg(String),
-    InvalidTimeArg(String),
+    InvalidTimeArg,
     InvalidGlob(String),
 }
 
@@ -468,11 +487,9 @@ Try '{} --help' for more information.",
                 s.quote(),
                 uucore::execution_phrase()
             ),
-            Self::InvalidTimeArg(s) => write!(
+            Self::InvalidTimeArg => write!(
                 f,
-                "Invalid argument {} for --time.
-'birth' and 'creation' arguments are not supported on this platform.",
-                s.quote()
+                "'birth' and 'creation' arguments for --time are not supported on this platform.",
             ),
             Self::InvalidGlob(s) => write!(f, "Invalid exclude syntax: {s}"),
         }
@@ -487,7 +504,7 @@ impl UError for DuError {
             Self::InvalidMaxDepthArg(_)
             | Self::SummarizeDepthConflict(_)
             | Self::InvalidTimeStyleArg(_)
-            | Self::InvalidTimeArg(_)
+            | Self::InvalidTimeArg
             | Self::InvalidGlob(_) => 1,
         }
     }
@@ -535,62 +552,25 @@ struct StatPrintInfo {
 }
 
 struct StatPrinter {
-    matches: ArgMatches,
-    threshold: Option<Threshold>,
     summarize: bool,
-    time_format_str: String,
-    line_ending: LineEnding,
     options: Options,
     convert_size: Box<dyn Fn(u64) -> String + Send>,
 }
 
 impl StatPrinter {
-    fn new(matches: ArgMatches, options: Options, summarize: bool) -> UResult<Self> {
-        let block_size = read_block_size(
-            matches
-                .get_one::<String>(options::BLOCK_SIZE)
-                .map(|s| s.as_str()),
-        )?;
-
-        let multiplier: u64 = if matches.get_flag(options::SI) {
-            1000
-        } else {
-            1024
-        };
+    fn new(options: Options, summarize: bool) -> UResult<Self> {
+        let multiplier: u64 = if options.si { 1000 } else { 1024 };
 
-        let convert_size_fn = get_convert_size_fn(&matches);
+        let convert_size_fn = get_convert_size_fn(&options);
 
         let convert_size: Box<dyn Fn(u64) -> String + Send> = if options.inodes {
             Box::new(|size: u64| size.to_string())
         } else {
-            Box::new(move |size: u64| convert_size_fn(size, multiplier, block_size))
-        };
-
-        let threshold = match matches.get_one::<String>(options::THRESHOLD) {
-            Some(s) => match Threshold::from_str(s) {
-                Ok(t) => Some(t),
-                Err(e) => {
-                    return Err(USimpleError::new(
-                        1,
-                        format_error_message(&e, s, options::THRESHOLD),
-                    ))
-                }
-            },
-            None => None,
+            Box::new(move |size: u64| convert_size_fn(size, multiplier, options.block_size))
         };
 
-        let time_format_str =
-            parse_time_style(matches.get_one::<String>("time-style").map(|s| s.as_str()))?
-                .to_string();
-
-        let line_ending = LineEnding::from_zero_flag(matches.get_flag(options::NULL));
-
         Ok(Self {
-            matches,
-            threshold,
             summarize,
-            time_format_str,
-            line_ending,
             options,
             convert_size,
         })
@@ -604,13 +584,14 @@ impl StatPrinter {
             match received {
                 Ok(message) => match message {
                     Ok(stat_info) => {
-                        let size = choose_size(&self.matches, &stat_info.stat);
+                        let size = choose_size(&self.options, &stat_info.stat);
 
                         if stat_info.depth == 0 {
                             grand_total += size;
                         }
 
                         if !self
+                            .options
                             .threshold
                             .map_or(false, |threshold| threshold.should_exclude(size))
                             && self
@@ -630,31 +611,24 @@ impl StatPrinter {
 
         if self.options.total {
             print!("{}\ttotal", (self.convert_size)(grand_total));
-            print!("{}", self.line_ending);
+            print!("{}", self.options.line_ending);
         }
 
         Ok(())
     }
 
     fn print_stat(&self, stat: &Stat, size: u64) -> UResult<()> {
-        if self.matches.contains_id(options::TIME) {
-            let tm = {
-                let secs = self
-                    .matches
-                    .get_one::<String>(options::TIME)
-                    .map(|s| get_time_secs(s, stat))
-                    .transpose()?
-                    .unwrap_or(stat.modified);
-                DateTime::<Local>::from(UNIX_EPOCH + Duration::from_secs(secs))
-            };
-            let time_str = tm.format(&self.time_format_str).to_string();
+        if let Some(time) = self.options.time {
+            let secs = get_time_secs(time, stat)?;
+            let tm = DateTime::<Local>::from(UNIX_EPOCH + Duration::from_secs(secs));
+            let time_str = tm.format(&self.options.time_format).to_string();
             print!("{}\t{}\t", (self.convert_size)(size), time_str);
         } else {
             print!("{}\t", (self.convert_size)(size));
         }
 
         print_verbatim(&stat.path).unwrap();
-        print!("{}", self.line_ending);
+        print!("{}", self.options.line_ending);
 
         Ok(())
     }
@@ -685,6 +659,21 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
         None => vec![PathBuf::from(".")],
     };
 
+    let time = matches.contains_id(options::TIME).then(|| {
+        match matches.get_one::<String>(options::TIME).map(AsRef::as_ref) {
+            None | Some("ctime" | "status") => Time::Modified,
+            Some("access" | "atime" | "use") => Time::Accessed,
+            Some("birth" | "creation") => Time::Created,
+            _ => unreachable!("should be caught by clap"),
+        }
+    });
+
+    let block_size = read_block_size(
+        matches
+            .get_one::<String>(options::BLOCK_SIZE)
+            .map(|s| s.as_str()),
+    )?;
+
     let options = Options {
         all: matches.get_flag(options::ALL),
         max_depth,
@@ -702,6 +691,25 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
         count_links: matches.get_flag(options::COUNT_LINKS),
         inodes: matches.get_flag(options::INODES),
         verbose: matches.get_flag(options::VERBOSE),
+        si: matches.get_flag(options::SI),
+        threshold: matches
+            .get_one::<String>(options::THRESHOLD)
+            .map(|s| {
+                Threshold::from_str(s).map_err(|e| {
+                    USimpleError::new(1, format_error_message(&e, s, options::THRESHOLD))
+                })
+            })
+            .transpose()?,
+        apparent_size: matches.get_flag(options::APPARENT_SIZE),
+        bytes: matches.get_flag(options::BYTES),
+        time,
+        block_size,
+        human_readable: matches.get_flag(options::HUMAN_READABLE),
+        block_size_1k: matches.get_flag(options::BLOCK_SIZE_1K),
+        block_size_1m: matches.get_flag(options::BLOCK_SIZE_1M),
+        time_format: parse_time_style(matches.get_one::<String>("time-style").map(|s| s.as_str()))?
+            .to_string(),
+        line_ending: LineEnding::from_zero_flag(matches.get_flag(options::NULL)),
     };
 
     if options.inodes
@@ -711,7 +719,7 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
     }
 
     // Use separate thread to print output, so we can print finished results while computation is still running
-    let stat_printer = StatPrinter::new(matches.clone(), options.clone(), summarize)?;
+    let stat_printer = StatPrinter::new(options.clone(), summarize)?;
     let (print_tx, rx) = mpsc::channel::<UResult<StatPrintInfo>>();
     let printing_thread = thread::spawn(move || stat_printer.print_stats(&rx));
 
@@ -767,17 +775,12 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
     Ok(())
 }
 
-fn get_time_secs(s: &str, stat: &Stat) -> Result<u64, DuError> {
-    let secs = match s {
-        "ctime" | "status" => stat.modified,
-        "access" | "atime" | "use" => stat.accessed,
-        "birth" | "creation" => stat
-            .created
-            .ok_or_else(|| DuError::InvalidTimeArg(s.into()))?,
-        // below should never happen as clap already restricts the values.
-        _ => unreachable!("Invalid field for --time"),
-    };
-    Ok(secs)
+fn get_time_secs(time: Time, stat: &Stat) -> Result<u64, DuError> {
+    match time {
+        Time::Modified => Ok(stat.modified),
+        Time::Accessed => Ok(stat.accessed),
+        Time::Created => stat.created.ok_or_else(|| DuError::InvalidTimeArg),
+    }
 }
 
 fn parse_time_style(s: Option<&str>) -> UResult<&str> {

From d6b10d4d720df1dfb85340ed7cda531c0e8b45bf Mon Sep 17 00:00:00 2001
From: Terts Diepraam <terts.diepraam@gmail.com>
Date: Thu, 7 Dec 2023 11:26:44 +0100
Subject: [PATCH 135/429] du: split traversal and printing options

---
 src/uu/du/src/du.rs | 57 ++++++++++++++++++++++++++++-----------------
 1 file changed, 35 insertions(+), 22 deletions(-)

diff --git a/src/uu/du/src/du.rs b/src/uu/du/src/du.rs
index 26e697abb46..14c7fe5d4b3 100644
--- a/src/uu/du/src/du.rs
+++ b/src/uu/du/src/du.rs
@@ -76,17 +76,20 @@ const USAGE: &str = help_usage!("du.md");
 // TODO: Support Z & Y (currently limited by size of u64)
 const UNITS: [(char, u32); 6] = [('E', 6), ('P', 5), ('T', 4), ('G', 3), ('M', 2), ('K', 1)];
 
-#[derive(Clone)]
-struct Options {
+struct TraversalOptions {
     all: bool,
-    max_depth: Option<usize>,
-    total: bool,
     separate_dirs: bool,
     one_file_system: bool,
     dereference: Deref,
     count_links: bool,
-    inodes: bool,
     verbose: bool,
+}
+
+#[derive(Clone)]
+struct PrintingOptions {
+    total: bool,
+    inodes: bool,
+    max_depth: Option<usize>,
     threshold: Option<Threshold>,
     apparent_size: bool,
     // TODO: the size conversion fields should be unified
@@ -134,7 +137,7 @@ struct Stat {
 }
 
 impl Stat {
-    fn new(path: &Path, options: &Options) -> std::io::Result<Self> {
+    fn new(path: &Path, options: &TraversalOptions) -> std::io::Result<Self> {
         // Determine whether to dereference (follow) the symbolic link
         let should_dereference = match &options.dereference {
             Deref::All => true,
@@ -292,7 +295,7 @@ fn read_block_size(s: Option<&str>) -> UResult<u64> {
     }
 }
 
-fn choose_size(options: &Options, stat: &Stat) -> u64 {
+fn choose_size(options: &PrintingOptions, stat: &Stat) -> u64 {
     if options.inodes {
         stat.inodes
     } else if options.apparent_size || options.bytes {
@@ -308,7 +311,7 @@ fn choose_size(options: &Options, stat: &Stat) -> u64 {
 #[allow(clippy::cognitive_complexity)]
 fn du(
     mut my_stat: Stat,
-    options: &Options,
+    options: &TraversalOptions,
     depth: usize,
     seen_inodes: &mut HashSet<FileInfo>,
     exclude: &[Pattern],
@@ -442,7 +445,7 @@ fn convert_size_other(size: u64, _multiplier: u64, block_size: u64) -> String {
     format!("{}", ((size as f64) / (block_size as f64)).ceil())
 }
 
-fn get_convert_size_fn(options: &Options) -> Box<dyn Fn(u64, u64, u64) -> String + Send> {
+fn get_convert_size_fn(options: &PrintingOptions) -> Box<dyn Fn(u64, u64, u64) -> String + Send> {
     if options.human_readable || options.si {
         Box::new(convert_size_human)
     } else if options.bytes {
@@ -553,12 +556,12 @@ struct StatPrintInfo {
 
 struct StatPrinter {
     summarize: bool,
-    options: Options,
+    options: PrintingOptions,
     convert_size: Box<dyn Fn(u64) -> String + Send>,
 }
 
 impl StatPrinter {
-    fn new(options: Options, summarize: bool) -> UResult<Self> {
+    fn new(options: PrintingOptions, summarize: bool) -> UResult<Self> {
         let multiplier: u64 = if options.si { 1000 } else { 1024 };
 
         let convert_size_fn = get_convert_size_fn(&options);
@@ -674,10 +677,8 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
             .map(|s| s.as_str()),
     )?;
 
-    let options = Options {
+    let traversal_options = TraversalOptions {
         all: matches.get_flag(options::ALL),
-        max_depth,
-        total: matches.get_flag(options::TOTAL),
         separate_dirs: matches.get_flag(options::SEPARATE_DIRS),
         one_file_system: matches.get_flag(options::ONE_FILE_SYSTEM),
         dereference: if matches.get_flag(options::DEREFERENCE) {
@@ -689,8 +690,13 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
             Deref::None
         },
         count_links: matches.get_flag(options::COUNT_LINKS),
-        inodes: matches.get_flag(options::INODES),
         verbose: matches.get_flag(options::VERBOSE),
+    };
+
+    let printing_options = PrintingOptions {
+        max_depth,
+        total: matches.get_flag(options::TOTAL),
+        inodes: matches.get_flag(options::INODES),
         si: matches.get_flag(options::SI),
         threshold: matches
             .get_one::<String>(options::THRESHOLD)
@@ -712,14 +718,14 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
         line_ending: LineEnding::from_zero_flag(matches.get_flag(options::NULL)),
     };
 
-    if options.inodes
+    if printing_options.inodes
         && (matches.get_flag(options::APPARENT_SIZE) || matches.get_flag(options::BYTES))
     {
         show_warning!("options --apparent-size and -b are ineffective with --inodes");
     }
 
     // Use separate thread to print output, so we can print finished results while computation is still running
-    let stat_printer = StatPrinter::new(options.clone(), summarize)?;
+    let stat_printer = StatPrinter::new(printing_options.clone(), summarize)?;
     let (print_tx, rx) = mpsc::channel::<UResult<StatPrintInfo>>();
     let printing_thread = thread::spawn(move || stat_printer.print_stats(&rx));
 
@@ -732,7 +738,7 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
             for pattern in &excludes {
                 if pattern.matches(&path_string) {
                     // if the directory is ignored, leave early
-                    if options.verbose {
+                    if traversal_options.verbose {
                         println!("{} ignored", path_string.quote());
                     }
                     continue 'loop_file;
@@ -741,14 +747,21 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
         }
 
         // Check existence of path provided in argument
-        if let Ok(stat) = Stat::new(&path, &options) {
+        if let Ok(stat) = Stat::new(&path, &traversal_options) {
             // Kick off the computation of disk usage from the initial path
             let mut seen_inodes: HashSet<FileInfo> = HashSet::new();
             if let Some(inode) = stat.inode {
                 seen_inodes.insert(inode);
             }
-            let stat = du(stat, &options, 0, &mut seen_inodes, &excludes, &print_tx)
-                .map_err(|e| USimpleError::new(1, e.to_string()))?;
+            let stat = du(
+                stat,
+                &traversal_options,
+                0,
+                &mut seen_inodes,
+                &excludes,
+                &print_tx,
+            )
+            .map_err(|e| USimpleError::new(1, e.to_string()))?;
 
             print_tx
                 .send(Ok(StatPrintInfo { stat, depth: 0 }))
@@ -779,7 +792,7 @@ fn get_time_secs(time: Time, stat: &Stat) -> Result<u64, DuError> {
     match time {
         Time::Modified => Ok(stat.modified),
         Time::Accessed => Ok(stat.accessed),
-        Time::Created => stat.created.ok_or_else(|| DuError::InvalidTimeArg),
+        Time::Created => stat.created.ok_or(DuError::InvalidTimeArg),
     }
 }
 

From cc26e55af28baa6ab5571bd87f004bf431d56c22 Mon Sep 17 00:00:00 2001
From: "renovate[bot]" <29139614+renovate[bot]@users.noreply.github.com>
Date: Thu, 7 Dec 2023 12:27:43 +0000
Subject: [PATCH 136/429] chore(deps): update rust crate once_cell to 1.19.0

---
 Cargo.lock | 4 ++--
 Cargo.toml | 2 +-
 2 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/Cargo.lock b/Cargo.lock
index 5060da44116..e9fcf327652 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -1409,9 +1409,9 @@ checksum = "830b246a0e5f20af87141b25c173cd1b609bd7779a4617d6ec582abaf90870f3"
 
 [[package]]
 name = "once_cell"
-version = "1.18.0"
+version = "1.19.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "dd8b5dd2ae5ed71462c540258bedcb51965123ad7e7ccf4b9a8cafaa4a63576d"
+checksum = "3fdb12b2476b595f9358c5161aa467c2438859caa136dec86c26fdd2efe17b92"
 
 [[package]]
 name = "onig"
diff --git a/Cargo.toml b/Cargo.toml
index 13b99700851..f88285a1f36 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -299,7 +299,7 @@ notify = { version = "=6.0.1", features = ["macos_kqueue"] }
 num-bigint = "0.4.4"
 num-traits = "0.2.17"
 number_prefix = "0.4"
-once_cell = "1.18.0"
+once_cell = "1.19.0"
 onig = { version = "~6.4", default-features = false }
 parse_datetime = "0.5.0"
 phf = "0.11.2"

From 054ca4a6b517cd86893a92362f152b7cde0071a1 Mon Sep 17 00:00:00 2001
From: zhitkoff <zhitkoff@gmail.com>
Date: Sun, 26 Nov 2023 17:01:22 -0500
Subject: [PATCH 137/429] wc: better handle files in pseudo-filesystems

---
 src/uu/wc/src/count_fast.rs | 26 +++++++++++++++++++++-----
 tests/by-util/test_wc.rs    |  8 ++++++++
 2 files changed, 29 insertions(+), 5 deletions(-)

diff --git a/src/uu/wc/src/count_fast.rs b/src/uu/wc/src/count_fast.rs
index 863625921bf..3872e60bf54 100644
--- a/src/uu/wc/src/count_fast.rs
+++ b/src/uu/wc/src/count_fast.rs
@@ -2,6 +2,8 @@
 //
 // For the full copyright and license information, please view the LICENSE
 // file that was distributed with this source code.
+
+// cSpell:ignore sysconf
 use crate::word_count::WordCount;
 
 use super::WordCountable;
@@ -11,7 +13,7 @@ use std::fs::OpenOptions;
 use std::io::{self, ErrorKind, Read};
 
 #[cfg(unix)]
-use libc::S_IFREG;
+use libc::{sysconf, S_IFREG, _SC_PAGESIZE};
 #[cfg(unix)]
 use nix::sys::stat;
 #[cfg(any(target_os = "linux", target_os = "android"))]
@@ -87,11 +89,25 @@ pub(crate) fn count_bytes_fast<T: WordCountable>(handle: &mut T) -> (usize, Opti
             // If stat.st_size = 0 then
             //  - either the size is 0
             //  - or the size is unknown.
-            // The second case happens for files in pseudo-filesystems. For
-            // example with /proc/version and /sys/kernel/profiling. So,
-            // if it is 0 we don't report that and instead do a full read.
+            // The second case happens for files in pseudo-filesystems.
+            // For example with /proc/version.
+            // So, if it is 0 we don't report that and instead do a full read.
+            //
+            // Another thing to consider for files in pseudo-filesystems like /proc, /sys
+            // and similar is that they could report `st_size` greater than actual content.
+            // For example /sys/kernel/profiling could report `st_size` equal to
+            // system page size (typically 4096 on 64bit system), while it's file content
+            // would count up only to a couple of bytes.
+            // This condition usually occurs for files in pseudo-filesystems like /proc, /sys
+            // that report `st_size` in the multiples of system page size.
+            // In such cases - fall back on full read
             if (stat.st_mode as libc::mode_t & S_IFREG) != 0 && stat.st_size > 0 {
-                return (stat.st_size as usize, None);
+                let sys_page_size = unsafe { sysconf(_SC_PAGESIZE) as usize };
+                if stat.st_size as usize % sys_page_size > 0 {
+                    // regular file or file from /proc, /sys and similar pseudo-filesystems
+                    // with size that is NOT a multiple of system page size
+                    return (stat.st_size as usize, None);
+                }
             }
             #[cfg(any(target_os = "linux", target_os = "android"))]
             {
diff --git a/tests/by-util/test_wc.rs b/tests/by-util/test_wc.rs
index 8358a542a23..c365b13b952 100644
--- a/tests/by-util/test_wc.rs
+++ b/tests/by-util/test_wc.rs
@@ -419,6 +419,14 @@ fn test_files_from_pseudo_filesystem() {
     use pretty_assertions::assert_ne;
     let result = new_ucmd!().arg("-c").arg("/proc/cpuinfo").succeeds();
     assert_ne!(result.stdout_str(), "0 /proc/cpuinfo\n");
+
+    let (at, mut ucmd) = at_and_ucmd!();
+    let result = ucmd.arg("-c").arg("/sys/kernel/profiling").succeeds();
+    let actual = at.read("/sys/kernel/profiling").len();
+    assert_eq!(
+        result.stdout_str(),
+        format!("{} /sys/kernel/profiling\n", actual)
+    );
 }
 
 #[test]

From 253926f2e2ae39613db744d3a5f0f15671c93b8a Mon Sep 17 00:00:00 2001
From: zhitkoff <zhitkoff@gmail.com>
Date: Fri, 1 Dec 2023 16:20:25 -0500
Subject: [PATCH 138/429] wc: unix input redirect

---
 src/uu/wc/src/count_fast.rs | 21 ++++++++++++++++++++-
 1 file changed, 20 insertions(+), 1 deletion(-)

diff --git a/src/uu/wc/src/count_fast.rs b/src/uu/wc/src/count_fast.rs
index 3872e60bf54..5fa1a978f38 100644
--- a/src/uu/wc/src/count_fast.rs
+++ b/src/uu/wc/src/count_fast.rs
@@ -101,7 +101,26 @@ pub(crate) fn count_bytes_fast<T: WordCountable>(handle: &mut T) -> (usize, Opti
             // This condition usually occurs for files in pseudo-filesystems like /proc, /sys
             // that report `st_size` in the multiples of system page size.
             // In such cases - fall back on full read
-            if (stat.st_mode as libc::mode_t & S_IFREG) != 0 && stat.st_size > 0 {
+            //
+            // And finally a special case of input redirection in *nix shell:
+            // `( wc -c ; wc -c ) < file` should return
+            // ```
+            // size_of_file
+            // 0
+            // ```
+            // Similarly
+            // `( head -c1 ; wc -c ) < file` should return
+            // ```
+            // first_byte_of_file
+            // size_of_file - 1
+            // ```
+            // Since the input stream from file is treated as continuous across both commands inside ().
+            // In cases like this, due to `<` redirect, the `stat.st_mode` would report input as a regular file
+            // and `stat.st_size` would report the size of file on disk
+            // and NOT the remaining number of bytes in the input stream. The raw file descriptor
+            // in this situation would be equal to `0` for STDIN in both invocations.
+            // Therefore we cannot rely of `st_size` here and should fall back on full read.
+            if fd > 0 && (stat.st_mode as libc::mode_t & S_IFREG) != 0 && stat.st_size > 0 {
                 let sys_page_size = unsafe { sysconf(_SC_PAGESIZE) as usize };
                 if stat.st_size as usize % sys_page_size > 0 {
                     // regular file or file from /proc, /sys and similar pseudo-filesystems

From 6186153a0856eae9b631a82c3b9b05666405b953 Mon Sep 17 00:00:00 2001
From: zhitkoff <zhitkoff@gmail.com>
Date: Fri, 1 Dec 2023 19:19:42 -0500
Subject: [PATCH 139/429] wc: count_fast optimization using seek

---
 src/uu/wc/src/count_fast.rs | 8 ++++++--
 src/uu/wc/src/countable.rs  | 9 +++++++++
 2 files changed, 15 insertions(+), 2 deletions(-)

diff --git a/src/uu/wc/src/count_fast.rs b/src/uu/wc/src/count_fast.rs
index 5fa1a978f38..1eb1d912724 100644
--- a/src/uu/wc/src/count_fast.rs
+++ b/src/uu/wc/src/count_fast.rs
@@ -10,7 +10,7 @@ use super::WordCountable;
 
 #[cfg(any(target_os = "linux", target_os = "android"))]
 use std::fs::OpenOptions;
-use std::io::{self, ErrorKind, Read};
+use std::io::{self, ErrorKind, Read, Seek, SeekFrom};
 
 #[cfg(unix)]
 use libc::{sysconf, S_IFREG, _SC_PAGESIZE};
@@ -100,7 +100,7 @@ pub(crate) fn count_bytes_fast<T: WordCountable>(handle: &mut T) -> (usize, Opti
             // would count up only to a couple of bytes.
             // This condition usually occurs for files in pseudo-filesystems like /proc, /sys
             // that report `st_size` in the multiples of system page size.
-            // In such cases - fall back on full read
+            // In such cases - attempt `seek()` for the end of file
             //
             // And finally a special case of input redirection in *nix shell:
             // `( wc -c ; wc -c ) < file` should return
@@ -126,6 +126,10 @@ pub(crate) fn count_bytes_fast<T: WordCountable>(handle: &mut T) -> (usize, Opti
                     // regular file or file from /proc, /sys and similar pseudo-filesystems
                     // with size that is NOT a multiple of system page size
                     return (stat.st_size as usize, None);
+                } else if let Some(file) = handle.inner_file() {
+                    if let Ok(n) = file.seek(SeekFrom::End(0)) {
+                        return (n as usize, None);
+                    }
                 }
             }
             #[cfg(any(target_os = "linux", target_os = "android"))]
diff --git a/src/uu/wc/src/countable.rs b/src/uu/wc/src/countable.rs
index 64397446491..d27c7fb5968 100644
--- a/src/uu/wc/src/countable.rs
+++ b/src/uu/wc/src/countable.rs
@@ -17,12 +17,14 @@ use std::os::unix::io::AsRawFd;
 pub trait WordCountable: AsRawFd + Read {
     type Buffered: BufRead;
     fn buffered(self) -> Self::Buffered;
+    fn inner_file(&mut self) -> Option<&mut File>;
 }
 
 #[cfg(not(unix))]
 pub trait WordCountable: Read {
     type Buffered: BufRead;
     fn buffered(self) -> Self::Buffered;
+    fn inner_file(&mut self) -> Option<&mut File>;
 }
 
 impl WordCountable for StdinLock<'_> {
@@ -31,6 +33,9 @@ impl WordCountable for StdinLock<'_> {
     fn buffered(self) -> Self::Buffered {
         self
     }
+    fn inner_file(&mut self) -> Option<&mut File> {
+        None
+    }
 }
 
 impl WordCountable for File {
@@ -39,4 +44,8 @@ impl WordCountable for File {
     fn buffered(self) -> Self::Buffered {
         BufReader::new(self)
     }
+
+    fn inner_file(&mut self) -> Option<&mut File> {
+        Some(self)
+    }
 }

From 85e78376fe932e168b6a891b829d55394330014b Mon Sep 17 00:00:00 2001
From: zhitkoff <zhitkoff@gmail.com>
Date: Fri, 1 Dec 2023 20:18:15 -0500
Subject: [PATCH 140/429] wc: count_fast seek optimization

---
 src/uu/wc/src/count_fast.rs | 8 +++++---
 1 file changed, 5 insertions(+), 3 deletions(-)

diff --git a/src/uu/wc/src/count_fast.rs b/src/uu/wc/src/count_fast.rs
index 1eb1d912724..1d3102f9975 100644
--- a/src/uu/wc/src/count_fast.rs
+++ b/src/uu/wc/src/count_fast.rs
@@ -100,7 +100,8 @@ pub(crate) fn count_bytes_fast<T: WordCountable>(handle: &mut T) -> (usize, Opti
             // would count up only to a couple of bytes.
             // This condition usually occurs for files in pseudo-filesystems like /proc, /sys
             // that report `st_size` in the multiples of system page size.
-            // In such cases - attempt `seek()` for the end of file
+            // In such cases - attempt `seek()` almost to the end of the file
+            // and then fall back on read to count the rest.
             //
             // And finally a special case of input redirection in *nix shell:
             // `( wc -c ; wc -c ) < file` should return
@@ -127,8 +128,9 @@ pub(crate) fn count_bytes_fast<T: WordCountable>(handle: &mut T) -> (usize, Opti
                     // with size that is NOT a multiple of system page size
                     return (stat.st_size as usize, None);
                 } else if let Some(file) = handle.inner_file() {
-                    if let Ok(n) = file.seek(SeekFrom::End(0)) {
-                        return (n as usize, None);
+                    let offset = stat.st_size - stat.st_size % (stat.st_blksize as i64 + 1);
+                    if let Ok(n) = file.seek(SeekFrom::Start(offset as u64)) {
+                        byte_count = n as usize;
                     }
                 }
             }

From 9c4d88009d1990fc52126eee43155310a104c9c3 Mon Sep 17 00:00:00 2001
From: zhitkoff <zhitkoff@gmail.com>
Date: Fri, 1 Dec 2023 20:49:49 -0500
Subject: [PATCH 141/429] wc: clippy

---
 src/uu/wc/src/count_fast.rs | 9 ++++++++-
 1 file changed, 8 insertions(+), 1 deletion(-)

diff --git a/src/uu/wc/src/count_fast.rs b/src/uu/wc/src/count_fast.rs
index 1d3102f9975..0d93967400d 100644
--- a/src/uu/wc/src/count_fast.rs
+++ b/src/uu/wc/src/count_fast.rs
@@ -10,12 +10,14 @@ use super::WordCountable;
 
 #[cfg(any(target_os = "linux", target_os = "android"))]
 use std::fs::OpenOptions;
-use std::io::{self, ErrorKind, Read, Seek, SeekFrom};
+use std::io::{self, ErrorKind, Read};
 
 #[cfg(unix)]
 use libc::{sysconf, S_IFREG, _SC_PAGESIZE};
 #[cfg(unix)]
 use nix::sys::stat;
+#[cfg(unix)]
+use std::io::{Seek, SeekFrom};
 #[cfg(any(target_os = "linux", target_os = "android"))]
 use std::os::unix::io::AsRawFd;
 
@@ -128,7 +130,12 @@ pub(crate) fn count_bytes_fast<T: WordCountable>(handle: &mut T) -> (usize, Opti
                     // with size that is NOT a multiple of system page size
                     return (stat.st_size as usize, None);
                 } else if let Some(file) = handle.inner_file() {
+                    // On some platforms `stat.st_blksize` is of i32 type,
+                    // i.e. MacOS on Apple Silicon (aarch64-apple-darwin),
+                    // as well as Debian Linux on ARM (aarch64-unknown-linux-gnu)
+                    #[allow(clippy::unnecessary_cast)]
                     let offset = stat.st_size - stat.st_size % (stat.st_blksize as i64 + 1);
+
                     if let Ok(n) = file.seek(SeekFrom::Start(offset as u64)) {
                         byte_count = n as usize;
                     }

From 9ff7b42d832fdc21ef20b02608e9623a4be50f8d Mon Sep 17 00:00:00 2001
From: zhitkoff <zhitkoff@gmail.com>
Date: Fri, 1 Dec 2023 21:00:39 -0500
Subject: [PATCH 142/429] wc: stat casting

---
 src/uu/wc/src/count_fast.rs | 7 ++++---
 1 file changed, 4 insertions(+), 3 deletions(-)

diff --git a/src/uu/wc/src/count_fast.rs b/src/uu/wc/src/count_fast.rs
index 0d93967400d..09b48b21e72 100644
--- a/src/uu/wc/src/count_fast.rs
+++ b/src/uu/wc/src/count_fast.rs
@@ -130,11 +130,12 @@ pub(crate) fn count_bytes_fast<T: WordCountable>(handle: &mut T) -> (usize, Opti
                     // with size that is NOT a multiple of system page size
                     return (stat.st_size as usize, None);
                 } else if let Some(file) = handle.inner_file() {
-                    // On some platforms `stat.st_blksize` is of i32 type,
+                    // On some platforms `stat.st_blksize` and/or `st.st_size` is of i32 type,
                     // i.e. MacOS on Apple Silicon (aarch64-apple-darwin),
-                    // as well as Debian Linux on ARM (aarch64-unknown-linux-gnu)
+                    // as well as Debian Linux on ARM (aarch64-unknown-linux-gnu), etc.
                     #[allow(clippy::unnecessary_cast)]
-                    let offset = stat.st_size - stat.st_size % (stat.st_blksize as i64 + 1);
+                    let offset =
+                        stat.st_size as i64 - stat.st_size as i64 % (stat.st_blksize as i64 + 1);
 
                     if let Ok(n) = file.seek(SeekFrom::Start(offset as u64)) {
                         byte_count = n as usize;

From 54ac5a7e1ac804bc57496faf31877da82d5b4be4 Mon Sep 17 00:00:00 2001
From: zhitkoff <zhitkoff@gmail.com>
Date: Sat, 2 Dec 2023 16:06:19 -0500
Subject: [PATCH 143/429] wc: count_fast windows optimization

---
 src/uu/wc/src/count_fast.rs | 31 +++++++++++++++++++++++++++++--
 1 file changed, 29 insertions(+), 2 deletions(-)

diff --git a/src/uu/wc/src/count_fast.rs b/src/uu/wc/src/count_fast.rs
index 09b48b21e72..59bde31c331 100644
--- a/src/uu/wc/src/count_fast.rs
+++ b/src/uu/wc/src/count_fast.rs
@@ -20,6 +20,12 @@ use nix::sys::stat;
 use std::io::{Seek, SeekFrom};
 #[cfg(any(target_os = "linux", target_os = "android"))]
 use std::os::unix::io::AsRawFd;
+#[cfg(windows)]
+use std::os::windows::fs::MetadataExt;
+#[cfg(windows)]
+const FILE_ATTRIBUTE_ARCHIVE: u32 = 32;
+#[cfg(windows)]
+const FILE_ATTRIBUTE_NORMAL: u32 = 128;
 
 #[cfg(any(target_os = "linux", target_os = "android"))]
 use libc::S_IFIFO;
@@ -76,6 +82,8 @@ fn count_bytes_using_splice(fd: &impl AsRawFd) -> Result<usize, usize> {
 ///   1. On Unix,  we can simply `stat` the file if it is regular.
 ///   2. On Linux -- if the above did not work -- we can use splice to count
 ///      the number of bytes if the file is a FIFO.
+///   3. On Windows we can use `std::os::windows::fs::MetadataExt` to get file size
+///      for regular files
 ///   3. Otherwise, we just read normally, but without the overhead of counting
 ///      other things such as lines and words.
 #[inline]
@@ -130,9 +138,12 @@ pub(crate) fn count_bytes_fast<T: WordCountable>(handle: &mut T) -> (usize, Opti
                     // with size that is NOT a multiple of system page size
                     return (stat.st_size as usize, None);
                 } else if let Some(file) = handle.inner_file() {
-                    // On some platforms `stat.st_blksize` and/or `st.st_size` is of i32 type,
+                    // On some platforms `stat.st_blksize` and `st.st_size`
+                    // are of different types: i64 vs i32
                     // i.e. MacOS on Apple Silicon (aarch64-apple-darwin),
-                    // as well as Debian Linux on ARM (aarch64-unknown-linux-gnu), etc.
+                    // Debian Linux on ARM (aarch64-unknown-linux-gnu),
+                    // 32bit i686 targets, etc.
+                    // While on the others they are of the same type.
                     #[allow(clippy::unnecessary_cast)]
                     let offset =
                         stat.st_size as i64 - stat.st_size as i64 % (stat.st_blksize as i64 + 1);
@@ -156,6 +167,22 @@ pub(crate) fn count_bytes_fast<T: WordCountable>(handle: &mut T) -> (usize, Opti
         }
     }
 
+    #[cfg(windows)]
+    {
+        if let Some(file) = handle.inner_file() {
+            if let Ok(metadata) = file.metadata() {
+                let attributes = metadata.file_attributes();
+                let size = metadata.file_size();
+
+                if (attributes & FILE_ATTRIBUTE_ARCHIVE) != 0
+                    || (attributes & FILE_ATTRIBUTE_NORMAL) != 0
+                {
+                    return (size as usize, None);
+                }
+            }
+        }
+    }
+
     // Fall back on `read`, but without the overhead of counting words and lines.
     let mut buf = [0_u8; BUF_SIZE];
     loop {

From b7f708b23326d4914b84b0e363cdff35a3ab4507 Mon Sep 17 00:00:00 2001
From: zhitkoff <zhitkoff@gmail.com>
Date: Sat, 2 Dec 2023 16:50:30 -0500
Subject: [PATCH 144/429] wc: comments

---
 src/uu/wc/src/count_fast.rs | 7 ++++---
 1 file changed, 4 insertions(+), 3 deletions(-)

diff --git a/src/uu/wc/src/count_fast.rs b/src/uu/wc/src/count_fast.rs
index 59bde31c331..d7875933d17 100644
--- a/src/uu/wc/src/count_fast.rs
+++ b/src/uu/wc/src/count_fast.rs
@@ -128,8 +128,9 @@ pub(crate) fn count_bytes_fast<T: WordCountable>(handle: &mut T) -> (usize, Opti
             // Since the input stream from file is treated as continuous across both commands inside ().
             // In cases like this, due to `<` redirect, the `stat.st_mode` would report input as a regular file
             // and `stat.st_size` would report the size of file on disk
-            // and NOT the remaining number of bytes in the input stream. The raw file descriptor
-            // in this situation would be equal to `0` for STDIN in both invocations.
+            // and NOT the remaining number of bytes in the input stream. 
+            // However, the raw file descriptor in this situation would be equal to `0` 
+            // for STDIN in both invocations.
             // Therefore we cannot rely of `st_size` here and should fall back on full read.
             if fd > 0 && (stat.st_mode as libc::mode_t & S_IFREG) != 0 && stat.st_size > 0 {
                 let sys_page_size = unsafe { sysconf(_SC_PAGESIZE) as usize };
@@ -138,7 +139,7 @@ pub(crate) fn count_bytes_fast<T: WordCountable>(handle: &mut T) -> (usize, Opti
                     // with size that is NOT a multiple of system page size
                     return (stat.st_size as usize, None);
                 } else if let Some(file) = handle.inner_file() {
-                    // On some platforms `stat.st_blksize` and `st.st_size`
+                    // On some platforms `stat.st_blksize` and `stat.st_size`
                     // are of different types: i64 vs i32
                     // i.e. MacOS on Apple Silicon (aarch64-apple-darwin),
                     // Debian Linux on ARM (aarch64-unknown-linux-gnu),

From a97b574fec16ad40d5f3ffc97b9e256d83c36718 Mon Sep 17 00:00:00 2001
From: zhitkoff <zhitkoff@gmail.com>
Date: Sat, 2 Dec 2023 16:52:04 -0500
Subject: [PATCH 145/429] wc: comments

---
 src/uu/wc/src/count_fast.rs | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/uu/wc/src/count_fast.rs b/src/uu/wc/src/count_fast.rs
index d7875933d17..487893b9f43 100644
--- a/src/uu/wc/src/count_fast.rs
+++ b/src/uu/wc/src/count_fast.rs
@@ -128,8 +128,8 @@ pub(crate) fn count_bytes_fast<T: WordCountable>(handle: &mut T) -> (usize, Opti
             // Since the input stream from file is treated as continuous across both commands inside ().
             // In cases like this, due to `<` redirect, the `stat.st_mode` would report input as a regular file
             // and `stat.st_size` would report the size of file on disk
-            // and NOT the remaining number of bytes in the input stream. 
-            // However, the raw file descriptor in this situation would be equal to `0` 
+            // and NOT the remaining number of bytes in the input stream.
+            // However, the raw file descriptor in this situation would be equal to `0`
             // for STDIN in both invocations.
             // Therefore we cannot rely of `st_size` here and should fall back on full read.
             if fd > 0 && (stat.st_mode as libc::mode_t & S_IFREG) != 0 && stat.st_size > 0 {

From 967c539cc6ccd08fda8b6d1de0d49f45b4311f0d Mon Sep 17 00:00:00 2001
From: zhitkoff <zhitkoff@gmail.com>
Date: Sun, 3 Dec 2023 16:00:18 -0500
Subject: [PATCH 146/429] wc: more tests

---
 tests/by-util/test_wc.rs | 8 ++++++++
 1 file changed, 8 insertions(+)

diff --git a/tests/by-util/test_wc.rs b/tests/by-util/test_wc.rs
index c365b13b952..9c55bd3bca5 100644
--- a/tests/by-util/test_wc.rs
+++ b/tests/by-util/test_wc.rs
@@ -243,6 +243,14 @@ fn test_single_only_lines() {
         .stdout_is("18 moby_dick.txt\n");
 }
 
+#[test]
+fn test_single_only_bytes() {
+    new_ucmd!()
+        .args(&["-c", "lorem_ipsum.txt"])
+        .run()
+        .stdout_is("772 lorem_ipsum.txt\n");
+}
+
 #[test]
 fn test_single_all_counts() {
     new_ucmd!()

From 0076c9f64c37aad2033867487462beb342cf1e13 Mon Sep 17 00:00:00 2001
From: Yury Zhytkou <54360928+zhitkoff@users.noreply.github.com>
Date: Thu, 7 Dec 2023 12:13:34 -0500
Subject: [PATCH 147/429] Update src/uu/wc/src/count_fast.rs

Co-authored-by: Sylvestre Ledru <sledru@mozilla.com>
---
 src/uu/wc/src/count_fast.rs | 3 +--
 1 file changed, 1 insertion(+), 2 deletions(-)

diff --git a/src/uu/wc/src/count_fast.rs b/src/uu/wc/src/count_fast.rs
index 487893b9f43..85d3d1d2b36 100644
--- a/src/uu/wc/src/count_fast.rs
+++ b/src/uu/wc/src/count_fast.rs
@@ -173,12 +173,11 @@ pub(crate) fn count_bytes_fast<T: WordCountable>(handle: &mut T) -> (usize, Opti
         if let Some(file) = handle.inner_file() {
             if let Ok(metadata) = file.metadata() {
                 let attributes = metadata.file_attributes();
-                let size = metadata.file_size();
 
                 if (attributes & FILE_ATTRIBUTE_ARCHIVE) != 0
                     || (attributes & FILE_ATTRIBUTE_NORMAL) != 0
                 {
-                    return (size as usize, None);
+                    return (metadata.file_size() as usize, None);
                 }
             }
         }

From 7861559f880e6fff3576bf4ac00afbf0d5489807 Mon Sep 17 00:00:00 2001
From: Terts Diepraam <terts.diepraam@gmail.com>
Date: Thu, 7 Dec 2023 11:58:11 +0100
Subject: [PATCH 148/429] du: put excludes in traversaloptions and make
 size_format enum

---
 src/uu/du/src/du.rs | 223 +++++++++++++++++---------------------------
 1 file changed, 86 insertions(+), 137 deletions(-)

diff --git a/src/uu/du/src/du.rs b/src/uu/du/src/du.rs
index 14c7fe5d4b3..7114ccc2668 100644
--- a/src/uu/du/src/du.rs
+++ b/src/uu/du/src/du.rs
@@ -83,25 +83,20 @@ struct TraversalOptions {
     dereference: Deref,
     count_links: bool,
     verbose: bool,
+    excludes: Vec<Pattern>,
 }
 
-#[derive(Clone)]
-struct PrintingOptions {
+struct StatPrinter {
     total: bool,
     inodes: bool,
     max_depth: Option<usize>,
     threshold: Option<Threshold>,
     apparent_size: bool,
-    // TODO: the size conversion fields should be unified
-    si: bool,
-    bytes: bool,
-    human_readable: bool,
-    block_size_1k: bool,
-    block_size_1m: bool,
-    block_size: u64,
+    size_format: SizeFormat,
     time: Option<Time>,
     time_format: String,
     line_ending: LineEnding,
+    summarize: bool,
 }
 
 #[derive(PartialEq, Clone)]
@@ -118,6 +113,12 @@ enum Time {
     Created,
 }
 
+#[derive(Clone)]
+enum SizeFormat {
+    Human(u64),
+    BlockSize(u64),
+}
+
 #[derive(PartialEq, Eq, Hash, Clone, Copy)]
 struct FileInfo {
     file_id: u128,
@@ -295,18 +296,6 @@ fn read_block_size(s: Option<&str>) -> UResult<u64> {
     }
 }
 
-fn choose_size(options: &PrintingOptions, stat: &Stat) -> u64 {
-    if options.inodes {
-        stat.inodes
-    } else if options.apparent_size || options.bytes {
-        stat.size
-    } else {
-        // The st_blocks field indicates the number of blocks allocated to the file, 512-byte units.
-        // See: http://linux.die.net/man/2/stat
-        stat.blocks * 512
-    }
-}
-
 // this takes `my_stat` to avoid having to stat files multiple times.
 #[allow(clippy::cognitive_complexity)]
 fn du(
@@ -314,7 +303,6 @@ fn du(
     options: &TraversalOptions,
     depth: usize,
     seen_inodes: &mut HashSet<FileInfo>,
-    exclude: &[Pattern],
     print_tx: &mpsc::Sender<UResult<StatPrintInfo>>,
 ) -> Result<Stat, Box<mpsc::SendError<UResult<StatPrintInfo>>>> {
     if my_stat.is_dir {
@@ -334,7 +322,7 @@ fn du(
                     match Stat::new(&entry.path(), options) {
                         Ok(this_stat) => {
                             // We have an exclude list
-                            for pattern in exclude {
+                            for pattern in &options.excludes {
                                 // Look at all patterns with both short and long paths
                                 // if we have 'du foo' but search to exclude 'foo/bar'
                                 // we need the full path
@@ -370,14 +358,8 @@ fn du(
                                     }
                                 }
 
-                                let this_stat = du(
-                                    this_stat,
-                                    options,
-                                    depth + 1,
-                                    seen_inodes,
-                                    exclude,
-                                    print_tx,
-                                )?;
+                                let this_stat =
+                                    du(this_stat, options, depth + 1, seen_inodes, print_tx)?;
 
                                 if !options.separate_dirs {
                                     my_stat.size += this_stat.size;
@@ -413,52 +395,6 @@ fn du(
     Ok(my_stat)
 }
 
-fn convert_size_human(size: u64, multiplier: u64, _block_size: u64) -> String {
-    for &(unit, power) in &UNITS {
-        let limit = multiplier.pow(power);
-        if size >= limit {
-            return format!("{:.1}{}", (size as f64) / (limit as f64), unit);
-        }
-    }
-    if size == 0 {
-        return "0".to_string();
-    }
-    format!("{size}B")
-}
-
-fn convert_size_b(size: u64, _multiplier: u64, _block_size: u64) -> String {
-    format!("{}", ((size as f64) / (1_f64)).ceil())
-}
-
-fn convert_size_k(size: u64, multiplier: u64, _block_size: u64) -> String {
-    format!("{}", ((size as f64) / (multiplier as f64)).ceil())
-}
-
-fn convert_size_m(size: u64, multiplier: u64, _block_size: u64) -> String {
-    format!(
-        "{}",
-        ((size as f64) / ((multiplier * multiplier) as f64)).ceil()
-    )
-}
-
-fn convert_size_other(size: u64, _multiplier: u64, block_size: u64) -> String {
-    format!("{}", ((size as f64) / (block_size as f64)).ceil())
-}
-
-fn get_convert_size_fn(options: &PrintingOptions) -> Box<dyn Fn(u64, u64, u64) -> String + Send> {
-    if options.human_readable || options.si {
-        Box::new(convert_size_human)
-    } else if options.bytes {
-        Box::new(convert_size_b)
-    } else if options.block_size_1k {
-        Box::new(convert_size_k)
-    } else if options.block_size_1m {
-        Box::new(convert_size_m)
-    } else {
-        Box::new(convert_size_other)
-    }
-}
-
 #[derive(Debug)]
 enum DuError {
     InvalidMaxDepthArg(String),
@@ -554,29 +490,17 @@ struct StatPrintInfo {
     depth: usize,
 }
 
-struct StatPrinter {
-    summarize: bool,
-    options: PrintingOptions,
-    convert_size: Box<dyn Fn(u64) -> String + Send>,
-}
-
 impl StatPrinter {
-    fn new(options: PrintingOptions, summarize: bool) -> UResult<Self> {
-        let multiplier: u64 = if options.si { 1000 } else { 1024 };
-
-        let convert_size_fn = get_convert_size_fn(&options);
-
-        let convert_size: Box<dyn Fn(u64) -> String + Send> = if options.inodes {
-            Box::new(|size: u64| size.to_string())
+    fn choose_size(&self, stat: &Stat) -> u64 {
+        if self.inodes {
+            stat.inodes
+        } else if self.apparent_size {
+            stat.size
         } else {
-            Box::new(move |size: u64| convert_size_fn(size, multiplier, options.block_size))
-        };
-
-        Ok(Self {
-            summarize,
-            options,
-            convert_size,
-        })
+            // The st_blocks field indicates the number of blocks allocated to the file, 512-byte units.
+            // See: http://linux.die.net/man/2/stat
+            stat.blocks * 512
+        }
     }
 
     fn print_stats(&self, rx: &mpsc::Receiver<UResult<StatPrintInfo>>) -> UResult<()> {
@@ -587,18 +511,16 @@ impl StatPrinter {
             match received {
                 Ok(message) => match message {
                     Ok(stat_info) => {
-                        let size = choose_size(&self.options, &stat_info.stat);
+                        let size = self.choose_size(&stat_info.stat);
 
                         if stat_info.depth == 0 {
                             grand_total += size;
                         }
 
                         if !self
-                            .options
                             .threshold
                             .map_or(false, |threshold| threshold.should_exclude(size))
                             && self
-                                .options
                                 .max_depth
                                 .map_or(true, |max_depth| stat_info.depth <= max_depth)
                             && (!self.summarize || stat_info.depth == 0)
@@ -612,31 +534,59 @@ impl StatPrinter {
             }
         }
 
-        if self.options.total {
-            print!("{}\ttotal", (self.convert_size)(grand_total));
-            print!("{}", self.options.line_ending);
+        if self.total {
+            print!("{}\ttotal", self.convert_size(grand_total));
+            print!("{}", self.line_ending);
         }
 
         Ok(())
     }
 
+    fn convert_size(&self, size: u64) -> String {
+        if self.inodes {
+            return size.to_string();
+        }
+        match self.size_format {
+            SizeFormat::Human(multiplier) => {
+                if size == 0 {
+                    return "0".to_string();
+                }
+                for &(unit, power) in &UNITS {
+                    let limit = multiplier.pow(power);
+                    if size >= limit {
+                        return format!("{:.1}{}", (size as f64) / (limit as f64), unit);
+                    }
+                }
+                format!("{size}B")
+            }
+            SizeFormat::BlockSize(block_size) => div_ceil(size, block_size).to_string(),
+        }
+    }
+
     fn print_stat(&self, stat: &Stat, size: u64) -> UResult<()> {
-        if let Some(time) = self.options.time {
+        if let Some(time) = self.time {
             let secs = get_time_secs(time, stat)?;
             let tm = DateTime::<Local>::from(UNIX_EPOCH + Duration::from_secs(secs));
-            let time_str = tm.format(&self.options.time_format).to_string();
-            print!("{}\t{}\t", (self.convert_size)(size), time_str);
+            let time_str = tm.format(&self.time_format).to_string();
+            print!("{}\t{}\t", self.convert_size(size), time_str);
         } else {
-            print!("{}\t", (self.convert_size)(size));
+            print!("{}\t", self.convert_size(size));
         }
 
         print_verbatim(&stat.path).unwrap();
-        print!("{}", self.options.line_ending);
+        print!("{}", self.line_ending);
 
         Ok(())
     }
 }
 
+// This can be replaced with u64::div_ceil once it is stabilized.
+// This implementation approach is optimized for when `b` is a constant,
+// particularly a power of two.
+pub fn div_ceil(a: u64, b: u64) -> u64 {
+    (a + b - 1) / b
+}
+
 #[uucore::main]
 #[allow(clippy::cognitive_complexity)]
 pub fn uumain(args: impl uucore::Args) -> UResult<()> {
@@ -671,11 +621,23 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
         }
     });
 
-    let block_size = read_block_size(
-        matches
-            .get_one::<String>(options::BLOCK_SIZE)
-            .map(|s| s.as_str()),
-    )?;
+    let size_format = if matches.get_flag(options::HUMAN_READABLE) {
+        SizeFormat::Human(1024)
+    } else if matches.get_flag(options::SI) {
+        SizeFormat::Human(1000)
+    } else if matches.get_flag(options::BYTES) {
+        SizeFormat::BlockSize(1)
+    } else if matches.get_flag(options::BLOCK_SIZE_1K) {
+        SizeFormat::BlockSize(1024)
+    } else if matches.get_flag(options::BLOCK_SIZE_1M) {
+        SizeFormat::BlockSize(1024 * 1024)
+    } else {
+        SizeFormat::BlockSize(read_block_size(
+            matches
+                .get_one::<String>(options::BLOCK_SIZE)
+                .map(AsRef::as_ref),
+        )?)
+    };
 
     let traversal_options = TraversalOptions {
         all: matches.get_flag(options::ALL),
@@ -691,13 +653,15 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
         },
         count_links: matches.get_flag(options::COUNT_LINKS),
         verbose: matches.get_flag(options::VERBOSE),
+        excludes: build_exclude_patterns(&matches)?,
     };
 
-    let printing_options = PrintingOptions {
+    let stat_printer = StatPrinter {
         max_depth,
+        size_format,
+        summarize,
         total: matches.get_flag(options::TOTAL),
         inodes: matches.get_flag(options::INODES),
-        si: matches.get_flag(options::SI),
         threshold: matches
             .get_one::<String>(options::THRESHOLD)
             .map(|s| {
@@ -706,36 +670,28 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
                 })
             })
             .transpose()?,
-        apparent_size: matches.get_flag(options::APPARENT_SIZE),
-        bytes: matches.get_flag(options::BYTES),
+        apparent_size: matches.get_flag(options::APPARENT_SIZE) || matches.get_flag(options::BYTES),
         time,
-        block_size,
-        human_readable: matches.get_flag(options::HUMAN_READABLE),
-        block_size_1k: matches.get_flag(options::BLOCK_SIZE_1K),
-        block_size_1m: matches.get_flag(options::BLOCK_SIZE_1M),
         time_format: parse_time_style(matches.get_one::<String>("time-style").map(|s| s.as_str()))?
             .to_string(),
         line_ending: LineEnding::from_zero_flag(matches.get_flag(options::NULL)),
     };
 
-    if printing_options.inodes
+    if stat_printer.inodes
         && (matches.get_flag(options::APPARENT_SIZE) || matches.get_flag(options::BYTES))
     {
         show_warning!("options --apparent-size and -b are ineffective with --inodes");
     }
 
     // Use separate thread to print output, so we can print finished results while computation is still running
-    let stat_printer = StatPrinter::new(printing_options.clone(), summarize)?;
     let (print_tx, rx) = mpsc::channel::<UResult<StatPrintInfo>>();
     let printing_thread = thread::spawn(move || stat_printer.print_stats(&rx));
 
-    let excludes = build_exclude_patterns(&matches)?;
-
     'loop_file: for path in files {
         // Skip if we don't want to ignore anything
-        if !&excludes.is_empty() {
+        if !&traversal_options.excludes.is_empty() {
             let path_string = path.to_string_lossy();
-            for pattern in &excludes {
+            for pattern in &traversal_options.excludes {
                 if pattern.matches(&path_string) {
                     // if the directory is ignored, leave early
                     if traversal_options.verbose {
@@ -753,15 +709,8 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
             if let Some(inode) = stat.inode {
                 seen_inodes.insert(inode);
             }
-            let stat = du(
-                stat,
-                &traversal_options,
-                0,
-                &mut seen_inodes,
-                &excludes,
-                &print_tx,
-            )
-            .map_err(|e| USimpleError::new(1, e.to_string()))?;
+            let stat = du(stat, &traversal_options, 0, &mut seen_inodes, &print_tx)
+                .map_err(|e| USimpleError::new(1, e.to_string()))?;
 
             print_tx
                 .send(Ok(StatPrintInfo { stat, depth: 0 }))

From c111dc88ac914b0f542501e014f0aa82e3570709 Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Fri, 8 Dec 2023 10:23:15 +0100
Subject: [PATCH 149/429] du: fix issue with dereference in test

---
 tests/by-util/test_du.rs | 19 +++++++++++++------
 1 file changed, 13 insertions(+), 6 deletions(-)

diff --git a/tests/by-util/test_du.rs b/tests/by-util/test_du.rs
index 10f32caf52e..cb1341432a0 100644
--- a/tests/by-util/test_du.rs
+++ b/tests/by-util/test_du.rs
@@ -365,12 +365,19 @@ fn test_du_no_dereference() {
             .stdout_does_not_contain(symlink);
 
         // ensure dereference "wins"
-        ts.ucmd()
-            .arg(arg)
-            .arg("--dereference")
-            .succeeds()
-            .stdout_contains(symlink)
-            .stdout_does_not_contain(dir);
+        let result = ts.ucmd().arg(arg).arg("--dereference").succeeds();
+
+        #[cfg(target_os = "linux")]
+        {
+            let result_reference = unwrap_or_return!(expected_result(&ts, &[arg, "--dereference"]));
+
+            if result_reference.succeeded() {
+                assert_eq!(result.stdout_str(), result_reference.stdout_str());
+            }
+        }
+
+        #[cfg(not(target_os = "linux"))]
+        result.stdout_contains(symlink).stdout_does_not_contain(dir);
     }
 }
 

From e9dc2930ee8260b3c3f7863ade3426239eb0332f Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Fri, 8 Dec 2023 15:10:48 +0100
Subject: [PATCH 150/429] ls: handle invalid block size as GNU does

---
 src/uu/ls/src/ls.rs      |  9 ++++-----
 tests/by-util/test_ls.rs | 10 ++++++++++
 2 files changed, 14 insertions(+), 5 deletions(-)

diff --git a/src/uu/ls/src/ls.rs b/src/uu/ls/src/ls.rs
index deb8aac3dfe..074210576b0 100644
--- a/src/uu/ls/src/ls.rs
+++ b/src/uu/ls/src/ls.rs
@@ -182,7 +182,7 @@ impl UError for LsError {
             Self::IOError(_) => 1,
             Self::IOErrorContext(_, _, false) => 1,
             Self::IOErrorContext(_, _, true) => 2,
-            Self::BlockSizeParseError(_) => 1,
+            Self::BlockSizeParseError(_) => 2,
             Self::ConflictingArgumentDired => 1,
             Self::DiredAndZeroAreIncompatible => 2,
             Self::AlreadyListedError(_) => 2,
@@ -806,10 +806,9 @@ impl Config {
             match parse_size_u64(&raw_block_size.to_string_lossy()) {
                 Ok(size) => Some(size),
                 Err(_) => {
-                    show!(LsError::BlockSizeParseError(
-                        opt_block_size.unwrap().clone()
-                    ));
-                    None
+                    return Err(Box::new(LsError::BlockSizeParseError(
+                        opt_block_size.unwrap().clone(),
+                    )));
                 }
             }
         } else if env_var_posixly_correct.is_some() {
diff --git a/tests/by-util/test_ls.rs b/tests/by-util/test_ls.rs
index 8bc2b75ac77..887f90e0f5a 100644
--- a/tests/by-util/test_ls.rs
+++ b/tests/by-util/test_ls.rs
@@ -3856,6 +3856,16 @@ fn test_posixly_correct() {
         .stdout_contains_line("total 8");
 }
 
+#[test]
+fn test_ls_invalid_block_size() {
+    new_ucmd!()
+        .arg("--block-size=invalid")
+        .fails()
+        .code_is(2)
+        .no_stdout()
+        .stderr_is("ls: invalid --block-size argument 'invalid'\n");
+}
+
 #[test]
 fn test_ls_hyperlink() {
     let scene = TestScenario::new(util_name!());

From b676216f9b54f2fc38ad07bc6019417e306dd60d Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Thu, 30 Nov 2023 11:04:14 +0100
Subject: [PATCH 151/429] ls: use the gnu_legacy feature from lscolors

---
 Cargo.toml               |  1 +
 src/uu/ls/Cargo.toml     |  2 +-
 src/uu/ls/src/ls.rs      |  6 ++-
 tests/by-util/test_ls.rs | 88 ++++++++++++++++++++++++----------------
 4 files changed, 60 insertions(+), 37 deletions(-)

diff --git a/Cargo.toml b/Cargo.toml
index f88285a1f36..abc3f26b0ab 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -290,6 +290,7 @@ itertools = "0.12.0"
 libc = "0.2.150"
 lscolors = { version = "0.16.0", default-features = false, features = [
   "nu-ansi-term",
+  "gnu_legacy",
 ] }
 memchr = "2"
 memmap2 = "0.9"
diff --git a/src/uu/ls/Cargo.toml b/src/uu/ls/Cargo.toml
index a82a1f37e07..56b642a1a43 100644
--- a/src/uu/ls/Cargo.toml
+++ b/src/uu/ls/Cargo.toml
@@ -22,7 +22,7 @@ number_prefix = { workspace = true }
 uutils_term_grid = { workspace = true }
 terminal_size = { workspace = true }
 glob = { workspace = true }
-lscolors = { workspace = true }
+lscolors = { workspace = true, features = ["gnu_legacy"] }
 uucore = { workspace = true, features = [
   "entries",
   "fs",
diff --git a/src/uu/ls/src/ls.rs b/src/uu/ls/src/ls.rs
index deb8aac3dfe..d93620967d1 100644
--- a/src/uu/ls/src/ls.rs
+++ b/src/uu/ls/src/ls.rs
@@ -3140,7 +3140,11 @@ fn display_file_name(
 fn color_name(name: String, path: &Path, md: Option<&Metadata>, ls_colors: &LsColors) -> String {
     match ls_colors.style_for_path_with_metadata(path, md) {
         Some(style) => {
-            return style.to_nu_ansi_term_style().paint(name).to_string();
+            return style
+                .to_nu_ansi_term_style()
+                .reset_before_style()
+                .paint(name)
+                .to_string();
         }
         None => name,
     }
diff --git a/tests/by-util/test_ls.rs b/tests/by-util/test_ls.rs
index 8bc2b75ac77..5061778aed3 100644
--- a/tests/by-util/test_ls.rs
+++ b/tests/by-util/test_ls.rs
@@ -2,7 +2,7 @@
 //
 // For the full copyright and license information, please view the LICENSE
 // file that was distributed with this source code.
-// spell-checker:ignore (words) READMECAREFULLY birthtime doesntexist oneline somebackup lrwx somefile somegroup somehiddenbackup somehiddenfile tabsize aaaaaaaa bbbb cccc dddddddd ncccc neee naaaaa nbcdef nfffff dired subdired tmpfs
+// spell-checker:ignore (words) READMECAREFULLY birthtime doesntexist oneline somebackup lrwx somefile somegroup somehiddenbackup somehiddenfile tabsize aaaaaaaa bbbb cccc dddddddd ncccc neee naaaaa nbcdef nfffff dired subdired tmpfs mdir1
 
 #[cfg(any(unix, feature = "feat_selinux"))]
 use crate::common::util::expected_result;
@@ -864,11 +864,11 @@ fn test_ls_zero() {
         .succeeds()
         .stdout_only("\"0-test-zero\"\x00\"2-test-zero\"\x00\"3-test-zero\"\x00");
 
-    scene
-        .ucmd()
-        .args(&["--zero", "--color=always"])
-        .succeeds()
-        .stdout_only("\x1b[1;34m0-test-zero\x1b[0m\x002-test-zero\x003-test-zero\x00");
+    let result = scene.ucmd().args(&["--zero", "--color=always"]).succeeds();
+    assert_eq!(
+        result.stdout_str(),
+        "\u{1b}[0m\u{1b}[01;34m0-test-zero\x1b[0m\x002-test-zero\x003-test-zero\x00"
+    );
 
     scene
         .ucmd()
@@ -921,12 +921,9 @@ fn test_ls_zero() {
                 "\"0-test-zero\"\x00\"1\\ntest-zero\"\x00\"2-test-zero\"\x00\"3-test-zero\"\x00",
             );
 
-        scene
-            .ucmd()
-            .args(&["--zero", "--color=always"])
-            .succeeds()
-            .stdout_only(
-                "\x1b[1;34m0-test-zero\x1b[0m\x001\ntest-zero\x002-test-zero\x003-test-zero\x00",
+        let result = scene.ucmd().args(&["--zero", "--color=always"]).succeeds();
+        assert_eq!(result.stdout_str(),
+                "\u{1b}[0m\u{1b}[01;34m0-test-zero\x1b[0m\x001\ntest-zero\x002-test-zero\x003-test-zero\x00",
             );
 
         scene
@@ -1202,12 +1199,21 @@ fn test_ls_long_symlink_color() {
     }
 
     fn capture_colored_string(input: &str) -> (Color, Name) {
-        let colored_name = Regex::new(r"\x1b\[([0-9;]+)m(.+)\x1b\[0m").unwrap();
+        // Input can be:
+        // \u{1b}[0m\u{1b}[01;36mln-dir3\u{1b}[0m
+        // \u{1b}[0m\u{1b}[01;34m./dir1/dir2/dir3\u{1b}[0m
+        // \u{1b}[0m\u{1b}[01;36mln-file-invalid\u{1b}[0m
+        // \u{1b}[01;36mdir1/invalid-target\u{1b}[0m
+        let colored_name = Regex::new(r"(?:\x1b\[0m\x1b)?\[([0-9;]+)m(.+)\x1b\[0m").unwrap();
         match colored_name.captures(input) {
-            Some(captures) => (
-                captures.get(1).unwrap().as_str().to_string(),
-                captures.get(2).unwrap().as_str().to_string(),
-            ),
+            Some(captures) => {
+                dbg!(captures.get(1).unwrap().as_str().to_string());
+                dbg!(captures.get(2).unwrap().as_str().to_string());
+                return (
+                    captures.get(1).unwrap().as_str().to_string(),
+                    captures.get(2).unwrap().as_str().to_string(),
+                );
+            }
             None => (String::new(), input.to_string()),
         }
     }
@@ -1977,6 +1983,20 @@ fn test_ls_recursive_1() {
         .stdout_is(out);
 }
 
+// Function to convert a string to its ASCII representation
+fn to_ascii_representation(input: &str) -> String {
+    input
+        .chars()
+        .map(|c| {
+            if c.is_ascii_control() || !c.is_ascii() {
+                format!("\\x{:02x}", c as u32)
+            } else {
+                c.to_string()
+            }
+        })
+        .collect::<String>()
+}
+
 #[test]
 fn test_ls_color() {
     let scene = TestScenario::new(util_name!());
@@ -1995,9 +2015,9 @@ fn test_ls_color() {
     at.touch(nested_file);
     at.touch("test-color");
 
-    let a_with_colors = "\x1b[1;34ma\x1b[0m";
-    let z_with_colors = "\x1b[1;34mz\x1b[0m";
-    let nested_dir_with_colors = "\x1b[1;34mnested_dir\x1b[0m"; // spell-checker:disable-line
+    let a_with_colors = "\x1b[0m\x1b[01;34ma\x1b[0m";
+    let z_with_colors = "\x1b[01;34mz\x1b[0m\n";
+    let nested_dir_with_colors = "\x1b[0m\x1b[01;34mnested_dir\x1b[0m\x0anested_file"; // spell-checker:disable-line
 
     // Color is disabled by default
     let result = scene.ucmd().succeeds();
@@ -2006,12 +2026,9 @@ fn test_ls_color() {
 
     // Color should be enabled
     for param in ["--color", "--col", "--color=always", "--col=always"] {
-        scene
-            .ucmd()
-            .arg(param)
-            .succeeds()
-            .stdout_contains(a_with_colors)
-            .stdout_contains(z_with_colors);
+        let result = scene.ucmd().arg(param).succeeds();
+        assert!(result.stdout_str().contains(a_with_colors));
+        assert!(result.stdout_str().contains(z_with_colors));
     }
 
     // Color should be disabled
@@ -2020,12 +2037,8 @@ fn test_ls_color() {
     assert!(!result.stdout_str().contains(z_with_colors));
 
     // Nested dir should be shown and colored
-    scene
-        .ucmd()
-        .arg("--color")
-        .arg("a")
-        .succeeds()
-        .stdout_contains(nested_dir_with_colors);
+    let result = scene.ucmd().arg("--color").arg("a").succeeds();
+    assert!(result.stdout_str().contains(nested_dir_with_colors));
 
     // No output
     scene
@@ -2037,13 +2050,18 @@ fn test_ls_color() {
 
     // The colors must not mess up the grid layout
     at.touch("b");
-    scene
+    let result = scene
         .ucmd()
         .arg("--color")
         .arg("-w=15")
         .arg("-C")
-        .succeeds()
-        .stdout_only(format!("{a_with_colors}  test-color\nb  {z_with_colors}\n"));
+        .succeeds();
+    let expected = format!("{}  test-color\x0ab  {}", a_with_colors, z_with_colors);
+    assert_eq!(
+        to_ascii_representation(result.stdout_str()),
+        to_ascii_representation(&expected)
+    );
+    assert_eq!(result.stdout_str(), expected);
 }
 
 #[cfg(unix)]

From 268b180416d0249b232a762ff408ffe8a29babb4 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Sat, 9 Dec 2023 13:06:09 +0100
Subject: [PATCH 152/429] ls colors: create a stylemanager to carry the
 previous style to know if we need to reset or not

---
 src/uu/ls/src/ls.rs      | 88 ++++++++++++++++++++++++++++++++--------
 tests/by-util/test_ls.rs | 20 +++++++++
 2 files changed, 91 insertions(+), 17 deletions(-)

diff --git a/src/uu/ls/src/ls.rs b/src/uu/ls/src/ls.rs
index d93620967d1..e3176ec72c6 100644
--- a/src/uu/ls/src/ls.rs
+++ b/src/uu/ls/src/ls.rs
@@ -10,7 +10,8 @@ use clap::{
     crate_version, Arg, ArgAction, Command,
 };
 use glob::{MatchOptions, Pattern};
-use lscolors::LsColors;
+use lscolors::{LsColors, Style};
+
 use number_prefix::NumberPrefix;
 use std::{cell::OnceCell, num::IntErrorKind};
 use std::{collections::HashSet, io::IsTerminal};
@@ -1900,6 +1901,7 @@ pub fn list(locs: Vec<&Path>, config: &Config) -> UResult<()> {
     let mut dirs = Vec::<PathData>::new();
     let mut out = BufWriter::new(stdout());
     let mut dired = DiredOutput::default();
+    let mut style_manager = StyleManager::new();
     let initial_locs_len = locs.len();
 
     for loc in locs {
@@ -1933,7 +1935,7 @@ pub fn list(locs: Vec<&Path>, config: &Config) -> UResult<()> {
     sort_entries(&mut files, config, &mut out);
     sort_entries(&mut dirs, config, &mut out);
 
-    display_items(&files, config, &mut out, &mut dired)?;
+    display_items(&files, config, &mut out, &mut dired, &mut style_manager)?;
 
     for (pos, path_data) in dirs.iter().enumerate() {
         // Do read_dir call here to match GNU semantics by printing
@@ -1985,6 +1987,7 @@ pub fn list(locs: Vec<&Path>, config: &Config) -> UResult<()> {
             &mut out,
             &mut listed_ancestors,
             &mut dired,
+            &mut style_manager,
         )?;
     }
     if config.dired {
@@ -2101,6 +2104,7 @@ fn enter_directory(
     out: &mut BufWriter<Stdout>,
     listed_ancestors: &mut HashSet<FileInformation>,
     dired: &mut DiredOutput,
+    style_manager: &mut StyleManager,
 ) -> UResult<()> {
     // Create vec of entries with initial dot files
     let mut entries: Vec<PathData> = if config.files == Files::All {
@@ -2153,7 +2157,7 @@ fn enter_directory(
         }
     }
 
-    display_items(&entries, config, out, dired)?;
+    display_items(&entries, config, out, dired, style_manager)?;
 
     if config.recursive {
         for e in entries
@@ -2194,7 +2198,15 @@ fn enter_directory(
 
                         show_dir_name(&e.p_buf, out);
                         writeln!(out)?;
-                        enter_directory(e, rd, config, out, listed_ancestors, dired)?;
+                        enter_directory(
+                            e,
+                            rd,
+                            config,
+                            out,
+                            listed_ancestors,
+                            dired,
+                            style_manager,
+                        )?;
                         listed_ancestors
                             .remove(&FileInformation::from_path(&e.p_buf, e.must_dereference)?);
                     } else {
@@ -2316,6 +2328,7 @@ fn display_items(
     config: &Config,
     out: &mut BufWriter<Stdout>,
     dired: &mut DiredOutput,
+    style_manager: &mut StyleManager,
 ) -> UResult<()> {
     // `-Z`, `--context`:
     // Display the SELinux security context or '?' if none is found. When used with the `-l`
@@ -2338,7 +2351,7 @@ fn display_items(
                     display_additional_leading_info(item, &padding_collection, config, out)?;
                 write!(out, "{more_info}")?;
             }
-            display_item_long(item, &padding_collection, config, out, dired)?;
+            display_item_long(item, &padding_collection, config, out, dired, style_manager)?;
         }
     } else {
         let mut longest_context_len = 1;
@@ -2358,7 +2371,7 @@ fn display_items(
 
         for i in items {
             let more_info = display_additional_leading_info(i, &padding, config, out)?;
-            let cell = display_file_name(i, config, prefix_context, more_info, out);
+            let cell = display_file_name(i, config, prefix_context, more_info, out, style_manager);
             names_vec.push(cell);
         }
 
@@ -2513,6 +2526,7 @@ fn display_item_long(
     config: &Config,
     out: &mut BufWriter<Stdout>,
     dired: &mut DiredOutput,
+    style_manager: &mut StyleManager,
 ) -> UResult<()> {
     let mut output_display: String = String::new();
     if config.dired {
@@ -2605,7 +2619,8 @@ fn display_item_long(
 
         write!(output_display, " {} ", display_date(md, config)).unwrap();
 
-        let displayed_file = display_file_name(item, config, None, String::new(), out).contents;
+        let displayed_file =
+            display_file_name(item, config, None, String::new(), out, style_manager).contents;
         if config.dired {
             let (start, end) = dired::calculate_dired(
                 &dired.dired_positions,
@@ -2687,7 +2702,8 @@ fn display_item_long(
             write!(output_display, " {}", pad_right("?", padding.uname)).unwrap();
         }
 
-        let displayed_file = display_file_name(item, config, None, String::new(), out).contents;
+        let displayed_file =
+            display_file_name(item, config, None, String::new(), out, style_manager).contents;
         let date_len = 12;
 
         write!(
@@ -2985,6 +3001,7 @@ fn display_file_name(
     prefix_context: Option<usize>,
     more_info: String,
     out: &mut BufWriter<Stdout>,
+    style_manager: &mut StyleManager,
 ) -> Cell {
     // This is our return value. We start by `&path.display_name` and modify it along the way.
     let mut name = escape_name(&path.display_name, &config.quoting_style);
@@ -3008,13 +3025,14 @@ fn display_file_name(
     if let Some(ls_colors) = &config.color {
         let md = path.md(out);
         name = if md.is_some() {
-            color_name(name, &path.p_buf, md, ls_colors)
+            color_name(name, &path.p_buf, md, ls_colors, style_manager)
         } else {
             color_name(
                 name,
                 &path.p_buf,
                 path.p_buf.symlink_metadata().ok().as_ref(),
                 ls_colors,
+                style_manager,
             )
         };
     }
@@ -3103,6 +3121,7 @@ fn display_file_name(
                             &target_data.p_buf,
                             Some(&target_metadata),
                             ls_colors,
+                            style_manager,
                         ));
                     }
                 } else {
@@ -3137,15 +3156,50 @@ fn display_file_name(
     }
 }
 
-fn color_name(name: String, path: &Path, md: Option<&Metadata>, ls_colors: &LsColors) -> String {
-    match ls_colors.style_for_path_with_metadata(path, md) {
-        Some(style) => {
-            return style
-                .to_nu_ansi_term_style()
-                .reset_before_style()
-                .paint(name)
-                .to_string();
+/// We need this struct to be able to store the previous style.
+/// This because we need to check the previous value in case we don't need
+/// the reset
+struct StyleManager {
+    current_style: Option<Style>,
+}
+
+impl StyleManager {
+    fn new() -> Self {
+        Self {
+            current_style: None,
         }
+    }
+
+    fn apply_style(&mut self, new_style: &Style, name: &str) -> String {
+        if let Some(current) = &self.current_style {
+            if *current == *new_style {
+                // Current style is the same as new style, apply without reset.
+                let mut style = new_style.to_nu_ansi_term_style();
+                style.prefix_with_reset = false;
+                return style.paint(name).to_string();
+            }
+        }
+
+        // We are getting a new style, we need to reset it
+        self.current_style = Some(new_style.clone());
+        new_style
+            .to_nu_ansi_term_style()
+            .reset_before_style()
+            .paint(name)
+            .to_string()
+    }
+}
+
+/// Colors the provided name based on the style determined for the given path.
+fn color_name(
+    name: String,
+    path: &Path,
+    md: Option<&Metadata>,
+    ls_colors: &LsColors,
+    style_manager: &mut StyleManager,
+) -> String {
+    match ls_colors.style_for_path_with_metadata(path, md) {
+        Some(style) => style_manager.apply_style(style, &name),
         None => name,
     }
 }
diff --git a/tests/by-util/test_ls.rs b/tests/by-util/test_ls.rs
index 5061778aed3..4f56f2a0d54 100644
--- a/tests/by-util/test_ls.rs
+++ b/tests/by-util/test_ls.rs
@@ -3903,3 +3903,23 @@ fn test_ls_hyperlink() {
         .succeeds()
         .stdout_is(format!("{file}\n"));
 }
+
+#[test]
+fn test_ls_color_do_not_reset() {
+    let scene: TestScenario = TestScenario::new(util_name!());
+    let at = &scene.fixtures;
+    at.mkdir("example");
+    at.mkdir("example/a");
+    at.mkdir("example/b");
+
+    let result = scene
+        .ucmd()
+        .arg("--color=always")
+        .arg("example/")
+        .succeeds();
+    // the second color code should not have a reset
+    assert_eq!(
+        result.stdout_str().escape_default().to_string(),
+        "\\u{1b}[0m\\u{1b}[01;34ma\\u{1b}[0m\\n\\u{1b}[01;34mb\\u{1b}[0m\\n"
+    );
+}

From e071286eb05104ed043cdaf5496c4db02044391e Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Sat, 9 Dec 2023 09:53:50 +0100
Subject: [PATCH 153/429] address review comments

---
 Cargo.toml               |  1 -
 src/uu/ls/Cargo.toml     |  2 +-
 tests/by-util/test_ls.rs | 18 ++----------------
 3 files changed, 3 insertions(+), 18 deletions(-)

diff --git a/Cargo.toml b/Cargo.toml
index abc3f26b0ab..90157833431 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -289,7 +289,6 @@ indicatif = "0.17"
 itertools = "0.12.0"
 libc = "0.2.150"
 lscolors = { version = "0.16.0", default-features = false, features = [
-  "nu-ansi-term",
   "gnu_legacy",
 ] }
 memchr = "2"
diff --git a/src/uu/ls/Cargo.toml b/src/uu/ls/Cargo.toml
index 56b642a1a43..a82a1f37e07 100644
--- a/src/uu/ls/Cargo.toml
+++ b/src/uu/ls/Cargo.toml
@@ -22,7 +22,7 @@ number_prefix = { workspace = true }
 uutils_term_grid = { workspace = true }
 terminal_size = { workspace = true }
 glob = { workspace = true }
-lscolors = { workspace = true, features = ["gnu_legacy"] }
+lscolors = { workspace = true }
 uucore = { workspace = true, features = [
   "entries",
   "fs",
diff --git a/tests/by-util/test_ls.rs b/tests/by-util/test_ls.rs
index 4f56f2a0d54..f5858dcea85 100644
--- a/tests/by-util/test_ls.rs
+++ b/tests/by-util/test_ls.rs
@@ -1983,20 +1983,6 @@ fn test_ls_recursive_1() {
         .stdout_is(out);
 }
 
-// Function to convert a string to its ASCII representation
-fn to_ascii_representation(input: &str) -> String {
-    input
-        .chars()
-        .map(|c| {
-            if c.is_ascii_control() || !c.is_ascii() {
-                format!("\\x{:02x}", c as u32)
-            } else {
-                c.to_string()
-            }
-        })
-        .collect::<String>()
-}
-
 #[test]
 fn test_ls_color() {
     let scene = TestScenario::new(util_name!());
@@ -2058,8 +2044,8 @@ fn test_ls_color() {
         .succeeds();
     let expected = format!("{}  test-color\x0ab  {}", a_with_colors, z_with_colors);
     assert_eq!(
-        to_ascii_representation(result.stdout_str()),
-        to_ascii_representation(&expected)
+        result.stdout_str().escape_default().to_string(),
+        expected.escape_default().to_string()
     );
     assert_eq!(result.stdout_str(), expected);
 }

From 5d8c49ff079de6ce41fb9d4fcd2358c99e4d16a3 Mon Sep 17 00:00:00 2001
From: "renovate[bot]" <29139614+renovate[bot]@users.noreply.github.com>
Date: Sat, 9 Dec 2023 12:52:02 +0000
Subject: [PATCH 154/429] chore(deps): update rust crate xattr to 1.1.1

---
 Cargo.lock | 4 ++--
 Cargo.toml | 2 +-
 2 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/Cargo.lock b/Cargo.lock
index e9fcf327652..a7f87cf2756 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -3519,9 +3519,9 @@ checksum = "1a515f5799fe4961cb532f983ce2b23082366b898e52ffbce459c86f67c8378a"
 
 [[package]]
 name = "xattr"
-version = "1.0.1"
+version = "1.1.1"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "f4686009f71ff3e5c4dbcf1a282d0a44db3f021ba69350cd42086b3e5f1c6985"
+checksum = "fbc6ab6ec1907d1a901cdbcd2bd4cb9e7d64ce5c9739cbb97d3c391acd8c7fae"
 dependencies = [
  "libc",
 ]
diff --git a/Cargo.toml b/Cargo.toml
index f88285a1f36..28c422e2cd7 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -330,7 +330,7 @@ utf-8 = "0.7.6"
 walkdir = "2.4"
 winapi-util = "0.1.6"
 windows-sys = { version = "0.48.0", default-features = false }
-xattr = "1.0.1"
+xattr = "1.1.1"
 zip = { version = "0.6.6", default-features = false, features = ["deflate"] }
 
 hex = "0.4.3"

From 1d4c919b97d53cca4842ff323e2298a7b9888d73 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Sat, 9 Dec 2023 16:33:19 +0100
Subject: [PATCH 155/429] Add mdir to the spell ignore

---
 tests/by-util/test_ls.rs | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/by-util/test_ls.rs b/tests/by-util/test_ls.rs
index f5858dcea85..6c56eff7cf9 100644
--- a/tests/by-util/test_ls.rs
+++ b/tests/by-util/test_ls.rs
@@ -2,7 +2,7 @@
 //
 // For the full copyright and license information, please view the LICENSE
 // file that was distributed with this source code.
-// spell-checker:ignore (words) READMECAREFULLY birthtime doesntexist oneline somebackup lrwx somefile somegroup somehiddenbackup somehiddenfile tabsize aaaaaaaa bbbb cccc dddddddd ncccc neee naaaaa nbcdef nfffff dired subdired tmpfs mdir1
+// spell-checker:ignore (words) READMECAREFULLY birthtime doesntexist oneline somebackup lrwx somefile somegroup somehiddenbackup somehiddenfile tabsize aaaaaaaa bbbb cccc dddddddd ncccc neee naaaaa nbcdef nfffff dired subdired tmpfs mdir
 
 #[cfg(any(unix, feature = "feat_selinux"))]
 use crate::common::util::expected_result;

From 7279fbe91c12acb9346314c43a76e4a40c8d900b Mon Sep 17 00:00:00 2001
From: "renovate[bot]" <29139614+renovate[bot]@users.noreply.github.com>
Date: Sun, 10 Dec 2023 01:38:33 +0000
Subject: [PATCH 156/429] chore(deps): update vmactions/freebsd-vm action to
 v1.0.5

---
 .github/workflows/freebsd.yml | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/.github/workflows/freebsd.yml b/.github/workflows/freebsd.yml
index 27537cf6dab..c4d441a5572 100644
--- a/.github/workflows/freebsd.yml
+++ b/.github/workflows/freebsd.yml
@@ -39,7 +39,7 @@ jobs:
     - name: Run sccache-cache
       uses: mozilla-actions/sccache-action@v0.0.3
     - name: Prepare, build and test
-      uses: vmactions/freebsd-vm@v1.0.4
+      uses: vmactions/freebsd-vm@v1.0.5
       with:
         usesh: true
         sync: rsync
@@ -131,7 +131,7 @@ jobs:
     - name: Run sccache-cache
       uses: mozilla-actions/sccache-action@v0.0.3
     - name: Prepare, build and test
-      uses: vmactions/freebsd-vm@v1.0.4
+      uses: vmactions/freebsd-vm@v1.0.5
       with:
         usesh: true
         sync: rsync

From 673093f8429d24832f760ec7bffc9abbe6bdf220 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Dorian=20P=C3=A9ron?=
 <72708393+RenjiSann@users.noreply.github.com>
Date: Sun, 10 Dec 2023 16:07:41 +0100
Subject: [PATCH 157/429] ls: set default quoting style to literal when not TTY
 (#5553)

* ls: set default quoting style to literal if output is not TTY

* tests/ls: Fix quoting tests that now run with Literal as default

* ls: Fix formatting/linting/spelling issues

* tests/ls: Fix windows escaped tests
---
 src/uu/ls/src/ls.rs      |  4 +++-
 tests/by-util/test_ls.rs | 22 +++++++++++++---------
 2 files changed, 16 insertions(+), 10 deletions(-)

diff --git a/src/uu/ls/src/ls.rs b/src/uu/ls/src/ls.rs
index e3176ec72c6..4feb70db789 100644
--- a/src/uu/ls/src/ls.rs
+++ b/src/uu/ls/src/ls.rs
@@ -642,7 +642,9 @@ fn extract_quoting_style(options: &clap::ArgMatches, show_control: bool) -> Quot
         QuotingStyle::C {
             quotes: quoting_style::Quotes::Double,
         }
-    } else if options.get_flag(options::DIRED) {
+    } else if options.get_flag(options::DIRED) || !std::io::stdout().is_terminal() {
+        // By default, `ls` uses Literal quoting when
+        // writing to a non-terminal file descriptor
         QuotingStyle::Literal { show_control }
     } else {
         // TODO: use environment variable if available
diff --git a/tests/by-util/test_ls.rs b/tests/by-util/test_ls.rs
index 6c56eff7cf9..0e817511f4e 100644
--- a/tests/by-util/test_ls.rs
+++ b/tests/by-util/test_ls.rs
@@ -2472,13 +2472,16 @@ fn test_ls_quoting_style() {
     {
         at.touch("one\ntwo");
         at.touch("one\\two");
-        // Default is shell-escape
+        // Default is literal, when stdout is not a TTY.
+        // Otherwise, it is shell-escape
         scene
             .ucmd()
             .arg("--hide-control-chars")
             .arg("one\ntwo")
             .succeeds()
-            .stdout_only("'one'$'\\n''two'\n");
+            .stdout_only("one?two\n");
+        // TODO: TTY-expected output, find a way to check this as well
+        // .stdout_only("'one'$'\\n''two'\n");
 
         for (arg, correct) in [
             ("--quoting-style=literal", "one?two"),
@@ -2565,7 +2568,9 @@ fn test_ls_quoting_style() {
         .ucmd()
         .arg("one two")
         .succeeds()
-        .stdout_only("'one two'\n");
+        .stdout_only("one two\n");
+    // TODO: TTY-expected output
+    // .stdout_only("'one two'\n");
 
     for (arg, correct) in [
         ("--quoting-style=literal", "one two"),
@@ -2628,7 +2633,9 @@ fn test_ls_quoting_and_color() {
         .arg("--color")
         .arg("one two")
         .succeeds()
-        .stdout_only("'one two'\n");
+        .stdout_only("one two\n");
+    // TODO: TTY-expected output
+    // .stdout_only("'one two'\n");
 }
 
 #[test]
@@ -3160,11 +3167,8 @@ fn test_ls_path() {
         .stdout_is(expected_stdout);
 
     let abs_path = format!("{}/{}", at.as_string(), path);
-    let expected_stdout = if cfg!(windows) {
-        format!("\'{abs_path}\'\n")
-    } else {
-        format!("{abs_path}\n")
-    };
+    let expected_stdout = format!("{abs_path}\n");
+
     scene.ucmd().arg(&abs_path).run().stdout_is(expected_stdout);
 
     let expected_stdout = format!("{path}\n{file1}\n");

From 0491a97a33eedd2d41e5074ee3905085524b3252 Mon Sep 17 00:00:00 2001
From: "renovate[bot]" <29139614+renovate[bot]@users.noreply.github.com>
Date: Sun, 10 Dec 2023 18:51:09 +0000
Subject: [PATCH 158/429] chore(deps): update rust crate libc to 0.2.151

---
 Cargo.lock | 4 ++--
 Cargo.toml | 2 +-
 2 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/Cargo.lock b/Cargo.lock
index a7f87cf2756..c943a26117b 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -1187,9 +1187,9 @@ checksum = "830d08ce1d1d941e6b30645f1a0eb5643013d835ce3779a5fc208261dbe10f55"
 
 [[package]]
 name = "libc"
-version = "0.2.150"
+version = "0.2.151"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "89d92a4743f9a61002fae18374ed11e7973f530cb3a3255fb354818118b2203c"
+checksum = "302d7ab3130588088d277783b1e2d2e10c9e9e4a16dd9050e6ec93fb3e7048f4"
 
 [[package]]
 name = "libloading"
diff --git a/Cargo.toml b/Cargo.toml
index 3df108e4e11..0a65185a84b 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -287,7 +287,7 @@ half = "2.3"
 hostname = "0.3"
 indicatif = "0.17"
 itertools = "0.12.0"
-libc = "0.2.150"
+libc = "0.2.151"
 lscolors = { version = "0.16.0", default-features = false, features = [
   "gnu_legacy",
 ] }

From fa0c64ddde2d08103c8e682815ec9f5924a716a5 Mon Sep 17 00:00:00 2001
From: Arpit Bhadauria <singharpit511@gmail.com>
Date: Mon, 11 Dec 2023 02:05:55 +0000
Subject: [PATCH 159/429] review fixes

---
 src/uu/expr/src/expr.rs        |  6 +--
 src/uu/expr/src/syntax_tree.rs | 76 +++++++++++++++++-----------------
 2 files changed, 40 insertions(+), 42 deletions(-)

diff --git a/src/uu/expr/src/expr.rs b/src/uu/expr/src/expr.rs
index 1a9bb07de4a..6adedd9eccc 100644
--- a/src/uu/expr/src/expr.rs
+++ b/src/uu/expr/src/expr.rs
@@ -13,7 +13,7 @@ use uucore::{
     format_usage, help_about, help_section, help_usage,
 };
 
-use crate::syntax_tree::{is_truthy, NumOrStr};
+use crate::syntax_tree::is_truthy;
 
 mod syntax_tree;
 
@@ -108,9 +108,9 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
         .map(|v| v.into_iter().map(|s| s.as_ref()).collect::<Vec<_>>())
         .unwrap_or_default();
 
-    let res: String = AstNode::parse(&token_strings)?.eval()?.into();
+    let res: String = AstNode::parse(&token_strings)?.eval()?.eval_as_string();
     println!("{res}");
-    if !is_truthy(&NumOrStr::from(res)) {
+    if !is_truthy(&res.into()) {
         return Err(1.into());
     }
     Ok(())
diff --git a/src/uu/expr/src/syntax_tree.rs b/src/uu/expr/src/syntax_tree.rs
index ae2a44e5205..4514b2a6707 100644
--- a/src/uu/expr/src/syntax_tree.rs
+++ b/src/uu/expr/src/syntax_tree.rs
@@ -80,17 +80,17 @@ impl RelationOp {
             }
         };
         if b {
-            Ok(NumOrStr::from(1))
+            Ok(1.into())
         } else {
-            Ok(NumOrStr::from(0))
+            Ok(0.into())
         }
     }
 }
 
 impl NumericOp {
     fn eval(&self, left: &AstNode, right: &AstNode) -> ExprResult<NumOrStr> {
-        let a = ExprResult::<BigInt>::from(left.eval()?)?;
-        let b = ExprResult::<BigInt>::from(right.eval()?)?;
+        let a = left.eval()?.eval_as_bigint()?;
+        let b = right.eval()?.eval_as_bigint()?;
         Ok(NumOrStr::Num(match self {
             Self::Add => a + b,
             Self::Sub => a - b,
@@ -121,22 +121,22 @@ impl StringOp {
                 if is_truthy(&right) {
                     return Ok(right);
                 }
-                Ok(NumOrStr::from(0))
+                Ok(0.into())
             }
             Self::And => {
                 let left = left.eval()?;
                 if !is_truthy(&left) {
-                    return Ok(NumOrStr::from(0));
+                    return Ok(0.into());
                 }
                 let right = right.eval()?;
                 if !is_truthy(&right) {
-                    return Ok(NumOrStr::from(0));
+                    return Ok(0.into());
                 }
                 Ok(left)
             }
             Self::Match => {
-                let left: String = left.eval()?.into();
-                let right: String = right.eval()?.into();
+                let left = left.eval()?.eval_as_string();
+                let right = right.eval()?.eval_as_string();
                 let re_string = format!("^{}", right);
                 let re = Regex::with_options(
                     &re_string,
@@ -144,7 +144,7 @@ impl StringOp {
                     Syntax::grep(),
                 )
                 .map_err(|_| ExprError::InvalidRegexExpression)?;
-                Ok(NumOrStr::from(if re.captures_len() > 0 {
+                Ok(if re.captures_len() > 0 {
                     re.captures(&left)
                         .map(|captures| captures.at(1).unwrap())
                         .unwrap_or("")
@@ -152,19 +152,20 @@ impl StringOp {
                 } else {
                     re.find(&left)
                         .map_or("0".to_string(), |(start, end)| (end - start).to_string())
-                }))
+                }
+                .into())
             }
             Self::Index => {
-                let left: String = left.eval()?.into();
-                let right: String = right.eval()?.into();
+                let left = left.eval()?.eval_as_string();
+                let right = right.eval()?.eval_as_string();
                 for (current_idx, ch_h) in left.chars().enumerate() {
                     for ch_n in right.to_string().chars() {
                         if ch_n == ch_h {
-                            return Ok(NumOrStr::from(current_idx + 1));
+                            return Ok((current_idx + 1).into());
                         }
                     }
                 }
-                Ok(NumOrStr::from(0))
+                Ok(0.into())
             }
         }
     }
@@ -220,38 +221,34 @@ impl From<String> for NumOrStr {
 
 impl From<NumOrStr> for Option<usize> {
     fn from(s: NumOrStr) -> Self {
-        match s.into() {
+        match s.eval_as_bigint() {
             Ok(num) => num.to_usize(),
             Err(_) => None,
         }
     }
 }
 
-impl From<NumOrStr> for String {
-    fn from(s: NumOrStr) -> Self {
-        match s {
-            NumOrStr::Num(num) => num.to_string(),
-            NumOrStr::Str(str) => str.to_string(),
+impl NumOrStr {
+    pub fn to_bigint(&self) -> Result<BigInt, ParseBigIntError> {
+        match self {
+            Self::Num(num) => Ok(num.clone()),
+            Self::Str(str) => str.parse::<BigInt>(),
         }
     }
-}
 
-impl From<NumOrStr> for ExprResult<BigInt> {
-    fn from(s: NumOrStr) -> Self {
-        match s {
+    pub fn eval_as_bigint(self) -> ExprResult<BigInt> {
+        match self {
             NumOrStr::Num(num) => Ok(num),
             NumOrStr::Str(str) => str
                 .parse::<BigInt>()
                 .map_err(|_| ExprError::NonIntegerArgument),
         }
     }
-}
 
-impl NumOrStr {
-    pub fn to_bigint(&self) -> Result<BigInt, ParseBigIntError> {
+    pub fn eval_as_string(self) -> String {
         match self {
-            Self::Num(num) => Ok(num.clone()),
-            Self::Str(str) => str.parse::<BigInt>(),
+            NumOrStr::Num(num) => num.to_string(),
+            NumOrStr::Str(str) => str,
         }
     }
 }
@@ -283,7 +280,7 @@ impl AstNode {
 
     pub fn eval(&self) -> ExprResult<NumOrStr> {
         match self {
-            Self::Leaf { value } => Ok(NumOrStr::from(value.to_string())),
+            Self::Leaf { value } => Ok(value.to_string().into()),
             Self::BinOp {
                 op_type,
                 left,
@@ -294,7 +291,7 @@ impl AstNode {
                 pos,
                 length,
             } => {
-                let string: String = string.eval()?.into();
+                let string: String = string.eval()?.eval_as_string();
 
                 // The GNU docs say:
                 //
@@ -307,16 +304,17 @@ impl AstNode {
                 let length: usize = Option::<usize>::from(length.eval()?).unwrap_or(0);
 
                 let (Some(pos), Some(_)) = (pos.checked_sub(1), length.checked_sub(1)) else {
-                    return Ok(NumOrStr::from(String::new()));
+                    return Ok(String::new().into());
                 };
 
-                Ok(NumOrStr::from(
-                    string.chars().skip(pos).take(length).collect::<String>(),
-                ))
-            }
-            Self::Length { string } => {
-                Ok(NumOrStr::from(String::from(string.eval()?).chars().count()))
+                Ok(string
+                    .chars()
+                    .skip(pos)
+                    .take(length)
+                    .collect::<String>()
+                    .into())
             }
+            Self::Length { string } => Ok(string.eval()?.eval_as_string().chars().count().into()),
         }
     }
 }

From 824371d8841f1652de5a8b4d865a175af2a91d5b Mon Sep 17 00:00:00 2001
From: Arpit Bhadauria <singharpit511@gmail.com>
Date: Mon, 11 Dec 2023 02:12:24 +0000
Subject: [PATCH 160/429] style lint fixes

---
 src/uu/expr/src/syntax_tree.rs | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/src/uu/expr/src/syntax_tree.rs b/src/uu/expr/src/syntax_tree.rs
index 4514b2a6707..820911cd306 100644
--- a/src/uu/expr/src/syntax_tree.rs
+++ b/src/uu/expr/src/syntax_tree.rs
@@ -238,8 +238,8 @@ impl NumOrStr {
 
     pub fn eval_as_bigint(self) -> ExprResult<BigInt> {
         match self {
-            NumOrStr::Num(num) => Ok(num),
-            NumOrStr::Str(str) => str
+            Self::Num(num) => Ok(num),
+            Self::Str(str) => str
                 .parse::<BigInt>()
                 .map_err(|_| ExprError::NonIntegerArgument),
         }
@@ -247,8 +247,8 @@ impl NumOrStr {
 
     pub fn eval_as_string(self) -> String {
         match self {
-            NumOrStr::Num(num) => num.to_string(),
-            NumOrStr::Str(str) => str,
+            Self::Num(num) => num.to_string(),
+            Self::Str(str) => str,
         }
     }
 }

From db91e12a1dce69c020bb97de5b88d330115aedbd Mon Sep 17 00:00:00 2001
From: Ian Douglas Scott <ian@iandouglasscott.com>
Date: Sun, 5 Nov 2023 18:11:04 -0800
Subject: [PATCH 161/429] Fix build on Redox, and add `stat` to Redox feature

---
 Cargo.toml                             |  1 +
 src/uu/cp/src/cp.rs                    |  2 ++
 src/uu/date/src/date.rs                |  1 -
 src/uu/df/src/df.rs                    |  2 +-
 src/uu/shred/src/shred.rs              |  8 ++++----
 src/uucore/src/lib/features/entries.rs |  5 -----
 src/uucore/src/lib/features/fsext.rs   | 11 ++++++++---
 src/uucore/src/lib/features/mode.rs    | 17 ++++++++++++-----
 src/uucore/src/lib/features/signals.rs |  2 +-
 9 files changed, 29 insertions(+), 20 deletions(-)

diff --git a/Cargo.toml b/Cargo.toml
index 3df108e4e11..55dcb378fd0 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -240,6 +240,7 @@ feat_os_unix_redox = [
   "feat_common_core",
   #
   "chmod",
+  "stat",
   "uname",
 ]
 # "feat_os_windows_legacy" == slightly restricted set of utilities which can be built/run on early windows platforms (eg, "WinXP")
diff --git a/src/uu/cp/src/cp.rs b/src/uu/cp/src/cp.rs
index 7265e89f12a..de01a5ef38c 100644
--- a/src/uu/cp/src/cp.rs
+++ b/src/uu/cp/src/cp.rs
@@ -1896,6 +1896,7 @@ fn handle_no_preserve_mode(options: &Options, org_mode: u32) -> u32 {
             target_os = "macos",
             target_os = "macos-12",
             target_os = "freebsd",
+            target_os = "redox",
         )))]
         {
             const MODE_RW_UGO: u32 = S_IRUSR | S_IWUSR | S_IRGRP | S_IWGRP | S_IROTH | S_IWOTH;
@@ -1911,6 +1912,7 @@ fn handle_no_preserve_mode(options: &Options, org_mode: u32) -> u32 {
             target_os = "macos",
             target_os = "macos-12",
             target_os = "freebsd",
+            target_os = "redox",
         ))]
         {
             const MODE_RW_UGO: u32 =
diff --git a/src/uu/date/src/date.rs b/src/uu/date/src/date.rs
index b5ab8993acd..ee3c7bfdfae 100644
--- a/src/uu/date/src/date.rs
+++ b/src/uu/date/src/date.rs
@@ -16,7 +16,6 @@ use std::fs::File;
 use std::io::{BufRead, BufReader};
 use std::path::PathBuf;
 use uucore::display::Quotable;
-#[cfg(not(any(target_os = "redox")))]
 use uucore::error::FromIo;
 use uucore::error::{UResult, USimpleError};
 use uucore::{format_usage, help_about, help_usage, show};
diff --git a/src/uu/df/src/df.rs b/src/uu/df/src/df.rs
index 78325f3d2ad..c21ba98471a 100644
--- a/src/uu/df/src/df.rs
+++ b/src/uu/df/src/df.rs
@@ -336,7 +336,7 @@ fn filter_mount_list(vmi: Vec<MountInfo>, opt: &Options) -> Vec<MountInfo> {
 fn get_all_filesystems(opt: &Options) -> Result<Vec<Filesystem>, std::io::Error> {
     // Run a sync call before any operation if so instructed.
     if opt.sync {
-        #[cfg(not(windows))]
+        #[cfg(not(any(windows, target_os = "redox")))]
         unsafe {
             #[cfg(not(target_os = "android"))]
             uucore::libc::sync();
diff --git a/src/uu/shred/src/shred.rs b/src/uu/shred/src/shred.rs
index 04f81bf23fd..711fd0485cc 100644
--- a/src/uu/shred/src/shred.rs
+++ b/src/uu/shred/src/shred.rs
@@ -369,12 +369,12 @@ fn wipe_file(
         let metadata = fs::metadata(path).map_err_context(String::new)?;
         let mut perms = metadata.permissions();
         #[cfg(unix)]
-        #[allow(clippy::useless_conversion)]
+        #[allow(clippy::useless_conversion, clippy::unnecessary_cast)]
         {
             // NOTE: set_readonly(false) makes the file world-writable on Unix.
-            // NOTE: S_IWUSR type is u16 on macOS.
-            if (perms.mode() & u32::from(S_IWUSR)) == 0 {
-                perms.set_mode(u32::from(S_IWUSR));
+            // NOTE: S_IWUSR type is u16 on macOS, i32 on Redox.
+            if (perms.mode() & (S_IWUSR as u32)) == 0 {
+                perms.set_mode(S_IWUSR as u32);
             }
         }
         #[cfg(not(unix))]
diff --git a/src/uucore/src/lib/features/entries.rs b/src/uucore/src/lib/features/entries.rs
index 29c9b437234..fa10ba2decb 100644
--- a/src/uucore/src/lib/features/entries.rs
+++ b/src/uucore/src/lib/features/entries.rs
@@ -35,7 +35,6 @@
 #[cfg(any(target_os = "freebsd", target_vendor = "apple"))]
 use libc::time_t;
 use libc::{c_char, c_int, gid_t, uid_t};
-#[cfg(not(target_os = "redox"))]
 use libc::{getgrgid, getgrnam, getgroups};
 use libc::{getpwnam, getpwuid, group, passwd};
 
@@ -67,7 +66,6 @@ extern "C" {
 /// > supplementary group IDs for the process is returned.  This allows
 /// > the caller to determine the size of a dynamically allocated list
 /// > to be used in a further call to getgroups().
-#[cfg(not(target_os = "redox"))]
 pub fn get_groups() -> IOResult<Vec<gid_t>> {
     let mut groups = Vec::new();
     loop {
@@ -337,7 +335,6 @@ macro_rules! f {
 }
 
 f!(getpwnam, getpwuid, uid_t, Passwd);
-#[cfg(not(target_os = "redox"))]
 f!(getgrnam, getgrgid, gid_t, Group);
 
 #[inline]
@@ -345,7 +342,6 @@ pub fn uid2usr(id: uid_t) -> IOResult<String> {
     Passwd::locate(id).map(|p| p.name)
 }
 
-#[cfg(not(target_os = "redox"))]
 #[inline]
 pub fn gid2grp(id: gid_t) -> IOResult<String> {
     Group::locate(id).map(|p| p.name)
@@ -356,7 +352,6 @@ pub fn usr2uid(name: &str) -> IOResult<uid_t> {
     Passwd::locate(name).map(|p| p.uid)
 }
 
-#[cfg(not(target_os = "redox"))]
 #[inline]
 pub fn grp2gid(name: &str) -> IOResult<gid_t> {
     Group::locate(name).map(|p| p.gid)
diff --git a/src/uucore/src/lib/features/fsext.rs b/src/uucore/src/lib/features/fsext.rs
index 93fedb44b7c..9ee5e2464e5 100644
--- a/src/uucore/src/lib/features/fsext.rs
+++ b/src/uucore/src/lib/features/fsext.rs
@@ -71,6 +71,7 @@ use std::convert::{AsRef, From};
     target_os = "android",
     target_os = "illumos",
     target_os = "solaris",
+    target_os = "redox",
 ))]
 use std::ffi::CStr;
 #[cfg(not(windows))]
@@ -106,7 +107,6 @@ pub use libc::statvfs as StatFs;
     target_vendor = "apple",
     target_os = "freebsd",
     target_os = "openbsd",
-    target_os = "redox"
 ))]
 pub use libc::statfs as statfs_fn;
 #[cfg(any(
@@ -114,7 +114,8 @@ pub use libc::statfs as statfs_fn;
     target_os = "bitrig",
     target_os = "illumos",
     target_os = "solaris",
-    target_os = "dragonfly"
+    target_os = "dragonfly",
+    target_os = "redox"
 ))]
 pub use libc::statvfs as statfs_fn;
 
@@ -639,6 +640,7 @@ impl FsMeta for StatFs {
             not(target_os = "openbsd"),
             not(target_os = "illumos"),
             not(target_os = "solaris"),
+            not(target_os = "redox"),
             not(target_arch = "s390x"),
             target_pointer_width = "64"
         ))]
@@ -646,6 +648,7 @@ impl FsMeta for StatFs {
         #[cfg(all(
             not(target_env = "musl"),
             not(target_os = "freebsd"),
+            not(target_os = "redox"),
             any(
                 target_arch = "s390x",
                 target_vendor = "apple",
@@ -659,7 +662,8 @@ impl FsMeta for StatFs {
             target_env = "musl",
             target_os = "freebsd",
             target_os = "illumos",
-            target_os = "solaris"
+            target_os = "solaris",
+            target_os = "redox"
         ))]
         return self.f_bsize.try_into().unwrap();
     }
@@ -875,6 +879,7 @@ pub fn pretty_time(sec: i64, nsec: i64) -> String {
     // the date was set
     let local_offset = match UtcOffset::local_offset_at(tm) {
         Ok(lo) => lo,
+        Err(_) if cfg!(target_os = "redox") => UtcOffset::UTC,
         Err(e) => {
             panic!("error: {e}");
         }
diff --git a/src/uucore/src/lib/features/mode.rs b/src/uucore/src/lib/features/mode.rs
index 147624891bd..c2da380bf0f 100644
--- a/src/uucore/src/lib/features/mode.rs
+++ b/src/uucore/src/lib/features/mode.rs
@@ -137,6 +137,7 @@ fn parse_change(mode: &str, fperm: u32, considering_dir: bool) -> (u32, usize) {
     (srwx, pos)
 }
 
+#[allow(clippy::unnecessary_cast)]
 pub fn parse_mode(mode: &str) -> Result<mode_t, String> {
     #[cfg(all(
         not(target_os = "freebsd"),
@@ -148,9 +149,9 @@ pub fn parse_mode(mode: &str) -> Result<mode_t, String> {
     let fperm = (S_IRUSR | S_IWUSR | S_IRGRP | S_IWGRP | S_IROTH | S_IWOTH) as u32;
 
     let result = if mode.chars().any(|c| c.is_ascii_digit()) {
-        parse_numeric(fperm, mode, true)
+        parse_numeric(fperm as u32, mode, true)
     } else {
-        parse_symbolic(fperm, mode, get_umask(), true)
+        parse_symbolic(fperm as u32, mode, get_umask(), true)
     };
     result.map(|mode| mode as mode_t)
 }
@@ -168,11 +169,17 @@ pub fn get_umask() -> u32 {
     #[cfg(all(
         not(target_os = "freebsd"),
         not(target_vendor = "apple"),
-        not(target_os = "android")
+        not(target_os = "android"),
+        not(target_os = "redox")
     ))]
     return mask;
-    #[cfg(any(target_os = "freebsd", target_vendor = "apple", target_os = "android"))]
-    return mask.into();
+    #[cfg(any(
+        target_os = "freebsd",
+        target_vendor = "apple",
+        target_os = "android",
+        target_os = "redox"
+    ))]
+    return mask as u32;
 }
 
 // Iterate 'args' and delete the first occurrence
diff --git a/src/uucore/src/lib/features/signals.rs b/src/uucore/src/lib/features/signals.rs
index 2e8c26a4598..a4c85647ba4 100644
--- a/src/uucore/src/lib/features/signals.rs
+++ b/src/uucore/src/lib/features/signals.rs
@@ -27,7 +27,7 @@ Linux Programmer's Manual
 
 */
 
-#[cfg(any(target_os = "linux", target_os = "android"))]
+#[cfg(any(target_os = "linux", target_os = "android", target_os = "redox"))]
 pub static ALL_SIGNALS: [&str; 32] = [
     "EXIT", "HUP", "INT", "QUIT", "ILL", "TRAP", "ABRT", "BUS", "FPE", "KILL", "USR1", "SEGV",
     "USR2", "PIPE", "ALRM", "TERM", "STKFLT", "CHLD", "CONT", "STOP", "TSTP", "TTIN", "TTOU",

From 3dab2b739072efec893bbf50445a8529db55d78d Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Mon, 11 Dec 2023 09:33:36 +0100
Subject: [PATCH 162/429] ls: use show_dir_name to output dir name

---
 src/uu/ls/src/ls.rs | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/src/uu/ls/src/ls.rs b/src/uu/ls/src/ls.rs
index 3b34cf15eba..a5fe3d6246d 100644
--- a/src/uu/ls/src/ls.rs
+++ b/src/uu/ls/src/ls.rs
@@ -1961,7 +1961,8 @@ pub fn list(locs: Vec<&Path>, config: &Config) -> UResult<()> {
                 if config.dired {
                     dired::indent(&mut out)?;
                 }
-                writeln!(out, "{}:", path_data.p_buf.display())?;
+                show_dir_name(&path_data.p_buf, &mut out);
+                writeln!(out)?;
                 if config.dired {
                     // First directory displayed
                     let dir_len = path_data.display_name.len();

From 191eb9ac126361a26597502a997e1ce2c3116f2b Mon Sep 17 00:00:00 2001
From: Terts Diepraam <terts.diepraam@gmail.com>
Date: Mon, 11 Dec 2023 10:49:38 +0100
Subject: [PATCH 163/429] echo: make -e and -E override each other

---
 src/uu/echo/src/echo.rs    |  6 ++++--
 tests/by-util/test_echo.rs | 13 +++++++++++++
 2 files changed, 17 insertions(+), 2 deletions(-)

diff --git a/src/uu/echo/src/echo.rs b/src/uu/echo/src/echo.rs
index b3707b6f898..7c03159d538 100644
--- a/src/uu/echo/src/echo.rs
+++ b/src/uu/echo/src/echo.rs
@@ -154,13 +154,15 @@ pub fn uu_app() -> Command {
             Arg::new(options::ENABLE_BACKSLASH_ESCAPE)
                 .short('e')
                 .help("enable interpretation of backslash escapes")
-                .action(ArgAction::SetTrue),
+                .action(ArgAction::SetTrue)
+                .overrides_with(options::DISABLE_BACKSLASH_ESCAPE),
         )
         .arg(
             Arg::new(options::DISABLE_BACKSLASH_ESCAPE)
                 .short('E')
                 .help("disable interpretation of backslash escapes (default)")
-                .action(ArgAction::SetTrue),
+                .action(ArgAction::SetTrue)
+                .overrides_with(options::ENABLE_BACKSLASH_ESCAPE),
         )
         .arg(Arg::new(options::STRING).action(ArgAction::Append))
 }
diff --git a/tests/by-util/test_echo.rs b/tests/by-util/test_echo.rs
index 875ff66cb14..ac6bd74d1e0 100644
--- a/tests/by-util/test_echo.rs
+++ b/tests/by-util/test_echo.rs
@@ -117,6 +117,19 @@ fn test_escape_newline() {
         .stdout_only("\na\n");
 }
 
+#[test]
+fn test_escape_override() {
+    new_ucmd!()
+        .args(&["-e", "-E", "\\na"])
+        .succeeds()
+        .stdout_only("\\na\n");
+
+    new_ucmd!()
+        .args(&["-E", "-e", "\\na"])
+        .succeeds()
+        .stdout_only("\na\n");
+}
+
 #[test]
 fn test_escape_no_further_output() {
     new_ucmd!()

From 9d0c1b3482f3876c18cc69e95ccd13902a20f483 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Mon, 11 Dec 2023 11:02:50 +0100
Subject: [PATCH 164/429] fuzzing: quick timeout because seq is freezing

---
 .github/workflows/fuzzing.yml | 1 +
 1 file changed, 1 insertion(+)

diff --git a/.github/workflows/fuzzing.yml b/.github/workflows/fuzzing.yml
index eed2ae2fc99..fb100d716ee 100644
--- a/.github/workflows/fuzzing.yml
+++ b/.github/workflows/fuzzing.yml
@@ -36,6 +36,7 @@ jobs:
     needs: fuzz-build
     name: Run the fuzzers
     runs-on: ubuntu-latest
+    timeout-minutes: 5
     env:
       RUN_FOR: 60
     strategy:

From 2faab59aa4abce17e04158fc2a74e1daf8f8d9f1 Mon Sep 17 00:00:00 2001
From: Laurent Cheylus <foxy@free.fr>
Date: Mon, 11 Dec 2023 12:45:16 +0100
Subject: [PATCH 165/429] tests/hostname: disable failing
 test_hostname::test_hostname_ip on OpenBSD

  - On OpenBSD, test_hostname::test_hostname_ip fails with "failed to lookup address information:
    Name does not resolve" error

Signed-off-by: Laurent Cheylus <foxy@free.fr>
---
 tests/by-util/test_hostname.rs | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/tests/by-util/test_hostname.rs b/tests/by-util/test_hostname.rs
index 84cb73e2ecf..972ec4aabbf 100644
--- a/tests/by-util/test_hostname.rs
+++ b/tests/by-util/test_hostname.rs
@@ -14,8 +14,8 @@ fn test_hostname() {
     assert!(ls_default_res.stdout().len() >= ls_domain_res.stdout().len());
 }
 
-// FixME: fails for "MacOS" and "freebsd" "failed to lookup address information: Name does not resolve"
-#[cfg(not(any(target_os = "macos", target_os = "freebsd")))]
+// FixME: fails for "MacOS", "freebsd" and "openbsd" "failed to lookup address information: Name does not resolve"
+#[cfg(not(any(target_os = "macos", target_os = "freebsd", target_os = "openbsd")))]
 #[test]
 fn test_hostname_ip() {
     let result = new_ucmd!().arg("-i").succeeds();

From bc5b5e013acee31187cfa1bd9d20340dcdc90ead Mon Sep 17 00:00:00 2001
From: Terts Diepraam <terts.diepraam@gmail.com>
Date: Mon, 11 Dec 2023 13:35:17 +0100
Subject: [PATCH 166/429] tr: operate on bytes instead of chars

---
 src/uu/tr/src/convert.rs       |  36 -------
 src/uu/tr/src/operation.rs     | 173 ++++++++++++++++-----------------
 src/uu/tr/src/tr.rs            |  20 ++--
 src/uu/tr/src/unicode_table.rs |  20 ++--
 tests/by-util/test_tr.rs       |  17 ++--
 5 files changed, 115 insertions(+), 151 deletions(-)
 delete mode 100644 src/uu/tr/src/convert.rs

diff --git a/src/uu/tr/src/convert.rs b/src/uu/tr/src/convert.rs
deleted file mode 100644
index 28a80e9f52e..00000000000
--- a/src/uu/tr/src/convert.rs
+++ /dev/null
@@ -1,36 +0,0 @@
-// This file is part of the uutils coreutils package.
-//
-// For the full copyright and license information, please view the LICENSE
-// file that was distributed with this source code.
-
-// spell-checker:ignore (strings) anychar combinator
-
-use nom::{
-    branch::alt,
-    bytes::complete::tag,
-    character::complete::{anychar, one_of},
-    combinator::{map_opt, recognize},
-    multi::{many0, many_m_n},
-    sequence::preceded,
-    IResult,
-};
-
-fn parse_octal(input: &str) -> IResult<&str, char> {
-    map_opt(
-        preceded(tag("\\"), recognize(many_m_n(1, 3, one_of("01234567")))),
-        |out: &str| {
-            u32::from_str_radix(out, 8)
-                .map(std::char::from_u32)
-                .ok()
-                .flatten()
-        },
-    )(input)
-}
-
-pub fn reduce_octal_to_char(input: &str) -> String {
-    many0(alt((parse_octal, anychar)))(input)
-        .map(|(_, r)| r)
-        .unwrap()
-        .into_iter()
-        .collect()
-}
diff --git a/src/uu/tr/src/operation.rs b/src/uu/tr/src/operation.rs
index b7d74427a9e..cd6a83de6c9 100644
--- a/src/uu/tr/src/operation.rs
+++ b/src/uu/tr/src/operation.rs
@@ -7,10 +7,10 @@
 
 use nom::{
     branch::alt,
-    bytes::complete::tag,
-    character::complete::{anychar, digit1},
-    combinator::{map, peek, value},
-    multi::many0,
+    bytes::complete::{tag, take},
+    character::complete::{digit1, one_of},
+    combinator::{map, map_opt, peek, recognize, value},
+    multi::{many0, many_m_n},
     sequence::{delimited, preceded, separated_pair},
     IResult,
 };
@@ -62,10 +62,10 @@ impl UError for BadSequence {}
 
 #[derive(Debug, Clone, Copy)]
 pub enum Sequence {
-    Char(char),
-    CharRange(u32, u32),
-    CharStar(char),
-    CharRepeat(char, usize),
+    Char(u8),
+    CharRange(u8, u8),
+    CharStar(u8),
+    CharRepeat(u8, usize),
     Alnum,
     Alpha,
     Blank,
@@ -81,21 +81,17 @@ pub enum Sequence {
 }
 
 impl Sequence {
-    pub fn flatten(&self) -> Box<dyn Iterator<Item = char>> {
+    pub fn flatten(&self) -> Box<dyn Iterator<Item = u8>> {
         match self {
             Self::Char(c) => Box::new(std::iter::once(*c)),
-            Self::CharRange(l, r) => Box::new((*l..=*r).flat_map(std::char::from_u32)),
+            Self::CharRange(l, r) => Box::new(*l..=*r),
             Self::CharStar(c) => Box::new(std::iter::repeat(*c)),
             Self::CharRepeat(c, n) => Box::new(std::iter::repeat(*c).take(*n)),
-            Self::Alnum => Box::new(('0'..='9').chain('A'..='Z').chain('a'..='z')),
-            Self::Alpha => Box::new(('A'..='Z').chain('a'..='z')),
+            Self::Alnum => Box::new((b'0'..=b'9').chain(b'A'..=b'Z').chain(b'a'..=b'z')),
+            Self::Alpha => Box::new((b'A'..=b'Z').chain(b'a'..=b'z')),
             Self::Blank => Box::new(unicode_table::BLANK.iter().cloned()),
-            Self::Control => Box::new(
-                (0..=31)
-                    .chain(std::iter::once(127))
-                    .flat_map(std::char::from_u32),
-            ),
-            Self::Digit => Box::new('0'..='9'),
+            Self::Control => Box::new((0..=31).chain(std::iter::once(127))),
+            Self::Digit => Box::new(b'0'..=b'9'),
             Self::Graph => Box::new(
                 (48..=57) // digit
                     .chain(65..=90) // uppercase
@@ -105,10 +101,9 @@ impl Sequence {
                     .chain(58..=64)
                     .chain(91..=96)
                     .chain(123..=126)
-                    .chain(std::iter::once(32)) // space
-                    .flat_map(std::char::from_u32),
+                    .chain(std::iter::once(32)), // space
             ),
-            Self::Lower => Box::new('a'..='z'),
+            Self::Lower => Box::new(b'a'..=b'z'),
             Self::Print => Box::new(
                 (48..=57) // digit
                     .chain(65..=90) // uppercase
@@ -117,29 +112,22 @@ impl Sequence {
                     .chain(33..=47)
                     .chain(58..=64)
                     .chain(91..=96)
-                    .chain(123..=126)
-                    .flat_map(std::char::from_u32),
-            ),
-            Self::Punct => Box::new(
-                (33..=47)
-                    .chain(58..=64)
-                    .chain(91..=96)
-                    .chain(123..=126)
-                    .flat_map(std::char::from_u32),
+                    .chain(123..=126),
             ),
+            Self::Punct => Box::new((33..=47).chain(58..=64).chain(91..=96).chain(123..=126)),
             Self::Space => Box::new(unicode_table::SPACES.iter().cloned()),
-            Self::Upper => Box::new('A'..='Z'),
-            Self::Xdigit => Box::new(('0'..='9').chain('A'..='F').chain('a'..='f')),
+            Self::Upper => Box::new(b'A'..=b'Z'),
+            Self::Xdigit => Box::new((b'0'..=b'9').chain(b'A'..=b'F').chain(b'a'..=b'f')),
         }
     }
 
     // Hide all the nasty sh*t in here
     // TODO: Make the 2 set lazily generate the character mapping as necessary.
     pub fn solve_set_characters(
-        set1_str: &str,
-        set2_str: &str,
+        set1_str: &[u8],
+        set2_str: &[u8],
         truncate_set1_flag: bool,
-    ) -> Result<(Vec<char>, Vec<char>), BadSequence> {
+    ) -> Result<(Vec<u8>, Vec<u8>), BadSequence> {
         let set1 = Self::from_str(set1_str)?;
         let set2 = Self::from_str(set2_str)?;
 
@@ -164,7 +152,7 @@ impl Sequence {
                     .count();
                 let star_compensate_len = set1_len.saturating_sub(set2_len);
                 let (left, right) = (partition.next(), partition.next());
-                let set2_solved: Vec<char> = match (left, right) {
+                let set2_solved: Vec<_> = match (left, right) {
                     (None, None) => match char_star {
                         Some(c) => std::iter::repeat(*c).take(star_compensate_len).collect(),
                         None => std::iter::empty().collect(),
@@ -201,7 +189,7 @@ impl Sequence {
                             .collect(),
                     },
                 };
-                let mut set1_solved: Vec<char> = set1.iter().flat_map(Self::flatten).collect();
+                let mut set1_solved: Vec<_> = set1.iter().flat_map(Self::flatten).collect();
                 if truncate_set1_flag {
                     set1_solved.truncate(set2_solved.len());
                 }
@@ -216,7 +204,7 @@ impl Sequence {
 }
 
 impl Sequence {
-    pub fn from_str(input: &str) -> Result<Vec<Self>, BadSequence> {
+    pub fn from_str(input: &[u8]) -> Result<Vec<Self>, BadSequence> {
         many0(alt((
             Self::parse_char_range,
             Self::parse_char_star,
@@ -232,27 +220,38 @@ impl Sequence {
         .collect::<Result<Vec<_>, _>>()
     }
 
-    fn parse_backslash(input: &str) -> IResult<&str, char> {
-        preceded(tag("\\"), anychar)(input).map(|(l, a)| {
+    fn parse_octal(input: &[u8]) -> IResult<&[u8], u8> {
+        map_opt(
+            preceded(tag("\\"), recognize(many_m_n(1, 3, one_of("01234567")))),
+            |out: &[u8]| u8::from_str_radix(std::str::from_utf8(out).expect("boop"), 8).ok(),
+        )(input)
+    }
+
+    fn parse_backslash(input: &[u8]) -> IResult<&[u8], u8> {
+        preceded(tag("\\"), Self::single_char)(input).map(|(l, a)| {
             let c = match a {
-                'a' => unicode_table::BEL,
-                'b' => unicode_table::BS,
-                'f' => unicode_table::FF,
-                'n' => unicode_table::LF,
-                'r' => unicode_table::CR,
-                't' => unicode_table::HT,
-                'v' => unicode_table::VT,
+                b'a' => unicode_table::BEL,
+                b'b' => unicode_table::BS,
+                b'f' => unicode_table::FF,
+                b'n' => unicode_table::LF,
+                b'r' => unicode_table::CR,
+                b't' => unicode_table::HT,
+                b'v' => unicode_table::VT,
                 x => x,
             };
             (l, c)
         })
     }
 
-    fn parse_backslash_or_char(input: &str) -> IResult<&str, char> {
-        alt((Self::parse_backslash, anychar))(input)
+    fn parse_backslash_or_char(input: &[u8]) -> IResult<&[u8], u8> {
+        alt((Self::parse_octal, Self::parse_backslash, Self::single_char))(input)
+    }
+
+    fn single_char(input: &[u8]) -> IResult<&[u8], u8> {
+        take(1usize)(input).map(|(l, a)| (l, a[0]))
     }
 
-    fn parse_char_range(input: &str) -> IResult<&str, Result<Self, BadSequence>> {
+    fn parse_char_range(input: &[u8]) -> IResult<&[u8], Result<Self, BadSequence>> {
         separated_pair(
             Self::parse_backslash_or_char,
             tag("-"),
@@ -261,41 +260,42 @@ impl Sequence {
         .map(|(l, (a, b))| {
             (l, {
                 let (start, end) = (u32::from(a), u32::from(b));
-                Ok(Self::CharRange(start, end))
+                Ok(Self::CharRange(start as u8, end as u8))
             })
         })
     }
 
-    fn parse_char_star(input: &str) -> IResult<&str, Result<Self, BadSequence>> {
+    fn parse_char_star(input: &[u8]) -> IResult<&[u8], Result<Self, BadSequence>> {
         delimited(tag("["), Self::parse_backslash_or_char, tag("*]"))(input)
             .map(|(l, a)| (l, Ok(Self::CharStar(a))))
     }
 
-    fn parse_char_repeat(input: &str) -> IResult<&str, Result<Self, BadSequence>> {
+    fn parse_char_repeat(input: &[u8]) -> IResult<&[u8], Result<Self, BadSequence>> {
         delimited(
             tag("["),
             separated_pair(Self::parse_backslash_or_char, tag("*"), digit1),
             tag("]"),
         )(input)
         .map(|(l, (c, cnt_str))| {
-            let result = if cnt_str.starts_with('0') {
-                match usize::from_str_radix(cnt_str, 8) {
+            let s = String::from_utf8_lossy(cnt_str);
+            let result = if cnt_str.starts_with(b"0") {
+                match usize::from_str_radix(&s, 8) {
                     Ok(0) => Ok(Self::CharStar(c)),
                     Ok(count) => Ok(Self::CharRepeat(c, count)),
-                    Err(_) => Err(BadSequence::InvalidRepeatCount(cnt_str.to_string())),
+                    Err(_) => Err(BadSequence::InvalidRepeatCount(s.to_string())),
                 }
             } else {
-                match cnt_str.parse::<usize>() {
+                match s.parse::<usize>() {
                     Ok(0) => Ok(Self::CharStar(c)),
                     Ok(count) => Ok(Self::CharRepeat(c, count)),
-                    Err(_) => Err(BadSequence::InvalidRepeatCount(cnt_str.to_string())),
+                    Err(_) => Err(BadSequence::InvalidRepeatCount(s.to_string())),
                 }
             };
             (l, result)
         })
     }
 
-    fn parse_class(input: &str) -> IResult<&str, Result<Self, BadSequence>> {
+    fn parse_class(input: &[u8]) -> IResult<&[u8], Result<Self, BadSequence>> {
         delimited(
             tag("[:"),
             alt((
@@ -322,7 +322,7 @@ impl Sequence {
         )(input)
     }
 
-    fn parse_char_equal(input: &str) -> IResult<&str, Result<Self, BadSequence>> {
+    fn parse_char_equal(input: &[u8]) -> IResult<&[u8], Result<Self, BadSequence>> {
         delimited(
             tag("[="),
             alt((
@@ -338,17 +338,17 @@ impl Sequence {
 }
 
 pub trait SymbolTranslator {
-    fn translate(&mut self, current: char) -> Option<char>;
+    fn translate(&mut self, current: u8) -> Option<u8>;
 }
 
 #[derive(Debug)]
 pub struct DeleteOperation {
-    set: Vec<char>,
+    set: Vec<u8>,
     complement_flag: bool,
 }
 
 impl DeleteOperation {
-    pub fn new(set: Vec<char>, complement_flag: bool) -> Self {
+    pub fn new(set: Vec<u8>, complement_flag: bool) -> Self {
         Self {
             set,
             complement_flag,
@@ -357,8 +357,8 @@ impl DeleteOperation {
 }
 
 impl SymbolTranslator for DeleteOperation {
-    fn translate(&mut self, current: char) -> Option<char> {
-        let found = self.set.iter().any(|sequence| sequence.eq(&current));
+    fn translate(&mut self, current: u8) -> Option<u8> {
+        let found = self.set.iter().any(|sequence| *sequence == current);
         if self.complement_flag == found {
             Some(current)
         } else {
@@ -368,15 +368,15 @@ impl SymbolTranslator for DeleteOperation {
 }
 
 pub struct TranslateOperationComplement {
-    iter: u32,
+    iter: u8,
     set2_iter: usize,
-    set1: Vec<char>,
-    set2: Vec<char>,
-    translation_map: HashMap<char, char>,
+    set1: Vec<u8>,
+    set2: Vec<u8>,
+    translation_map: HashMap<u8, u8>,
 }
 
 impl TranslateOperationComplement {
-    fn new(set1: Vec<char>, set2: Vec<char>) -> Self {
+    fn new(set1: Vec<u8>, set2: Vec<u8>) -> Self {
         Self {
             iter: 0,
             set2_iter: 0,
@@ -389,11 +389,11 @@ impl TranslateOperationComplement {
 
 #[derive(Debug)]
 pub struct TranslateOperationStandard {
-    translation_map: HashMap<char, char>,
+    translation_map: HashMap<u8, u8>,
 }
 
 impl TranslateOperationStandard {
-    fn new(set1: Vec<char>, set2: Vec<char>) -> Result<Self, BadSequence> {
+    fn new(set1: Vec<u8>, set2: Vec<u8>) -> Result<Self, BadSequence> {
         if let Some(fallback) = set2.last().copied() {
             Ok(Self {
                 translation_map: set1
@@ -417,18 +417,17 @@ pub enum TranslateOperation {
 }
 
 impl TranslateOperation {
-    fn next_complement_char(iter: u32, ignore_list: &[char]) -> (u32, char) {
+    fn next_complement_char(iter: u8, ignore_list: &[u8]) -> (u8, u8) {
         (iter..)
-            .filter_map(std::char::from_u32)
-            .filter(|c| !ignore_list.iter().any(|s| s.eq(c)))
-            .map(|c| (u32::from(c) + 1, c))
+            .filter(|c| !ignore_list.iter().any(|s| s == c))
+            .map(|c| (c + 1, c))
             .next()
             .expect("exhausted all possible characters")
     }
 }
 
 impl TranslateOperation {
-    pub fn new(set1: Vec<char>, set2: Vec<char>, complement: bool) -> Result<Self, BadSequence> {
+    pub fn new(set1: Vec<u8>, set2: Vec<u8>, complement: bool) -> Result<Self, BadSequence> {
         if complement {
             Ok(Self::Complement(TranslateOperationComplement::new(
                 set1, set2,
@@ -440,7 +439,7 @@ impl TranslateOperation {
 }
 
 impl SymbolTranslator for TranslateOperation {
-    fn translate(&mut self, current: char) -> Option<char> {
+    fn translate(&mut self, current: u8) -> Option<u8> {
         match self {
             Self::Standard(TranslateOperationStandard { translation_map }) => Some(
                 translation_map
@@ -482,13 +481,13 @@ impl SymbolTranslator for TranslateOperation {
 
 #[derive(Debug, Clone)]
 pub struct SqueezeOperation {
-    set1: HashSet<char>,
+    set1: HashSet<u8>,
     complement: bool,
-    previous: Option<char>,
+    previous: Option<u8>,
 }
 
 impl SqueezeOperation {
-    pub fn new(set1: Vec<char>, complement: bool) -> Self {
+    pub fn new(set1: Vec<u8>, complement: bool) -> Self {
         Self {
             set1: set1.into_iter().collect(),
             complement,
@@ -498,7 +497,7 @@ impl SqueezeOperation {
 }
 
 impl SymbolTranslator for SqueezeOperation {
-    fn translate(&mut self, current: char) -> Option<char> {
+    fn translate(&mut self, current: u8) -> Option<u8> {
         if self.complement {
             let next = if self.set1.contains(&current) {
                 Some(current)
@@ -537,15 +536,15 @@ where
     R: BufRead,
     W: Write,
 {
-    let mut buf = String::new();
-    let mut output_buf = String::new();
-    while let Ok(length) = input.read_line(&mut buf) {
+    let mut buf = Vec::new();
+    let mut output_buf = Vec::new();
+    while let Ok(length) = input.read_until(b'\n', &mut buf) {
         if length == 0 {
             break;
         } else {
-            let filtered = buf.chars().filter_map(|c| translator.translate(c));
+            let filtered = buf.iter().filter_map(|c| translator.translate(*c));
             output_buf.extend(filtered);
-            output.write_all(output_buf.as_bytes()).unwrap();
+            output.write_all(&output_buf).unwrap();
         }
         buf.clear();
         output_buf.clear();
diff --git a/src/uu/tr/src/tr.rs b/src/uu/tr/src/tr.rs
index 9c6e7a7da58..4fddf8d50af 100644
--- a/src/uu/tr/src/tr.rs
+++ b/src/uu/tr/src/tr.rs
@@ -5,7 +5,6 @@
 
 // spell-checker:ignore (ToDO) allocs bset dflag cflag sflag tflag
 
-mod convert;
 mod operation;
 mod unicode_table;
 
@@ -42,14 +41,15 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
     let squeeze_flag = matches.get_flag(options::SQUEEZE);
     let truncate_set1_flag = matches.get_flag(options::TRUNCATE_SET1);
 
-    let sets = matches
+    // Ultimately this should be OsString, but we might want to wait for the
+    // pattern API on OsStr
+    let sets: Vec<_> = matches
         .get_many::<String>(options::SETS)
-        .map(|v| {
-            v.map(ToString::to_string)
-                .map(|input| convert::reduce_octal_to_char(&input))
-                .collect::<Vec<_>>()
-        })
-        .unwrap_or_default();
+        .into_iter()
+        .flatten()
+        .map(ToOwned::to_owned)
+        .collect();
+
     let sets_len = sets.len();
 
     if sets.is_empty() {
@@ -80,8 +80,8 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
 
     let mut sets_iter = sets.iter().map(|c| c.as_str());
     let (set1, set2) = Sequence::solve_set_characters(
-        sets_iter.next().unwrap_or_default(),
-        sets_iter.next().unwrap_or_default(),
+        sets_iter.next().unwrap_or_default().as_bytes(),
+        sets_iter.next().unwrap_or_default().as_bytes(),
         truncate_set1_flag,
     )?;
 
diff --git a/src/uu/tr/src/unicode_table.rs b/src/uu/tr/src/unicode_table.rs
index a00a30b8bee..5d31ab37569 100644
--- a/src/uu/tr/src/unicode_table.rs
+++ b/src/uu/tr/src/unicode_table.rs
@@ -3,13 +3,13 @@
 // For the full copyright and license information, please view the LICENSE
 // file that was distributed with this source code.
 
-pub static BEL: char = '\u{0007}';
-pub static BS: char = '\u{0008}';
-pub static HT: char = '\u{0009}';
-pub static LF: char = '\u{000A}';
-pub static VT: char = '\u{000B}';
-pub static FF: char = '\u{000C}';
-pub static CR: char = '\u{000D}';
-pub static SPACE: char = '\u{0020}';
-pub static SPACES: &[char] = &[HT, LF, VT, FF, CR, SPACE];
-pub static BLANK: &[char] = &[SPACE, HT];
+pub static BEL: u8 = 0x7;
+pub static BS: u8 = 0x8;
+pub static HT: u8 = 0x9;
+pub static LF: u8 = 0xA;
+pub static VT: u8 = 0xB;
+pub static FF: u8 = 0xC;
+pub static CR: u8 = 0xD;
+pub static SPACE: u8 = 0x20;
+pub static SPACES: &[u8] = &[HT, LF, VT, FF, CR, SPACE];
+pub static BLANK: &[u8] = &[SPACE, HT];
diff --git a/tests/by-util/test_tr.rs b/tests/by-util/test_tr.rs
index 7c475a492ef..01d062cab7b 100644
--- a/tests/by-util/test_tr.rs
+++ b/tests/by-util/test_tr.rs
@@ -29,12 +29,12 @@ fn test_small_set2() {
 }
 
 #[test]
-fn test_unicode() {
+fn test_invalid_unicode() {
     new_ucmd!()
-        .args(&[", ┬─┬", "╯︵┻━┻"])
-        .pipe_in("(,°□°）, ┬─┬")
-        .run()
-        .stdout_is("(╯°□°）╯︵┻━┻");
+        .args(&["-dc", "abc"])
+        .pipe_in([0o200, b'a', b'b', b'c'])
+        .succeeds()
+        .stdout_is("abc");
 }
 
 #[test]
@@ -733,10 +733,11 @@ fn check_against_gnu_tr_tests_w() {
     //  {IN=>"\300\301\377\345\345\350\345"},
     //  {OUT=>"\300\301\377\345"}],
     new_ucmd!()
-        .args(&["-ds", "\u{350}", "\u{345}"])
-        .pipe_in("\u{300}\u{301}\u{377}\u{345}\u{345}\u{350}\u{345}")
+        .arg("-ds")
+        .args(&["\\350", "\\345"])
+        .pipe_in([0o300, 0o301, 0o377, 0o345, 0o345, 0o350, 0o345])
         .succeeds()
-        .stdout_is("\u{300}\u{301}\u{377}\u{345}");
+        .stdout_is_bytes([0o300, 0o301, 0o377, 0o345]);
 }
 
 #[test]

From f165c8e1fd9655737e4d78a9d656927e6b32ad38 Mon Sep 17 00:00:00 2001
From: Terts Diepraam <terts.diepraam@gmail.com>
Date: Mon, 11 Dec 2023 13:40:55 +0100
Subject: [PATCH 167/429] fuzz/echo: set should_pass to true

---
 .github/workflows/fuzzing.yml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/.github/workflows/fuzzing.yml b/.github/workflows/fuzzing.yml
index eed2ae2fc99..dcf08dba5cf 100644
--- a/.github/workflows/fuzzing.yml
+++ b/.github/workflows/fuzzing.yml
@@ -46,7 +46,7 @@ jobs:
           - { name: fuzz_date, should_pass: false }
           - { name: fuzz_expr, should_pass: true }
           - { name: fuzz_printf, should_pass: false }
-          - { name: fuzz_echo, should_pass: false }
+          - { name: fuzz_echo, should_pass: true }
           - { name: fuzz_seq, should_pass: false }
           - { name: fuzz_parse_glob, should_pass: true }
           - { name: fuzz_parse_size, should_pass: true }

From 6711dd569480c63ed1c6acb9de59b360a665a84c Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Mon, 11 Dec 2023 16:38:55 +0100
Subject: [PATCH 168/429] ls: make --block-size and --human-readable/--si

override each other
---
 src/uu/ls/src/ls.rs      |  6 +++--
 tests/by-util/test_ls.rs | 50 ++++++++++++++++++++++++++++++++++++++++
 2 files changed, 54 insertions(+), 2 deletions(-)

diff --git a/src/uu/ls/src/ls.rs b/src/uu/ls/src/ls.rs
index a5fe3d6246d..2aa4bad067b 100644
--- a/src/uu/ls/src/ls.rs
+++ b/src/uu/ls/src/ls.rs
@@ -1552,7 +1552,7 @@ pub fn uu_app() -> Command {
                 .short('h')
                 .long(options::size::HUMAN_READABLE)
                 .help("Print human readable file sizes (e.g. 1K 234M 56G).")
-                .overrides_with(options::size::SI)
+                .overrides_with_all([options::size::BLOCK_SIZE, options::size::SI])
                 .action(ArgAction::SetTrue),
         )
         .arg(
@@ -1569,6 +1569,7 @@ pub fn uu_app() -> Command {
             Arg::new(options::size::SI)
                 .long(options::size::SI)
                 .help("Print human readable file sizes using powers of 1000 instead of 1024.")
+                .overrides_with_all([options::size::BLOCK_SIZE, options::size::HUMAN_READABLE])
                 .action(ArgAction::SetTrue),
         )
         .arg(
@@ -1576,7 +1577,8 @@ pub fn uu_app() -> Command {
                 .long(options::size::BLOCK_SIZE)
                 .require_equals(true)
                 .value_name("BLOCK_SIZE")
-                .help("scale sizes by BLOCK_SIZE when printing them"),
+                .help("scale sizes by BLOCK_SIZE when printing them")
+                .overrides_with_all([options::size::SI, options::size::HUMAN_READABLE]),
         )
         .arg(
             Arg::new(options::INODE)
diff --git a/tests/by-util/test_ls.rs b/tests/by-util/test_ls.rs
index c9f43028c9c..179941e7878 100644
--- a/tests/by-util/test_ls.rs
+++ b/tests/by-util/test_ls.rs
@@ -3874,6 +3874,56 @@ fn test_ls_invalid_block_size() {
         .stderr_is("ls: invalid --block-size argument 'invalid'\n");
 }
 
+#[cfg(all(unix, feature = "dd"))]
+#[test]
+fn test_ls_block_size_override() {
+    let scene = TestScenario::new(util_name!());
+
+    scene
+        .ccmd("dd")
+        .arg("if=/dev/zero")
+        .arg("of=file")
+        .arg("bs=1024")
+        .arg("count=1")
+        .succeeds();
+
+    // --si "wins"
+    scene
+        .ucmd()
+        .arg("-s")
+        .arg("--block-size=512")
+        .arg("--si")
+        .succeeds()
+        .stdout_contains_line("total 4.1k");
+
+    // --block-size "wins"
+    scene
+        .ucmd()
+        .arg("-s")
+        .arg("--si")
+        .arg("--block-size=512")
+        .succeeds()
+        .stdout_contains_line("total 8");
+
+    // --human-readable "wins"
+    scene
+        .ucmd()
+        .arg("-s")
+        .arg("--block-size=512")
+        .arg("--human-readable")
+        .succeeds()
+        .stdout_contains_line("total 4.0K");
+
+    // --block-size "wins"
+    scene
+        .ucmd()
+        .arg("-s")
+        .arg("--human-readable")
+        .arg("--block-size=512")
+        .succeeds()
+        .stdout_contains_line("total 8");
+}
+
 #[test]
 fn test_ls_hyperlink() {
     let scene = TestScenario::new(util_name!());

From d239b2f47b9a690905b60a51be5e4805e79af581 Mon Sep 17 00:00:00 2001
From: Laurent Cheylus <foxy@free.fr>
Date: Sun, 3 Dec 2023 09:41:03 +0100
Subject: [PATCH 169/429] chroot: add OpenBSD support for set_groups function

---
 src/uu/chroot/src/chroot.rs | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/uu/chroot/src/chroot.rs b/src/uu/chroot/src/chroot.rs
index 6366775c36d..b0469ae0451 100644
--- a/src/uu/chroot/src/chroot.rs
+++ b/src/uu/chroot/src/chroot.rs
@@ -253,7 +253,7 @@ fn set_main_group(group: &str) -> UResult<()> {
     Ok(())
 }
 
-#[cfg(any(target_vendor = "apple", target_os = "freebsd"))]
+#[cfg(any(target_vendor = "apple", target_os = "freebsd", target_os = "openbsd"))]
 fn set_groups(groups: &[libc::gid_t]) -> libc::c_int {
     unsafe { setgroups(groups.len() as libc::c_int, groups.as_ptr()) }
 }

From 94537d3b34d5bf5979c0953f281684786009deb9 Mon Sep 17 00:00:00 2001
From: Laurent Cheylus <foxy@free.fr>
Date: Sun, 3 Dec 2023 09:42:27 +0100
Subject: [PATCH 170/429] id: fix support for OpenBSD

  - add target_os cfg for pline function
  - add target_os cfg for auditd function (void on OpenBSD)
---
 src/uu/id/src/id.rs | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/src/uu/id/src/id.rs b/src/uu/id/src/id.rs
index 8b16ba8b733..b8fb51d79db 100644
--- a/src/uu/id/src/id.rs
+++ b/src/uu/id/src/id.rs
@@ -507,7 +507,7 @@ fn pline(possible_uid: Option<uid_t>) {
     );
 }
 
-#[cfg(any(target_os = "linux", target_os = "android"))]
+#[cfg(any(target_os = "linux", target_os = "android", target_os = "openbsd"))]
 fn pline(possible_uid: Option<uid_t>) {
     let uid = possible_uid.unwrap_or_else(getuid);
     let pw = Passwd::locate(uid).unwrap();
@@ -524,10 +524,10 @@ fn pline(possible_uid: Option<uid_t>) {
     );
 }
 
-#[cfg(any(target_os = "linux", target_os = "android"))]
+#[cfg(any(target_os = "linux", target_os = "android", target_os = "openbsd"))]
 fn auditid() {}
 
-#[cfg(not(any(target_os = "linux", target_os = "android")))]
+#[cfg(not(any(target_os = "linux", target_os = "android", target_os = "openbsd")))]
 fn auditid() {
     use std::mem::MaybeUninit;
 
@@ -624,7 +624,7 @@ fn id_print(state: &State, groups: &[u32]) {
     }
 }
 
-#[cfg(not(any(target_os = "linux", target_os = "android")))]
+#[cfg(not(any(target_os = "linux", target_os = "android", target_os = "openbsd")))]
 mod audit {
     use super::libc::{c_int, c_uint, dev_t, pid_t, uid_t};
 

From 38ea40d0bf2e0d2632a1f0b0c3a428f5c7b40d9c Mon Sep 17 00:00:00 2001
From: Laurent Cheylus <foxy@free.fr>
Date: Sun, 3 Dec 2023 09:44:19 +0100
Subject: [PATCH 171/429] nohup: fix for OpenBSD with
 _vprocmgr_detach_from_console function

---
 src/uu/nohup/src/nohup.rs | 7 ++++++-
 1 file changed, 6 insertions(+), 1 deletion(-)

diff --git a/src/uu/nohup/src/nohup.rs b/src/uu/nohup/src/nohup.rs
index c64f7bf71ba..a93f1ba7024 100644
--- a/src/uu/nohup/src/nohup.rs
+++ b/src/uu/nohup/src/nohup.rs
@@ -200,7 +200,12 @@ extern "C" {
     fn _vprocmgr_detach_from_console(flags: u32) -> *const libc::c_int;
 }
 
-#[cfg(any(target_os = "linux", target_os = "android", target_os = "freebsd"))]
+#[cfg(any(
+    target_os = "linux",
+    target_os = "android",
+    target_os = "freebsd",
+    target_os = "openbsd"
+))]
 unsafe fn _vprocmgr_detach_from_console(_: u32) -> *const libc::c_int {
     std::ptr::null()
 }

From e6d12732f517db75df728ea47b4340609438eb11 Mon Sep 17 00:00:00 2001
From: Laurent Cheylus <foxy@free.fr>
Date: Mon, 4 Dec 2023 18:53:04 +0100
Subject: [PATCH 172/429] uucore: disable utmpx feature on OpenBSD

  - See issue uutils/coreutils#5596 for details
---
 src/uucore/src/lib/features.rs | 1 +
 src/uucore/src/lib/lib.rs      | 1 +
 2 files changed, 2 insertions(+)

diff --git a/src/uucore/src/lib/features.rs b/src/uucore/src/lib/features.rs
index a28e8a7bfc9..e26de487b57 100644
--- a/src/uucore/src/lib/features.rs
+++ b/src/uucore/src/lib/features.rs
@@ -52,6 +52,7 @@ pub mod signals;
     unix,
     not(target_os = "android"),
     not(target_os = "fuchsia"),
+    not(target_os = "openbsd"),
     not(target_os = "redox"),
     not(target_env = "musl"),
     feature = "utmpx"
diff --git a/src/uucore/src/lib/lib.rs b/src/uucore/src/lib/lib.rs
index 426b4216ca2..dcef26443ea 100644
--- a/src/uucore/src/lib/lib.rs
+++ b/src/uucore/src/lib/lib.rs
@@ -79,6 +79,7 @@ pub use crate::features::signals;
     unix,
     not(target_os = "android"),
     not(target_os = "fuchsia"),
+    not(target_os = "openbsd"),
     not(target_os = "redox"),
     not(target_env = "musl"),
     feature = "utmpx"

From d3e6e7a947a3987d66433421716b032ab292fa50 Mon Sep 17 00:00:00 2001
From: Laurent Cheylus <foxy@free.fr>
Date: Sat, 9 Dec 2023 18:31:58 +0100
Subject: [PATCH 173/429] pinky: tool unsupported on OpenBSD

  - utmpx not supported on OpenBSD

  - add src/uu/pinky/src/platform directory and platform/mod.rs for conditional compilation
    according to target_os
  - platform/openbsd.rs: implementation on OpenBSD (unsupported tool)
  - platform/unix.rs: implementation on other OS
  - src/uu/pinky/src/pinky.rs: use platform module for uucore::main function
---
 src/uu/pinky/src/pinky.rs            | 284 +-------------------------
 src/uu/pinky/src/platform/mod.rs     |  14 ++
 src/uu/pinky/src/platform/openbsd.rs |  17 ++
 src/uu/pinky/src/platform/unix.rs    | 293 +++++++++++++++++++++++++++
 4 files changed, 327 insertions(+), 281 deletions(-)
 create mode 100644 src/uu/pinky/src/platform/mod.rs
 create mode 100644 src/uu/pinky/src/platform/openbsd.rs
 create mode 100644 src/uu/pinky/src/platform/unix.rs

diff --git a/src/uu/pinky/src/pinky.rs b/src/uu/pinky/src/pinky.rs
index 8ac8f6c8446..6b393b905d6 100644
--- a/src/uu/pinky/src/pinky.rs
+++ b/src/uu/pinky/src/pinky.rs
@@ -5,21 +5,11 @@
 
 // spell-checker:ignore (ToDO) BUFSIZE gecos fullname, mesg iobuf
 
-use uucore::entries::{Locate, Passwd};
-use uucore::error::{FromIo, UResult};
-use uucore::libc::S_IWGRP;
-use uucore::utmpx::{self, time, Utmpx};
-
-use std::io::prelude::*;
-use std::io::BufReader;
-
-use std::fs::File;
-use std::os::unix::fs::MetadataExt;
-
 use clap::{crate_version, Arg, ArgAction, Command};
-use std::path::PathBuf;
 use uucore::{format_usage, help_about, help_usage};
 
+mod platform;
+
 const ABOUT: &str = help_about!("pinky.md");
 const USAGE: &str = help_usage!("pinky.md");
 
@@ -37,88 +27,8 @@ mod options {
     pub const HELP: &str = "help";
 }
 
-fn get_long_usage() -> String {
-    format!(
-        "A lightweight 'finger' program;  print user information.\n\
-         The utmp file will be {}.",
-        utmpx::DEFAULT_FILE
-    )
-}
-
 #[uucore::main]
-pub fn uumain(args: impl uucore::Args) -> UResult<()> {
-    let args = args.collect_ignore();
-
-    let matches = uu_app()
-        .after_help(get_long_usage())
-        .try_get_matches_from(args)?;
-
-    let users: Vec<String> = matches
-        .get_many::<String>(options::USER)
-        .map(|v| v.map(ToString::to_string).collect())
-        .unwrap_or_default();
-
-    // If true, display the hours:minutes since each user has touched
-    // the keyboard, or blank if within the last minute, or days followed
-    // by a 'd' if not within the last day.
-    let mut include_idle = true;
-
-    // If true, display a line at the top describing each field.
-    let include_heading = !matches.get_flag(options::OMIT_HEADINGS);
-
-    // if true, display the user's full name from pw_gecos.
-    let mut include_fullname = true;
-
-    // if true, display the user's ~/.project file when doing long format.
-    let include_project = !matches.get_flag(options::OMIT_PROJECT_FILE);
-
-    // if true, display the user's ~/.plan file when doing long format.
-    let include_plan = !matches.get_flag(options::OMIT_PLAN_FILE);
-
-    // if true, display the user's home directory and shell
-    // when doing long format.
-    let include_home_and_shell = !matches.get_flag(options::OMIT_HOME_DIR);
-
-    // if true, use the "short" output format.
-    let do_short_format = !matches.get_flag(options::LONG_FORMAT);
-
-    /* if true, display the ut_host field. */
-    let mut include_where = true;
-
-    if matches.get_flag(options::OMIT_NAME) {
-        include_fullname = false;
-    }
-    if matches.get_flag(options::OMIT_NAME_HOST) {
-        include_fullname = false;
-        include_where = false;
-    }
-    if matches.get_flag(options::OMIT_NAME_HOST_TIME) {
-        include_fullname = false;
-        include_idle = false;
-        include_where = false;
-    }
-
-    let pk = Pinky {
-        include_idle,
-        include_heading,
-        include_fullname,
-        include_project,
-        include_plan,
-        include_home_and_shell,
-        include_where,
-        names: users,
-    };
-
-    if do_short_format {
-        match pk.short_pinky() {
-            Ok(_) => Ok(()),
-            Err(e) => Err(e.map_err_context(String::new)),
-        }
-    } else {
-        pk.long_pinky();
-        Ok(())
-    }
-}
+use platform::uumain;
 
 pub fn uu_app() -> Command {
     Command::new(uucore::util_name())
@@ -197,17 +107,6 @@ pub fn uu_app() -> Command {
         )
 }
 
-struct Pinky {
-    include_idle: bool,
-    include_heading: bool,
-    include_fullname: bool,
-    include_project: bool,
-    include_plan: bool,
-    include_where: bool,
-    include_home_and_shell: bool,
-    names: Vec<String>,
-}
-
 pub trait Capitalize {
     fn capitalize(&self) -> String;
 }
@@ -225,180 +124,3 @@ impl Capitalize for str {
             })
     }
 }
-
-fn idle_string(when: i64) -> String {
-    thread_local! {
-        static NOW: time::OffsetDateTime = time::OffsetDateTime::now_local().unwrap();
-    }
-    NOW.with(|n| {
-        let duration = n.unix_timestamp() - when;
-        if duration < 60 {
-            // less than 1min
-            "     ".to_owned()
-        } else if duration < 24 * 3600 {
-            // less than 1day
-            let hours = duration / (60 * 60);
-            let minutes = (duration % (60 * 60)) / 60;
-            format!("{hours:02}:{minutes:02}")
-        } else {
-            // more than 1day
-            let days = duration / (24 * 3600);
-            format!("{days}d")
-        }
-    })
-}
-
-fn time_string(ut: &Utmpx) -> String {
-    // "%b %e %H:%M"
-    let time_format: Vec<time::format_description::FormatItem> =
-        time::format_description::parse("[month repr:short] [day padding:space] [hour]:[minute]")
-            .unwrap();
-    ut.login_time().format(&time_format).unwrap() // LC_ALL=C
-}
-
-fn gecos_to_fullname(pw: &Passwd) -> Option<String> {
-    let mut gecos = if let Some(gecos) = &pw.user_info {
-        gecos.clone()
-    } else {
-        return None;
-    };
-    if let Some(n) = gecos.find(',') {
-        gecos.truncate(n);
-    }
-    Some(gecos.replace('&', &pw.name.capitalize()))
-}
-
-impl Pinky {
-    fn print_entry(&self, ut: &Utmpx) -> std::io::Result<()> {
-        let mut pts_path = PathBuf::from("/dev");
-        pts_path.push(ut.tty_device().as_str());
-
-        let mesg;
-        let last_change;
-
-        match pts_path.metadata() {
-            #[allow(clippy::unnecessary_cast)]
-            Ok(meta) => {
-                mesg = if meta.mode() & S_IWGRP as u32 == 0 {
-                    '*'
-                } else {
-                    ' '
-                };
-                last_change = meta.atime();
-            }
-            _ => {
-                mesg = '?';
-                last_change = 0;
-            }
-        }
-
-        print!("{1:<8.0$}", utmpx::UT_NAMESIZE, ut.user());
-
-        if self.include_fullname {
-            let fullname = if let Ok(pw) = Passwd::locate(ut.user().as_ref()) {
-                gecos_to_fullname(&pw)
-            } else {
-                None
-            };
-            if let Some(fullname) = fullname {
-                print!(" {fullname:<19.19}");
-            } else {
-                print!(" {:19}", "        ???");
-            }
-        }
-
-        print!(" {}{:<8.*}", mesg, utmpx::UT_LINESIZE, ut.tty_device());
-
-        if self.include_idle {
-            if last_change == 0 {
-                print!(" {:<6}", "?????");
-            } else {
-                print!(" {:<6}", idle_string(last_change));
-            }
-        }
-
-        print!(" {}", time_string(ut));
-
-        let mut s = ut.host();
-        if self.include_where && !s.is_empty() {
-            s = ut.canon_host()?;
-            print!(" {s}");
-        }
-
-        println!();
-        Ok(())
-    }
-
-    fn print_heading(&self) {
-        print!("{:<8}", "Login");
-        if self.include_fullname {
-            print!(" {:<19}", "Name");
-        }
-        print!(" {:<9}", " TTY");
-        if self.include_idle {
-            print!(" {:<6}", "Idle");
-        }
-        print!(" {:<16}", "When");
-        if self.include_where {
-            print!(" Where");
-        }
-        println!();
-    }
-
-    fn short_pinky(&self) -> std::io::Result<()> {
-        if self.include_heading {
-            self.print_heading();
-        }
-        for ut in Utmpx::iter_all_records() {
-            if ut.is_user_process()
-                && (self.names.is_empty() || self.names.iter().any(|n| n.as_str() == ut.user()))
-            {
-                self.print_entry(&ut)?;
-            }
-        }
-        Ok(())
-    }
-
-    fn long_pinky(&self) {
-        for u in &self.names {
-            print!("Login name: {u:<28}In real life: ");
-            if let Ok(pw) = Passwd::locate(u.as_str()) {
-                let fullname = gecos_to_fullname(&pw).unwrap_or_default();
-                let user_dir = pw.user_dir.unwrap_or_default();
-                let user_shell = pw.user_shell.unwrap_or_default();
-                println!(" {fullname}");
-                if self.include_home_and_shell {
-                    print!("Directory: {user_dir:<29}");
-                    println!("Shell:  {user_shell}");
-                }
-                if self.include_project {
-                    let mut p = PathBuf::from(&user_dir);
-                    p.push(".project");
-                    if let Ok(f) = File::open(p) {
-                        print!("Project: ");
-                        read_to_console(f);
-                    }
-                }
-                if self.include_plan {
-                    let mut p = PathBuf::from(&user_dir);
-                    p.push(".plan");
-                    if let Ok(f) = File::open(p) {
-                        println!("Plan:");
-                        read_to_console(f);
-                    }
-                }
-                println!();
-            } else {
-                println!(" ???");
-            }
-        }
-    }
-}
-
-fn read_to_console<F: Read>(f: F) {
-    let mut reader = BufReader::new(f);
-    let mut iobuf = Vec::new();
-    if reader.read_to_end(&mut iobuf).is_ok() {
-        print!("{}", String::from_utf8_lossy(&iobuf));
-    }
-}
diff --git a/src/uu/pinky/src/platform/mod.rs b/src/uu/pinky/src/platform/mod.rs
new file mode 100644
index 00000000000..e0e87dca1bf
--- /dev/null
+++ b/src/uu/pinky/src/platform/mod.rs
@@ -0,0 +1,14 @@
+// This file is part of the uutils coreutils package.
+//
+// For the full copyright and license information, please view the LICENSE
+// file that was distributed with this source code.
+
+#[cfg(not(target_os = "openbsd"))]
+mod unix;
+#[cfg(not(target_os = "openbsd"))]
+pub use self::unix::*;
+
+#[cfg(target_os = "openbsd")]
+mod openbsd;
+#[cfg(target_os = "openbsd")]
+pub use self::openbsd::*;
diff --git a/src/uu/pinky/src/platform/openbsd.rs b/src/uu/pinky/src/platform/openbsd.rs
new file mode 100644
index 00000000000..7e6970c1f09
--- /dev/null
+++ b/src/uu/pinky/src/platform/openbsd.rs
@@ -0,0 +1,17 @@
+// This file is part of the uutils coreutils package.
+//
+// For the full copyright and license information, please view the LICENSE
+// file that was distributed with this source code.
+
+// Specific implementation for OpenBSD: tool unsupported (utmpx not supported)
+
+use crate::uu_app;
+
+use uucore::error::UResult;
+
+pub fn uumain(args: impl uucore::Args) -> UResult<()> {
+    let _matches = uu_app().try_get_matches_from(args)?;
+
+    println!("unsupported command on OpenBSD");
+    Ok(())
+}
diff --git a/src/uu/pinky/src/platform/unix.rs b/src/uu/pinky/src/platform/unix.rs
new file mode 100644
index 00000000000..381acacd2f6
--- /dev/null
+++ b/src/uu/pinky/src/platform/unix.rs
@@ -0,0 +1,293 @@
+// This file is part of the uutils coreutils package.
+//
+// For the full copyright and license information, please view the LICENSE
+// file that was distributed with this source code.
+
+// spell-checker:ignore (ToDO) BUFSIZE gecos fullname, mesg iobuf
+
+use crate::options;
+use crate::uu_app;
+use crate::Capitalize;
+
+use uucore::entries::{Locate, Passwd};
+use uucore::error::{FromIo, UResult};
+use uucore::libc::S_IWGRP;
+use uucore::utmpx::{self, time, Utmpx};
+
+use std::io::prelude::*;
+use std::io::BufReader;
+
+use std::fs::File;
+use std::os::unix::fs::MetadataExt;
+
+use std::path::PathBuf;
+
+fn get_long_usage() -> String {
+    format!(
+        "A lightweight 'finger' program;  print user information.\n\
+         The utmp file will be {}.",
+        utmpx::DEFAULT_FILE
+    )
+}
+
+pub fn uumain(args: impl uucore::Args) -> UResult<()> {
+    let args = args.collect_ignore();
+
+    let matches = uu_app()
+        .after_help(get_long_usage())
+        .try_get_matches_from(args)?;
+
+    let users: Vec<String> = matches
+        .get_many::<String>(options::USER)
+        .map(|v| v.map(ToString::to_string).collect())
+        .unwrap_or_default();
+
+    // If true, display the hours:minutes since each user has touched
+    // the keyboard, or blank if within the last minute, or days followed
+    // by a 'd' if not within the last day.
+    let mut include_idle = true;
+
+    // If true, display a line at the top describing each field.
+    let include_heading = !matches.get_flag(options::OMIT_HEADINGS);
+
+    // if true, display the user's full name from pw_gecos.
+    let mut include_fullname = true;
+
+    // if true, display the user's ~/.project file when doing long format.
+    let include_project = !matches.get_flag(options::OMIT_PROJECT_FILE);
+
+    // if true, display the user's ~/.plan file when doing long format.
+    let include_plan = !matches.get_flag(options::OMIT_PLAN_FILE);
+
+    // if true, display the user's home directory and shell
+    // when doing long format.
+    let include_home_and_shell = !matches.get_flag(options::OMIT_HOME_DIR);
+
+    // if true, use the "short" output format.
+    let do_short_format = !matches.get_flag(options::LONG_FORMAT);
+
+    /* if true, display the ut_host field. */
+    let mut include_where = true;
+
+    if matches.get_flag(options::OMIT_NAME) {
+        include_fullname = false;
+    }
+    if matches.get_flag(options::OMIT_NAME_HOST) {
+        include_fullname = false;
+        include_where = false;
+    }
+    if matches.get_flag(options::OMIT_NAME_HOST_TIME) {
+        include_fullname = false;
+        include_idle = false;
+        include_where = false;
+    }
+
+    let pk = Pinky {
+        include_idle,
+        include_heading,
+        include_fullname,
+        include_project,
+        include_plan,
+        include_home_and_shell,
+        include_where,
+        names: users,
+    };
+
+    if do_short_format {
+        match pk.short_pinky() {
+            Ok(_) => Ok(()),
+            Err(e) => Err(e.map_err_context(String::new)),
+        }
+    } else {
+        pk.long_pinky();
+        Ok(())
+    }
+}
+
+struct Pinky {
+    include_idle: bool,
+    include_heading: bool,
+    include_fullname: bool,
+    include_project: bool,
+    include_plan: bool,
+    include_where: bool,
+    include_home_and_shell: bool,
+    names: Vec<String>,
+}
+
+fn idle_string(when: i64) -> String {
+    thread_local! {
+        static NOW: time::OffsetDateTime = time::OffsetDateTime::now_local().unwrap();
+    }
+    NOW.with(|n| {
+        let duration = n.unix_timestamp() - when;
+        if duration < 60 {
+            // less than 1min
+            "     ".to_owned()
+        } else if duration < 24 * 3600 {
+            // less than 1day
+            let hours = duration / (60 * 60);
+            let minutes = (duration % (60 * 60)) / 60;
+            format!("{hours:02}:{minutes:02}")
+        } else {
+            // more than 1day
+            let days = duration / (24 * 3600);
+            format!("{days}d")
+        }
+    })
+}
+
+fn time_string(ut: &Utmpx) -> String {
+    // "%b %e %H:%M"
+    let time_format: Vec<time::format_description::FormatItem> =
+        time::format_description::parse("[month repr:short] [day padding:space] [hour]:[minute]")
+            .unwrap();
+    ut.login_time().format(&time_format).unwrap() // LC_ALL=C
+}
+
+fn gecos_to_fullname(pw: &Passwd) -> Option<String> {
+    let mut gecos = if let Some(gecos) = &pw.user_info {
+        gecos.clone()
+    } else {
+        return None;
+    };
+    if let Some(n) = gecos.find(',') {
+        gecos.truncate(n);
+    }
+    Some(gecos.replace('&', &pw.name.capitalize()))
+}
+
+impl Pinky {
+    fn print_entry(&self, ut: &Utmpx) -> std::io::Result<()> {
+        let mut pts_path = PathBuf::from("/dev");
+        pts_path.push(ut.tty_device().as_str());
+
+        let mesg;
+        let last_change;
+
+        match pts_path.metadata() {
+            #[allow(clippy::unnecessary_cast)]
+            Ok(meta) => {
+                mesg = if meta.mode() & S_IWGRP as u32 == 0 {
+                    '*'
+                } else {
+                    ' '
+                };
+                last_change = meta.atime();
+            }
+            _ => {
+                mesg = '?';
+                last_change = 0;
+            }
+        }
+
+        print!("{1:<8.0$}", utmpx::UT_NAMESIZE, ut.user());
+
+        if self.include_fullname {
+            let fullname = if let Ok(pw) = Passwd::locate(ut.user().as_ref()) {
+                gecos_to_fullname(&pw)
+            } else {
+                None
+            };
+            if let Some(fullname) = fullname {
+                print!(" {fullname:<19.19}");
+            } else {
+                print!(" {:19}", "        ???");
+            }
+        }
+
+        print!(" {}{:<8.*}", mesg, utmpx::UT_LINESIZE, ut.tty_device());
+
+        if self.include_idle {
+            if last_change == 0 {
+                print!(" {:<6}", "?????");
+            } else {
+                print!(" {:<6}", idle_string(last_change));
+            }
+        }
+
+        print!(" {}", time_string(ut));
+
+        let mut s = ut.host();
+        if self.include_where && !s.is_empty() {
+            s = ut.canon_host()?;
+            print!(" {s}");
+        }
+
+        println!();
+        Ok(())
+    }
+
+    fn print_heading(&self) {
+        print!("{:<8}", "Login");
+        if self.include_fullname {
+            print!(" {:<19}", "Name");
+        }
+        print!(" {:<9}", " TTY");
+        if self.include_idle {
+            print!(" {:<6}", "Idle");
+        }
+        print!(" {:<16}", "When");
+        if self.include_where {
+            print!(" Where");
+        }
+        println!();
+    }
+
+    fn short_pinky(&self) -> std::io::Result<()> {
+        if self.include_heading {
+            self.print_heading();
+        }
+        for ut in Utmpx::iter_all_records() {
+            if ut.is_user_process()
+                && (self.names.is_empty() || self.names.iter().any(|n| n.as_str() == ut.user()))
+            {
+                self.print_entry(&ut)?;
+            }
+        }
+        Ok(())
+    }
+
+    fn long_pinky(&self) {
+        for u in &self.names {
+            print!("Login name: {u:<28}In real life: ");
+            if let Ok(pw) = Passwd::locate(u.as_str()) {
+                let fullname = gecos_to_fullname(&pw).unwrap_or_default();
+                let user_dir = pw.user_dir.unwrap_or_default();
+                let user_shell = pw.user_shell.unwrap_or_default();
+                println!(" {fullname}");
+                if self.include_home_and_shell {
+                    print!("Directory: {user_dir:<29}");
+                    println!("Shell:  {user_shell}");
+                }
+                if self.include_project {
+                    let mut p = PathBuf::from(&user_dir);
+                    p.push(".project");
+                    if let Ok(f) = File::open(p) {
+                        print!("Project: ");
+                        read_to_console(f);
+                    }
+                }
+                if self.include_plan {
+                    let mut p = PathBuf::from(&user_dir);
+                    p.push(".plan");
+                    if let Ok(f) = File::open(p) {
+                        println!("Plan:");
+                        read_to_console(f);
+                    }
+                }
+                println!();
+            } else {
+                println!(" ???");
+            }
+        }
+    }
+}
+
+fn read_to_console<F: Read>(f: F) {
+    let mut reader = BufReader::new(f);
+    let mut iobuf = Vec::new();
+    if reader.read_to_end(&mut iobuf).is_ok() {
+        print!("{}", String::from_utf8_lossy(&iobuf));
+    }
+}

From 8c6d72291638bfac7a33c3bdd708a07fb4f74d1e Mon Sep 17 00:00:00 2001
From: Laurent Cheylus <foxy@free.fr>
Date: Sat, 9 Dec 2023 18:39:10 +0100
Subject: [PATCH 174/429] uptime: tool unsupported on OpenBSD

  - utmpx not supported on OpenBSD

  - add src/uu/uptime/src/platform directory and platform/mod.rs for conditional compilation
    according to target_os
  - platform/openbsd.rs: implementation on OpenBSD (unsupported tool)
  - platform/unix.rs: implementation on other OS
  - src/uu/uptime/src/uptime.rs: use platform module for uucore::main function
---
 src/uu/uptime/src/platform/mod.rs     |  14 +++
 src/uu/uptime/src/platform/openbsd.rs |  17 +++
 src/uu/uptime/src/platform/unix.rs    | 161 ++++++++++++++++++++++++++
 src/uu/uptime/src/uptime.rs           | 152 +-----------------------
 4 files changed, 194 insertions(+), 150 deletions(-)
 create mode 100644 src/uu/uptime/src/platform/mod.rs
 create mode 100644 src/uu/uptime/src/platform/openbsd.rs
 create mode 100644 src/uu/uptime/src/platform/unix.rs

diff --git a/src/uu/uptime/src/platform/mod.rs b/src/uu/uptime/src/platform/mod.rs
new file mode 100644
index 00000000000..e0e87dca1bf
--- /dev/null
+++ b/src/uu/uptime/src/platform/mod.rs
@@ -0,0 +1,14 @@
+// This file is part of the uutils coreutils package.
+//
+// For the full copyright and license information, please view the LICENSE
+// file that was distributed with this source code.
+
+#[cfg(not(target_os = "openbsd"))]
+mod unix;
+#[cfg(not(target_os = "openbsd"))]
+pub use self::unix::*;
+
+#[cfg(target_os = "openbsd")]
+mod openbsd;
+#[cfg(target_os = "openbsd")]
+pub use self::openbsd::*;
diff --git a/src/uu/uptime/src/platform/openbsd.rs b/src/uu/uptime/src/platform/openbsd.rs
new file mode 100644
index 00000000000..7e6970c1f09
--- /dev/null
+++ b/src/uu/uptime/src/platform/openbsd.rs
@@ -0,0 +1,17 @@
+// This file is part of the uutils coreutils package.
+//
+// For the full copyright and license information, please view the LICENSE
+// file that was distributed with this source code.
+
+// Specific implementation for OpenBSD: tool unsupported (utmpx not supported)
+
+use crate::uu_app;
+
+use uucore::error::UResult;
+
+pub fn uumain(args: impl uucore::Args) -> UResult<()> {
+    let _matches = uu_app().try_get_matches_from(args)?;
+
+    println!("unsupported command on OpenBSD");
+    Ok(())
+}
diff --git a/src/uu/uptime/src/platform/unix.rs b/src/uu/uptime/src/platform/unix.rs
new file mode 100644
index 00000000000..df3e5e6536f
--- /dev/null
+++ b/src/uu/uptime/src/platform/unix.rs
@@ -0,0 +1,161 @@
+// This file is part of the uutils coreutils package.
+//
+// For the full copyright and license information, please view the LICENSE
+// file that was distributed with this source code.
+
+// spell-checker:ignore (ToDO) getloadavg upsecs updays nusers loadavg boottime uphours upmins
+
+use crate::options;
+use crate::uu_app;
+
+use chrono::{Local, TimeZone, Utc};
+
+use uucore::libc::time_t;
+
+use uucore::error::{UResult, USimpleError};
+
+#[cfg(unix)]
+use uucore::libc::getloadavg;
+
+#[cfg(windows)]
+extern "C" {
+    fn GetTickCount() -> uucore::libc::uint32_t;
+}
+
+pub fn uumain(args: impl uucore::Args) -> UResult<()> {
+    let matches = uu_app().try_get_matches_from(args)?;
+
+    let (boot_time, user_count) = process_utmpx();
+    let uptime = get_uptime(boot_time);
+    if uptime < 0 {
+        Err(USimpleError::new(1, "could not retrieve system uptime"))
+    } else {
+        if matches.get_flag(options::SINCE) {
+            let initial_date = Local
+                .timestamp_opt(Utc::now().timestamp() - uptime, 0)
+                .unwrap();
+            println!("{}", initial_date.format("%Y-%m-%d %H:%M:%S"));
+            return Ok(());
+        }
+
+        print_time();
+        let upsecs = uptime;
+        print_uptime(upsecs);
+        print_nusers(user_count);
+        print_loadavg();
+
+        Ok(())
+    }
+}
+
+#[cfg(unix)]
+fn print_loadavg() {
+    use uucore::libc::c_double;
+
+    let mut avg: [c_double; 3] = [0.0; 3];
+    let loads: i32 = unsafe { getloadavg(avg.as_mut_ptr(), 3) };
+
+    if loads == -1 {
+        println!();
+    } else {
+        print!("load average: ");
+        for n in 0..loads {
+            print!(
+                "{:.2}{}",
+                avg[n as usize],
+                if n == loads - 1 { "\n" } else { ", " }
+            );
+        }
+    }
+}
+
+#[cfg(windows)]
+fn print_loadavg() {
+    // XXX: currently this is a noop as Windows does not seem to have anything comparable to
+    //      getloadavg()
+}
+
+#[cfg(unix)]
+fn process_utmpx() -> (Option<time_t>, usize) {
+    use uucore::utmpx::*;
+
+    let mut nusers = 0;
+    let mut boot_time = None;
+
+    for line in Utmpx::iter_all_records() {
+        match line.record_type() {
+            USER_PROCESS => nusers += 1,
+            BOOT_TIME => {
+                let dt = line.login_time();
+                if dt.unix_timestamp() > 0 {
+                    boot_time = Some(dt.unix_timestamp() as time_t);
+                }
+            }
+            _ => continue,
+        }
+    }
+    (boot_time, nusers)
+}
+
+#[cfg(windows)]
+fn process_utmpx() -> (Option<time_t>, usize) {
+    (None, 0) // TODO: change 0 to number of users
+}
+
+fn print_nusers(nusers: usize) {
+    match nusers.cmp(&1) {
+        std::cmp::Ordering::Equal => print!("1 user,  "),
+        std::cmp::Ordering::Greater => print!("{nusers} users,  "),
+        _ => {}
+    };
+}
+
+fn print_time() {
+    let local_time = Local::now().time();
+
+    print!(" {} ", local_time.format("%H:%M:%S"));
+}
+
+#[cfg(unix)]
+fn get_uptime(boot_time: Option<time_t>) -> i64 {
+    use std::fs::File;
+    use std::io::Read;
+
+    let mut proc_uptime_s = String::new();
+
+    let proc_uptime = File::open("/proc/uptime")
+        .ok()
+        .and_then(|mut f| f.read_to_string(&mut proc_uptime_s).ok())
+        .and_then(|_| proc_uptime_s.split_whitespace().next())
+        .and_then(|s| s.split('.').next().unwrap_or("0").parse().ok());
+
+    proc_uptime.unwrap_or_else(|| match boot_time {
+        Some(t) => {
+            let now = Local::now().timestamp();
+            #[cfg(target_pointer_width = "64")]
+            let boottime: i64 = t;
+            #[cfg(not(target_pointer_width = "64"))]
+            let boottime: i64 = t.into();
+            now - boottime
+        }
+        None => -1,
+    })
+}
+
+#[cfg(windows)]
+fn get_uptime(_boot_time: Option<time_t>) -> i64 {
+    unsafe { GetTickCount() as i64 }
+}
+
+fn print_uptime(upsecs: i64) {
+    let updays = upsecs / 86400;
+    let uphours = (upsecs - (updays * 86400)) / 3600;
+    let upmins = (upsecs - (updays * 86400) - (uphours * 3600)) / 60;
+    match updays.cmp(&1) {
+        std::cmp::Ordering::Equal => print!("up {updays:1} day, {uphours:2}:{upmins:02},  "),
+        std::cmp::Ordering::Greater => {
+            print!("up {updays:1} days, {uphours:2}:{upmins:02},  ");
+        }
+        _ => print!("up  {uphours:2}:{upmins:02}, "),
+    };
+}
diff --git a/src/uu/uptime/src/uptime.rs b/src/uu/uptime/src/uptime.rs
index 778fbc92047..196ae60bae0 100644
--- a/src/uu/uptime/src/uptime.rs
+++ b/src/uu/uptime/src/uptime.rs
@@ -3,15 +3,11 @@
 // For the full copyright and license information, please view the LICENSE
 // file that was distributed with this source code.
 
-// spell-checker:ignore (ToDO) getloadavg upsecs updays nusers loadavg boottime uphours upmins
-
-use chrono::{Local, TimeZone, Utc};
 use clap::{crate_version, Arg, ArgAction, Command};
 
-use uucore::libc::time_t;
 use uucore::{format_usage, help_about, help_usage};
 
-use uucore::error::{UResult, USimpleError};
+mod platform;
 
 const ABOUT: &str = help_about!("uptime.md");
 const USAGE: &str = help_usage!("uptime.md");
@@ -19,40 +15,8 @@ pub mod options {
     pub static SINCE: &str = "since";
 }
 
-#[cfg(unix)]
-use uucore::libc::getloadavg;
-
-#[cfg(windows)]
-extern "C" {
-    fn GetTickCount() -> uucore::libc::uint32_t;
-}
-
 #[uucore::main]
-pub fn uumain(args: impl uucore::Args) -> UResult<()> {
-    let matches = uu_app().try_get_matches_from(args)?;
-
-    let (boot_time, user_count) = process_utmpx();
-    let uptime = get_uptime(boot_time);
-    if uptime < 0 {
-        Err(USimpleError::new(1, "could not retrieve system uptime"))
-    } else {
-        if matches.get_flag(options::SINCE) {
-            let initial_date = Local
-                .timestamp_opt(Utc::now().timestamp() - uptime, 0)
-                .unwrap();
-            println!("{}", initial_date.format("%Y-%m-%d %H:%M:%S"));
-            return Ok(());
-        }
-
-        print_time();
-        let upsecs = uptime;
-        print_uptime(upsecs);
-        print_nusers(user_count);
-        print_loadavg();
-
-        Ok(())
-    }
-}
+use platform::uumain;
 
 pub fn uu_app() -> Command {
     Command::new(uucore::util_name())
@@ -68,115 +32,3 @@ pub fn uu_app() -> Command {
                 .action(ArgAction::SetTrue),
         )
 }
-
-#[cfg(unix)]
-fn print_loadavg() {
-    use uucore::libc::c_double;
-
-    let mut avg: [c_double; 3] = [0.0; 3];
-    let loads: i32 = unsafe { getloadavg(avg.as_mut_ptr(), 3) };
-
-    if loads == -1 {
-        println!();
-    } else {
-        print!("load average: ");
-        for n in 0..loads {
-            print!(
-                "{:.2}{}",
-                avg[n as usize],
-                if n == loads - 1 { "\n" } else { ", " }
-            );
-        }
-    }
-}
-
-#[cfg(windows)]
-fn print_loadavg() {
-    // XXX: currently this is a noop as Windows does not seem to have anything comparable to
-    //      getloadavg()
-}
-
-#[cfg(unix)]
-fn process_utmpx() -> (Option<time_t>, usize) {
-    use uucore::utmpx::*;
-
-    let mut nusers = 0;
-    let mut boot_time = None;
-
-    for line in Utmpx::iter_all_records() {
-        match line.record_type() {
-            USER_PROCESS => nusers += 1,
-            BOOT_TIME => {
-                let dt = line.login_time();
-                if dt.unix_timestamp() > 0 {
-                    boot_time = Some(dt.unix_timestamp() as time_t);
-                }
-            }
-            _ => continue,
-        }
-    }
-    (boot_time, nusers)
-}
-
-#[cfg(windows)]
-fn process_utmpx() -> (Option<time_t>, usize) {
-    (None, 0) // TODO: change 0 to number of users
-}
-
-fn print_nusers(nusers: usize) {
-    match nusers.cmp(&1) {
-        std::cmp::Ordering::Equal => print!("1 user,  "),
-        std::cmp::Ordering::Greater => print!("{nusers} users,  "),
-        _ => {}
-    };
-}
-
-fn print_time() {
-    let local_time = Local::now().time();
-
-    print!(" {} ", local_time.format("%H:%M:%S"));
-}
-
-#[cfg(unix)]
-fn get_uptime(boot_time: Option<time_t>) -> i64 {
-    use std::fs::File;
-    use std::io::Read;
-
-    let mut proc_uptime_s = String::new();
-
-    let proc_uptime = File::open("/proc/uptime")
-        .ok()
-        .and_then(|mut f| f.read_to_string(&mut proc_uptime_s).ok())
-        .and_then(|_| proc_uptime_s.split_whitespace().next())
-        .and_then(|s| s.split('.').next().unwrap_or("0").parse().ok());
-
-    proc_uptime.unwrap_or_else(|| match boot_time {
-        Some(t) => {
-            let now = Local::now().timestamp();
-            #[cfg(target_pointer_width = "64")]
-            let boottime: i64 = t;
-            #[cfg(not(target_pointer_width = "64"))]
-            let boottime: i64 = t.into();
-            now - boottime
-        }
-        None => -1,
-    })
-}
-
-#[cfg(windows)]
-fn get_uptime(_boot_time: Option<time_t>) -> i64 {
-    unsafe { GetTickCount() as i64 }
-}
-
-fn print_uptime(upsecs: i64) {
-    let updays = upsecs / 86400;
-    let uphours = (upsecs - (updays * 86400)) / 3600;
-    let upmins = (upsecs - (updays * 86400) - (uphours * 3600)) / 60;
-    match updays.cmp(&1) {
-        std::cmp::Ordering::Equal => print!("up {updays:1} day, {uphours:2}:{upmins:02},  "),
-        std::cmp::Ordering::Greater => {
-            print!("up {updays:1} days, {uphours:2}:{upmins:02},  ");
-        }
-        _ => print!("up  {uphours:2}:{upmins:02}, "),
-    };
-}

From fdd6ecb71321a64a5debba8085503c26ee29b1da Mon Sep 17 00:00:00 2001
From: Laurent Cheylus <foxy@free.fr>
Date: Sat, 9 Dec 2023 18:41:10 +0100
Subject: [PATCH 175/429] users: tool unsupported on OpenBSD

  - utmpx not supported on OpenBSD

  - add src/uu/users/src/platform directory and platform/mod.rs for conditional compilation
    according to target_os
  - platform/openbsd.rs: implementation on OpenBSD (unsupported tool)
  - platform/unix.rs: implementation on other OS
  - src/uu/users/src/users.rs: use platform module for uucore::main function
---
 src/uu/users/src/platform/mod.rs     | 14 ++++++++
 src/uu/users/src/platform/openbsd.rs | 17 +++++++++
 src/uu/users/src/platform/unix.rs    | 53 ++++++++++++++++++++++++++++
 src/uu/users/src/users.rs            | 44 ++---------------------
 4 files changed, 87 insertions(+), 41 deletions(-)
 create mode 100644 src/uu/users/src/platform/mod.rs
 create mode 100644 src/uu/users/src/platform/openbsd.rs
 create mode 100644 src/uu/users/src/platform/unix.rs

diff --git a/src/uu/users/src/platform/mod.rs b/src/uu/users/src/platform/mod.rs
new file mode 100644
index 00000000000..e0e87dca1bf
--- /dev/null
+++ b/src/uu/users/src/platform/mod.rs
@@ -0,0 +1,14 @@
+// This file is part of the uutils coreutils package.
+//
+// For the full copyright and license information, please view the LICENSE
+// file that was distributed with this source code.
+
+#[cfg(not(target_os = "openbsd"))]
+mod unix;
+#[cfg(not(target_os = "openbsd"))]
+pub use self::unix::*;
+
+#[cfg(target_os = "openbsd")]
+mod openbsd;
+#[cfg(target_os = "openbsd")]
+pub use self::openbsd::*;
diff --git a/src/uu/users/src/platform/openbsd.rs b/src/uu/users/src/platform/openbsd.rs
new file mode 100644
index 00000000000..7e6970c1f09
--- /dev/null
+++ b/src/uu/users/src/platform/openbsd.rs
@@ -0,0 +1,17 @@
+// This file is part of the uutils coreutils package.
+//
+// For the full copyright and license information, please view the LICENSE
+// file that was distributed with this source code.
+
+// Specific implementation for OpenBSD: tool unsupported (utmpx not supported)
+
+use crate::uu_app;
+
+use uucore::error::UResult;
+
+pub fn uumain(args: impl uucore::Args) -> UResult<()> {
+    let _matches = uu_app().try_get_matches_from(args)?;
+
+    println!("unsupported command on OpenBSD");
+    Ok(())
+}
diff --git a/src/uu/users/src/platform/unix.rs b/src/uu/users/src/platform/unix.rs
new file mode 100644
index 00000000000..99c9ce776bb
--- /dev/null
+++ b/src/uu/users/src/platform/unix.rs
@@ -0,0 +1,53 @@
+// This file is part of the uutils coreutils package.
+//
+// For the full copyright and license information, please view the LICENSE
+// file that was distributed with this source code.
+
+// spell-checker:ignore (paths) wtmp
+
+use crate::uu_app;
+
+use std::ffi::OsString;
+use std::path::Path;
+
+use uucore::error::UResult;
+use uucore::utmpx::{self, Utmpx};
+
+static ARG_FILES: &str = "files";
+
+fn get_long_usage() -> String {
+    format!(
+        "Output who is currently logged in according to FILE.
+If FILE is not specified, use {}.  /var/log/wtmp as FILE is common.",
+        utmpx::DEFAULT_FILE
+    )
+}
+
+pub fn uumain(args: impl uucore::Args) -> UResult<()> {
+    let matches = uu_app()
+        .after_help(get_long_usage())
+        .try_get_matches_from(args)?;
+
+    let files: Vec<&Path> = matches
+        .get_many::<OsString>(ARG_FILES)
+        .map(|v| v.map(AsRef::as_ref).collect())
+        .unwrap_or_default();
+
+    let filename = if files.is_empty() {
+        utmpx::DEFAULT_FILE.as_ref()
+    } else {
+        files[0]
+    };
+
+    let mut users = Utmpx::iter_all_records_from(filename)
+        .filter(Utmpx::is_user_process)
+        .map(|ut| ut.user())
+        .collect::<Vec<_>>();
+
+    if !users.is_empty() {
+        users.sort();
+        println!("{}", users.join(" "));
+    }
+
+    Ok(())
+}
diff --git a/src/uu/users/src/users.rs b/src/uu/users/src/users.rs
index 199882b7eab..d299399f311 100644
--- a/src/uu/users/src/users.rs
+++ b/src/uu/users/src/users.rs
@@ -5,57 +5,19 @@
 
 // spell-checker:ignore (paths) wtmp
 
-use std::ffi::OsString;
-use std::path::Path;
-
 use clap::builder::ValueParser;
 use clap::{crate_version, Arg, Command};
-use uucore::error::UResult;
-use uucore::utmpx::{self, Utmpx};
 use uucore::{format_usage, help_about, help_usage};
 
+mod platform;
+
 const ABOUT: &str = help_about!("users.md");
 const USAGE: &str = help_usage!("users.md");
 
 static ARG_FILES: &str = "files";
 
-fn get_long_usage() -> String {
-    format!(
-        "Output who is currently logged in according to FILE.
-If FILE is not specified, use {}.  /var/log/wtmp as FILE is common.",
-        utmpx::DEFAULT_FILE
-    )
-}
-
 #[uucore::main]
-pub fn uumain(args: impl uucore::Args) -> UResult<()> {
-    let matches = uu_app()
-        .after_help(get_long_usage())
-        .try_get_matches_from(args)?;
-
-    let files: Vec<&Path> = matches
-        .get_many::<OsString>(ARG_FILES)
-        .map(|v| v.map(AsRef::as_ref).collect())
-        .unwrap_or_default();
-
-    let filename = if files.is_empty() {
-        utmpx::DEFAULT_FILE.as_ref()
-    } else {
-        files[0]
-    };
-
-    let mut users = Utmpx::iter_all_records_from(filename)
-        .filter(Utmpx::is_user_process)
-        .map(|ut| ut.user())
-        .collect::<Vec<_>>();
-
-    if !users.is_empty() {
-        users.sort();
-        println!("{}", users.join(" "));
-    }
-
-    Ok(())
-}
+use platform::uumain;
 
 pub fn uu_app() -> Command {
     Command::new(uucore::util_name())

From e1032e1f065e29b836c9bded3d272b0cb3d143c7 Mon Sep 17 00:00:00 2001
From: Laurent Cheylus <foxy@free.fr>
Date: Sat, 9 Dec 2023 18:43:12 +0100
Subject: [PATCH 176/429] who: tool unsupported on OpenBSD

  - utmpx not supported on OpenBSD

  - add src/uu/who/src/platform directory and platform/mod.rs for conditional compilation according
    to target_os
  - platform/openbsd.rs: implementation on OpenBSD (unsupported tool)
  - platform/unix.rs: implementation on other OS
  - src/uu/who/src/who.rs: use platform module for uucore::main function
---
 src/uu/who/src/platform/mod.rs     |  14 +
 src/uu/who/src/platform/openbsd.rs |  17 ++
 src/uu/who/src/platform/unix.rs    | 432 +++++++++++++++++++++++++++++
 src/uu/who/src/who.rs              | 424 +---------------------------
 4 files changed, 466 insertions(+), 421 deletions(-)
 create mode 100644 src/uu/who/src/platform/mod.rs
 create mode 100644 src/uu/who/src/platform/openbsd.rs
 create mode 100644 src/uu/who/src/platform/unix.rs

diff --git a/src/uu/who/src/platform/mod.rs b/src/uu/who/src/platform/mod.rs
new file mode 100644
index 00000000000..e0e87dca1bf
--- /dev/null
+++ b/src/uu/who/src/platform/mod.rs
@@ -0,0 +1,14 @@
+// This file is part of the uutils coreutils package.
+//
+// For the full copyright and license information, please view the LICENSE
+// file that was distributed with this source code.
+
+#[cfg(not(target_os = "openbsd"))]
+mod unix;
+#[cfg(not(target_os = "openbsd"))]
+pub use self::unix::*;
+
+#[cfg(target_os = "openbsd")]
+mod openbsd;
+#[cfg(target_os = "openbsd")]
+pub use self::openbsd::*;
diff --git a/src/uu/who/src/platform/openbsd.rs b/src/uu/who/src/platform/openbsd.rs
new file mode 100644
index 00000000000..7e6970c1f09
--- /dev/null
+++ b/src/uu/who/src/platform/openbsd.rs
@@ -0,0 +1,17 @@
+// This file is part of the uutils coreutils package.
+//
+// For the full copyright and license information, please view the LICENSE
+// file that was distributed with this source code.
+
+// Specific implementation for OpenBSD: tool unsupported (utmpx not supported)
+
+use crate::uu_app;
+
+use uucore::error::UResult;
+
+pub fn uumain(args: impl uucore::Args) -> UResult<()> {
+    let _matches = uu_app().try_get_matches_from(args)?;
+
+    println!("unsupported command on OpenBSD");
+    Ok(())
+}
diff --git a/src/uu/who/src/platform/unix.rs b/src/uu/who/src/platform/unix.rs
new file mode 100644
index 00000000000..17eaa9af961
--- /dev/null
+++ b/src/uu/who/src/platform/unix.rs
@@ -0,0 +1,432 @@
+// This file is part of the uutils coreutils package.
+//
+// For the full copyright and license information, please view the LICENSE
+// file that was distributed with this source code.
+
+// spell-checker:ignore (ToDO) ttyname hostnames runlevel mesg wtmp statted boottime deadprocs initspawn clockchange curr runlvline pidstr exitstr hoststr
+
+use crate::options;
+use crate::uu_app;
+
+use uucore::display::Quotable;
+use uucore::error::{FromIo, UResult};
+use uucore::libc::{ttyname, STDIN_FILENO, S_IWGRP};
+use uucore::utmpx::{self, time, Utmpx};
+
+use std::borrow::Cow;
+use std::ffi::CStr;
+use std::fmt::Write;
+use std::os::unix::fs::MetadataExt;
+use std::path::PathBuf;
+
+fn get_long_usage() -> String {
+    format!(
+        "If FILE is not specified, use {}.  /var/log/wtmp as FILE is common.\n\
+         If ARG1 ARG2 given, -m presumed: 'am i' or 'mom likes' are usual.",
+        utmpx::DEFAULT_FILE,
+    )
+}
+
+pub fn uumain(args: impl uucore::Args) -> UResult<()> {
+    let args = args.collect_ignore();
+
+    let matches = uu_app()
+        .after_help(get_long_usage())
+        .try_get_matches_from(args)?;
+
+    let files: Vec<String> = matches
+        .get_many::<String>(options::FILE)
+        .map(|v| v.map(ToString::to_string).collect())
+        .unwrap_or_default();
+
+    // If true, attempt to canonicalize hostnames via a DNS lookup.
+    let do_lookup = matches.get_flag(options::LOOKUP);
+
+    // If true, display only a list of usernames and count of
+    // the users logged on.
+    // Ignored for 'who am i'.
+    let short_list = matches.get_flag(options::COUNT);
+
+    let all = matches.get_flag(options::ALL);
+
+    // If true, display a line at the top describing each field.
+    let include_heading = matches.get_flag(options::HEADING);
+
+    // If true, display a '+' for each user if mesg y, a '-' if mesg n,
+    // or a '?' if their tty cannot be statted.
+    let include_mesg = all || matches.get_flag(options::MESG);
+
+    // If true, display the last boot time.
+    let need_boottime = all || matches.get_flag(options::BOOT);
+
+    // If true, display dead processes.
+    let need_deadprocs = all || matches.get_flag(options::DEAD);
+
+    // If true, display processes waiting for user login.
+    let need_login = all || matches.get_flag(options::LOGIN);
+
+    // If true, display processes started by init.
+    let need_initspawn = all || matches.get_flag(options::PROCESS);
+
+    // If true, display the last clock change.
+    let need_clockchange = all || matches.get_flag(options::TIME);
+
+    // If true, display the current runlevel.
+    let need_runlevel = all || matches.get_flag(options::RUNLEVEL);
+
+    let use_defaults = !(all
+        || need_boottime
+        || need_deadprocs
+        || need_login
+        || need_initspawn
+        || need_runlevel
+        || need_clockchange
+        || matches.get_flag(options::USERS));
+
+    // If true, display user processes.
+    let need_users = all || matches.get_flag(options::USERS) || use_defaults;
+
+    // If true, display the hours:minutes since each user has touched
+    // the keyboard, or "." if within the last minute, or "old" if
+    // not within the last day.
+    let include_idle = need_deadprocs || need_login || need_runlevel || need_users;
+
+    // If true, display process termination & exit status.
+    let include_exit = need_deadprocs;
+
+    // If true, display only name, line, and time fields.
+    let short_output = !include_exit && use_defaults;
+
+    // If true, display info only for the controlling tty.
+    let my_line_only = matches.get_flag(options::ONLY_HOSTNAME_USER) || files.len() == 2;
+
+    let mut who = Who {
+        do_lookup,
+        short_list,
+        short_output,
+        include_idle,
+        include_heading,
+        include_mesg,
+        include_exit,
+        need_boottime,
+        need_deadprocs,
+        need_login,
+        need_initspawn,
+        need_clockchange,
+        need_runlevel,
+        need_users,
+        my_line_only,
+        args: files,
+    };
+
+    who.exec()
+}
+
+struct Who {
+    do_lookup: bool,
+    short_list: bool,
+    short_output: bool,
+    include_idle: bool,
+    include_heading: bool,
+    include_mesg: bool,
+    include_exit: bool,
+    need_boottime: bool,
+    need_deadprocs: bool,
+    need_login: bool,
+    need_initspawn: bool,
+    need_clockchange: bool,
+    need_runlevel: bool,
+    need_users: bool,
+    my_line_only: bool,
+    args: Vec<String>,
+}
+
+fn idle_string<'a>(when: i64, boottime: i64) -> Cow<'a, str> {
+    thread_local! {
+        static NOW: time::OffsetDateTime = time::OffsetDateTime::now_local().unwrap();
+    }
+    NOW.with(|n| {
+        let now = n.unix_timestamp();
+        if boottime < when && now - 24 * 3600 < when && when <= now {
+            let seconds_idle = now - when;
+            if seconds_idle < 60 {
+                "  .  ".into()
+            } else {
+                format!(
+                    "{:02}:{:02}",
+                    seconds_idle / 3600,
+                    (seconds_idle % 3600) / 60
+                )
+                .into()
+            }
+        } else {
+            " old ".into()
+        }
+    })
+}
+
+fn time_string(ut: &Utmpx) -> String {
+    // "%b %e %H:%M"
+    let time_format: Vec<time::format_description::FormatItem> =
+        time::format_description::parse("[month repr:short] [day padding:space] [hour]:[minute]")
+            .unwrap();
+    ut.login_time().format(&time_format).unwrap() // LC_ALL=C
+}
+
+#[inline]
+fn current_tty() -> String {
+    unsafe {
+        let res = ttyname(STDIN_FILENO);
+        if res.is_null() {
+            String::new()
+        } else {
+            CStr::from_ptr(res as *const _)
+                .to_string_lossy()
+                .trim_start_matches("/dev/")
+                .to_owned()
+        }
+    }
+}
+
+impl Who {
+    #[allow(clippy::cognitive_complexity)]
+    fn exec(&mut self) -> UResult<()> {
+        let run_level_chk = |_record: i16| {
+            #[cfg(not(target_os = "linux"))]
+            return false;
+
+            #[cfg(target_os = "linux")]
+            return _record == utmpx::RUN_LVL;
+        };
+
+        let f = if self.args.len() == 1 {
+            self.args[0].as_ref()
+        } else {
+            utmpx::DEFAULT_FILE
+        };
+        if self.short_list {
+            let users = Utmpx::iter_all_records_from(f)
+                .filter(Utmpx::is_user_process)
+                .map(|ut| ut.user())
+                .collect::<Vec<_>>();
+            println!("{}", users.join(" "));
+            println!("# users={}", users.len());
+        } else {
+            let records = Utmpx::iter_all_records_from(f);
+
+            if self.include_heading {
+                self.print_heading();
+            }
+            let cur_tty = if self.my_line_only {
+                current_tty()
+            } else {
+                String::new()
+            };
+
+            for ut in records {
+                if !self.my_line_only || cur_tty == ut.tty_device() {
+                    if self.need_users && ut.is_user_process() {
+                        self.print_user(&ut)?;
+                    } else if self.need_runlevel && run_level_chk(ut.record_type()) {
+                        if cfg!(target_os = "linux") {
+                            self.print_runlevel(&ut);
+                        }
+                    } else if self.need_boottime && ut.record_type() == utmpx::BOOT_TIME {
+                        self.print_boottime(&ut);
+                    } else if self.need_clockchange && ut.record_type() == utmpx::NEW_TIME {
+                        self.print_clockchange(&ut);
+                    } else if self.need_initspawn && ut.record_type() == utmpx::INIT_PROCESS {
+                        self.print_initspawn(&ut);
+                    } else if self.need_login && ut.record_type() == utmpx::LOGIN_PROCESS {
+                        self.print_login(&ut);
+                    } else if self.need_deadprocs && ut.record_type() == utmpx::DEAD_PROCESS {
+                        self.print_deadprocs(&ut);
+                    }
+                }
+
+                if ut.record_type() == utmpx::BOOT_TIME {}
+            }
+        }
+        Ok(())
+    }
+
+    #[inline]
+    fn print_runlevel(&self, ut: &Utmpx) {
+        let last = (ut.pid() / 256) as u8 as char;
+        let curr = (ut.pid() % 256) as u8 as char;
+        let runlvline = format!("run-level {curr}");
+        let comment = format!("last={}", if last == 'N' { 'S' } else { 'N' });
+
+        self.print_line(
+            "",
+            ' ',
+            &runlvline,
+            &time_string(ut),
+            "",
+            "",
+            if last.is_control() { "" } else { &comment },
+            "",
+        );
+    }
+
+    #[inline]
+    fn print_clockchange(&self, ut: &Utmpx) {
+        self.print_line("", ' ', "clock change", &time_string(ut), "", "", "", "");
+    }
+
+    #[inline]
+    fn print_login(&self, ut: &Utmpx) {
+        let comment = format!("id={}", ut.terminal_suffix());
+        let pidstr = format!("{}", ut.pid());
+        self.print_line(
+            "LOGIN",
+            ' ',
+            &ut.tty_device(),
+            &time_string(ut),
+            "",
+            &pidstr,
+            &comment,
+            "",
+        );
+    }
+
+    #[inline]
+    fn print_deadprocs(&self, ut: &Utmpx) {
+        let comment = format!("id={}", ut.terminal_suffix());
+        let pidstr = format!("{}", ut.pid());
+        let e = ut.exit_status();
+        let exitstr = format!("term={} exit={}", e.0, e.1);
+        self.print_line(
+            "",
+            ' ',
+            &ut.tty_device(),
+            &time_string(ut),
+            "",
+            &pidstr,
+            &comment,
+            &exitstr,
+        );
+    }
+
+    #[inline]
+    fn print_initspawn(&self, ut: &Utmpx) {
+        let comment = format!("id={}", ut.terminal_suffix());
+        let pidstr = format!("{}", ut.pid());
+        self.print_line(
+            "",
+            ' ',
+            &ut.tty_device(),
+            &time_string(ut),
+            "",
+            &pidstr,
+            &comment,
+            "",
+        );
+    }
+
+    #[inline]
+    fn print_boottime(&self, ut: &Utmpx) {
+        self.print_line("", ' ', "system boot", &time_string(ut), "", "", "", "");
+    }
+
+    fn print_user(&self, ut: &Utmpx) -> UResult<()> {
+        let mut p = PathBuf::from("/dev");
+        p.push(ut.tty_device().as_str());
+        let mesg;
+        let last_change;
+        match p.metadata() {
+            Ok(meta) => {
+                #[cfg(all(
+                    not(target_os = "android"),
+                    not(target_os = "freebsd"),
+                    not(target_vendor = "apple")
+                ))]
+                let iwgrp = S_IWGRP;
+                #[cfg(any(target_os = "android", target_os = "freebsd", target_vendor = "apple"))]
+                let iwgrp = S_IWGRP as u32;
+                mesg = if meta.mode() & iwgrp == 0 { '-' } else { '+' };
+                last_change = meta.atime();
+            }
+            _ => {
+                mesg = '?';
+                last_change = 0;
+            }
+        }
+
+        let idle = if last_change == 0 {
+            "  ?".into()
+        } else {
+            idle_string(last_change, 0)
+        };
+
+        let s = if self.do_lookup {
+            ut.canon_host().map_err_context(|| {
+                let host = ut.host();
+                format!(
+                    "failed to canonicalize {}",
+                    host.split(':').next().unwrap_or(&host).quote()
+                )
+            })?
+        } else {
+            ut.host()
+        };
+        let hoststr = if s.is_empty() { s } else { format!("({s})") };
+
+        self.print_line(
+            ut.user().as_ref(),
+            mesg,
+            ut.tty_device().as_ref(),
+            time_string(ut).as_str(),
+            idle.as_ref(),
+            format!("{}", ut.pid()).as_str(),
+            hoststr.as_str(),
+            "",
+        );
+
+        Ok(())
+    }
+
+    #[allow(clippy::too_many_arguments)]
+    fn print_line(
+        &self,
+        user: &str,
+        state: char,
+        line: &str,
+        time: &str,
+        idle: &str,
+        pid: &str,
+        comment: &str,
+        exit: &str,
+    ) {
+        let mut buf = String::with_capacity(64);
+        let msg = vec![' ', state].into_iter().collect::<String>();
+
+        write!(buf, "{user:<8}").unwrap();
+        if self.include_mesg {
+            buf.push_str(&msg);
+        }
+        write!(buf, " {line:<12}").unwrap();
+        // "%b %e %H:%M" (LC_ALL=C)
+        let time_size = 3 + 2 + 2 + 1 + 2;
+        write!(buf, " {time:<time_size$}").unwrap();
+
+        if !self.short_output {
+            if self.include_idle {
+                write!(buf, " {idle:<6}").unwrap();
+            }
+            write!(buf, " {pid:>10}").unwrap();
+        }
+        write!(buf, " {comment:<8}").unwrap();
+        if self.include_exit {
+            write!(buf, " {exit:<12}").unwrap();
+        }
+        println!("{}", buf.trim_end());
+    }
+
+    #[inline]
+    fn print_heading(&self) {
+        self.print_line(
+            "NAME", ' ', "LINE", "TIME", "IDLE", "PID", "COMMENT", "EXIT",
+        );
+    }
+}
diff --git a/src/uu/who/src/who.rs b/src/uu/who/src/who.rs
index 5d952efffb2..1eb28e874e8 100644
--- a/src/uu/who/src/who.rs
+++ b/src/uu/who/src/who.rs
@@ -5,19 +5,11 @@
 
 // spell-checker:ignore (ToDO) ttyname hostnames runlevel mesg wtmp statted boottime deadprocs initspawn clockchange curr runlvline pidstr exitstr hoststr
 
-use uucore::display::Quotable;
-use uucore::error::{FromIo, UResult};
-use uucore::libc::{ttyname, STDIN_FILENO, S_IWGRP};
-use uucore::utmpx::{self, time, Utmpx};
-
 use clap::{crate_version, Arg, ArgAction, Command};
-use std::borrow::Cow;
-use std::ffi::CStr;
-use std::fmt::Write;
-use std::os::unix::fs::MetadataExt;
-use std::path::PathBuf;
 use uucore::{format_usage, help_about, help_usage};
 
+mod platform;
+
 mod options {
     pub const ALL: &str = "all";
     pub const BOOT: &str = "boot";
@@ -44,109 +36,8 @@ static RUNLEVEL_HELP: &str = "print current runlevel";
 #[cfg(not(target_os = "linux"))]
 static RUNLEVEL_HELP: &str = "print current runlevel (This is meaningless on non Linux)";
 
-fn get_long_usage() -> String {
-    format!(
-        "If FILE is not specified, use {}.  /var/log/wtmp as FILE is common.\n\
-         If ARG1 ARG2 given, -m presumed: 'am i' or 'mom likes' are usual.",
-        utmpx::DEFAULT_FILE,
-    )
-}
-
 #[uucore::main]
-pub fn uumain(args: impl uucore::Args) -> UResult<()> {
-    let args = args.collect_ignore();
-
-    let matches = uu_app()
-        .after_help(get_long_usage())
-        .try_get_matches_from(args)?;
-
-    let files: Vec<String> = matches
-        .get_many::<String>(options::FILE)
-        .map(|v| v.map(ToString::to_string).collect())
-        .unwrap_or_default();
-
-    // If true, attempt to canonicalize hostnames via a DNS lookup.
-    let do_lookup = matches.get_flag(options::LOOKUP);
-
-    // If true, display only a list of usernames and count of
-    // the users logged on.
-    // Ignored for 'who am i'.
-    let short_list = matches.get_flag(options::COUNT);
-
-    let all = matches.get_flag(options::ALL);
-
-    // If true, display a line at the top describing each field.
-    let include_heading = matches.get_flag(options::HEADING);
-
-    // If true, display a '+' for each user if mesg y, a '-' if mesg n,
-    // or a '?' if their tty cannot be statted.
-    let include_mesg = all || matches.get_flag(options::MESG);
-
-    // If true, display the last boot time.
-    let need_boottime = all || matches.get_flag(options::BOOT);
-
-    // If true, display dead processes.
-    let need_deadprocs = all || matches.get_flag(options::DEAD);
-
-    // If true, display processes waiting for user login.
-    let need_login = all || matches.get_flag(options::LOGIN);
-
-    // If true, display processes started by init.
-    let need_initspawn = all || matches.get_flag(options::PROCESS);
-
-    // If true, display the last clock change.
-    let need_clockchange = all || matches.get_flag(options::TIME);
-
-    // If true, display the current runlevel.
-    let need_runlevel = all || matches.get_flag(options::RUNLEVEL);
-
-    let use_defaults = !(all
-        || need_boottime
-        || need_deadprocs
-        || need_login
-        || need_initspawn
-        || need_runlevel
-        || need_clockchange
-        || matches.get_flag(options::USERS));
-
-    // If true, display user processes.
-    let need_users = all || matches.get_flag(options::USERS) || use_defaults;
-
-    // If true, display the hours:minutes since each user has touched
-    // the keyboard, or "." if within the last minute, or "old" if
-    // not within the last day.
-    let include_idle = need_deadprocs || need_login || need_runlevel || need_users;
-
-    // If true, display process termination & exit status.
-    let include_exit = need_deadprocs;
-
-    // If true, display only name, line, and time fields.
-    let short_output = !include_exit && use_defaults;
-
-    // If true, display info only for the controlling tty.
-    let my_line_only = matches.get_flag(options::ONLY_HOSTNAME_USER) || files.len() == 2;
-
-    let mut who = Who {
-        do_lookup,
-        short_list,
-        short_output,
-        include_idle,
-        include_heading,
-        include_mesg,
-        include_exit,
-        need_boottime,
-        need_deadprocs,
-        need_login,
-        need_initspawn,
-        need_clockchange,
-        need_runlevel,
-        need_users,
-        my_line_only,
-        args: files,
-    };
-
-    who.exec()
-}
+use platform::uumain;
 
 pub fn uu_app() -> Command {
     Command::new(uucore::util_name())
@@ -258,312 +149,3 @@ pub fn uu_app() -> Command {
                 .value_hint(clap::ValueHint::FilePath),
         )
 }
-
-struct Who {
-    do_lookup: bool,
-    short_list: bool,
-    short_output: bool,
-    include_idle: bool,
-    include_heading: bool,
-    include_mesg: bool,
-    include_exit: bool,
-    need_boottime: bool,
-    need_deadprocs: bool,
-    need_login: bool,
-    need_initspawn: bool,
-    need_clockchange: bool,
-    need_runlevel: bool,
-    need_users: bool,
-    my_line_only: bool,
-    args: Vec<String>,
-}
-
-fn idle_string<'a>(when: i64, boottime: i64) -> Cow<'a, str> {
-    thread_local! {
-        static NOW: time::OffsetDateTime = time::OffsetDateTime::now_local().unwrap();
-    }
-    NOW.with(|n| {
-        let now = n.unix_timestamp();
-        if boottime < when && now - 24 * 3600 < when && when <= now {
-            let seconds_idle = now - when;
-            if seconds_idle < 60 {
-                "  .  ".into()
-            } else {
-                format!(
-                    "{:02}:{:02}",
-                    seconds_idle / 3600,
-                    (seconds_idle % 3600) / 60
-                )
-                .into()
-            }
-        } else {
-            " old ".into()
-        }
-    })
-}
-
-fn time_string(ut: &Utmpx) -> String {
-    // "%b %e %H:%M"
-    let time_format: Vec<time::format_description::FormatItem> =
-        time::format_description::parse("[month repr:short] [day padding:space] [hour]:[minute]")
-            .unwrap();
-    ut.login_time().format(&time_format).unwrap() // LC_ALL=C
-}
-
-#[inline]
-fn current_tty() -> String {
-    unsafe {
-        let res = ttyname(STDIN_FILENO);
-        if res.is_null() {
-            String::new()
-        } else {
-            CStr::from_ptr(res as *const _)
-                .to_string_lossy()
-                .trim_start_matches("/dev/")
-                .to_owned()
-        }
-    }
-}
-
-impl Who {
-    #[allow(clippy::cognitive_complexity)]
-    fn exec(&mut self) -> UResult<()> {
-        let run_level_chk = |_record: i16| {
-            #[cfg(not(target_os = "linux"))]
-            return false;
-
-            #[cfg(target_os = "linux")]
-            return _record == utmpx::RUN_LVL;
-        };
-
-        let f = if self.args.len() == 1 {
-            self.args[0].as_ref()
-        } else {
-            utmpx::DEFAULT_FILE
-        };
-        if self.short_list {
-            let users = Utmpx::iter_all_records_from(f)
-                .filter(Utmpx::is_user_process)
-                .map(|ut| ut.user())
-                .collect::<Vec<_>>();
-            println!("{}", users.join(" "));
-            println!("# users={}", users.len());
-        } else {
-            let records = Utmpx::iter_all_records_from(f);
-
-            if self.include_heading {
-                self.print_heading();
-            }
-            let cur_tty = if self.my_line_only {
-                current_tty()
-            } else {
-                String::new()
-            };
-
-            for ut in records {
-                if !self.my_line_only || cur_tty == ut.tty_device() {
-                    if self.need_users && ut.is_user_process() {
-                        self.print_user(&ut)?;
-                    } else if self.need_runlevel && run_level_chk(ut.record_type()) {
-                        if cfg!(target_os = "linux") {
-                            self.print_runlevel(&ut);
-                        }
-                    } else if self.need_boottime && ut.record_type() == utmpx::BOOT_TIME {
-                        self.print_boottime(&ut);
-                    } else if self.need_clockchange && ut.record_type() == utmpx::NEW_TIME {
-                        self.print_clockchange(&ut);
-                    } else if self.need_initspawn && ut.record_type() == utmpx::INIT_PROCESS {
-                        self.print_initspawn(&ut);
-                    } else if self.need_login && ut.record_type() == utmpx::LOGIN_PROCESS {
-                        self.print_login(&ut);
-                    } else if self.need_deadprocs && ut.record_type() == utmpx::DEAD_PROCESS {
-                        self.print_deadprocs(&ut);
-                    }
-                }
-
-                if ut.record_type() == utmpx::BOOT_TIME {}
-            }
-        }
-        Ok(())
-    }
-
-    #[inline]
-    fn print_runlevel(&self, ut: &Utmpx) {
-        let last = (ut.pid() / 256) as u8 as char;
-        let curr = (ut.pid() % 256) as u8 as char;
-        let runlvline = format!("run-level {curr}");
-        let comment = format!("last={}", if last == 'N' { 'S' } else { 'N' });
-
-        self.print_line(
-            "",
-            ' ',
-            &runlvline,
-            &time_string(ut),
-            "",
-            "",
-            if last.is_control() { "" } else { &comment },
-            "",
-        );
-    }
-
-    #[inline]
-    fn print_clockchange(&self, ut: &Utmpx) {
-        self.print_line("", ' ', "clock change", &time_string(ut), "", "", "", "");
-    }
-
-    #[inline]
-    fn print_login(&self, ut: &Utmpx) {
-        let comment = format!("id={}", ut.terminal_suffix());
-        let pidstr = format!("{}", ut.pid());
-        self.print_line(
-            "LOGIN",
-            ' ',
-            &ut.tty_device(),
-            &time_string(ut),
-            "",
-            &pidstr,
-            &comment,
-            "",
-        );
-    }
-
-    #[inline]
-    fn print_deadprocs(&self, ut: &Utmpx) {
-        let comment = format!("id={}", ut.terminal_suffix());
-        let pidstr = format!("{}", ut.pid());
-        let e = ut.exit_status();
-        let exitstr = format!("term={} exit={}", e.0, e.1);
-        self.print_line(
-            "",
-            ' ',
-            &ut.tty_device(),
-            &time_string(ut),
-            "",
-            &pidstr,
-            &comment,
-            &exitstr,
-        );
-    }
-
-    #[inline]
-    fn print_initspawn(&self, ut: &Utmpx) {
-        let comment = format!("id={}", ut.terminal_suffix());
-        let pidstr = format!("{}", ut.pid());
-        self.print_line(
-            "",
-            ' ',
-            &ut.tty_device(),
-            &time_string(ut),
-            "",
-            &pidstr,
-            &comment,
-            "",
-        );
-    }
-
-    #[inline]
-    fn print_boottime(&self, ut: &Utmpx) {
-        self.print_line("", ' ', "system boot", &time_string(ut), "", "", "", "");
-    }
-
-    fn print_user(&self, ut: &Utmpx) -> UResult<()> {
-        let mut p = PathBuf::from("/dev");
-        p.push(ut.tty_device().as_str());
-        let mesg;
-        let last_change;
-        match p.metadata() {
-            Ok(meta) => {
-                #[cfg(all(
-                    not(target_os = "android"),
-                    not(target_os = "freebsd"),
-                    not(target_vendor = "apple")
-                ))]
-                let iwgrp = S_IWGRP;
-                #[cfg(any(target_os = "android", target_os = "freebsd", target_vendor = "apple"))]
-                let iwgrp = S_IWGRP as u32;
-                mesg = if meta.mode() & iwgrp == 0 { '-' } else { '+' };
-                last_change = meta.atime();
-            }
-            _ => {
-                mesg = '?';
-                last_change = 0;
-            }
-        }
-
-        let idle = if last_change == 0 {
-            "  ?".into()
-        } else {
-            idle_string(last_change, 0)
-        };
-
-        let s = if self.do_lookup {
-            ut.canon_host().map_err_context(|| {
-                let host = ut.host();
-                format!(
-                    "failed to canonicalize {}",
-                    host.split(':').next().unwrap_or(&host).quote()
-                )
-            })?
-        } else {
-            ut.host()
-        };
-        let hoststr = if s.is_empty() { s } else { format!("({s})") };
-
-        self.print_line(
-            ut.user().as_ref(),
-            mesg,
-            ut.tty_device().as_ref(),
-            time_string(ut).as_str(),
-            idle.as_ref(),
-            format!("{}", ut.pid()).as_str(),
-            hoststr.as_str(),
-            "",
-        );
-
-        Ok(())
-    }
-
-    #[allow(clippy::too_many_arguments)]
-    fn print_line(
-        &self,
-        user: &str,
-        state: char,
-        line: &str,
-        time: &str,
-        idle: &str,
-        pid: &str,
-        comment: &str,
-        exit: &str,
-    ) {
-        let mut buf = String::with_capacity(64);
-        let msg = vec![' ', state].into_iter().collect::<String>();
-
-        write!(buf, "{user:<8}").unwrap();
-        if self.include_mesg {
-            buf.push_str(&msg);
-        }
-        write!(buf, " {line:<12}").unwrap();
-        // "%b %e %H:%M" (LC_ALL=C)
-        let time_size = 3 + 2 + 2 + 1 + 2;
-        write!(buf, " {time:<time_size$}").unwrap();
-
-        if !self.short_output {
-            if self.include_idle {
-                write!(buf, " {idle:<6}").unwrap();
-            }
-            write!(buf, " {pid:>10}").unwrap();
-        }
-        write!(buf, " {comment:<8}").unwrap();
-        if self.include_exit {
-            write!(buf, " {exit:<12}").unwrap();
-        }
-        println!("{}", buf.trim_end());
-    }
-
-    #[inline]
-    fn print_heading(&self) {
-        self.print_line(
-            "NAME", ' ', "LINE", "TIME", "IDLE", "PID", "COMMENT", "EXIT",
-        );
-    }
-}

From 3bf966df56a435a99e05e8802a85be16f42bf100 Mon Sep 17 00:00:00 2001
From: Arpit Bhadauria <singharpit511@gmail.com>
Date: Mon, 11 Dec 2023 20:47:36 +0000
Subject: [PATCH 177/429] remove from trait for NumOrStr

---
 src/uu/expr/src/syntax_tree.rs | 21 ++++++++++-----------
 1 file changed, 10 insertions(+), 11 deletions(-)

diff --git a/src/uu/expr/src/syntax_tree.rs b/src/uu/expr/src/syntax_tree.rs
index 820911cd306..7817b172137 100644
--- a/src/uu/expr/src/syntax_tree.rs
+++ b/src/uu/expr/src/syntax_tree.rs
@@ -219,15 +219,6 @@ impl From<String> for NumOrStr {
     }
 }
 
-impl From<NumOrStr> for Option<usize> {
-    fn from(s: NumOrStr) -> Self {
-        match s.eval_as_bigint() {
-            Ok(num) => num.to_usize(),
-            Err(_) => None,
-        }
-    }
-}
-
 impl NumOrStr {
     pub fn to_bigint(&self) -> Result<BigInt, ParseBigIntError> {
         match self {
@@ -300,8 +291,16 @@ impl AstNode {
                 //
                 // So we coerce errors into 0 to make that the only case we
                 // have to care about.
-                let pos: usize = Option::<usize>::from(pos.eval()?).unwrap_or(0);
-                let length: usize = Option::<usize>::from(length.eval()?).unwrap_or(0);
+                let pos = pos
+                    .eval()?
+                    .eval_as_bigint()
+                    .map_or(0.into(), |n| n.to_usize())
+                    .unwrap_or(0);
+                let length = length
+                    .eval()?
+                    .eval_as_bigint()
+                    .map_or(0.into(), |n| n.to_usize())
+                    .unwrap_or(0);
 
                 let (Some(pos), Some(_)) = (pos.checked_sub(1), length.checked_sub(1)) else {
                     return Ok(String::new().into());

From 1919b3ba1702f9836fb38bc2490b418981e4faae Mon Sep 17 00:00:00 2001
From: Jeremy Soller <jackpot51@gmail.com>
Date: Mon, 11 Dec 2023 10:08:02 -0700
Subject: [PATCH 178/429] Add Redox OS CI

---
 .github/workflows/CICD.yml | 19 ++++++++++++++-----
 1 file changed, 14 insertions(+), 5 deletions(-)

diff --git a/.github/workflows/CICD.yml b/.github/workflows/CICD.yml
index 8c96ce693ee..f52ead1f6ca 100644
--- a/.github/workflows/CICD.yml
+++ b/.github/workflows/CICD.yml
@@ -473,6 +473,7 @@ jobs:
           - { os: ubuntu-latest  , target: i686-unknown-linux-musl     , features: feat_os_unix_musl      , use-cross: use-cross }
           - { os: ubuntu-latest  , target: x86_64-unknown-linux-gnu    , features: feat_os_unix           , use-cross: use-cross }
           - { os: ubuntu-latest  , target: x86_64-unknown-linux-musl   , features: feat_os_unix_musl      , use-cross: use-cross }
+          - { os: ubuntu-latest  , target: x86_64-unknown-redox        , features: feat_os_unix_redox     , use-cross: redoxer  , skip-tests: true }
           - { os: macos-latest   , target: aarch64-apple-darwin        , features: feat_os_macos          , use-cross: use-cross, skip-tests: true} # Hopefully github provides free M1 runners soon...
           - { os: macos-latest   , target: x86_64-apple-darwin         , features: feat_os_macos }
           - { os: windows-latest , target: i686-pc-windows-msvc        , features: feat_os_windows }
@@ -525,7 +526,7 @@ jobs:
           i686-*) TARGET_ARCH=i686 ;;
           x86_64-*) TARGET_ARCH=x86_64 ;;
         esac;
-        unset TARGET_OS ; case '${{ matrix.job.target }}' in *-linux-*) TARGET_OS=linux ;; *-apple-*) TARGET_OS=macos ;; *-windows-*) TARGET_OS=windows ;; esac;
+        unset TARGET_OS ; case '${{ matrix.job.target }}' in *-linux-*) TARGET_OS=linux ;; *-apple-*) TARGET_OS=macos ;; *-windows-*) TARGET_OS=windows ;; *-redox*) TARGET_OS=redox ;; esac;
         outputs TARGET_ARCH TARGET_OS
         # package name
         PKG_suffix=".tar.gz" ; case '${{ matrix.job.target }}' in *-pc-windows-*) PKG_suffix=".zip" ;; esac;
@@ -560,8 +561,11 @@ jobs:
         if [ -n "${{ matrix.job.features }}" ]; then CARGO_FEATURES_OPTION='--features=${{ matrix.job.features }}' ; fi
         outputs CARGO_FEATURES_OPTION
         # * CARGO_CMD
-        CARGO_CMD='cross' ; case '${{ matrix.job.use-cross }}' in ''|0|f|false|n|no) CARGO_CMD='cargo' ;; esac;
+        CARGO_CMD='cross' ; case '${{ matrix.job.use-cross }}' in ''|0|f|false|n|no) CARGO_CMD='cargo' ;; redoxer) CARGO_CMD='redoxer' ;; esac;
         outputs CARGO_CMD
+        # * CARGO_CMD_OPTIONS
+        CARGO_CMD_OPTIONS='+${{ env.RUST_MIN_SRV }}' ; case '${{ matrix.job.target }}' in *-redox*) CARGO_CMD_OPTIONS="" ;; esac;
+        outputs CARGO_CMD_OPTIONS
         # ** pass needed environment into `cross` container (iff `cross` not already configured via "Cross.toml")
         if [ "${CARGO_CMD}" = 'cross' ] && [ ! -e "Cross.toml" ] ; then
           printf "[build.env]\npassthrough = [\"CI\", \"RUST_BACKTRACE\", \"CARGO_TERM_COLOR\"]\n" > Cross.toml
@@ -595,6 +599,7 @@ jobs:
         case '${{ matrix.job.target }}' in
           arm-unknown-linux-gnueabihf) sudo apt-get -y update ; sudo apt-get -y install gcc-arm-linux-gnueabihf ;;
           aarch64-unknown-linux-gnu) sudo apt-get -y update ; sudo apt-get -y install gcc-aarch64-linux-gnu ;;
+          *-redox*) sudo apt-get -y update ; sudo apt-get -y install fuse3 libfuse-dev ;;
         esac
         case '${{ matrix.job.os }}' in
           macos-latest) brew install coreutils ;; # needed for testing
@@ -614,6 +619,10 @@ jobs:
             echo "foo" > /home/runner/.plan
             ;;
         esac
+    - uses: taiki-e/install-action@v2
+      if: steps.vars.outputs.CARGO_CMD == 'redoxer'
+      with:
+        tool: redoxer@0.2.37
     - name: Initialize toolchain-dependent workflow variables
       id: dep_vars
       shell: bash
@@ -652,14 +661,14 @@ jobs:
       shell: bash
       run: |
         ## Build
-        ${{ steps.vars.outputs.CARGO_CMD }} +${{ env.RUST_MIN_SRV }} build --release \
+        ${{ steps.vars.outputs.CARGO_CMD }} ${{ steps.vars.outputs.CARGO_CMD_OPTIONS }} build --release \
         --target=${{ matrix.job.target }} ${{ matrix.job.cargo-options }} ${{ steps.vars.outputs.CARGO_FEATURES_OPTION }}
     - name: Test
       if: matrix.job.skip-tests != true
       shell: bash
       run: |
         ## Test
-        ${{ steps.vars.outputs.CARGO_CMD }} +${{ env.RUST_MIN_SRV }} test --target=${{ matrix.job.target }} \
+        ${{ steps.vars.outputs.CARGO_CMD }} ${{ steps.vars.outputs.CARGO_CMD_OPTIONS }} test --target=${{ matrix.job.target }} \
         ${{ steps.vars.outputs.CARGO_TEST_OPTIONS}} ${{ matrix.job.cargo-options }} ${{ steps.vars.outputs.CARGO_FEATURES_OPTION }}
       env:
         RUST_BACKTRACE: "1"
@@ -668,7 +677,7 @@ jobs:
       shell: bash
       run: |
         ## Test individual utilities
-        ${{ steps.vars.outputs.CARGO_CMD }} +${{ env.RUST_MIN_SRV }} test --target=${{ matrix.job.target }} \
+        ${{ steps.vars.outputs.CARGO_CMD }} ${{ steps.vars.outputs.CARGO_CMD_OPTIONS }} test --target=${{ matrix.job.target }} \
         ${{ steps.vars.outputs.CARGO_TEST_OPTIONS}} ${{ matrix.job.cargo-options }} ${{ steps.dep_vars.outputs.CARGO_UTILITY_LIST_OPTIONS }}
       env:
         RUST_BACKTRACE: "1"

From 89cb4acb99593b6a85a9cc75e7623a3b1de82737 Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Sat, 9 Dec 2023 17:05:36 +0100
Subject: [PATCH 179/429] ls: encode path when using --hyperlink

---
 src/uu/ls/src/ls.rs      | 18 +++++++++++++++++-
 tests/by-util/test_ls.rs | 32 ++++++++++++++++++++++++++++++++
 2 files changed, 49 insertions(+), 1 deletion(-)

diff --git a/src/uu/ls/src/ls.rs b/src/uu/ls/src/ls.rs
index a5fe3d6246d..3cf848ae2c2 100644
--- a/src/uu/ls/src/ls.rs
+++ b/src/uu/ls/src/ls.rs
@@ -3019,7 +3019,23 @@ fn display_file_name(
         let absolute_path = fs::canonicalize(&path.p_buf).unwrap_or_default();
         let absolute_path = absolute_path.to_string_lossy();
 
-        // TODO encode path
+        #[cfg(not(target_os = "windows"))]
+        let unencoded_chars = "_-.:~/";
+        #[cfg(target_os = "windows")]
+        let unencoded_chars = "_-.:~/\\";
+
+        // percentage encoding of path
+        let absolute_path: String = absolute_path
+            .chars()
+            .map(|c| {
+                if c.is_alphanumeric() || unencoded_chars.contains(c) {
+                    c.to_string()
+                } else {
+                    format!("%{:02x}", c as u8)
+                }
+            })
+            .collect();
+
         // \x1b = ESC, \x07 = BEL
         name = format!("\x1b]8;;file://{hostname}{absolute_path}\x07{name}\x1b]8;;\x07");
     }
diff --git a/tests/by-util/test_ls.rs b/tests/by-util/test_ls.rs
index c9f43028c9c..76cb0d21677 100644
--- a/tests/by-util/test_ls.rs
+++ b/tests/by-util/test_ls.rs
@@ -3904,6 +3904,38 @@ fn test_ls_hyperlink() {
         .stdout_is(format!("{file}\n"));
 }
 
+// spell-checker: disable
+#[test]
+fn test_ls_hyperlink_encode_link() {
+    let (at, mut ucmd) = at_and_ucmd!();
+
+    #[cfg(not(target_os = "windows"))]
+    {
+        at.touch("back\\slash");
+        at.touch("ques?tion");
+    }
+    at.touch("encoded%3Fquestion");
+    at.touch("sp ace");
+
+    let result = ucmd.arg("--hyperlink").succeeds();
+    #[cfg(not(target_os = "windows"))]
+    {
+        assert!(result
+            .stdout_str()
+            .contains("back%5cslash\x07back\\slash\x1b]8;;\x07"));
+        assert!(result
+            .stdout_str()
+            .contains("ques%3ftion\x07ques?tion\x1b]8;;\x07"));
+    }
+    assert!(result
+        .stdout_str()
+        .contains("encoded%253Fquestion\x07encoded%3Fquestion\x1b]8;;\x07"));
+    assert!(result
+        .stdout_str()
+        .contains("sp%20ace\x07sp ace\x1b]8;;\x07"));
+}
+// spell-checker: enable
+
 #[test]
 fn test_ls_color_do_not_reset() {
     let scene: TestScenario = TestScenario::new(util_name!());

From 42558344f155f085acdc7b3b18e5a97fb479beb7 Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Tue, 12 Dec 2023 14:23:51 +0100
Subject: [PATCH 180/429] ls: enable "args override self"

---
 src/uu/ls/src/ls.rs      |  1 +
 tests/by-util/test_ls.rs | 15 +++++++++++++++
 2 files changed, 16 insertions(+)

diff --git a/src/uu/ls/src/ls.rs b/src/uu/ls/src/ls.rs
index 2aa4bad067b..1fceefe17fb 100644
--- a/src/uu/ls/src/ls.rs
+++ b/src/uu/ls/src/ls.rs
@@ -1070,6 +1070,7 @@ pub fn uu_app() -> Command {
         .about(ABOUT)
         .infer_long_args(true)
         .disable_help_flag(true)
+        .args_override_self(true)
         .arg(
             Arg::new(options::HELP)
                 .long(options::HELP)
diff --git a/tests/by-util/test_ls.rs b/tests/by-util/test_ls.rs
index 179941e7878..c3460633a22 100644
--- a/tests/by-util/test_ls.rs
+++ b/tests/by-util/test_ls.rs
@@ -3924,6 +3924,21 @@ fn test_ls_block_size_override() {
         .stdout_contains_line("total 8");
 }
 
+#[test]
+fn test_ls_block_size_override_self() {
+    new_ucmd!()
+        .arg("--block-size=512")
+        .arg("--block-size=512")
+        .succeeds();
+
+    new_ucmd!()
+        .arg("--human-readable")
+        .arg("--human-readable")
+        .succeeds();
+
+    new_ucmd!().arg("--si").arg("--si").succeeds();
+}
+
 #[test]
 fn test_ls_hyperlink() {
     let scene = TestScenario::new(util_name!());

From c32fb25b1faac8bd38bd3474d89ebb30e708eab7 Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Mon, 11 Dec 2023 10:55:37 +0100
Subject: [PATCH 181/429] Bump xattr from 1.1.1 to 1.1.3

---
 Cargo.lock | 96 ++++++++++++++++++++++++++++++++++++++++++++++--------
 Cargo.toml |  2 +-
 2 files changed, 83 insertions(+), 15 deletions(-)

diff --git a/Cargo.lock b/Cargo.lock
index c943a26117b..446b1724768 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -781,12 +781,12 @@ dependencies = [
 
 [[package]]
 name = "errno"
-version = "0.3.5"
+version = "0.3.8"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "ac3e13f66a2f95e32a39eaa81f6b95d42878ca0e1db0c7543723dfe12557e860"
+checksum = "a258e46cdc063eb8519c00b9fc845fc47bcfca4130e2f08e88665ceda8474245"
 dependencies = [
  "libc",
- "windows-sys 0.48.0",
+ "windows-sys 0.52.0",
 ]
 
 [[package]]
@@ -1215,9 +1215,9 @@ checksum = "ef53942eb7bf7ff43a617b3e2c1c4a5ecf5944a7c1bc12d7ee39bbb15e5c1519"
 
 [[package]]
 name = "linux-raw-sys"
-version = "0.4.10"
+version = "0.4.12"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "da2479e8c062e40bf0066ffa0bc823de0a9368974af99c9f6df941d2c231e03f"
+checksum = "c4cd1a83af159aa67994778be9070f0ae1bd732942279cabb14f86f986a21456"
 
 [[package]]
 name = "lock_api"
@@ -1600,7 +1600,7 @@ dependencies = [
  "hex",
  "lazy_static",
  "procfs-core",
- "rustix 0.38.21",
+ "rustix 0.38.28",
 ]
 
 [[package]]
@@ -1842,15 +1842,15 @@ dependencies = [
 
 [[package]]
 name = "rustix"
-version = "0.38.21"
+version = "0.38.28"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "2b426b0506e5d50a7d8dafcf2e81471400deb602392c7dd110815afb4eaf02a3"
+checksum = "72e572a5e8ca657d7366229cdde4bd14c4eb5499a9573d4d366fe1b599daa316"
 dependencies = [
  "bitflags 2.4.0",
  "errno",
  "libc",
- "linux-raw-sys 0.4.10",
- "windows-sys 0.48.0",
+ "linux-raw-sys 0.4.12",
+ "windows-sys 0.52.0",
 ]
 
 [[package]]
@@ -2063,7 +2063,7 @@ dependencies = [
  "cfg-if",
  "fastrand",
  "redox_syscall 0.4.0",
- "rustix 0.38.21",
+ "rustix 0.38.28",
  "windows-sys 0.48.0",
 ]
 
@@ -2083,7 +2083,7 @@ version = "0.3.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "21bebf2b7c9e0a515f6e0f8c51dc0f8e4696391e6f1ff30379559f8365fb0df7"
 dependencies = [
- "rustix 0.38.21",
+ "rustix 0.38.28",
  "windows-sys 0.48.0",
 ]
 
@@ -3403,6 +3403,15 @@ dependencies = [
  "windows-targets 0.48.0",
 ]
 
+[[package]]
+name = "windows-sys"
+version = "0.52.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "282be5f36a8ce781fad8c8ae18fa3f9beff57ec1b52cb3de0789201425d9a33d"
+dependencies = [
+ "windows-targets 0.52.0",
+]
+
 [[package]]
 name = "windows-targets"
 version = "0.42.2"
@@ -3433,6 +3442,21 @@ dependencies = [
  "windows_x86_64_msvc 0.48.0",
 ]
 
+[[package]]
+name = "windows-targets"
+version = "0.52.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "8a18201040b24831fbb9e4eb208f8892e1f50a37feb53cc7ff887feb8f50e7cd"
+dependencies = [
+ "windows_aarch64_gnullvm 0.52.0",
+ "windows_aarch64_msvc 0.52.0",
+ "windows_i686_gnu 0.52.0",
+ "windows_i686_msvc 0.52.0",
+ "windows_x86_64_gnu 0.52.0",
+ "windows_x86_64_gnullvm 0.52.0",
+ "windows_x86_64_msvc 0.52.0",
+]
+
 [[package]]
 name = "windows_aarch64_gnullvm"
 version = "0.42.2"
@@ -3445,6 +3469,12 @@ version = "0.48.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "91ae572e1b79dba883e0d315474df7305d12f569b400fcf90581b06062f7e1bc"
 
+[[package]]
+name = "windows_aarch64_gnullvm"
+version = "0.52.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "cb7764e35d4db8a7921e09562a0304bf2f93e0a51bfccee0bd0bb0b666b015ea"
+
 [[package]]
 name = "windows_aarch64_msvc"
 version = "0.42.2"
@@ -3457,6 +3487,12 @@ version = "0.48.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "b2ef27e0d7bdfcfc7b868b317c1d32c641a6fe4629c171b8928c7b08d98d7cf3"
 
+[[package]]
+name = "windows_aarch64_msvc"
+version = "0.52.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "bbaa0368d4f1d2aaefc55b6fcfee13f41544ddf36801e793edbbfd7d7df075ef"
+
 [[package]]
 name = "windows_i686_gnu"
 version = "0.42.2"
@@ -3469,6 +3505,12 @@ version = "0.48.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "622a1962a7db830d6fd0a69683c80a18fda201879f0f447f065a3b7467daa241"
 
+[[package]]
+name = "windows_i686_gnu"
+version = "0.52.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "a28637cb1fa3560a16915793afb20081aba2c92ee8af57b4d5f28e4b3e7df313"
+
 [[package]]
 name = "windows_i686_msvc"
 version = "0.42.2"
@@ -3481,6 +3523,12 @@ version = "0.48.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "4542c6e364ce21bf45d69fdd2a8e455fa38d316158cfd43b3ac1c5b1b19f8e00"
 
+[[package]]
+name = "windows_i686_msvc"
+version = "0.52.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "ffe5e8e31046ce6230cc7215707b816e339ff4d4d67c65dffa206fd0f7aa7b9a"
+
 [[package]]
 name = "windows_x86_64_gnu"
 version = "0.42.2"
@@ -3493,6 +3541,12 @@ version = "0.48.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "ca2b8a661f7628cbd23440e50b05d705db3686f894fc9580820623656af974b1"
 
+[[package]]
+name = "windows_x86_64_gnu"
+version = "0.52.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "3d6fa32db2bc4a2f5abeacf2b69f7992cd09dca97498da74a151a3132c26befd"
+
 [[package]]
 name = "windows_x86_64_gnullvm"
 version = "0.42.2"
@@ -3505,6 +3559,12 @@ version = "0.48.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "7896dbc1f41e08872e9d5e8f8baa8fdd2677f29468c4e156210174edc7f7b953"
 
+[[package]]
+name = "windows_x86_64_gnullvm"
+version = "0.52.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "1a657e1e9d3f514745a572a6846d3c7aa7dbe1658c056ed9c3344c4109a6949e"
+
 [[package]]
 name = "windows_x86_64_msvc"
 version = "0.42.2"
@@ -3517,13 +3577,21 @@ version = "0.48.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "1a515f5799fe4961cb532f983ce2b23082366b898e52ffbce459c86f67c8378a"
 
+[[package]]
+name = "windows_x86_64_msvc"
+version = "0.52.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "dff9641d1cd4be8d1a070daf9e3773c5f67e78b4d9d42263020c057706765c04"
+
 [[package]]
 name = "xattr"
-version = "1.1.1"
+version = "1.1.3"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "fbc6ab6ec1907d1a901cdbcd2bd4cb9e7d64ce5c9739cbb97d3c391acd8c7fae"
+checksum = "a7dae5072fe1f8db8f8d29059189ac175196e410e40ba42d5d4684ae2f750995"
 dependencies = [
  "libc",
+ "linux-raw-sys 0.4.12",
+ "rustix 0.38.28",
 ]
 
 [[package]]
diff --git a/Cargo.toml b/Cargo.toml
index 53e5ce32e96..332131bbe50 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -331,7 +331,7 @@ utf-8 = "0.7.6"
 walkdir = "2.4"
 winapi-util = "0.1.6"
 windows-sys = { version = "0.48.0", default-features = false }
-xattr = "1.1.1"
+xattr = "1.1.3"
 zip = { version = "0.6.6", default-features = false, features = ["deflate"] }
 
 hex = "0.4.3"

From 116245b8eff208c2540fb7a9477d8f3c9842ebc1 Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Mon, 11 Dec 2023 11:02:22 +0100
Subject: [PATCH 182/429] deny.toml: allow three versions of windows-sys

---
 deny.toml | 18 ++++++++++++++++++
 1 file changed, 18 insertions(+)

diff --git a/deny.toml b/deny.toml
index 03301ad7cd4..df970c2c6e8 100644
--- a/deny.toml
+++ b/deny.toml
@@ -64,8 +64,12 @@ skip = [
   { name = "rustix", version = "0.37.26" },
   # various crates
   { name = "windows-sys", version = "0.45.0" },
+  # various crates
+  { name = "windows-sys", version = "0.48.0" },
   # windows-sys
   { name = "windows-targets", version = "0.42.2" },
+  # windows-sys
+  { name = "windows-targets", version = "0.48.0" },
   # windows-targets
   { name = "windows_aarch64_gnullvm", version = "0.42.2" },
   # windows-targets
@@ -80,6 +84,20 @@ skip = [
   { name = "windows_x86_64_gnullvm", version = "0.42.2" },
   # windows-targets
   { name = "windows_x86_64_msvc", version = "0.42.2" },
+  # windows-targets
+  { name = "windows_aarch64_gnullvm", version = "0.48.0" },
+  # windows-targets
+  { name = "windows_aarch64_msvc", version = "0.48.0" },
+  # windows-targets
+  { name = "windows_i686_gnu", version = "0.48.0" },
+  # windows-targets
+  { name = "windows_i686_msvc", version = "0.48.0" },
+  # windows-targets
+  { name = "windows_x86_64_gnu", version = "0.48.0" },
+  # windows-targets
+  { name = "windows_x86_64_gnullvm", version = "0.48.0" },
+  # windows-targets
+  { name = "windows_x86_64_msvc", version = "0.48.0" },
   # various crates
   { name = "syn", version = "1.0.109" },
   # various crates

From 5d57fdc7f8cf9195c5bbe94ac6cb092087c168f7 Mon Sep 17 00:00:00 2001
From: "renovate[bot]" <29139614+renovate[bot]@users.noreply.github.com>
Date: Wed, 13 Dec 2023 09:25:44 +0000
Subject: [PATCH 183/429] chore(deps): update dawidd6/action-download-artifact
 action to v3

---
 .github/workflows/CICD.yml     | 4 ++--
 .github/workflows/GnuTests.yml | 2 +-
 2 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/.github/workflows/CICD.yml b/.github/workflows/CICD.yml
index 8c96ce693ee..7629725eef4 100644
--- a/.github/workflows/CICD.yml
+++ b/.github/workflows/CICD.yml
@@ -395,14 +395,14 @@ jobs:
               --arg multisize "$SIZE_MULTI" \
               '{($date): { sha: $sha, size: $size, multisize: $multisize, }}' > size-result.json
     - name: Download the previous individual size result
-      uses: dawidd6/action-download-artifact@v2
+      uses: dawidd6/action-download-artifact@v3
       with:
         workflow: CICD.yml
         name: individual-size-result
         repo: uutils/coreutils
         path: dl
     - name: Download the previous size result
-      uses: dawidd6/action-download-artifact@v2
+      uses: dawidd6/action-download-artifact@v3
       with:
         workflow: CICD.yml
         name: size-result
diff --git a/.github/workflows/GnuTests.yml b/.github/workflows/GnuTests.yml
index 87e4373eddc..f889e5a858b 100644
--- a/.github/workflows/GnuTests.yml
+++ b/.github/workflows/GnuTests.yml
@@ -77,7 +77,7 @@ jobs:
         ref: ${{ steps.vars.outputs.repo_GNU_ref }}
         submodules: recursive
     - name: Retrieve reference artifacts
-      uses: dawidd6/action-download-artifact@v2
+      uses: dawidd6/action-download-artifact@v3
       # ref: <https://github.com/dawidd6/action-download-artifact>
       continue-on-error: true ## don't break the build for missing reference artifacts (may be expired or just not generated yet)
       with:

From 6fb3bbb8a0051b4ef091a781599a1347cdc57705 Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Wed, 13 Dec 2023 14:27:19 +0100
Subject: [PATCH 184/429] mv: rename two tests

---
 tests/by-util/test_mv.rs | 20 ++++++++++----------
 1 file changed, 10 insertions(+), 10 deletions(-)

diff --git a/tests/by-util/test_mv.rs b/tests/by-util/test_mv.rs
index 571de769125..3fb002dc3e0 100644
--- a/tests/by-util/test_mv.rs
+++ b/tests/by-util/test_mv.rs
@@ -10,31 +10,31 @@ use std::thread::sleep;
 use std::time::Duration;
 
 #[test]
-fn test_invalid_arg() {
+fn test_mv_invalid_arg() {
     new_ucmd!().arg("--definitely-invalid").fails().code_is(1);
 }
 
 #[test]
-fn test_mv_rename_dir() {
+fn test_mv_missing_dest() {
     let (at, mut ucmd) = at_and_ucmd!();
-    let dir1 = "test_mv_rename_dir";
-    let dir2 = "test_mv_rename_dir2";
+    let dir = "dir";
 
-    at.mkdir(dir1);
-
-    ucmd.arg(dir1).arg(dir2).succeeds().no_stderr();
+    at.mkdir(dir);
 
-    assert!(at.dir_exists(dir2));
+    ucmd.arg(dir).fails();
 }
 
 #[test]
-fn test_mv_fail() {
+fn test_mv_rename_dir() {
     let (at, mut ucmd) = at_and_ucmd!();
     let dir1 = "test_mv_rename_dir";
+    let dir2 = "test_mv_rename_dir2";
 
     at.mkdir(dir1);
 
-    ucmd.arg(dir1).fails();
+    ucmd.arg(dir1).arg(dir2).succeeds().no_stderr();
+
+    assert!(at.dir_exists(dir2));
 }
 
 #[test]

From ebe5c51cee2f9a221df1c3dcd3881c39d6f503d2 Mon Sep 17 00:00:00 2001
From: Jeremy Soller <jackpot51@gmail.com>
Date: Wed, 13 Dec 2023 08:47:16 -0700
Subject: [PATCH 185/429] Format case statements

---
 .github/workflows/CICD.yml | 22 ++++++++++++++++++----
 1 file changed, 18 insertions(+), 4 deletions(-)

diff --git a/.github/workflows/CICD.yml b/.github/workflows/CICD.yml
index f52ead1f6ca..dc25e58b6e8 100644
--- a/.github/workflows/CICD.yml
+++ b/.github/workflows/CICD.yml
@@ -526,7 +526,13 @@ jobs:
           i686-*) TARGET_ARCH=i686 ;;
           x86_64-*) TARGET_ARCH=x86_64 ;;
         esac;
-        unset TARGET_OS ; case '${{ matrix.job.target }}' in *-linux-*) TARGET_OS=linux ;; *-apple-*) TARGET_OS=macos ;; *-windows-*) TARGET_OS=windows ;; *-redox*) TARGET_OS=redox ;; esac;
+        unset TARGET_OS
+        case '${{ matrix.job.target }}' in
+          *-linux-*) TARGET_OS=linux ;;
+          *-apple-*) TARGET_OS=macos ;;
+          *-windows-*) TARGET_OS=windows ;;
+          *-redox*) TARGET_OS=redox ;;
+        esac
         outputs TARGET_ARCH TARGET_OS
         # package name
         PKG_suffix=".tar.gz" ; case '${{ matrix.job.target }}' in *-pc-windows-*) PKG_suffix=".zip" ;; esac;
@@ -561,10 +567,18 @@ jobs:
         if [ -n "${{ matrix.job.features }}" ]; then CARGO_FEATURES_OPTION='--features=${{ matrix.job.features }}' ; fi
         outputs CARGO_FEATURES_OPTION
         # * CARGO_CMD
-        CARGO_CMD='cross' ; case '${{ matrix.job.use-cross }}' in ''|0|f|false|n|no) CARGO_CMD='cargo' ;; redoxer) CARGO_CMD='redoxer' ;; esac;
+        CARGO_CMD='cross'
+        CARGO_CMD_OPTIONS='+${{ env.RUST_MIN_SRV }}'
+        case '${{ matrix.job.use-cross }}' in
+          ''|0|f|false|n|no)
+            CARGO_CMD='cargo'
+            ;;
+          redoxer)
+            CARGO_CMD='redoxer'
+            CARGO_CMD_OPTIONS=''
+            ;;
+        esac
         outputs CARGO_CMD
-        # * CARGO_CMD_OPTIONS
-        CARGO_CMD_OPTIONS='+${{ env.RUST_MIN_SRV }}' ; case '${{ matrix.job.target }}' in *-redox*) CARGO_CMD_OPTIONS="" ;; esac;
         outputs CARGO_CMD_OPTIONS
         # ** pass needed environment into `cross` container (iff `cross` not already configured via "Cross.toml")
         if [ "${CARGO_CMD}" = 'cross' ] && [ ! -e "Cross.toml" ] ; then

From 7f23faf8999069b283a370991f1f3220619304ba Mon Sep 17 00:00:00 2001
From: Terts Diepraam <terts.diepraam@gmail.com>
Date: Thu, 14 Dec 2023 16:35:56 +0100
Subject: [PATCH 186/429] expr: clean up conversion from bigint to usize

---
 src/uu/expr/src/syntax_tree.rs | 6 ++++--
 1 file changed, 4 insertions(+), 2 deletions(-)

diff --git a/src/uu/expr/src/syntax_tree.rs b/src/uu/expr/src/syntax_tree.rs
index 7817b172137..28e4ff0bd65 100644
--- a/src/uu/expr/src/syntax_tree.rs
+++ b/src/uu/expr/src/syntax_tree.rs
@@ -294,12 +294,14 @@ impl AstNode {
                 let pos = pos
                     .eval()?
                     .eval_as_bigint()
-                    .map_or(0.into(), |n| n.to_usize())
+                    .ok()
+                    .and_then(|n| n.to_usize())
                     .unwrap_or(0);
                 let length = length
                     .eval()?
                     .eval_as_bigint()
-                    .map_or(0.into(), |n| n.to_usize())
+                    .ok()
+                    .and_then(|n| n.to_usize())
                     .unwrap_or(0);
 
                 let (Some(pos), Some(_)) = (pos.checked_sub(1), length.checked_sub(1)) else {

From 97857d5be08d4901508cf5f6bdecf09399b4e8bc Mon Sep 17 00:00:00 2001
From: "renovate[bot]" <29139614+renovate[bot]@users.noreply.github.com>
Date: Thu, 14 Dec 2023 17:51:36 +0000
Subject: [PATCH 187/429] chore(deps): update actions/upload-artifact action to
 v4

---
 .github/workflows/CICD.yml     | 18 +++++++++---------
 .github/workflows/GnuTests.yml | 10 +++++-----
 2 files changed, 14 insertions(+), 14 deletions(-)

diff --git a/.github/workflows/CICD.yml b/.github/workflows/CICD.yml
index 7629725eef4..965e2606271 100644
--- a/.github/workflows/CICD.yml
+++ b/.github/workflows/CICD.yml
@@ -439,12 +439,12 @@ jobs:
         previous_multisize=$(cat dl/size-result.json | jq -r '.[] | .multisize')
         check 'multicall binary' "$multisize" "$previous_multisize" 'size-result.json'
     - name: Upload the individual size result
-      uses: actions/upload-artifact@v3
+      uses: actions/upload-artifact@v4
       with:
         name: individual-size-result
         path: individual-size-result.json
     - name: Upload the size result
-      uses: actions/upload-artifact@v3
+      uses: actions/upload-artifact@v4
       with:
         name: size-result
         path: size-result.json
@@ -673,7 +673,7 @@ jobs:
       env:
         RUST_BACKTRACE: "1"
     - name: Archive executable artifacts
-      uses: actions/upload-artifact@v3
+      uses: actions/upload-artifact@v4
       with:
         name: ${{ env.PROJECT_NAME }}-${{ matrix.job.target }}
         path: target/${{ matrix.job.target }}/release/${{ env.PROJECT_NAME }}${{ steps.vars.outputs.EXE_suffix }}
@@ -784,17 +784,17 @@ jobs:
           HASH=$(sha1sum '${{ steps.vars.outputs.TEST_SUMMARY_FILE }}' | cut --delim=" " -f 1)
           echo "HASH=${HASH}" >> $GITHUB_OUTPUT
     - name: Reserve SHA1/ID of 'test-summary'
-      uses: actions/upload-artifact@v3
+      uses: actions/upload-artifact@v4
       with:
         name: "${{ steps.summary.outputs.HASH }}"
         path: "${{ steps.vars.outputs.TEST_SUMMARY_FILE }}"
     - name: Reserve test results summary
-      uses: actions/upload-artifact@v3
+      uses: actions/upload-artifact@v4
       with:
         name: test-summary
         path: "${{ steps.vars.outputs.TEST_SUMMARY_FILE }}"
     - name: Upload json results
-      uses: actions/upload-artifact@v3
+      uses: actions/upload-artifact@v4
       with:
         name: busybox-result.json
         path: ${{ steps.vars.outputs.TEST_SUMMARY_FILE }}
@@ -872,17 +872,17 @@ jobs:
         HASH=$(sha1sum '${{ steps.vars.outputs.TEST_SUMMARY_FILE }}' | cut --delim=" " -f 1)
           echo "HASH=${HASH}" >> $GITHUB_OUTPUT
     - name: Reserve SHA1/ID of 'test-summary'
-      uses: actions/upload-artifact@v3
+      uses: actions/upload-artifact@v4
       with:
         name: "${{ steps.summary.outputs.HASH }}"
         path: "${{ steps.vars.outputs.TEST_SUMMARY_FILE }}"
     - name: Reserve test results summary
-      uses: actions/upload-artifact@v3
+      uses: actions/upload-artifact@v4
       with:
         name: test-summary
         path: "${{ steps.vars.outputs.TEST_SUMMARY_FILE }}"
     - name: Upload json results
-      uses: actions/upload-artifact@v3
+      uses: actions/upload-artifact@v4
       with:
         name: toybox-result.json
         path: ${{ steps.vars.outputs.TEST_SUMMARY_FILE }}
diff --git a/.github/workflows/GnuTests.yml b/.github/workflows/GnuTests.yml
index f889e5a858b..5215ab24f83 100644
--- a/.github/workflows/GnuTests.yml
+++ b/.github/workflows/GnuTests.yml
@@ -179,22 +179,22 @@ jobs:
           # Compress logs before upload (fails otherwise)
           gzip ${{ steps.vars.outputs.TEST_LOGS_GLOB }}
     - name: Reserve SHA1/ID of 'test-summary'
-      uses: actions/upload-artifact@v3
+      uses: actions/upload-artifact@v4
       with:
         name: "${{ steps.summary.outputs.HASH }}"
         path: "${{ steps.vars.outputs.TEST_SUMMARY_FILE }}"
     - name: Reserve test results summary
-      uses: actions/upload-artifact@v3
+      uses: actions/upload-artifact@v4
       with:
         name: test-summary
         path: "${{ steps.vars.outputs.TEST_SUMMARY_FILE }}"
     - name: Reserve test logs
-      uses: actions/upload-artifact@v3
+      uses: actions/upload-artifact@v4
       with:
         name: test-logs
         path: "${{ steps.vars.outputs.TEST_LOGS_GLOB }}"
     - name: Upload full json results
-      uses: actions/upload-artifact@v3
+      uses: actions/upload-artifact@v4
       with:
         name: gnu-full-result.json
         path: ${{ steps.vars.outputs.TEST_FULL_SUMMARY_FILE }}
@@ -288,7 +288,7 @@ jobs:
         if test -n "${have_new_failures}" ; then exit -1 ; fi
     - name: Upload comparison log (for GnuComment workflow)
       if: success() || failure() # run regardless of prior step success/failure
-      uses: actions/upload-artifact@v3
+      uses: actions/upload-artifact@v4
       with:
         name: comment
         path: ${{ steps.vars.outputs.path_reference }}/comment/

From 3a7a3bf63941492c7885ba0287c78854a6950c12 Mon Sep 17 00:00:00 2001
From: Arpit Bhadauria <singharpit511@gmail.com>
Date: Fri, 15 Dec 2023 16:44:31 +0530
Subject: [PATCH 188/429] fmt: remove crash! macro (#5589)

* fmt: remove crash! macro

* Fix styling in fmt

* Revert "Fix styling in fmt"

This reverts commit 002e02f50c5bfebfc69fb1acb86d39a36d96d97d.

* Revert "fmt: remove crash! macro"

This reverts commit d65a3f85a1840d0c1d2e32f927e951a62258370f.

* Replace crash! with unreachable! macro

* Remove crash! import

* Remove unreachable! from fmt

* keep the helpful comment

* Fix lint and format issues

* review fixes
---
 src/uu/fmt/src/linebreak.rs | 40 +++++++++++++++++--------------------
 1 file changed, 18 insertions(+), 22 deletions(-)

diff --git a/src/uu/fmt/src/linebreak.rs b/src/uu/fmt/src/linebreak.rs
index 306c15f3614..7393589d0b3 100644
--- a/src/uu/fmt/src/linebreak.rs
+++ b/src/uu/fmt/src/linebreak.rs
@@ -8,8 +8,6 @@
 use std::io::{BufWriter, Stdout, Write};
 use std::{cmp, i64, mem};
 
-use uucore::crash;
-
 use crate::parasplit::{ParaWords, Paragraph, WordInfo};
 use crate::FmtOptions;
 
@@ -363,28 +361,26 @@ fn find_kp_breakpoints<'a, T: Iterator<Item = &'a WordInfo<'a>>>(
 }
 
 fn build_best_path<'a>(paths: &[LineBreak<'a>], active: &[usize]) -> Vec<(&'a WordInfo<'a>, bool)> {
-    let mut breakwords = vec![];
     // of the active paths, we select the one with the fewest demerits
-    let mut best_idx = match active.iter().min_by_key(|&&a| paths[a].demerits) {
-        None => crash!(
-            1,
-            "Failed to find a k-p linebreak solution. This should never happen."
-        ),
-        Some(&s) => s,
-    };
-
-    // now, chase the pointers back through the break list, recording
-    // the words at which we should break
-    loop {
-        let next_best = &paths[best_idx];
-        match next_best.linebreak {
-            None => return breakwords,
-            Some(prev) => {
-                breakwords.push((prev, next_best.break_before));
-                best_idx = next_best.prev;
+    active
+        .iter()
+        .min_by_key(|&&a| paths[a].demerits)
+        .map(|&(mut best_idx)| {
+            let mut breakwords = vec![];
+            // now, chase the pointers back through the break list, recording
+            // the words at which we should break
+            loop {
+                let next_best = &paths[best_idx];
+                match next_best.linebreak {
+                    None => return breakwords,
+                    Some(prev) => {
+                        breakwords.push((prev, next_best.break_before));
+                        best_idx = next_best.prev;
+                    }
+                }
             }
-        }
-    }
+        })
+        .unwrap_or_default()
 }
 
 // "infinite" badness is more like (1+BAD_INFTY)^2 because of how demerits are computed

From c32e730a1f0f0625158571dd528cde7519515f81 Mon Sep 17 00:00:00 2001
From: Terts Diepraam <terts.diepraam@gmail.com>
Date: Fri, 15 Dec 2023 14:38:27 +0100
Subject: [PATCH 189/429] all: remove collect_{lossy,ignore} calls where
 possible

---
 src/uu/base32/src/base_common.rs  | 3 +--
 src/uu/cat/src/cat.rs             | 2 --
 src/uu/chroot/src/chroot.rs       | 2 --
 src/uu/cksum/src/cksum.rs         | 2 --
 src/uu/comm/src/comm.rs           | 2 --
 src/uu/csplit/src/csplit.rs       | 2 --
 src/uu/dd/src/dd.rs               | 2 --
 src/uu/dircolors/src/dircolors.rs | 2 --
 src/uu/dirname/src/dirname.rs     | 2 --
 src/uu/du/src/du.rs               | 2 --
 src/uu/echo/src/echo.rs           | 1 -
 src/uu/expr/src/expr.rs           | 2 --
 src/uu/logname/src/logname.rs     | 2 --
 src/uu/mkfifo/src/mkfifo.rs       | 2 --
 src/uu/mknod/src/mknod.rs         | 1 -
 src/uu/mktemp/src/mktemp.rs       | 6 +++---
 src/uu/more/src/more.rs           | 1 -
 src/uu/nl/src/nl.rs               | 2 --
 src/uu/nohup/src/nohup.rs         | 2 --
 src/uu/pathchk/src/pathchk.rs     | 2 --
 src/uu/pinky/src/pinky.rs         | 2 --
 src/uu/printf/src/printf.rs       | 1 -
 src/uu/ptx/src/ptx.rs             | 2 --
 src/uu/shred/src/shred.rs         | 2 --
 src/uu/shuf/src/shuf.rs           | 2 --
 src/uu/sort/src/sort.rs           | 1 -
 src/uu/stdbuf/src/stdbuf.rs       | 2 --
 src/uu/stty/src/stty.rs           | 2 --
 src/uu/sum/src/sum.rs             | 2 --
 src/uu/tac/src/tac.rs             | 2 --
 src/uu/timeout/src/timeout.rs     | 2 --
 src/uu/tr/src/tr.rs               | 2 --
 src/uu/tsort/src/tsort.rs         | 2 --
 src/uu/who/src/who.rs             | 2 --
 34 files changed, 4 insertions(+), 64 deletions(-)

diff --git a/src/uu/base32/src/base_common.rs b/src/uu/base32/src/base_common.rs
index 74c3dc80879..2112a40ead7 100644
--- a/src/uu/base32/src/base_common.rs
+++ b/src/uu/base32/src/base_common.rs
@@ -87,8 +87,7 @@ pub fn parse_base_cmd_args(
     usage: &str,
 ) -> UResult<Config> {
     let command = base_app(about, usage);
-    let arg_list = args.collect_lossy();
-    Config::from(&command.try_get_matches_from(arg_list)?)
+    Config::from(&command.try_get_matches_from(args)?)
 }
 
 pub fn base_app(about: &'static str, usage: &str) -> Command {
diff --git a/src/uu/cat/src/cat.rs b/src/uu/cat/src/cat.rs
index 34eb265129d..8aaecb8c175 100644
--- a/src/uu/cat/src/cat.rs
+++ b/src/uu/cat/src/cat.rs
@@ -174,8 +174,6 @@ mod options {
 
 #[uucore::main]
 pub fn uumain(args: impl uucore::Args) -> UResult<()> {
-    let args = args.collect_ignore();
-
     let matches = uu_app().try_get_matches_from(args)?;
 
     let number_mode = if matches.get_flag(options::NUMBER_NONBLANK) {
diff --git a/src/uu/chroot/src/chroot.rs b/src/uu/chroot/src/chroot.rs
index 6366775c36d..9ea861d46d1 100644
--- a/src/uu/chroot/src/chroot.rs
+++ b/src/uu/chroot/src/chroot.rs
@@ -33,8 +33,6 @@ mod options {
 
 #[uucore::main]
 pub fn uumain(args: impl uucore::Args) -> UResult<()> {
-    let args = args.collect_lossy();
-
     let matches = uu_app().try_get_matches_from(args).with_exit_code(125)?;
 
     let default_shell: &'static str = "/bin/sh";
diff --git a/src/uu/cksum/src/cksum.rs b/src/uu/cksum/src/cksum.rs
index 629bb457fd8..24576040937 100644
--- a/src/uu/cksum/src/cksum.rs
+++ b/src/uu/cksum/src/cksum.rs
@@ -221,8 +221,6 @@ mod options {
 
 #[uucore::main]
 pub fn uumain(args: impl uucore::Args) -> UResult<()> {
-    let args = args.collect_ignore();
-
     let matches = uu_app().try_get_matches_from(args)?;
 
     let algo_name: &str = match matches.get_one::<String>(options::ALGORITHM) {
diff --git a/src/uu/comm/src/comm.rs b/src/uu/comm/src/comm.rs
index e6977142ef5..dd49ef53b02 100644
--- a/src/uu/comm/src/comm.rs
+++ b/src/uu/comm/src/comm.rs
@@ -145,8 +145,6 @@ fn open_file(name: &str, line_ending: LineEnding) -> io::Result<LineReader> {
 
 #[uucore::main]
 pub fn uumain(args: impl uucore::Args) -> UResult<()> {
-    let args = args.collect_lossy();
-
     let matches = uu_app().try_get_matches_from(args)?;
     let line_ending = LineEnding::from_zero_flag(matches.get_flag(options::ZERO_TERMINATED));
     let filename1 = matches.get_one::<String>(options::FILE_1).unwrap();
diff --git a/src/uu/csplit/src/csplit.rs b/src/uu/csplit/src/csplit.rs
index d33be1a5d54..00bebbf4dcb 100644
--- a/src/uu/csplit/src/csplit.rs
+++ b/src/uu/csplit/src/csplit.rs
@@ -552,8 +552,6 @@ where
 
 #[uucore::main]
 pub fn uumain(args: impl uucore::Args) -> UResult<()> {
-    let args = args.collect_ignore();
-
     let matches = uu_app().try_get_matches_from(args)?;
 
     // get the file to split
diff --git a/src/uu/dd/src/dd.rs b/src/uu/dd/src/dd.rs
index b721d1d72ee..e849fcd2a2a 100644
--- a/src/uu/dd/src/dd.rs
+++ b/src/uu/dd/src/dd.rs
@@ -1267,8 +1267,6 @@ fn is_fifo(filename: &str) -> bool {
 
 #[uucore::main]
 pub fn uumain(args: impl uucore::Args) -> UResult<()> {
-    let args = args.collect_ignore();
-
     let matches = uu_app().try_get_matches_from(args)?;
 
     let settings: Settings = Parser::new().parse(
diff --git a/src/uu/dircolors/src/dircolors.rs b/src/uu/dircolors/src/dircolors.rs
index ecca9d16033..531c3ee474c 100644
--- a/src/uu/dircolors/src/dircolors.rs
+++ b/src/uu/dircolors/src/dircolors.rs
@@ -129,8 +129,6 @@ fn generate_ls_colors(fmt: &OutputFmt, sep: &str) -> String {
 
 #[uucore::main]
 pub fn uumain(args: impl uucore::Args) -> UResult<()> {
-    let args = args.collect_ignore();
-
     let matches = uu_app().try_get_matches_from(args)?;
 
     let files = matches
diff --git a/src/uu/dirname/src/dirname.rs b/src/uu/dirname/src/dirname.rs
index 51935cb7f23..a645b05fd72 100644
--- a/src/uu/dirname/src/dirname.rs
+++ b/src/uu/dirname/src/dirname.rs
@@ -21,8 +21,6 @@ mod options {
 
 #[uucore::main]
 pub fn uumain(args: impl uucore::Args) -> UResult<()> {
-    let args = args.collect_lossy();
-
     let matches = uu_app().after_help(AFTER_HELP).try_get_matches_from(args)?;
 
     let line_ending = LineEnding::from_zero_flag(matches.get_flag(options::ZERO));
diff --git a/src/uu/du/src/du.rs b/src/uu/du/src/du.rs
index 7114ccc2668..1213e004f15 100644
--- a/src/uu/du/src/du.rs
+++ b/src/uu/du/src/du.rs
@@ -590,8 +590,6 @@ pub fn div_ceil(a: u64, b: u64) -> u64 {
 #[uucore::main]
 #[allow(clippy::cognitive_complexity)]
 pub fn uumain(args: impl uucore::Args) -> UResult<()> {
-    let args = args.collect_ignore();
-
     let matches = uu_app().try_get_matches_from(args)?;
 
     let summarize = matches.get_flag(options::SUMMARIZE);
diff --git a/src/uu/echo/src/echo.rs b/src/uu/echo/src/echo.rs
index b3707b6f898..522cb0c9457 100644
--- a/src/uu/echo/src/echo.rs
+++ b/src/uu/echo/src/echo.rs
@@ -118,7 +118,6 @@ fn print_escaped(input: &str, mut output: impl Write) -> io::Result<ControlFlow<
 
 #[uucore::main]
 pub fn uumain(args: impl uucore::Args) -> UResult<()> {
-    let args = args.collect_lossy();
     let matches = uu_app().get_matches_from(args);
 
     let no_newline = matches.get_flag(options::NO_NEWLINE);
diff --git a/src/uu/expr/src/expr.rs b/src/uu/expr/src/expr.rs
index c271f0935fd..1e19b6e12dc 100644
--- a/src/uu/expr/src/expr.rs
+++ b/src/uu/expr/src/expr.rs
@@ -98,8 +98,6 @@ pub fn uu_app() -> Command {
 
 #[uucore::main]
 pub fn uumain(args: impl uucore::Args) -> UResult<()> {
-    let args = args.collect_lossy();
-
     // For expr utility we do not want getopts.
     // The following usage should work without escaping hyphens: `expr -15 = 1 +  2 \* \( 3 - -4 \)`
     let matches = uu_app().try_get_matches_from(args)?;
diff --git a/src/uu/logname/src/logname.rs b/src/uu/logname/src/logname.rs
index 55d4fec75ee..02a78cf4c3c 100644
--- a/src/uu/logname/src/logname.rs
+++ b/src/uu/logname/src/logname.rs
@@ -30,8 +30,6 @@ const USAGE: &str = help_usage!("logname.md");
 
 #[uucore::main]
 pub fn uumain(args: impl uucore::Args) -> UResult<()> {
-    let args = args.collect_ignore();
-
     let _ = uu_app().try_get_matches_from(args)?;
 
     match get_userlogin() {
diff --git a/src/uu/mkfifo/src/mkfifo.rs b/src/uu/mkfifo/src/mkfifo.rs
index 39d1127394e..9320f76ed04 100644
--- a/src/uu/mkfifo/src/mkfifo.rs
+++ b/src/uu/mkfifo/src/mkfifo.rs
@@ -22,8 +22,6 @@ mod options {
 
 #[uucore::main]
 pub fn uumain(args: impl uucore::Args) -> UResult<()> {
-    let args = args.collect_ignore();
-
     let matches = uu_app().try_get_matches_from(args)?;
 
     if matches.contains_id(options::CONTEXT) {
diff --git a/src/uu/mknod/src/mknod.rs b/src/uu/mknod/src/mknod.rs
index ceafd235b01..15a0fdacdb8 100644
--- a/src/uu/mknod/src/mknod.rs
+++ b/src/uu/mknod/src/mknod.rs
@@ -68,7 +68,6 @@ fn _mknod(file_name: &str, mode: mode_t, dev: dev_t) -> i32 {
 
 #[uucore::main]
 pub fn uumain(args: impl uucore::Args) -> UResult<()> {
-    let args = args.collect_ignore();
     // Linux-specific options, not implemented
     // opts.optflag("Z", "", "set the SELinux security context to default type");
     // opts.optopt("", "context", "like -Z, or if CTX is specified then set the SELinux or SMACK security context to CTX");
diff --git a/src/uu/mktemp/src/mktemp.rs b/src/uu/mktemp/src/mktemp.rs
index d52351a8948..ae44225c9a6 100644
--- a/src/uu/mktemp/src/mktemp.rs
+++ b/src/uu/mktemp/src/mktemp.rs
@@ -12,6 +12,7 @@ use uucore::{format_usage, help_about, help_usage};
 
 use std::env;
 use std::error::Error;
+use std::ffi::OsStr;
 use std::fmt::Display;
 use std::io::ErrorKind;
 use std::iter;
@@ -308,8 +309,7 @@ impl Params {
 
 #[uucore::main]
 pub fn uumain(args: impl uucore::Args) -> UResult<()> {
-    let args = args.collect_lossy();
-
+    let args: Vec<_> = args.collect();
     let matches = match uu_app().try_get_matches_from(&args) {
         Ok(m) => m,
         Err(e) => {
@@ -333,7 +333,7 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
         // If POSIXLY_CORRECT was set, template MUST be the last argument.
         if matches.contains_id(ARG_TEMPLATE) {
             // Template argument was provided, check if was the last one.
-            if args.last().unwrap() != &options.template {
+            if args.last().unwrap() != OsStr::new(&options.template) {
                 return Err(Box::new(MkTempError::TooManyTemplates));
             }
         }
diff --git a/src/uu/more/src/more.rs b/src/uu/more/src/more.rs
index b21b2ab1f35..f651a033b54 100644
--- a/src/uu/more/src/more.rs
+++ b/src/uu/more/src/more.rs
@@ -87,7 +87,6 @@ impl Options {
 
 #[uucore::main]
 pub fn uumain(args: impl uucore::Args) -> UResult<()> {
-    let args = args.collect_lossy();
     let matches = match uu_app().try_get_matches_from(args) {
         Ok(m) => m,
         Err(e) => return Err(e.into()),
diff --git a/src/uu/nl/src/nl.rs b/src/uu/nl/src/nl.rs
index eaf27f3b6f4..7d7688650aa 100644
--- a/src/uu/nl/src/nl.rs
+++ b/src/uu/nl/src/nl.rs
@@ -178,8 +178,6 @@ pub mod options {
 
 #[uucore::main]
 pub fn uumain(args: impl uucore::Args) -> UResult<()> {
-    let args = args.collect_lossy();
-
     let matches = uu_app().try_get_matches_from(args)?;
 
     let mut settings = Settings::default();
diff --git a/src/uu/nohup/src/nohup.rs b/src/uu/nohup/src/nohup.rs
index c64f7bf71ba..602cb7ca70f 100644
--- a/src/uu/nohup/src/nohup.rs
+++ b/src/uu/nohup/src/nohup.rs
@@ -74,8 +74,6 @@ impl Display for NohupError {
 
 #[uucore::main]
 pub fn uumain(args: impl uucore::Args) -> UResult<()> {
-    let args = args.collect_lossy();
-
     let matches = uu_app().try_get_matches_from(args).with_exit_code(125)?;
 
     replace_fds()?;
diff --git a/src/uu/pathchk/src/pathchk.rs b/src/uu/pathchk/src/pathchk.rs
index 81c35208864..ffb214e2ebf 100644
--- a/src/uu/pathchk/src/pathchk.rs
+++ b/src/uu/pathchk/src/pathchk.rs
@@ -36,8 +36,6 @@ const POSIX_NAME_MAX: usize = 14;
 
 #[uucore::main]
 pub fn uumain(args: impl uucore::Args) -> UResult<()> {
-    let args = args.collect_lossy();
-
     let matches = uu_app().try_get_matches_from(args)?;
 
     // set working mode
diff --git a/src/uu/pinky/src/pinky.rs b/src/uu/pinky/src/pinky.rs
index 8ac8f6c8446..02161cb364a 100644
--- a/src/uu/pinky/src/pinky.rs
+++ b/src/uu/pinky/src/pinky.rs
@@ -47,8 +47,6 @@ fn get_long_usage() -> String {
 
 #[uucore::main]
 pub fn uumain(args: impl uucore::Args) -> UResult<()> {
-    let args = args.collect_ignore();
-
     let matches = uu_app()
         .after_help(get_long_usage())
         .try_get_matches_from(args)?;
diff --git a/src/uu/printf/src/printf.rs b/src/uu/printf/src/printf.rs
index 663411b8952..ad42e38941f 100644
--- a/src/uu/printf/src/printf.rs
+++ b/src/uu/printf/src/printf.rs
@@ -27,7 +27,6 @@ mod options {
 
 #[uucore::main]
 pub fn uumain(args: impl uucore::Args) -> UResult<()> {
-    let args = args.collect_ignore();
     let matches = uu_app().get_matches_from(args);
 
     let format_string = matches
diff --git a/src/uu/ptx/src/ptx.rs b/src/uu/ptx/src/ptx.rs
index 6dd2b2992e0..7caa8f4a5d4 100644
--- a/src/uu/ptx/src/ptx.rs
+++ b/src/uu/ptx/src/ptx.rs
@@ -715,8 +715,6 @@ mod options {
 
 #[uucore::main]
 pub fn uumain(args: impl uucore::Args) -> UResult<()> {
-    let args = args.collect_ignore();
-
     let matches = uu_app().try_get_matches_from(args)?;
 
     let mut input_files: Vec<String> = match &matches.get_many::<String>(options::FILE) {
diff --git a/src/uu/shred/src/shred.rs b/src/uu/shred/src/shred.rs
index 711fd0485cc..d4209aa3a97 100644
--- a/src/uu/shred/src/shred.rs
+++ b/src/uu/shred/src/shred.rs
@@ -200,8 +200,6 @@ impl BytesWriter {
 
 #[uucore::main]
 pub fn uumain(args: impl uucore::Args) -> UResult<()> {
-    let args = args.collect_ignore();
-
     let matches = uu_app().try_get_matches_from(args)?;
 
     if !matches.contains_id(options::FILE) {
diff --git a/src/uu/shuf/src/shuf.rs b/src/uu/shuf/src/shuf.rs
index 8c636f1cb1d..de302435cb6 100644
--- a/src/uu/shuf/src/shuf.rs
+++ b/src/uu/shuf/src/shuf.rs
@@ -47,8 +47,6 @@ mod options {
 
 #[uucore::main]
 pub fn uumain(args: impl uucore::Args) -> UResult<()> {
-    let args = args.collect_lossy();
-
     let matches = uu_app().try_get_matches_from(args)?;
 
     let mode = if let Some(args) = matches.get_many::<String>(options::ECHO) {
diff --git a/src/uu/sort/src/sort.rs b/src/uu/sort/src/sort.rs
index 4e6e841874b..bc331915b14 100644
--- a/src/uu/sort/src/sort.rs
+++ b/src/uu/sort/src/sort.rs
@@ -1029,7 +1029,6 @@ fn make_sort_mode_arg(mode: &'static str, short: char, help: &'static str) -> Ar
 #[uucore::main]
 #[allow(clippy::cognitive_complexity)]
 pub fn uumain(args: impl uucore::Args) -> UResult<()> {
-    let args = args.collect_ignore();
     let mut settings = GlobalSettings::default();
 
     let matches = match uu_app().try_get_matches_from(args) {
diff --git a/src/uu/stdbuf/src/stdbuf.rs b/src/uu/stdbuf/src/stdbuf.rs
index 38c4451ca50..2436274e7f8 100644
--- a/src/uu/stdbuf/src/stdbuf.rs
+++ b/src/uu/stdbuf/src/stdbuf.rs
@@ -141,8 +141,6 @@ fn get_preload_env(tmp_dir: &TempDir) -> UResult<(String, PathBuf)> {
 
 #[uucore::main]
 pub fn uumain(args: impl uucore::Args) -> UResult<()> {
-    let args = args.collect_ignore();
-
     let matches = uu_app().try_get_matches_from(args)?;
 
     let options = ProgramOptions::try_from(&matches).map_err(|e| UUsageError::new(125, e.0))?;
diff --git a/src/uu/stty/src/stty.rs b/src/uu/stty/src/stty.rs
index 669285750b4..5a5c31f5e60 100644
--- a/src/uu/stty/src/stty.rs
+++ b/src/uu/stty/src/stty.rs
@@ -176,8 +176,6 @@ ioctl_write_ptr_bad!(
 
 #[uucore::main]
 pub fn uumain(args: impl uucore::Args) -> UResult<()> {
-    let args = args.collect_lossy();
-
     let matches = uu_app().try_get_matches_from(args)?;
 
     let opts = Options::from(&matches)?;
diff --git a/src/uu/sum/src/sum.rs b/src/uu/sum/src/sum.rs
index 38ad3964ec8..d1f383351aa 100644
--- a/src/uu/sum/src/sum.rs
+++ b/src/uu/sum/src/sum.rs
@@ -102,8 +102,6 @@ mod options {
 
 #[uucore::main]
 pub fn uumain(args: impl uucore::Args) -> UResult<()> {
-    let args = args.collect_lossy();
-
     let matches = uu_app().try_get_matches_from(args)?;
 
     let files: Vec<String> = match matches.get_many::<String>(options::FILE) {
diff --git a/src/uu/tac/src/tac.rs b/src/uu/tac/src/tac.rs
index b8cb61029da..3865c61ae48 100644
--- a/src/uu/tac/src/tac.rs
+++ b/src/uu/tac/src/tac.rs
@@ -33,8 +33,6 @@ mod options {
 
 #[uucore::main]
 pub fn uumain(args: impl uucore::Args) -> UResult<()> {
-    let args = args.collect_lossy();
-
     let matches = uu_app().try_get_matches_from(args)?;
 
     let before = matches.get_flag(options::BEFORE);
diff --git a/src/uu/timeout/src/timeout.rs b/src/uu/timeout/src/timeout.rs
index 5e73fe2ab50..958bc647e10 100644
--- a/src/uu/timeout/src/timeout.rs
+++ b/src/uu/timeout/src/timeout.rs
@@ -107,8 +107,6 @@ impl Config {
 
 #[uucore::main]
 pub fn uumain(args: impl uucore::Args) -> UResult<()> {
-    let args = args.collect_lossy();
-
     let matches = uu_app().try_get_matches_from(args).with_exit_code(125)?;
 
     let config = Config::from(&matches)?;
diff --git a/src/uu/tr/src/tr.rs b/src/uu/tr/src/tr.rs
index 9c6e7a7da58..010228260ed 100644
--- a/src/uu/tr/src/tr.rs
+++ b/src/uu/tr/src/tr.rs
@@ -33,8 +33,6 @@ mod options {
 
 #[uucore::main]
 pub fn uumain(args: impl uucore::Args) -> UResult<()> {
-    let args = args.collect_lossy();
-
     let matches = uu_app().after_help(AFTER_HELP).try_get_matches_from(args)?;
 
     let delete_flag = matches.get_flag(options::DELETE);
diff --git a/src/uu/tsort/src/tsort.rs b/src/uu/tsort/src/tsort.rs
index e71710847ea..3ae4f4f97e6 100644
--- a/src/uu/tsort/src/tsort.rs
+++ b/src/uu/tsort/src/tsort.rs
@@ -20,8 +20,6 @@ mod options {
 
 #[uucore::main]
 pub fn uumain(args: impl uucore::Args) -> UResult<()> {
-    let args = args.collect_lossy();
-
     let matches = uu_app().try_get_matches_from(args)?;
 
     let input = matches
diff --git a/src/uu/who/src/who.rs b/src/uu/who/src/who.rs
index 5d952efffb2..788368aaf8c 100644
--- a/src/uu/who/src/who.rs
+++ b/src/uu/who/src/who.rs
@@ -54,8 +54,6 @@ fn get_long_usage() -> String {
 
 #[uucore::main]
 pub fn uumain(args: impl uucore::Args) -> UResult<()> {
-    let args = args.collect_ignore();
-
     let matches = uu_app()
         .after_help(get_long_usage())
         .try_get_matches_from(args)?;

From 92692c815dc1d44f8af548589cec98eccf91527e Mon Sep 17 00:00:00 2001
From: Terts Diepraam <terts.diepraam@gmail.com>
Date: Fri, 15 Dec 2023 15:02:46 +0100
Subject: [PATCH 190/429] docs: add winget installer (#5648)

* docs: add winget installer

* docs: add "winget" to spell-checker:ignore

---------

Co-authored-by: Daniel Hofstetter <daniel.hofstetter@42dh.com>
---
 docs/src/installation.md | 8 +++++++-
 1 file changed, 7 insertions(+), 1 deletion(-)

diff --git a/docs/src/installation.md b/docs/src/installation.md
index 54b1e23f3f6..9eba96b55e7 100644
--- a/docs/src/installation.md
+++ b/docs/src/installation.md
@@ -1,4 +1,4 @@
-<!-- spell-checker:ignore pacman pamac nixpkgs openmandriva conda -->
+<!-- spell-checker:ignore pacman pamac nixpkgs openmandriva conda winget -->
 
 # Installation
 
@@ -131,6 +131,12 @@ pkg install rust-coreutils
 
 ## Windows
 
+### Winget
+
+```shell
+winget install uutils.coreutils
+```
+
 ### Scoop
 
 [![Scoop package](https://repology.org/badge/version-for-repo/scoop/uutils-coreutils.svg)](https://scoop.sh/#/apps?q=uutils-coreutils&s=0&d=1&o=true)

From 8ce6fdc1950d0be2e59f23f46d987912f655e779 Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Fri, 15 Dec 2023 15:35:22 +0100
Subject: [PATCH 191/429] docs: remove scoop badge, adapt links to repos

---
 docs/src/installation.md | 14 +++++++-------
 1 file changed, 7 insertions(+), 7 deletions(-)

diff --git a/docs/src/installation.md b/docs/src/installation.md
index 9eba96b55e7..dadc6e58e1a 100644
--- a/docs/src/installation.md
+++ b/docs/src/installation.md
@@ -12,7 +12,7 @@ You can also [build uutils from source](build.md).
 
 ## Cargo
 
-[![crates.io package](https://repology.org/badge/version-for-repo/crates_io/uutils-coreutils.svg)](https://repology.org/project/uutils-coreutils/versions)
+[![crates.io package](https://repology.org/badge/version-for-repo/crates_io/uutils-coreutils.svg)](https://crates.io/crates/coreutils)
 
 ```shell
 # Linux
@@ -65,9 +65,9 @@ emerge -pv sys-apps/uutils-coreutils
 
 ### Manjaro
 
-![Manjaro Stable package](https://repology.org/badge/version-for-repo/manjaro_stable/uutils-coreutils.svg)
-[![Manjaro Testing package](https://repology.org/badge/version-for-repo/manjaro_testing/uutils-coreutils.svg)](https://repology.org/project/uutils-coreutils/versions)
-[![Manjaro Unstable package](https://repology.org/badge/version-for-repo/manjaro_unstable/uutils-coreutils.svg)](https://repology.org/project/uutils-coreutils/versions)
+[![Manjaro Stable package](https://repology.org/badge/version-for-repo/manjaro_stable/uutils-coreutils.svg)](https://packages.manjaro.org/?query=uutils-coreutils)
+[![Manjaro Testing package](https://repology.org/badge/version-for-repo/manjaro_testing/uutils-coreutils.svg)](https://packages.manjaro.org/?query=uutils-coreutils)
+[![Manjaro Unstable package](https://repology.org/badge/version-for-repo/manjaro_unstable/uutils-coreutils.svg)](https://packages.manjaro.org/?query=uutils-coreutils)
 
 ```shell
 pacman -S uutils-coreutils
@@ -77,7 +77,7 @@ pamac install uutils-coreutils
 
 ### NixOS
 
-[![nixpkgs unstable package](https://repology.org/badge/version-for-repo/nix_unstable/uutils-coreutils.svg)](https://repology.org/project/uutils-coreutils/versions)
+[![nixpkgs unstable package](https://repology.org/badge/version-for-repo/nix_unstable/uutils-coreutils.svg)](https://search.nixos.org/packages?query=uutils-coreutils)
 
 ```shell
 nix-env -iA nixos.uutils-coreutils
@@ -139,7 +139,7 @@ winget install uutils.coreutils
 
 ### Scoop
 
-[![Scoop package](https://repology.org/badge/version-for-repo/scoop/uutils-coreutils.svg)](https://scoop.sh/#/apps?q=uutils-coreutils&s=0&d=1&o=true)
+[Scoop package](https://scoop.sh/#/apps?q=uutils-coreutils&s=0&d=1&o=true)
 
 ```shell
 scoop install uutils-coreutils
@@ -152,7 +152,7 @@ scoop install uutils-coreutils
 [Conda package](https://anaconda.org/conda-forge/uutils-coreutils)
 
 ```
-conda install -c conda-forge uutils-coreutils 
+conda install -c conda-forge uutils-coreutils
 ```
 
 ## Non-standard packages

From 30c27c143c988b947cb00111b3d09e97ef4ae74d Mon Sep 17 00:00:00 2001
From: Terts Diepraam <terts.diepraam@gmail.com>
Date: Fri, 15 Dec 2023 15:56:41 +0100
Subject: [PATCH 192/429] mknod: remove parsemode.rs

This file was entirely unused, so it's probably safe to remove it
---
 src/uu/mknod/src/parsemode.rs | 57 -----------------------------------
 1 file changed, 57 deletions(-)
 delete mode 100644 src/uu/mknod/src/parsemode.rs

diff --git a/src/uu/mknod/src/parsemode.rs b/src/uu/mknod/src/parsemode.rs
deleted file mode 100644
index c38800bcb0d..00000000000
--- a/src/uu/mknod/src/parsemode.rs
+++ /dev/null
@@ -1,57 +0,0 @@
-// This file is part of the uutils coreutils package.
-//
-// For the full copyright and license information, please view the LICENSE
-// file that was distributed with this source code.
-// spell-checker:ignore (path) osrelease
-
-use libc::{mode_t, S_IRGRP, S_IROTH, S_IRUSR, S_IWGRP, S_IWOTH, S_IWUSR};
-
-use uucore::mode;
-
-pub const MODE_RW_UGO: mode_t = S_IRUSR | S_IWUSR | S_IRGRP | S_IWGRP | S_IROTH | S_IWOTH;
-
-pub fn parse_mode(mode: &str) -> Result<mode_t, String> {
-    let result = if mode.chars().any(|c| c.is_ascii_digit()) {
-        mode::parse_numeric(MODE_RW_UGO as u32, mode)
-    } else {
-        mode::parse_symbolic(MODE_RW_UGO as u32, mode, true)
-    };
-    result.map(|mode| mode as mode_t)
-}
-
-#[cfg(test)]
-mod test {
-    /// Test if the program is running under WSL
-    // ref: <https://github.com/microsoft/WSL/issues/4555> @@ <https://archive.is/dP0bz>
-    // ToDO: test on WSL2 which likely doesn't need special handling; plan change to `is_wsl_1()` if WSL2 is less needy
-    pub fn is_wsl() -> bool {
-        #[cfg(target_os = "linux")]
-        {
-            if let Ok(b) = std::fs::read("/proc/sys/kernel/osrelease") {
-                if let Ok(s) = std::str::from_utf8(&b) {
-                    let a = s.to_ascii_lowercase();
-                    return a.contains("microsoft") || a.contains("wsl");
-                }
-            }
-        }
-        false
-    }
-
-    #[test]
-    fn symbolic_modes() {
-        assert_eq!(super::parse_mode("u+x").unwrap(), 0o766);
-        assert_eq!(
-            super::parse_mode("+x").unwrap(),
-            if is_wsl() { 0o776 } else { 0o777 }
-        );
-        assert_eq!(super::parse_mode("a-w").unwrap(), 0o444);
-        assert_eq!(super::parse_mode("g-r").unwrap(), 0o626);
-    }
-
-    #[test]
-    fn numeric_modes() {
-        assert_eq!(super::parse_mode("644").unwrap(), 0o644);
-        assert_eq!(super::parse_mode("+100").unwrap(), 0o766);
-        assert_eq!(super::parse_mode("-4").unwrap(), 0o662);
-    }
-}

From c2276f4f6b62ffc2a21c6156bb299b5ceae9c5cb Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Fri, 15 Dec 2023 17:10:24 +0100
Subject: [PATCH 193/429] ci: rename test summary names for busybox & toybox

---
 .github/workflows/CICD.yml | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/.github/workflows/CICD.yml b/.github/workflows/CICD.yml
index 965e2606271..4e01799088e 100644
--- a/.github/workflows/CICD.yml
+++ b/.github/workflows/CICD.yml
@@ -791,7 +791,7 @@ jobs:
     - name: Reserve test results summary
       uses: actions/upload-artifact@v4
       with:
-        name: test-summary
+        name: busybox-test-summary
         path: "${{ steps.vars.outputs.TEST_SUMMARY_FILE }}"
     - name: Upload json results
       uses: actions/upload-artifact@v4
@@ -879,7 +879,7 @@ jobs:
     - name: Reserve test results summary
       uses: actions/upload-artifact@v4
       with:
-        name: test-summary
+        name: toybox-test-summary
         path: "${{ steps.vars.outputs.TEST_SUMMARY_FILE }}"
     - name: Upload json results
       uses: actions/upload-artifact@v4

From cc0a0fdb201eb30783c2dbdb5c67bdcbc383577f Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Sat, 16 Dec 2023 09:17:29 +0100
Subject: [PATCH 194/429] ignore-intermittent.txt: adjust the renamed test name

---
 .github/workflows/ignore-intermittent.txt | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/.github/workflows/ignore-intermittent.txt b/.github/workflows/ignore-intermittent.txt
index 759bd96eb8a..e163202a2ca 100644
--- a/.github/workflows/ignore-intermittent.txt
+++ b/.github/workflows/ignore-intermittent.txt
@@ -1,3 +1,3 @@
-tests/tail-2/inotify-dir-recreate
+tests/tail/inotify-dir-recreate
 tests/misc/timeout
 tests/rm/rm1

From 01000a37a3316927a0ce3a0cd8411fc5c3363178 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Sat, 16 Dec 2023 09:40:38 +0100
Subject: [PATCH 195/429] fix two minor clippy warnings

---
 src/uu/dd/src/dd.rs | 2 +-
 src/uu/tr/src/tr.rs | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/uu/dd/src/dd.rs b/src/uu/dd/src/dd.rs
index e849fcd2a2a..07a754deb51 100644
--- a/src/uu/dd/src/dd.rs
+++ b/src/uu/dd/src/dd.rs
@@ -1181,7 +1181,7 @@ fn calc_loop_bsize(
             cmp::min(ideal_bsize as u64, rremain * ibs as u64) as usize
         }
         Some(Num::Bytes(bmax)) => {
-            let bmax: u128 = (*bmax).try_into().unwrap();
+            let bmax: u128 = (*bmax).into();
             let bremain: u128 = bmax - wstat.bytes_total;
             cmp::min(ideal_bsize as u128, bremain) as usize
         }
diff --git a/src/uu/tr/src/tr.rs b/src/uu/tr/src/tr.rs
index 010228260ed..628a0efa84b 100644
--- a/src/uu/tr/src/tr.rs
+++ b/src/uu/tr/src/tr.rs
@@ -61,7 +61,7 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
         ));
     }
 
-    if let Some(first) = sets.get(0) {
+    if let Some(first) = sets.first() {
         if first.ends_with('\\') {
             show!(USimpleError::new(
                 0,

From f6d3f9afbfb47ad9752c0cfe6ee21c459b56c615 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Fri, 15 Dec 2023 22:49:35 +0100
Subject: [PATCH 196/429] ls: manages the COLOR and COLORTERM variables

Should fix GNU tests/ls/color-term.sh
---
 src/uu/ls/src/ls.rs      | 33 +++++++++++++++++++++-
 tests/by-util/test_ls.rs | 61 +++++++++++++++++++++++++++++++++++++++-
 2 files changed, 92 insertions(+), 2 deletions(-)

diff --git a/src/uu/ls/src/ls.rs b/src/uu/ls/src/ls.rs
index 1fceefe17fb..424ef8cc12e 100644
--- a/src/uu/ls/src/ls.rs
+++ b/src/uu/ls/src/ls.rs
@@ -3,7 +3,7 @@
 // For the full copyright and license information, please view the LICENSE
 // file that was distributed with this source code.
 
-// spell-checker:ignore (ToDO) somegroup nlink tabsize dired subdired dtype
+// spell-checker:ignore (ToDO) somegroup nlink tabsize dired subdired dtype colorterm
 
 use clap::{
     builder::{NonEmptyStringValueParser, ValueParser},
@@ -553,12 +553,43 @@ fn extract_time(options: &clap::ArgMatches) -> Time {
     }
 }
 
+// Some env variables can be passed
+// For now, we are only verifying if empty or not and known for TERM
+fn is_color_compatible_term() -> bool {
+    let is_term_set = std::env::var("TERM").is_ok();
+    let is_colorterm_set = std::env::var("COLORTERM").is_ok();
+
+    let term = std::env::var("TERM").unwrap_or_default();
+    let colorterm = std::env::var("COLORTERM").unwrap_or_default();
+
+    // Search function to manage the "*" into the data structure
+    let term_matches = |term: &str| -> bool {
+        uucore::colors::TERMS.iter().any(|&pattern| {
+            term == pattern
+                || (pattern.ends_with('*') && term.starts_with(&pattern[..pattern.len() - 1]))
+        })
+    };
+
+    if is_term_set && colorterm.is_empty() && is_colorterm_set && term.is_empty() {
+        return false;
+    }
+
+    if !term.is_empty() && !term_matches(&term) {
+        return false;
+    }
+    true
+}
+
 /// Extracts the color option to use based on the options provided.
 ///
 /// # Returns
 ///
 /// A boolean representing whether or not to use color.
 fn extract_color(options: &clap::ArgMatches) -> bool {
+    if !is_color_compatible_term() {
+        return false;
+    }
+
     match options.get_one::<String>(options::COLOR) {
         None => options.contains_id(options::COLOR),
         Some(val) => match val.as_str() {
diff --git a/tests/by-util/test_ls.rs b/tests/by-util/test_ls.rs
index c3460633a22..ca1da8b7ece 100644
--- a/tests/by-util/test_ls.rs
+++ b/tests/by-util/test_ls.rs
@@ -2,7 +2,7 @@
 //
 // For the full copyright and license information, please view the LICENSE
 // file that was distributed with this source code.
-// spell-checker:ignore (words) READMECAREFULLY birthtime doesntexist oneline somebackup lrwx somefile somegroup somehiddenbackup somehiddenfile tabsize aaaaaaaa bbbb cccc dddddddd ncccc neee naaaaa nbcdef nfffff dired subdired tmpfs mdir
+// spell-checker:ignore (words) READMECAREFULLY birthtime doesntexist oneline somebackup lrwx somefile somegroup somehiddenbackup somehiddenfile tabsize aaaaaaaa bbbb cccc dddddddd ncccc neee naaaaa nbcdef nfffff dired subdired tmpfs mdir COLORTERM mexe
 
 #[cfg(any(unix, feature = "feat_selinux"))]
 use crate::common::util::expected_result;
@@ -3988,3 +3988,62 @@ fn test_ls_color_do_not_reset() {
         "\\u{1b}[0m\\u{1b}[01;34ma\\u{1b}[0m\\n\\u{1b}[01;34mb\\u{1b}[0m\\n"
     );
 }
+
+#[cfg(all(unix, feature = "chmod"))]
+#[test]
+fn test_term_colorterm() {
+    let scene = TestScenario::new(util_name!());
+    let at = &scene.fixtures;
+    at.touch("exe");
+    scene.ccmd("chmod").arg("+x").arg("exe").succeeds();
+
+    // Should show colors
+    let result = scene
+        .ucmd()
+        .arg("--color=always")
+        .env("LS_COLORS", "")
+        .env("TERM", "")
+        .succeeds();
+    assert_eq!(
+        result.stdout_str().trim().escape_default().to_string(),
+        "\\u{1b}[0m\\u{1b}[01;32mexe\\u{1b}[0m"
+    );
+
+    // Should show colors
+    let result = scene
+        .ucmd()
+        .arg("--color=always")
+        .env("LS_COLORS", "")
+        .env("COLORTERM", "")
+        .succeeds();
+    assert_eq!(
+        result.stdout_str().trim().escape_default().to_string(),
+        "\\u{1b}[0m\\u{1b}[01;32mexe\\u{1b}[0m"
+    );
+
+    // No colors
+    let result = scene
+        .ucmd()
+        .arg("--color=always")
+        .env("LS_COLORS", "")
+        .env("TERM", "")
+        .env("COLORTERM", "")
+        .succeeds();
+    assert_eq!(
+        result.stdout_str().trim().escape_default().to_string(),
+        "exe"
+    );
+
+    // No colors
+    let result = scene
+        .ucmd()
+        .arg("--color=always")
+        .env("LS_COLORS", "")
+        .env("TERM", "dumb")
+        .env("COLORTERM", "")
+        .succeeds();
+    assert_eq!(
+        result.stdout_str().trim().escape_default().to_string(),
+        "exe"
+    );
+}

From 6621a1d6d677f2d9744f4fc94e9711622e96980b Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Sat, 16 Dec 2023 10:30:17 +0100
Subject: [PATCH 197/429] Apply the change from
 c32e730a1f0f0625158571dd528cde7519515f81 too

---
 src/uu/pinky/src/platform/unix.rs | 2 --
 1 file changed, 2 deletions(-)

diff --git a/src/uu/pinky/src/platform/unix.rs b/src/uu/pinky/src/platform/unix.rs
index 381acacd2f6..ecea2b9f29e 100644
--- a/src/uu/pinky/src/platform/unix.rs
+++ b/src/uu/pinky/src/platform/unix.rs
@@ -31,8 +31,6 @@ fn get_long_usage() -> String {
 }
 
 pub fn uumain(args: impl uucore::Args) -> UResult<()> {
-    let args = args.collect_ignore();
-
     let matches = uu_app()
         .after_help(get_long_usage())
         .try_get_matches_from(args)?;

From afc6ac81145ee61294504d123768d3e9843d0685 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Sat, 16 Dec 2023 10:30:47 +0100
Subject: [PATCH 198/429] Apply change from
 c32e730a1f0f0625158571dd528cde7519515f81

---
 src/uu/who/src/platform/unix.rs | 2 --
 1 file changed, 2 deletions(-)

diff --git a/src/uu/who/src/platform/unix.rs b/src/uu/who/src/platform/unix.rs
index 17eaa9af961..b59b73a5703 100644
--- a/src/uu/who/src/platform/unix.rs
+++ b/src/uu/who/src/platform/unix.rs
@@ -28,8 +28,6 @@ fn get_long_usage() -> String {
 }
 
 pub fn uumain(args: impl uucore::Args) -> UResult<()> {
-    let args = args.collect_ignore();
-
     let matches = uu_app()
         .after_help(get_long_usage())
         .try_get_matches_from(args)?;

From 5c37df6e46822246c9bb54620d9395ac2afd5137 Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Sat, 16 Dec 2023 14:31:41 +0100
Subject: [PATCH 199/429] docs: remove two notes

---
 docs/src/installation.md | 4 ----
 1 file changed, 4 deletions(-)

diff --git a/docs/src/installation.md b/docs/src/installation.md
index dadc6e58e1a..238a4db9b61 100644
--- a/docs/src/installation.md
+++ b/docs/src/installation.md
@@ -53,8 +53,6 @@ apt install rust-coreutils
 export PATH=/usr/lib/cargo/bin/coreutils:$PATH
 ```
 
-> **Note**: Only available from Bookworm (Debian 12)
-
 ### Gentoo
 
 [![Gentoo package](https://repology.org/badge/version-for-repo/gentoo/uutils-coreutils.svg)](https://packages.gentoo.org/packages/sys-apps/uutils-coreutils)
@@ -101,8 +99,6 @@ apt install rust-coreutils
 export PATH=/usr/lib/cargo/bin/coreutils:$PATH
 ```
 
-> **Note**: Only available from Kinetic (Ubuntu 22.10)
-
 ## MacOS
 
 ### Homebrew

From ba0c89fc5e3ce04192e7558278437eb26d668f93 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Sat, 16 Dec 2023 15:06:58 +0100
Subject: [PATCH 200/429] build-gnu.sh: build in debug by default. Easier for
 local dev

---
 .github/workflows/GnuTests.yml |  4 ++--
 DEVELOPMENT.md                 |  4 ++--
 util/build-gnu.sh              | 17 +++++++++++++----
 3 files changed, 17 insertions(+), 8 deletions(-)

diff --git a/.github/workflows/GnuTests.yml b/.github/workflows/GnuTests.yml
index 5215ab24f83..3ce6e8be27b 100644
--- a/.github/workflows/GnuTests.yml
+++ b/.github/workflows/GnuTests.yml
@@ -116,7 +116,7 @@ jobs:
       run: |
         ## Build binaries
         cd '${{ steps.vars.outputs.path_UUTILS }}'
-        bash util/build-gnu.sh
+        bash util/build-gnu.sh --release-build
     - name: Run GNU tests
       shell: bash
       run: |
@@ -354,7 +354,7 @@ jobs:
       run: |
         ## Build binaries
         cd uutils
-        UU_MAKE_PROFILE=debug bash util/build-gnu.sh
+        bash util/build-gnu.sh
     - name: Run GNU tests
       run: bash uutils/util/run-gnu-test.sh
     - name: Generate coverage data (via `grcov`)
diff --git a/DEVELOPMENT.md b/DEVELOPMENT.md
index 67b201e9cc3..29cfe2b2a3c 100644
--- a/DEVELOPMENT.md
+++ b/DEVELOPMENT.md
@@ -226,8 +226,8 @@ To run uutils against the GNU test suite locally, run the following commands:
 
 ```shell
 bash util/build-gnu.sh
-# Build uutils without release optimizations
-UU_MAKE_PROFILE=debug bash util/build-gnu.sh
+# Build uutils with release optimizations
+bash util/build-gnu.sh --release-build
 bash util/run-gnu-test.sh
 # To run a single test:
 bash util/run-gnu-test.sh tests/touch/not-owner.sh # for example
diff --git a/util/build-gnu.sh b/util/build-gnu.sh
index 7c0691c0697..4a14f3f6c4d 100755
--- a/util/build-gnu.sh
+++ b/util/build-gnu.sh
@@ -1,7 +1,6 @@
 #!/bin/bash
 # `build-gnu.bash` ~ builds GNU coreutils (from supplied sources)
 #
-# UU_MAKE_PROFILE == 'debug' | 'release' ## build profile for *uutils* build; may be supplied by caller, defaults to 'release'
 
 # spell-checker:ignore (paths) abmon deref discrim eacces getlimits getopt ginstall inacc infloop inotify reflink ; (misc) INT_OFLOW OFLOW baddecode submodules ; (vars/env) SRCDIR vdir rcexp xpart dired
 
@@ -11,6 +10,19 @@ ME="${0}"
 ME_dir="$(dirname -- "$(readlink -fm -- "${ME}")")"
 REPO_main_dir="$(dirname -- "${ME_dir}")"
 
+# Default profile is 'debug'
+UU_MAKE_PROFILE='debug'
+
+for arg in "$@"
+do
+    if [ "$arg" == "--release-build" ]; then
+        UU_MAKE_PROFILE='release'
+        break
+    fi
+done
+
+echo "UU_MAKE_PROFILE='${UU_MAKE_PROFILE}'"
+
 ### * config (from environment with fallback defaults); note: GNU is expected to be a sibling repo directory
 
 path_UUTILS=${path_UUTILS:-${REPO_main_dir}}
@@ -56,9 +68,6 @@ echo "path_GNU='${path_GNU}'"
 
 ###
 
-UU_MAKE_PROFILE=${UU_MAKE_PROFILE:-release}
-echo "UU_MAKE_PROFILE='${UU_MAKE_PROFILE}'"
-
 UU_BUILD_DIR="${path_UUTILS}/target/${UU_MAKE_PROFILE}"
 echo "UU_BUILD_DIR='${UU_BUILD_DIR}'"
 

From 9167a843586d9a27402eb380ebe195df507c9161 Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Sat, 16 Dec 2023 17:17:44 +0100
Subject: [PATCH 201/429] ls: enable "colors" feature

---
 src/uu/ls/Cargo.toml | 1 +
 1 file changed, 1 insertion(+)

diff --git a/src/uu/ls/Cargo.toml b/src/uu/ls/Cargo.toml
index a82a1f37e07..d11eeb27ce3 100644
--- a/src/uu/ls/Cargo.toml
+++ b/src/uu/ls/Cargo.toml
@@ -24,6 +24,7 @@ terminal_size = { workspace = true }
 glob = { workspace = true }
 lscolors = { workspace = true }
 uucore = { workspace = true, features = [
+  "colors",
   "entries",
   "fs",
   "quoting-style",

From 052f38f14d5e9f7e100aa8f1c40feefbcc5e3418 Mon Sep 17 00:00:00 2001
From: Akmal <xkmxlfirdxus@gmail.com>
Date: Sun, 17 Dec 2023 17:43:00 +0200
Subject: [PATCH 202/429]  unexpand: remove crash! macro (#5588)

* unexpand_macro_fixed

* unexpand

* Remove crash

* Passed local test case

* Small changes

* unexpand: remove #[allow(clippy::cognitive_complexity)]

---------

Co-authored-by: Daniel Hofstetter <daniel.hofstetter@42dh.com>
---
 src/uu/unexpand/src/unexpand.rs | 192 ++++++++++++++++----------------
 1 file changed, 95 insertions(+), 97 deletions(-)

diff --git a/src/uu/unexpand/src/unexpand.rs b/src/uu/unexpand/src/unexpand.rs
index 11ad43060a6..66d9a0187b6 100644
--- a/src/uu/unexpand/src/unexpand.rs
+++ b/src/uu/unexpand/src/unexpand.rs
@@ -14,8 +14,8 @@ use std::num::IntErrorKind;
 use std::str::from_utf8;
 use unicode_width::UnicodeWidthChar;
 use uucore::display::Quotable;
-use uucore::error::{FromIo, UError, UResult};
-use uucore::{crash, crash_if_err, format_usage, help_about, help_usage};
+use uucore::error::{FromIo, UError, UResult, USimpleError};
+use uucore::{crash_if_err, format_usage, help_about, help_usage};
 
 const USAGE: &str = help_usage!("unexpand.md");
 const ABOUT: &str = help_about!("unexpand.md");
@@ -161,7 +161,7 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
 
     let matches = uu_app().try_get_matches_from(expand_shortcuts(&args))?;
 
-    unexpand(&Options::new(&matches)?).map_err_context(String::new)
+    unexpand(&Options::new(&matches)?)
 }
 
 pub fn uu_app() -> Command {
@@ -209,16 +209,13 @@ pub fn uu_app() -> Command {
         )
 }
 
-fn open(path: &str) -> BufReader<Box<dyn Read + 'static>> {
+fn open(path: &str) -> UResult<BufReader<Box<dyn Read + 'static>>> {
     let file_buf;
     if path == "-" {
-        BufReader::new(Box::new(stdin()) as Box<dyn Read>)
+        Ok(BufReader::new(Box::new(stdin()) as Box<dyn Read>))
     } else {
-        file_buf = match File::open(path) {
-            Ok(a) => a,
-            Err(e) => crash!(1, "{}: {}", path.maybe_quote(), e),
-        };
-        BufReader::new(Box::new(file_buf) as Box<dyn Read>)
+        file_buf = File::open(path).map_err_context(|| path.to_string())?;
+        Ok(BufReader::new(Box::new(file_buf) as Box<dyn Read>))
     }
 }
 
@@ -315,106 +312,107 @@ fn next_char_info(uflag: bool, buf: &[u8], byte: usize) -> (CharType, usize, usi
 }
 
 #[allow(clippy::cognitive_complexity)]
-fn unexpand(options: &Options) -> std::io::Result<()> {
+fn unexpand_line(
+    buf: &mut Vec<u8>,
+    output: &mut BufWriter<std::io::Stdout>,
+    options: &Options,
+    lastcol: usize,
+    ts: &[usize],
+) -> std::io::Result<()> {
+    let mut byte = 0; // offset into the buffer
+    let mut col = 0; // the current column
+    let mut scol = 0; // the start col for the current span, i.e., the already-printed width
+    let mut init = true; // are we at the start of the line?
+    let mut pctype = CharType::Other;
+
+    while byte < buf.len() {
+        // when we have a finite number of columns, never convert past the last column
+        if lastcol > 0 && col >= lastcol {
+            write_tabs(output, ts, scol, col, pctype == CharType::Tab, init, true);
+            output.write_all(&buf[byte..])?;
+            scol = col;
+            break;
+        }
+
+        // figure out how big the next char is, if it's UTF-8
+        let (ctype, cwidth, nbytes) = next_char_info(options.uflag, buf, byte);
+
+        // now figure out how many columns this char takes up, and maybe print it
+        let tabs_buffered = init || options.aflag;
+        match ctype {
+            CharType::Space | CharType::Tab => {
+                // compute next col, but only write space or tab chars if not buffering
+                col += if ctype == CharType::Space {
+                    1
+                } else {
+                    next_tabstop(ts, col).unwrap_or(1)
+                };
+
+                if !tabs_buffered {
+                    output.write_all(&buf[byte..byte + nbytes])?;
+                    scol = col; // now printed up to this column
+                }
+            }
+            CharType::Other | CharType::Backspace => {
+                // always
+                write_tabs(
+                    output,
+                    ts,
+                    scol,
+                    col,
+                    pctype == CharType::Tab,
+                    init,
+                    options.aflag,
+                );
+                init = false; // no longer at the start of a line
+                col = if ctype == CharType::Other {
+                    // use computed width
+                    col + cwidth
+                } else if col > 0 {
+                    // Backspace case, but only if col > 0
+                    col - 1
+                } else {
+                    0
+                };
+                output.write_all(&buf[byte..byte + nbytes])?;
+                scol = col; // we've now printed up to this column
+            }
+        }
+
+        byte += nbytes; // move on to next char
+        pctype = ctype; // save the previous type
+    }
+
+    // write out anything remaining
+    write_tabs(output, ts, scol, col, pctype == CharType::Tab, init, true);
+    output.flush()?;
+    buf.truncate(0); // clear out the buffer
+
+    Ok(())
+}
+
+fn unexpand(options: &Options) -> UResult<()> {
     let mut output = BufWriter::new(stdout());
     let ts = &options.tabstops[..];
     let mut buf = Vec::new();
     let lastcol = if ts.len() > 1 { *ts.last().unwrap() } else { 0 };
 
     for file in &options.files {
-        let mut fh = open(file);
+        let mut fh = match open(file) {
+            Ok(reader) => reader,
+            Err(err) => {
+                return Err(USimpleError::new(1, err.to_string()));
+            }
+        };
 
         while match fh.read_until(b'\n', &mut buf) {
             Ok(s) => s > 0,
             Err(_) => !buf.is_empty(),
         } {
-            let mut byte = 0; // offset into the buffer
-            let mut col = 0; // the current column
-            let mut scol = 0; // the start col for the current span, i.e., the already-printed width
-            let mut init = true; // are we at the start of the line?
-            let mut pctype = CharType::Other;
-
-            while byte < buf.len() {
-                // when we have a finite number of columns, never convert past the last column
-                if lastcol > 0 && col >= lastcol {
-                    write_tabs(
-                        &mut output,
-                        ts,
-                        scol,
-                        col,
-                        pctype == CharType::Tab,
-                        init,
-                        true,
-                    );
-                    output.write_all(&buf[byte..])?;
-                    scol = col;
-                    break;
-                }
-
-                // figure out how big the next char is, if it's UTF-8
-                let (ctype, cwidth, nbytes) = next_char_info(options.uflag, &buf, byte);
-
-                // now figure out how many columns this char takes up, and maybe print it
-                let tabs_buffered = init || options.aflag;
-                match ctype {
-                    CharType::Space | CharType::Tab => {
-                        // compute next col, but only write space or tab chars if not buffering
-                        col += if ctype == CharType::Space {
-                            1
-                        } else {
-                            next_tabstop(ts, col).unwrap_or(1)
-                        };
-
-                        if !tabs_buffered {
-                            output.write_all(&buf[byte..byte + nbytes])?;
-                            scol = col; // now printed up to this column
-                        }
-                    }
-                    CharType::Other | CharType::Backspace => {
-                        // always
-                        write_tabs(
-                            &mut output,
-                            ts,
-                            scol,
-                            col,
-                            pctype == CharType::Tab,
-                            init,
-                            options.aflag,
-                        );
-                        init = false; // no longer at the start of a line
-                        col = if ctype == CharType::Other {
-                            // use computed width
-                            col + cwidth
-                        } else if col > 0 {
-                            // Backspace case, but only if col > 0
-                            col - 1
-                        } else {
-                            0
-                        };
-                        output.write_all(&buf[byte..byte + nbytes])?;
-                        scol = col; // we've now printed up to this column
-                    }
-                }
-
-                byte += nbytes; // move on to next char
-                pctype = ctype; // save the previous type
-            }
-
-            // write out anything remaining
-            write_tabs(
-                &mut output,
-                ts,
-                scol,
-                col,
-                pctype == CharType::Tab,
-                init,
-                true,
-            );
-            output.flush()?;
-            buf.truncate(0); // clear out the buffer
+            unexpand_line(&mut buf, &mut output, options, lastcol, ts)?;
         }
     }
-    output.flush()
+    Ok(())
 }
 
 #[cfg(test)]

From af2625c8ce64cd4ddd406b1d86c4b056d8f64ebb Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Sun, 17 Dec 2023 17:39:02 +0100
Subject: [PATCH 203/429] fix order

Co-authored-by: Daniel Hofstetter <daniel.hofstetter@42dh.com>
---
 src/uu/ls/src/ls.rs | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/uu/ls/src/ls.rs b/src/uu/ls/src/ls.rs
index 424ef8cc12e..77f7913425d 100644
--- a/src/uu/ls/src/ls.rs
+++ b/src/uu/ls/src/ls.rs
@@ -570,7 +570,7 @@ fn is_color_compatible_term() -> bool {
         })
     };
 
-    if is_term_set && colorterm.is_empty() && is_colorterm_set && term.is_empty() {
+    if is_term_set && term.is_empty() && is_colorterm_set && colorterm.is_empty() {
         return false;
     }
 

From 5b451599961043de7e31c2e43f5bfe714416c218 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Sun, 17 Dec 2023 17:40:44 +0100
Subject: [PATCH 204/429] Improve the comment

---
 src/uu/ls/src/ls.rs | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/uu/ls/src/ls.rs b/src/uu/ls/src/ls.rs
index 77f7913425d..bfce1db7929 100644
--- a/src/uu/ls/src/ls.rs
+++ b/src/uu/ls/src/ls.rs
@@ -562,7 +562,7 @@ fn is_color_compatible_term() -> bool {
     let term = std::env::var("TERM").unwrap_or_default();
     let colorterm = std::env::var("COLORTERM").unwrap_or_default();
 
-    // Search function to manage the "*" into the data structure
+    // Search function in the TERM struct to manage the wildcards
     let term_matches = |term: &str| -> bool {
         uucore::colors::TERMS.iter().any(|&pattern| {
             term == pattern

From b2e26f2aec6268df23a4e2289aad6b9ec82ecd27 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Sun, 17 Dec 2023 17:57:21 +0100
Subject: [PATCH 205/429] fuzz: Simplify the compare_result function

---
 fuzz/fuzz_targets/fuzz_common.rs | 34 ++++++++++++++++++--------------
 fuzz/fuzz_targets/fuzz_echo.rs   |  8 ++------
 fuzz/fuzz_targets/fuzz_expr.rs   |  8 ++------
 fuzz/fuzz_targets/fuzz_printf.rs |  8 ++------
 fuzz/fuzz_targets/fuzz_seq.rs    |  8 ++------
 fuzz/fuzz_targets/fuzz_test.rs   |  8 ++------
 6 files changed, 29 insertions(+), 45 deletions(-)

diff --git a/fuzz/fuzz_targets/fuzz_common.rs b/fuzz/fuzz_targets/fuzz_common.rs
index 2adbb3dd677..89c82fba25e 100644
--- a/fuzz/fuzz_targets/fuzz_common.rs
+++ b/fuzz/fuzz_targets/fuzz_common.rs
@@ -222,15 +222,19 @@ pub fn run_gnu_cmd(
     }
 }
 
+/// Compare results from two different implementations of a command.
+///
+/// # Arguments
+/// * `test_type` - The command.
+/// * `input` - The input provided to the command.
+/// * `rust_result` - The result of running the command with the Rust implementation.
+/// * `gnu_result` - The result of running the command with the GNU implementation.
+/// * `fail_on_stderr_diff` - Whether to fail the test if there is a difference in stderr output.
 pub fn compare_result(
     test_type: &str,
     input: &str,
-    rust_stdout: &str,
-    gnu_stdout: &str,
-    rust_stderr: &str,
-    gnu_stderr: &str,
-    rust_exit_code: i32,
-    gnu_exit_code: i32,
+    rust_result: &CommandResult,
+    gnu_result: &CommandResult,
     fail_on_stderr_diff: bool,
 ) {
     println!("Test Type: {}", test_type);
@@ -239,24 +243,24 @@ pub fn compare_result(
     let mut discrepancies = Vec::new();
     let mut should_panic = false;
 
-    if rust_stdout.trim() != gnu_stdout.trim() {
+    if rust_result.stdout.trim() != gnu_result.stdout.trim() {
         discrepancies.push("stdout differs");
-        println!("Rust stdout: {}", rust_stdout);
-        println!("GNU stdout: {}", gnu_stdout);
+        println!("Rust stdout: {}", rust_result.stdout);
+        println!("GNU stdout: {}", gnu_result.stdout);
         should_panic = true;
     }
-    if rust_stderr.trim() != gnu_stderr.trim() {
+    if rust_result.stderr.trim() != gnu_result.stderr.trim() {
         discrepancies.push("stderr differs");
-        println!("Rust stderr: {}", rust_stderr);
-        println!("GNU stderr: {}", gnu_stderr);
+        println!("Rust stderr: {}", rust_result.stderr);
+        println!("GNU stderr: {}", gnu_result.stderr);
         if fail_on_stderr_diff {
             should_panic = true;
         }
     }
-    if rust_exit_code != gnu_exit_code {
+    if rust_result.exit_code != gnu_result.exit_code {
         discrepancies.push("exit code differs");
-        println!("Rust exit code: {}", rust_exit_code);
-        println!("GNU exit code: {}", gnu_exit_code);
+        println!("Rust exit code: {}", rust_result.exit_code);
+        println!("GNU exit code: {}", gnu_result.exit_code);
         should_panic = true;
     }
 
diff --git a/fuzz/fuzz_targets/fuzz_echo.rs b/fuzz/fuzz_targets/fuzz_echo.rs
index fda7fd7276f..bc391bd3e05 100644
--- a/fuzz/fuzz_targets/fuzz_echo.rs
+++ b/fuzz/fuzz_targets/fuzz_echo.rs
@@ -78,12 +78,8 @@ fuzz_target!(|_data: &[u8]| {
     compare_result(
         "echo",
         &format!("{:?}", &args[1..]),
-        &rust_result.stdout,
-        &gnu_result.stdout,
-        &rust_result.stderr,
-        &gnu_result.stderr,
-        rust_result.exit_code,
-        gnu_result.exit_code,
+        &rust_result,
+        &gnu_result,
         true,
     );
 });
diff --git a/fuzz/fuzz_targets/fuzz_expr.rs b/fuzz/fuzz_targets/fuzz_expr.rs
index 8d1848545ff..ce5535b16e1 100644
--- a/fuzz/fuzz_targets/fuzz_expr.rs
+++ b/fuzz/fuzz_targets/fuzz_expr.rs
@@ -86,12 +86,8 @@ fuzz_target!(|_data: &[u8]| {
     compare_result(
         "expr",
         &format!("{:?}", &args[1..]),
-        &rust_result.stdout,
-        &gnu_result.stdout,
-        &rust_result.stderr,
-        &gnu_result.stderr,
-        rust_result.exit_code,
-        gnu_result.exit_code,
+        &rust_result,
+        &gnu_result,
         false, // Set to true if you want to fail on stderr diff
     );
 });
diff --git a/fuzz/fuzz_targets/fuzz_printf.rs b/fuzz/fuzz_targets/fuzz_printf.rs
index 78bb3e3ce3b..25cf58c8e1b 100644
--- a/fuzz/fuzz_targets/fuzz_printf.rs
+++ b/fuzz/fuzz_targets/fuzz_printf.rs
@@ -99,12 +99,8 @@ fuzz_target!(|_data: &[u8]| {
     compare_result(
         "printf",
         &format!("{:?}", &args[1..]),
-        &rust_result.stdout,
-        &gnu_result.stdout,
-        &rust_result.stderr,
-        &gnu_result.stderr,
-        rust_result.exit_code,
-        gnu_result.exit_code,
+        &rust_result,
+        &gnu_result,
         false, // Set to true if you want to fail on stderr diff
     );
 });
diff --git a/fuzz/fuzz_targets/fuzz_seq.rs b/fuzz/fuzz_targets/fuzz_seq.rs
index 2e4ff1a4662..fdeaed16dc3 100644
--- a/fuzz/fuzz_targets/fuzz_seq.rs
+++ b/fuzz/fuzz_targets/fuzz_seq.rs
@@ -67,12 +67,8 @@ fuzz_target!(|_data: &[u8]| {
     compare_result(
         "seq",
         &format!("{:?}", &args[1..]),
-        &rust_result.stdout,
-        &gnu_result.stdout,
-        &rust_result.stderr,
-        &gnu_result.stderr,
-        rust_result.exit_code,
-        gnu_result.exit_code,
+        &rust_result,
+        &gnu_result,
         false, // Set to true if you want to fail on stderr diff
     );
 });
diff --git a/fuzz/fuzz_targets/fuzz_test.rs b/fuzz/fuzz_targets/fuzz_test.rs
index 38cd691b389..eeee2dc3e2c 100644
--- a/fuzz/fuzz_targets/fuzz_test.rs
+++ b/fuzz/fuzz_targets/fuzz_test.rs
@@ -203,12 +203,8 @@ fuzz_target!(|_data: &[u8]| {
     compare_result(
         "test",
         &format!("{:?}", &args[1..]),
-        &rust_result.stdout,
-        &gnu_result.stdout,
-        &rust_result.stderr,
-        &gnu_result.stderr,
-        rust_result.exit_code,
-        gnu_result.exit_code,
+        &rust_result,
+        &gnu_result,
         false, // Set to true if you want to fail on stderr diff
     );
 });

From d8d555dd66d02e6448f212814f1e1703f4fd51c1 Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Mon, 18 Dec 2023 08:22:25 +0100
Subject: [PATCH 206/429] ci: fix warnings from "cargo tree"

---
 .github/workflows/CICD.yml  | 4 ++--
 .github/workflows/FixPR.yml | 2 +-
 2 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/.github/workflows/CICD.yml b/.github/workflows/CICD.yml
index 5c242d65f34..8a7ff3f0624 100644
--- a/.github/workflows/CICD.yml
+++ b/.github/workflows/CICD.yml
@@ -208,7 +208,7 @@ jobs:
         echo "## dependency list"
         ## * using the 'stable' toolchain is necessary to avoid "unexpected '--filter-platform'" errors
         RUSTUP_TOOLCHAIN=stable cargo fetch --locked --quiet
-        RUSTUP_TOOLCHAIN=stable cargo tree --all --locked --no-dev-dependencies --no-indent ${{ steps.vars.outputs.CARGO_FEATURES_OPTION }} | grep -vE "$PWD" | sort --unique
+        RUSTUP_TOOLCHAIN=stable cargo tree --no-dedupe --locked -e=no-dev --prefix=none ${{ steps.vars.outputs.CARGO_FEATURES_OPTION }} | grep -vE "$PWD" | sort --unique
     - name: Test
       run: cargo nextest run --hide-progress-bar --profile ci ${{ steps.vars.outputs.CARGO_FEATURES_OPTION }} -p uucore -p coreutils
       env:
@@ -670,7 +670,7 @@ jobs:
         # dependencies
         echo "## dependency list"
         cargo fetch --locked --quiet
-        cargo tree --locked --target=${{ matrix.job.target }} ${{ matrix.job.cargo-options }} ${{ steps.vars.outputs.CARGO_FEATURES_OPTION }} --all --no-dev-dependencies --no-indent | grep -vE "$PWD" | sort --unique
+        cargo tree --locked --target=${{ matrix.job.target }} ${{ matrix.job.cargo-options }} ${{ steps.vars.outputs.CARGO_FEATURES_OPTION }} --no-dedupe -e=no-dev --prefix=none | grep -vE "$PWD" | sort --unique
     - name: Build
       shell: bash
       run: |
diff --git a/.github/workflows/FixPR.yml b/.github/workflows/FixPR.yml
index 7f5e5234d8b..e837b354687 100644
--- a/.github/workflows/FixPR.yml
+++ b/.github/workflows/FixPR.yml
@@ -63,7 +63,7 @@ jobs:
         echo "## dependency list"
         cargo fetch --locked --quiet
         ## * using the 'stable' toolchain is necessary to avoid "unexpected '--filter-platform'" errors
-        RUSTUP_TOOLCHAIN=stable cargo tree --locked --all --no-dev-dependencies --no-indent --features ${{ matrix.job.features }} | grep -vE "$PWD" | sort --unique
+        RUSTUP_TOOLCHAIN=stable cargo tree --locked --no-dedupe -e=no-dev --prefix=none --features ${{ matrix.job.features }} | grep -vE "$PWD" | sort --unique
     - name: Commit any changes (to '${{ env.BRANCH_TARGET }}')
       uses: EndBug/add-and-commit@v9
       with:

From bd22aba03b5617c4dec93dd5950fd75fe47ff780 Mon Sep 17 00:00:00 2001
From: Yykz <yykz@proton.me>
Date: Mon, 18 Dec 2023 12:47:37 +0100
Subject: [PATCH 207/429] make args of wc overriding

---
 src/uu/wc/src/wc.rs | 1 +
 1 file changed, 1 insertion(+)

diff --git a/src/uu/wc/src/wc.rs b/src/uu/wc/src/wc.rs
index 83081124d1b..d69647c3804 100644
--- a/src/uu/wc/src/wc.rs
+++ b/src/uu/wc/src/wc.rs
@@ -395,6 +395,7 @@ pub fn uu_app() -> Command {
         .about(ABOUT)
         .override_usage(format_usage(USAGE))
         .infer_long_args(true)
+        .args_override_self(true)
         .arg(
             Arg::new(options::BYTES)
                 .short('c')

From cae113c23757665262c7853c0fe8f0772b132203 Mon Sep 17 00:00:00 2001
From: Yykz <yykz@proton.me>
Date: Mon, 18 Dec 2023 14:12:59 +0100
Subject: [PATCH 208/429] Added tests

---
 tests/by-util/test_wc.rs | 13 +++++++++++++
 1 file changed, 13 insertions(+)

diff --git a/tests/by-util/test_wc.rs b/tests/by-util/test_wc.rs
index 9c55bd3bca5..df2551555b3 100644
--- a/tests/by-util/test_wc.rs
+++ b/tests/by-util/test_wc.rs
@@ -725,3 +725,16 @@ fn files0_from_dir() {
         .fails()
         .stderr_only(dir_err!("-"));
 }
+
+#[test]
+fn test_args_override() {
+    new_ucmd!()
+        .args(&["-ll", "-l", "alice_in_wonderland.txt"])
+        .run()
+        .stdout_is("5 alice_in_wonderland.txt\n");
+
+    new_ucmd!()
+        .args(&["--total=always", "--total=never", "alice_in_wonderland.txt"])
+        .run()
+        .stdout_is("  5  57 302 alice_in_wonderland.txt\n");
+}
\ No newline at end of file

From 8c6463c5258bb6a3d7f27ac5a2003e723eac4fd1 Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Mon, 18 Dec 2023 14:24:19 +0100
Subject: [PATCH 209/429] ls: extract "create_hyperlink" function

---
 src/uu/ls/src/ls.rs | 54 ++++++++++++++++++++++++---------------------
 1 file changed, 29 insertions(+), 25 deletions(-)

diff --git a/src/uu/ls/src/ls.rs b/src/uu/ls/src/ls.rs
index a802a2d609f..59018d0d27e 100644
--- a/src/uu/ls/src/ls.rs
+++ b/src/uu/ls/src/ls.rs
@@ -3047,31 +3047,7 @@ fn display_file_name(
     let mut width = name.width();
 
     if config.hyperlink {
-        let hostname = hostname::get().unwrap_or(OsString::from(""));
-        let hostname = hostname.to_string_lossy();
-
-        let absolute_path = fs::canonicalize(&path.p_buf).unwrap_or_default();
-        let absolute_path = absolute_path.to_string_lossy();
-
-        #[cfg(not(target_os = "windows"))]
-        let unencoded_chars = "_-.:~/";
-        #[cfg(target_os = "windows")]
-        let unencoded_chars = "_-.:~/\\";
-
-        // percentage encoding of path
-        let absolute_path: String = absolute_path
-            .chars()
-            .map(|c| {
-                if c.is_alphanumeric() || unencoded_chars.contains(c) {
-                    c.to_string()
-                } else {
-                    format!("%{:02x}", c as u8)
-                }
-            })
-            .collect();
-
-        // \x1b = ESC, \x07 = BEL
-        name = format!("\x1b]8;;file://{hostname}{absolute_path}\x07{name}\x1b]8;;\x07");
+        name = create_hyperlink(&name, path);
     }
 
     if let Some(ls_colors) = &config.color {
@@ -3208,6 +3184,34 @@ fn display_file_name(
     }
 }
 
+fn create_hyperlink(name: &str, path: &PathData) -> String {
+    let hostname = hostname::get().unwrap_or(OsString::from(""));
+    let hostname = hostname.to_string_lossy();
+
+    let absolute_path = fs::canonicalize(&path.p_buf).unwrap_or_default();
+    let absolute_path = absolute_path.to_string_lossy();
+
+    #[cfg(not(target_os = "windows"))]
+    let unencoded_chars = "_-.:~/";
+    #[cfg(target_os = "windows")]
+    let unencoded_chars = "_-.:~/\\";
+
+    // percentage encoding of path
+    let absolute_path: String = absolute_path
+        .chars()
+        .map(|c| {
+            if c.is_alphanumeric() || unencoded_chars.contains(c) {
+                c.to_string()
+            } else {
+                format!("%{:02x}", c as u8)
+            }
+        })
+        .collect();
+
+    // \x1b = ESC, \x07 = BEL
+    format!("\x1b]8;;file://{hostname}{absolute_path}\x07{name}\x1b]8;;\x07")
+}
+
 /// We need this struct to be able to store the previous style.
 /// This because we need to check the previous value in case we don't need
 /// the reset

From 917c6a4743ebd9ea3e7c471198b710f1dcb7ad40 Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Mon, 18 Dec 2023 15:09:07 +0100
Subject: [PATCH 210/429] ls: support hyperlinks for dir names

---
 src/uu/ls/src/ls.rs      | 16 +++++++++++-----
 tests/by-util/test_ls.rs | 36 ++++++++++++++++++++++++++++++++++++
 2 files changed, 47 insertions(+), 5 deletions(-)

diff --git a/src/uu/ls/src/ls.rs b/src/uu/ls/src/ls.rs
index 59018d0d27e..8d1ecdbc630 100644
--- a/src/uu/ls/src/ls.rs
+++ b/src/uu/ls/src/ls.rs
@@ -1926,8 +1926,14 @@ impl PathData {
     }
 }
 
-fn show_dir_name(dir: &Path, out: &mut BufWriter<Stdout>) {
-    write!(out, "{}:", dir.display()).unwrap();
+fn show_dir_name(path_data: &PathData, out: &mut BufWriter<Stdout>, config: &Config) {
+    if config.hyperlink {
+        let name = escape_name(&path_data.display_name, &config.quoting_style);
+        let hyperlink = create_hyperlink(&name, path_data);
+        write!(out, "{}:", hyperlink).unwrap();
+    } else {
+        write!(out, "{}:", path_data.p_buf.display()).unwrap();
+    }
 }
 
 #[allow(clippy::cognitive_complexity)]
@@ -1995,7 +2001,7 @@ pub fn list(locs: Vec<&Path>, config: &Config) -> UResult<()> {
                 if config.dired {
                     dired::indent(&mut out)?;
                 }
-                show_dir_name(&path_data.p_buf, &mut out);
+                show_dir_name(path_data, &mut out, config);
                 writeln!(out)?;
                 if config.dired {
                     // First directory displayed
@@ -2007,7 +2013,7 @@ pub fn list(locs: Vec<&Path>, config: &Config) -> UResult<()> {
                 }
             } else {
                 writeln!(out)?;
-                show_dir_name(&path_data.p_buf, &mut out);
+                show_dir_name(path_data, &mut out, config);
                 writeln!(out)?;
             }
         }
@@ -2232,7 +2238,7 @@ fn enter_directory(
                             dired::add_dir_name(dired, dir_name_size);
                         }
 
-                        show_dir_name(&e.p_buf, out);
+                        show_dir_name(e, out, config);
                         writeln!(out)?;
                         enter_directory(
                             e,
diff --git a/tests/by-util/test_ls.rs b/tests/by-util/test_ls.rs
index c68f96e6cad..e503807d6fe 100644
--- a/tests/by-util/test_ls.rs
+++ b/tests/by-util/test_ls.rs
@@ -4001,6 +4001,42 @@ fn test_ls_hyperlink_encode_link() {
 }
 // spell-checker: enable
 
+#[test]
+fn test_ls_hyperlink_dirs() {
+    let scene = TestScenario::new(util_name!());
+    let at = &scene.fixtures;
+    let dir_a = "a";
+    let dir_b = "b";
+
+    at.mkdir(dir_a);
+    at.mkdir(dir_b);
+
+    let path = at.root_dir_resolved();
+    let separator = std::path::MAIN_SEPARATOR_STR;
+
+    let result = scene
+        .ucmd()
+        .arg("--hyperlink")
+        .arg(dir_a)
+        .arg(dir_b)
+        .succeeds();
+
+    assert!(result.stdout_str().contains("\x1b]8;;file://"));
+    assert!(result
+        .stdout_str()
+        .lines()
+        .nth(0)
+        .unwrap()
+        .contains(&format!("{path}{separator}{dir_a}\x07{dir_a}\x1b]8;;\x07:")));
+    assert_eq!(result.stdout_str().lines().nth(1).unwrap(), "");
+    assert!(result
+        .stdout_str()
+        .lines()
+        .nth(2)
+        .unwrap()
+        .contains(&format!("{path}{separator}{dir_b}\x07{dir_b}\x1b]8;;\x07:")));
+}
+
 #[test]
 fn test_ls_color_do_not_reset() {
     let scene: TestScenario = TestScenario::new(util_name!());

From 652e02fb59ba948cf35ab3bc04fa942fb643c83a Mon Sep 17 00:00:00 2001
From: Yykz <yykz@proton.me>
Date: Mon, 18 Dec 2023 15:34:51 +0100
Subject: [PATCH 211/429] cargo fmt

---
 tests/by-util/test_wc.rs | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/by-util/test_wc.rs b/tests/by-util/test_wc.rs
index df2551555b3..77716e43af2 100644
--- a/tests/by-util/test_wc.rs
+++ b/tests/by-util/test_wc.rs
@@ -737,4 +737,4 @@ fn test_args_override() {
         .args(&["--total=always", "--total=never", "alice_in_wonderland.txt"])
         .run()
         .stdout_is("  5  57 302 alice_in_wonderland.txt\n");
-}
\ No newline at end of file
+}

From 00b9cbe09e7dd0ef68156f541c9dd462c4f4a3bb Mon Sep 17 00:00:00 2001
From: Terts Diepraam <terts.diepraam@gmail.com>
Date: Mon, 18 Dec 2023 22:11:04 +0100
Subject: [PATCH 212/429] expr: coerce to string before comparing values

---
 src/uu/expr/src/syntax_tree.rs | 4 +++-
 tests/by-util/test_expr.rs     | 8 ++++++++
 2 files changed, 11 insertions(+), 1 deletion(-)

diff --git a/src/uu/expr/src/syntax_tree.rs b/src/uu/expr/src/syntax_tree.rs
index 28e4ff0bd65..5aa9c93986b 100644
--- a/src/uu/expr/src/syntax_tree.rs
+++ b/src/uu/expr/src/syntax_tree.rs
@@ -70,6 +70,8 @@ impl RelationOp {
             }
         } else {
             // These comparisons should be using locale settings
+            let a = a.eval_as_string();
+            let b = b.eval_as_string();
             match self {
                 Self::Lt => a < b,
                 Self::Leq => a <= b,
@@ -195,7 +197,7 @@ const PRECEDENCE: &[&[(&str, BinOp)]] = &[
     &[(":", BinOp::String(StringOp::Match))],
 ];
 
-#[derive(Debug, PartialEq, Eq, Ord, PartialOrd)]
+#[derive(Debug)]
 pub enum NumOrStr {
     Num(BigInt),
     Str(String),
diff --git a/tests/by-util/test_expr.rs b/tests/by-util/test_expr.rs
index ebc2c832feb..7c9290d6a49 100644
--- a/tests/by-util/test_expr.rs
+++ b/tests/by-util/test_expr.rs
@@ -362,3 +362,11 @@ fn test_invalid_syntax() {
             .stderr_contains("syntax error");
     }
 }
+
+#[test]
+fn test_num_str_comparison() {
+    new_ucmd!()
+        .args(&["1a", "<", "1", "+", "1"])
+        .succeeds()
+        .stdout_is("1\n");
+}

From a5606613bde1b0391b78b27205a4353b9a06c53e Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Tue, 19 Dec 2023 09:32:32 +0100
Subject: [PATCH 213/429] ls: ignore invalid block size from env vars

---
 src/uu/ls/src/ls.rs      | 11 ++++++++---
 tests/by-util/test_ls.rs |  8 ++++++++
 2 files changed, 16 insertions(+), 3 deletions(-)

diff --git a/src/uu/ls/src/ls.rs b/src/uu/ls/src/ls.rs
index 8d1ecdbc630..8dbd9513688 100644
--- a/src/uu/ls/src/ls.rs
+++ b/src/uu/ls/src/ls.rs
@@ -840,9 +840,14 @@ impl Config {
             match parse_size_u64(&raw_block_size.to_string_lossy()) {
                 Ok(size) => Some(size),
                 Err(_) => {
-                    return Err(Box::new(LsError::BlockSizeParseError(
-                        opt_block_size.unwrap().clone(),
-                    )));
+                    // only fail if invalid block size was specified with --block-size,
+                    // ignore invalid block size from env vars
+                    if let Some(invalid_block_size) = opt_block_size {
+                        return Err(Box::new(LsError::BlockSizeParseError(
+                            invalid_block_size.clone(),
+                        )));
+                    }
+                    None
                 }
             }
         } else if env_var_posixly_correct.is_some() {
diff --git a/tests/by-util/test_ls.rs b/tests/by-util/test_ls.rs
index e503807d6fe..de62c659c0d 100644
--- a/tests/by-util/test_ls.rs
+++ b/tests/by-util/test_ls.rs
@@ -3874,6 +3874,14 @@ fn test_ls_invalid_block_size() {
         .stderr_is("ls: invalid --block-size argument 'invalid'\n");
 }
 
+// TODO ensure the correct block size is used when using -l because
+// the output of "ls -l" and "BLOCK_SIZE=invalid ls -l" is different
+#[test]
+fn test_ls_invalid_block_size_in_env_var() {
+    new_ucmd!().env("LS_BLOCK_SIZE", "invalid").succeeds();
+    new_ucmd!().env("BLOCK_SIZE", "invalid").succeeds();
+}
+
 #[cfg(all(unix, feature = "dd"))]
 #[test]
 fn test_ls_block_size_override() {

From ebfbd8b1fe19ec293cc102f07773d17ba29af747 Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Tue, 19 Dec 2023 10:22:44 +0100
Subject: [PATCH 214/429] ls: rename display_file_name -> display_item_name

---
 src/uu/ls/src/ls.rs | 24 ++++++++++++------------
 1 file changed, 12 insertions(+), 12 deletions(-)

diff --git a/src/uu/ls/src/ls.rs b/src/uu/ls/src/ls.rs
index 8d1ecdbc630..53397a4b730 100644
--- a/src/uu/ls/src/ls.rs
+++ b/src/uu/ls/src/ls.rs
@@ -2413,7 +2413,7 @@ fn display_items(
 
         for i in items {
             let more_info = display_additional_leading_info(i, &padding, config, out)?;
-            let cell = display_file_name(i, config, prefix_context, more_info, out, style_manager);
+            let cell = display_item_name(i, config, prefix_context, more_info, out, style_manager);
             names_vec.push(cell);
         }
 
@@ -2544,11 +2544,11 @@ fn display_grid(
 /// * `author` ([`display_uname`], config-optional)
 /// * `size / rdev` ([`display_len_or_rdev`])
 /// * `system_time` ([`get_system_time`])
-/// * `file_name` ([`display_file_name`])
+/// * `item_name` ([`display_item_name`])
 ///
 /// This function needs to display information in columns:
 /// * permissions and system_time are already guaranteed to be pre-formatted in fixed length.
-/// * file_name is the last column and is left-aligned.
+/// * item_name is the last column and is left-aligned.
 /// * Everything else needs to be padded using [`pad_left`].
 ///
 /// That's why we have the parameters:
@@ -2661,17 +2661,17 @@ fn display_item_long(
 
         write!(output_display, " {} ", display_date(md, config)).unwrap();
 
-        let displayed_file =
-            display_file_name(item, config, None, String::new(), out, style_manager).contents;
+        let displayed_item =
+            display_item_name(item, config, None, String::new(), out, style_manager).contents;
         if config.dired {
             let (start, end) = dired::calculate_dired(
                 &dired.dired_positions,
                 output_display.len(),
-                displayed_file.len(),
+                displayed_item.len(),
             );
             dired::update_positions(dired, start, end);
         }
-        write!(output_display, "{}{}", displayed_file, config.line_ending).unwrap();
+        write!(output_display, "{}{}", displayed_item, config.line_ending).unwrap();
     } else {
         #[cfg(unix)]
         let leading_char = {
@@ -2744,8 +2744,8 @@ fn display_item_long(
             write!(output_display, " {}", pad_right("?", padding.uname)).unwrap();
         }
 
-        let displayed_file =
-            display_file_name(item, config, None, String::new(), out, style_manager).contents;
+        let displayed_item =
+            display_item_name(item, config, None, String::new(), out, style_manager).contents;
         let date_len = 12;
 
         write!(
@@ -2760,10 +2760,10 @@ fn display_item_long(
             dired::calculate_and_update_positions(
                 dired,
                 output_display.len(),
-                displayed_file.trim().len(),
+                displayed_item.trim().len(),
             );
         }
-        write!(output_display, "{}{}", displayed_file, config.line_ending).unwrap();
+        write!(output_display, "{}{}", displayed_item, config.line_ending).unwrap();
     }
     write!(out, "{}", output_display)?;
 
@@ -3037,7 +3037,7 @@ fn classify_file(path: &PathData, out: &mut BufWriter<Stdout>) -> Option<char> {
 /// Note that non-unicode sequences in symlink targets are dealt with using
 /// [`std::path::Path::to_string_lossy`].
 #[allow(clippy::cognitive_complexity)]
-fn display_file_name(
+fn display_item_name(
     path: &PathData,
     config: &Config,
     prefix_context: Option<usize>,

From d8f299eb48e4c2e39d5e996ed55be223e94aaac0 Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Tue, 19 Dec 2023 10:26:23 +0100
Subject: [PATCH 215/429] ls: mention config.hyperlink in comment

---
 src/uu/ls/src/ls.rs | 1 +
 1 file changed, 1 insertion(+)

diff --git a/src/uu/ls/src/ls.rs b/src/uu/ls/src/ls.rs
index 53397a4b730..7f67a8cf7b1 100644
--- a/src/uu/ls/src/ls.rs
+++ b/src/uu/ls/src/ls.rs
@@ -3033,6 +3033,7 @@ fn classify_file(path: &PathData, out: &mut BufWriter<Stdout>) -> Option<char> {
 /// * `config.format` to display symlink targets if `Format::Long`. This function is also
 ///   responsible for coloring symlink target names if `config.color` is specified.
 /// * `config.context` to prepend security context to `name` if compiled with `feat_selinux`.
+/// * `config.hyperlink` decides whether to hyperlink the item
 ///
 /// Note that non-unicode sequences in symlink targets are dealt with using
 /// [`std::path::Path::to_string_lossy`].

From b9d4f97e6df35dab4792cec1d2ffdddb57623cb1 Mon Sep 17 00:00:00 2001
From: Laurent Cheylus <foxy@free.fr>
Date: Tue, 19 Dec 2023 11:43:35 +0100
Subject: [PATCH 216/429] uucore: remove useless conversion for features/fs on
 OpenBSD

  - src/uucore/src/lib/features/fs.rs: in inode function, remove useless
    conversion for target_OS = OpenBSD

Signed-off-by: Laurent Cheylus <foxy@free.fr>
---
 src/uucore/src/lib/features/fs.rs | 3 +--
 1 file changed, 1 insertion(+), 2 deletions(-)

diff --git a/src/uucore/src/lib/features/fs.rs b/src/uucore/src/lib/features/fs.rs
index 94ca82c8098..41437c55468 100644
--- a/src/uucore/src/lib/features/fs.rs
+++ b/src/uucore/src/lib/features/fs.rs
@@ -148,14 +148,13 @@ impl FileInformation {
     #[cfg(unix)]
     pub fn inode(&self) -> u64 {
         #[cfg(all(
-            not(any(target_os = "freebsd", target_os = "netbsd", target_os = "openbsd")),
+            not(any(target_os = "freebsd", target_os = "netbsd")),
             target_pointer_width = "64"
         ))]
         return self.0.st_ino;
         #[cfg(any(
             target_os = "freebsd",
             target_os = "netbsd",
-            target_os = "openbsd",
             not(target_pointer_width = "64")
         ))]
         return self.0.st_ino.into();

From 6bcf4e2cece5815eb7352e74f64af14b13ad5a4f Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Tue, 19 Dec 2023 13:26:39 +0100
Subject: [PATCH 217/429] tr: add 'boop' to the ignore spell check

---
 src/uu/tr/src/operation.rs | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/uu/tr/src/operation.rs b/src/uu/tr/src/operation.rs
index cd6a83de6c9..5565de6a16d 100644
--- a/src/uu/tr/src/operation.rs
+++ b/src/uu/tr/src/operation.rs
@@ -3,7 +3,7 @@
 // For the full copyright and license information, please view the LICENSE
 // file that was distributed with this source code.
 
-// spell-checker:ignore (strings) anychar combinator Alnum Punct Xdigit alnum punct xdigit cntrl
+// spell-checker:ignore (strings) anychar combinator Alnum Punct Xdigit alnum punct xdigit cntrl boop
 
 use nom::{
     branch::alt,

From d8709d28391182d5116d27aff62be8733fbd4f31 Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Tue, 19 Dec 2023 15:00:06 +0100
Subject: [PATCH 218/429] ls: recognize BLOCKSIZE env var

---
 src/uu/ls/src/ls.rs      | 11 +++++++----
 tests/by-util/test_ls.rs | 35 +++++++++++++++++++++++++++++++----
 2 files changed, 38 insertions(+), 8 deletions(-)

diff --git a/src/uu/ls/src/ls.rs b/src/uu/ls/src/ls.rs
index 81c90f14a94..6db8395cec7 100644
--- a/src/uu/ls/src/ls.rs
+++ b/src/uu/ls/src/ls.rs
@@ -810,10 +810,6 @@ impl Config {
             || options.get_flag(options::size::HUMAN_READABLE);
         let opt_kb = options.get_flag(options::size::KIBIBYTES);
 
-        let env_var_block_size = std::env::var_os("BLOCK_SIZE");
-        let env_var_ls_block_size = std::env::var_os("LS_BLOCK_SIZE");
-        let env_var_posixly_correct = std::env::var_os("POSIXLY_CORRECT");
-
         let size_format = if opt_si {
             SizeFormat::Decimal
         } else if opt_hr {
@@ -822,6 +818,11 @@ impl Config {
             SizeFormat::Bytes
         };
 
+        let env_var_blocksize = std::env::var_os("BLOCKSIZE");
+        let env_var_block_size = std::env::var_os("BLOCK_SIZE");
+        let env_var_ls_block_size = std::env::var_os("LS_BLOCK_SIZE");
+        let env_var_posixly_correct = std::env::var_os("POSIXLY_CORRECT");
+
         let raw_block_size = if let Some(opt_block_size) = opt_block_size {
             OsString::from(opt_block_size)
         } else if !opt_kb {
@@ -829,6 +830,8 @@ impl Config {
                 env_var_ls_block_size
             } else if let Some(env_var_block_size) = env_var_block_size {
                 env_var_block_size
+            } else if let Some(env_var_blocksize) = env_var_blocksize {
+                env_var_blocksize
             } else {
                 OsString::from("")
             }
diff --git a/tests/by-util/test_ls.rs b/tests/by-util/test_ls.rs
index de62c659c0d..8aeb762c79b 100644
--- a/tests/by-util/test_ls.rs
+++ b/tests/by-util/test_ls.rs
@@ -3839,7 +3839,7 @@ fn test_ls_cf_output_should_be_delimited_by_tab() {
 
 #[cfg(all(unix, feature = "dd"))]
 #[test]
-fn test_posixly_correct() {
+fn test_posixly_correct_and_block_size_env_vars() {
     let scene = TestScenario::new(util_name!());
 
     scene
@@ -3852,16 +3852,42 @@ fn test_posixly_correct() {
 
     scene
         .ucmd()
-        .arg("-s")
+        .arg("-l")
         .succeeds()
-        .stdout_contains_line("total 4");
+        .stdout_contains_line("total 4")
+        .stdout_contains(" 1024 ");
 
     scene
         .ucmd()
-        .arg("-s")
+        .arg("-l")
         .env("POSIXLY_CORRECT", "some_value")
         .succeeds()
         .stdout_contains_line("total 8");
+    //.stdout_contains(" 1024 "); // TODO needs second internal blocksize
+
+    scene
+        .ucmd()
+        .arg("-l")
+        .env("LS_BLOCK_SIZE", "512")
+        .succeeds()
+        .stdout_contains_line("total 8")
+        .stdout_contains(" 2 ");
+
+    scene
+        .ucmd()
+        .arg("-l")
+        .env("BLOCK_SIZE", "512")
+        .succeeds()
+        .stdout_contains_line("total 8")
+        .stdout_contains(" 2 ");
+
+    scene
+        .ucmd()
+        .arg("-l")
+        .env("BLOCKSIZE", "512")
+        .succeeds()
+        .stdout_contains_line("total 8");
+    //.stdout_contains(" 1024 "); // TODO needs second internal blocksize
 }
 
 #[test]
@@ -3880,6 +3906,7 @@ fn test_ls_invalid_block_size() {
 fn test_ls_invalid_block_size_in_env_var() {
     new_ucmd!().env("LS_BLOCK_SIZE", "invalid").succeeds();
     new_ucmd!().env("BLOCK_SIZE", "invalid").succeeds();
+    new_ucmd!().env("BLOCKSIZE", "invalid").succeeds();
 }
 
 #[cfg(all(unix, feature = "dd"))]

From ce2a5d5b9aa5a72bf9abc97e013630c5466d1cef Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Wed, 20 Dec 2023 15:15:20 +0100
Subject: [PATCH 219/429] expr fuzz: add missing ops. found thanks to oss fuzz
 coverage (#5557)

* expr fuzz: add missing ops. found thanks to oss fuzz coverage
https://storage.googleapis.com/oss-fuzz-coverage/rust-coreutils/reports/20231118/linux/src/rust-coreutils/src/uu/expr/src/syntax_tree.rs.html

Co-authored-by: Daniel Hofstetter <daniel.hofstetter@42dh.com>
---
 fuzz/fuzz_targets/fuzz_expr.rs | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/fuzz/fuzz_targets/fuzz_expr.rs b/fuzz/fuzz_targets/fuzz_expr.rs
index ce5535b16e1..9f2d28603ab 100644
--- a/fuzz/fuzz_targets/fuzz_expr.rs
+++ b/fuzz/fuzz_targets/fuzz_expr.rs
@@ -21,7 +21,9 @@ static CMD_PATH: &str = "expr";
 
 fn generate_expr(max_depth: u32) -> String {
     let mut rng = rand::thread_rng();
-    let ops = ["+", "-", "*", "/", "%", "<", ">", "=", "&", "|"];
+    let ops = [
+        "+", "-", "*", "/", "%", "<", ">", "=", "&", "|", "!=", "<=", ">=", ":", "index", "length", "substr",
+    ];
 
     let mut expr = String::new();
     let mut depth = 0;

From d4a9d63ea2b589f28c476e16a20f06c2597ddde6 Mon Sep 17 00:00:00 2001
From: Terts Diepraam <terts.diepraam@gmail.com>
Date: Tue, 19 Dec 2023 19:46:13 +0100
Subject: [PATCH 220/429] uucore/fsext: refactor MountInfo construction

---
 src/uucore/src/lib/features/fsext.rs | 212 ++++++++++++++-------------
 1 file changed, 108 insertions(+), 104 deletions(-)

diff --git a/src/uucore/src/lib/features/fsext.rs b/src/uucore/src/lib/features/fsext.rs
index 9ee5e2464e5..1dd536d47cc 100644
--- a/src/uucore/src/lib/features/fsext.rs
+++ b/src/uucore/src/lib/features/fsext.rs
@@ -10,8 +10,6 @@
 use time::macros::format_description;
 use time::UtcOffset;
 
-pub use crate::*; // import macros from `../../macros.rs`
-
 #[cfg(any(target_os = "linux", target_os = "android"))]
 const LINUX_MTAB: &str = "/etc/mtab";
 #[cfg(any(target_os = "linux", target_os = "android"))]
@@ -61,7 +59,7 @@ use libc::{
     mode_t, strerror, S_IFBLK, S_IFCHR, S_IFDIR, S_IFIFO, S_IFLNK, S_IFMT, S_IFREG, S_IFSOCK,
 };
 use std::borrow::Cow;
-use std::convert::{AsRef, From};
+use std::convert::From;
 #[cfg(any(
     target_vendor = "apple",
     target_os = "freebsd",
@@ -145,63 +143,27 @@ impl BirthTime for Metadata {
 
 #[derive(Debug, Clone)]
 pub struct MountInfo {
-    // it stores `volume_name` in windows platform and `dev_id` in unix platform
+    /// Stores `volume_name` in windows platform and `dev_id` in unix platform
     pub dev_id: String,
     pub dev_name: String,
     pub fs_type: String,
-    pub mount_dir: String,
-    pub mount_option: String, // we only care "bind" option
     pub mount_root: String,
+    pub mount_dir: String,
+    /// We only care whether this field contains "bind"
+    pub mount_option: String,
     pub remote: bool,
     pub dummy: bool,
 }
 
 impl MountInfo {
-    fn set_missing_fields(&mut self) {
-        #[cfg(unix)]
-        {
-            use std::os::unix::fs::MetadataExt;
-            // We want to keep the dev_id on Windows
-            // but set dev_id
-            if let Ok(stat) = std::fs::metadata(&self.mount_dir) {
-                // Why do we cast this to i32?
-                self.dev_id = (stat.dev() as i32).to_string();
-            } else {
-                self.dev_id = String::new();
-            }
-        }
-        // set MountInfo::dummy
-        // spell-checker:disable
-        match self.fs_type.as_ref() {
-            "autofs" | "proc" | "subfs"
-            /* for Linux 2.6/3.x */
-            | "debugfs" | "devpts" | "fusectl" | "mqueue" | "rpc_pipefs" | "sysfs"
-            /* FreeBSD, Linux 2.4 */
-            | "devfs"
-            /* for NetBSD 3.0 */
-            | "kernfs"
-            /* for Irix 6.5 */
-            | "ignore" => self.dummy = true,
-            _ => self.dummy = self.fs_type == "none"
-                && !self.mount_option.contains(MOUNT_OPT_BIND)
-        }
-        // spell-checker:enable
-        // set MountInfo::remote
-        #[cfg(windows)]
-        {
-            self.remote = DRIVE_REMOTE == unsafe { GetDriveTypeW(String2LPWSTR!(self.mount_root)) };
-        }
-        #[cfg(unix)]
-        {
-            self.remote = self.dev_name.find(':').is_some()
-                || (self.dev_name.starts_with("//") && self.fs_type == "smbfs"
-                    || self.fs_type == "cifs")
-                || self.dev_name == "-hosts";
-        }
-    }
-
     #[cfg(any(target_os = "linux", target_os = "android"))]
     fn new(file_name: &str, raw: &[&str]) -> Option<Self> {
+        let dev_name;
+        let fs_type;
+        let mount_root;
+        let mount_dir;
+        let mount_option;
+
         match file_name {
             // spell-checker:ignore (word) noatime
             // Format: 36 35 98:0 /mnt1 /mnt2 rw,noatime master:1 - ext3 /dev/root rw,errors=continue
@@ -211,36 +173,38 @@ impl MountInfo {
                 let after_fields = raw[FIELDS_OFFSET..].iter().position(|c| *c == "-").unwrap()
                     + FIELDS_OFFSET
                     + 1;
-                let mut m = Self {
-                    dev_id: String::new(),
-                    dev_name: raw[after_fields + 1].to_string(),
-                    fs_type: raw[after_fields].to_string(),
-                    mount_root: raw[3].to_string(),
-                    mount_dir: raw[4].to_string(),
-                    mount_option: raw[5].to_string(),
-                    remote: false,
-                    dummy: false,
-                };
-                m.set_missing_fields();
-                Some(m)
+                dev_name = raw[after_fields + 1].to_string();
+                fs_type = raw[after_fields].to_string();
+                mount_root = raw[3].to_string();
+                mount_dir = raw[4].to_string();
+                mount_option = raw[5].to_string();
             }
             LINUX_MTAB => {
-                let mut m = Self {
-                    dev_id: String::new(),
-                    dev_name: raw[0].to_string(),
-                    fs_type: raw[2].to_string(),
-                    mount_root: String::new(),
-                    mount_dir: raw[1].to_string(),
-                    mount_option: raw[3].to_string(),
-                    remote: false,
-                    dummy: false,
-                };
-                m.set_missing_fields();
-                Some(m)
+                dev_name = raw[0].to_string();
+                fs_type = raw[2].to_string();
+                mount_root = String::new();
+                mount_dir = raw[1].to_string();
+                mount_option = raw[3].to_string();
             }
-            _ => None,
-        }
+            _ => return None,
+        };
+
+        let dev_id = mount_dev_id(&mount_dir);
+        let dummy = is_dummy_filesystem(&fs_type, &mount_option);
+        let remote = is_remote_filesystem(&dev_name, &fs_type);
+
+        Some(Self {
+            dev_id,
+            dev_name,
+            fs_type,
+            mount_dir,
+            mount_option,
+            mount_root,
+            remote,
+            dummy,
+        })
     }
+
     #[cfg(windows)]
     fn new(mut volume_name: String) -> Option<Self> {
         let mut dev_name_buf = [0u16; MAX_PATH];
@@ -293,18 +257,17 @@ impl MountInfo {
         } else {
             Some(LPWSTR2String(&fs_type_buf))
         };
-        let mut mn_info = Self {
+        let remote = DRIVE_REMOTE == unsafe { GetDriveTypeW(String2LPWSTR!(self.mount_root)) };
+        Some(Self {
             dev_id: volume_name,
             dev_name,
             fs_type: fs_type.unwrap_or_default(),
             mount_root,
             mount_dir: String::new(),
             mount_option: String::new(),
-            remote: false,
+            remote,
             dummy: false,
-        };
-        mn_info.set_missing_fields();
-        Some(mn_info)
+        })
     }
 }
 
@@ -316,33 +279,74 @@ impl MountInfo {
 ))]
 impl From<StatFs> for MountInfo {
     fn from(statfs: StatFs) -> Self {
-        let mut info = Self {
+        let dev_name = unsafe {
+            // spell-checker:disable-next-line
+            CStr::from_ptr(&statfs.f_mntfromname[0])
+                .to_string_lossy()
+                .into_owned()
+        };
+        let fs_type = unsafe {
+            // spell-checker:disable-next-line
+            CStr::from_ptr(&statfs.f_fstypename[0])
+                .to_string_lossy()
+                .into_owned()
+        };
+        let mount_dir = unsafe {
+            // spell-checker:disable-next-line
+            CStr::from_ptr(&statfs.f_mntonname[0])
+                .to_string_lossy()
+                .into_owned()
+        };
+
+        let dummy = is_dummy_filesystem(&fs_type, &mount_option);
+        let remote = is_remote_filesystem(&dev_name, &fs_type);
+
+        Self {
             dev_id: String::new(),
-            dev_name: unsafe {
-                // spell-checker:disable-next-line
-                CStr::from_ptr(&statfs.f_mntfromname[0])
-                    .to_string_lossy()
-                    .into_owned()
-            },
-            fs_type: unsafe {
-                // spell-checker:disable-next-line
-                CStr::from_ptr(&statfs.f_fstypename[0])
-                    .to_string_lossy()
-                    .into_owned()
-            },
-            mount_dir: unsafe {
-                // spell-checker:disable-next-line
-                CStr::from_ptr(&statfs.f_mntonname[0])
-                    .to_string_lossy()
-                    .into_owned()
-            },
+            dev_name,
+            fs_type,
+            mount_dir,
             mount_root: String::new(),
             mount_option: String::new(),
-            remote: false,
-            dummy: false,
-        };
-        info.set_missing_fields();
-        info
+            remote,
+            dummy,
+        }
+    }
+}
+
+#[cfg(unix)]
+fn is_dummy_filesystem(fs_type: &str, mount_option: &str) -> bool {
+    match fs_type {
+        "autofs" | "proc" | "subfs"
+        // for Linux 2.6/3.x
+        | "debugfs" | "devpts" | "fusectl" | "mqueue" | "rpc_pipefs" | "sysfs"
+        // FreeBSD, Linux 2.4
+        | "devfs"
+        // for NetBSD 3.0
+        | "kernfs"
+        // for Irix 6.5
+        | "ignore" => true,
+        _ => fs_type == "none"
+            && !mount_option.contains(MOUNT_OPT_BIND)
+    }
+}
+
+#[cfg(unix)]
+fn is_remote_filesystem(dev_name: &str, fs_type: &str) -> bool {
+    dev_name.find(':').is_some()
+        || (dev_name.starts_with("//") && fs_type == "smbfs" || fs_type == "cifs")
+        || dev_name == "-hosts"
+}
+
+#[cfg(unix)]
+fn mount_dev_id(mount_dir: &str) -> String {
+    use std::os::unix::fs::MetadataExt;
+
+    if let Ok(stat) = std::fs::metadata(&mount_dir) {
+        // Why do we cast this to i32?
+        (stat.dev() as i32).to_string()
+    } else {
+        String::new()
     }
 }
 

From cc15876bb792e0b33313a4e56960555a6df37db6 Mon Sep 17 00:00:00 2001
From: Terts Diepraam <terts.diepraam@gmail.com>
Date: Tue, 19 Dec 2023 22:16:03 +0100
Subject: [PATCH 221/429] uucore/fsext: merge some windows imports

---
 src/uucore/src/lib/features/fsext.rs | 8 +++++---
 1 file changed, 5 insertions(+), 3 deletions(-)

diff --git a/src/uucore/src/lib/features/fsext.rs b/src/uucore/src/lib/features/fsext.rs
index 1dd536d47cc..394d70b6ae9 100644
--- a/src/uucore/src/lib/features/fsext.rs
+++ b/src/uucore/src/lib/features/fsext.rs
@@ -25,11 +25,13 @@ use std::ffi::OsStr;
 #[cfg(windows)]
 use std::os::windows::ffi::OsStrExt;
 #[cfg(windows)]
-use windows_sys::Win32::Foundation::{ERROR_NO_MORE_FILES, INVALID_HANDLE_VALUE};
-#[cfg(windows)]
-use windows_sys::Win32::Storage::FileSystem::{
+use windows_sys::Win32::{
+    Foundation::{ERROR_NO_MORE_FILES, INVALID_HANDLE_VALUE},
+    Storage::FileSystem::{
     FindFirstVolumeW, FindNextVolumeW, FindVolumeClose, GetDiskFreeSpaceW, GetDriveTypeW,
     GetVolumeInformationW, GetVolumePathNamesForVolumeNameW, QueryDosDeviceW,
+    },
+    System::WindowsProgramming::DRIVE_REMOTE,
 };
 #[cfg(windows)]
 use windows_sys::Win32::System::WindowsProgramming::DRIVE_REMOTE;

From f90713278fb36ed9612a3b651a7e3c2e88274748 Mon Sep 17 00:00:00 2001
From: Terts Diepraam <terts.diepraam@gmail.com>
Date: Tue, 19 Dec 2023 22:27:48 +0100
Subject: [PATCH 222/429] uucore/fsext: do not use dangerous macro for nul
 terminated UTF16 strings

---
 src/uucore/src/lib/features/fsext.rs | 86 +++++++++++++++-------------
 1 file changed, 46 insertions(+), 40 deletions(-)

diff --git a/src/uucore/src/lib/features/fsext.rs b/src/uucore/src/lib/features/fsext.rs
index 394d70b6ae9..d02d74babbc 100644
--- a/src/uucore/src/lib/features/fsext.rs
+++ b/src/uucore/src/lib/features/fsext.rs
@@ -14,12 +14,24 @@ use time::UtcOffset;
 const LINUX_MTAB: &str = "/etc/mtab";
 #[cfg(any(target_os = "linux", target_os = "android"))]
 const LINUX_MOUNTINFO: &str = "/proc/self/mountinfo";
+#[cfg(unix)]
 static MOUNT_OPT_BIND: &str = "bind";
 #[cfg(windows)]
 const MAX_PATH: usize = 266;
-#[cfg(not(unix))]
+#[cfg(windows)]
 static EXIT_ERR: i32 = 1;
 
+#[cfg(any(
+    windows,
+    target_os = "freebsd",
+    target_vendor = "apple",
+    target_os = "netbsd",
+    target_os = "openbsd"
+))]
+use crate::crash;
+#[cfg(windows)]
+use crate::show_warning;
+
 #[cfg(windows)]
 use std::ffi::OsStr;
 #[cfg(windows)]
@@ -28,26 +40,11 @@ use std::os::windows::ffi::OsStrExt;
 use windows_sys::Win32::{
     Foundation::{ERROR_NO_MORE_FILES, INVALID_HANDLE_VALUE},
     Storage::FileSystem::{
-    FindFirstVolumeW, FindNextVolumeW, FindVolumeClose, GetDiskFreeSpaceW, GetDriveTypeW,
-    GetVolumeInformationW, GetVolumePathNamesForVolumeNameW, QueryDosDeviceW,
+        FindFirstVolumeW, FindNextVolumeW, FindVolumeClose, GetDiskFreeSpaceW, GetDriveTypeW,
+        GetVolumeInformationW, GetVolumePathNamesForVolumeNameW, QueryDosDeviceW,
     },
     System::WindowsProgramming::DRIVE_REMOTE,
 };
-#[cfg(windows)]
-use windows_sys::Win32::System::WindowsProgramming::DRIVE_REMOTE;
-
-// Warning: the pointer has to be used *immediately* or the Vec
-// it points to will be dropped!
-#[cfg(windows)]
-macro_rules! String2LPWSTR {
-    ($str: expr) => {
-        OsStr::new(&$str)
-            .encode_wide()
-            .chain(Some(0))
-            .collect::<Vec<u16>>()
-            .as_ptr()
-    };
-}
 
 #[cfg(windows)]
 #[allow(non_snake_case)]
@@ -56,30 +53,28 @@ fn LPWSTR2String(buf: &[u16]) -> String {
     String::from_utf16(&buf[..len]).unwrap()
 }
 
+#[cfg(windows)]
+fn to_nul_terminated_wide_string(s: impl AsRef<OsStr>) -> Vec<u16> {
+    s.as_ref()
+        .encode_wide()
+        .chain(Some(0))
+        .collect::<Vec<u16>>()
+}
+
 #[cfg(unix)]
 use libc::{
     mode_t, strerror, S_IFBLK, S_IFCHR, S_IFDIR, S_IFIFO, S_IFLNK, S_IFMT, S_IFREG, S_IFSOCK,
 };
 use std::borrow::Cow;
 use std::convert::From;
-#[cfg(any(
-    target_vendor = "apple",
-    target_os = "freebsd",
-    target_os = "netbsd",
-    target_os = "openbsd",
-    target_os = "linux",
-    target_os = "android",
-    target_os = "illumos",
-    target_os = "solaris",
-    target_os = "redox",
-))]
+#[cfg(unix)]
 use std::ffi::CStr;
-#[cfg(not(windows))]
+#[cfg(unix)]
 use std::ffi::CString;
 use std::io::Error as IOError;
 #[cfg(unix)]
 use std::mem;
-#[cfg(not(unix))]
+#[cfg(windows)]
 use std::path::Path;
 use std::time::UNIX_EPOCH;
 
@@ -228,8 +223,9 @@ impl MountInfo {
 
         let mut mount_root_buf = [0u16; MAX_PATH];
         let success = unsafe {
+            let volume_name = to_nul_terminated_wide_string(&volume_name);
             GetVolumePathNamesForVolumeNameW(
-                String2LPWSTR!(volume_name),
+                volume_name.as_ptr(),
                 mount_root_buf.as_mut_ptr(),
                 mount_root_buf.len() as u32,
                 ptr::null_mut(),
@@ -243,8 +239,9 @@ impl MountInfo {
 
         let mut fs_type_buf = [0u16; MAX_PATH];
         let success = unsafe {
+            let mount_root = to_nul_terminated_wide_string(&mount_root);
             GetVolumeInformationW(
-                String2LPWSTR!(mount_root),
+                mount_root.as_ptr(),
                 ptr::null_mut(),
                 0,
                 ptr::null_mut(),
@@ -259,7 +256,11 @@ impl MountInfo {
         } else {
             Some(LPWSTR2String(&fs_type_buf))
         };
-        let remote = DRIVE_REMOTE == unsafe { GetDriveTypeW(String2LPWSTR!(self.mount_root)) };
+        let remote = DRIVE_REMOTE
+            == unsafe {
+                let mount_root = to_nul_terminated_wide_string(&mount_root);
+                GetDriveTypeW(mount_root.as_ptr())
+            };
         Some(Self {
             dev_id: volume_name,
             dev_name,
@@ -300,11 +301,12 @@ impl From<StatFs> for MountInfo {
                 .into_owned()
         };
 
-        let dummy = is_dummy_filesystem(&fs_type, &mount_option);
+        let dev_id = mount_dev_id(&mount_dir);
+        let dummy = is_dummy_filesystem(&fs_type, "");
         let remote = is_remote_filesystem(&dev_name, &fs_type);
 
         Self {
-            dev_id: String::new(),
+            dev_id,
             dev_name,
             fs_type,
             mount_dir,
@@ -318,6 +320,7 @@ impl From<StatFs> for MountInfo {
 
 #[cfg(unix)]
 fn is_dummy_filesystem(fs_type: &str, mount_option: &str) -> bool {
+    // spell-checker:disable
     match fs_type {
         "autofs" | "proc" | "subfs"
         // for Linux 2.6/3.x
@@ -331,6 +334,7 @@ fn is_dummy_filesystem(fs_type: &str, mount_option: &str) -> bool {
         _ => fs_type == "none"
             && !mount_option.contains(MOUNT_OPT_BIND)
     }
+    // spell-checker:enable
 }
 
 #[cfg(unix)]
@@ -344,7 +348,7 @@ fn is_remote_filesystem(dev_name: &str, fs_type: &str) -> bool {
 fn mount_dev_id(mount_dir: &str) -> String {
     use std::os::unix::fs::MetadataExt;
 
-    if let Ok(stat) = std::fs::metadata(&mount_dir) {
+    if let Ok(stat) = std::fs::metadata(mount_dir) {
         // Why do we cast this to i32?
         (stat.dev() as i32).to_string()
     } else {
@@ -558,13 +562,14 @@ impl FsUsage {
             };
         }
     }
-    #[cfg(not(unix))]
+    #[cfg(windows)]
     pub fn new(path: &Path) -> Self {
         let mut root_path = [0u16; MAX_PATH];
         let success = unsafe {
+            let path = to_nul_terminated_wide_string(path);
             GetVolumePathNamesForVolumeNameW(
                 //path_utf8.as_ptr(),
-                String2LPWSTR!(path.as_os_str()),
+                path.as_ptr(),
                 root_path.as_mut_ptr(),
                 root_path.len() as u32,
                 ptr::null_mut(),
@@ -584,8 +589,9 @@ impl FsUsage {
         let mut total_number_of_clusters = 0;
 
         let success = unsafe {
+            let path = to_nul_terminated_wide_string(path);
             GetDiskFreeSpaceW(
-                String2LPWSTR!(path.as_os_str()),
+                path.as_ptr(),
                 &mut sectors_per_cluster,
                 &mut bytes_per_sector,
                 &mut number_of_free_clusters,

From b7bbec6d0f4710af7bd9bd6e17d1524b818c16d5 Mon Sep 17 00:00:00 2001
From: "renovate[bot]" <29139614+renovate[bot]@users.noreply.github.com>
Date: Wed, 20 Dec 2023 17:09:27 +0000
Subject: [PATCH 223/429] chore(deps): update rust crate self_cell to 1.0.3

---
 Cargo.lock | 4 ++--
 Cargo.toml | 2 +-
 2 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/Cargo.lock b/Cargo.lock
index 446b1724768..44d458ae319 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -1870,9 +1870,9 @@ checksum = "d29ab0c6d3fc0ee92fe66e2d99f700eab17a8d57d1c1d3b748380fb20baa78cd"
 
 [[package]]
 name = "self_cell"
-version = "1.0.2"
+version = "1.0.3"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "e388332cd64eb80cd595a00941baf513caffae8dce9cfd0467fc9c66397dade6"
+checksum = "58bf37232d3bb9a2c4e641ca2a11d83b5062066f88df7fed36c28772046d65ba"
 
 [[package]]
 name = "selinux"
diff --git a/Cargo.toml b/Cargo.toml
index 332131bbe50..accfc2a0653 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -315,7 +315,7 @@ regex = "1.10.2"
 rstest = "0.18.2"
 rust-ini = "0.19.0"
 same-file = "1.0.6"
-self_cell = "1.0.2"
+self_cell = "1.0.3"
 selinux = "0.4"
 signal-hook = "0.3.17"
 smallvec = { version = "1.11", features = ["union"] }

From a6ba81db20d3807f390a5d4a988b4d17bbbcc5e5 Mon Sep 17 00:00:00 2001
From: Justin ! <just1602@riseup.net>
Date: Tue, 19 Dec 2023 21:33:06 -0500
Subject: [PATCH 224/429] sort: allow `-f` to be pass multiple time

Fix #5667
---
 src/uu/sort/src/sort.rs    | 1 +
 tests/by-util/test_sort.rs | 8 ++++++++
 2 files changed, 9 insertions(+)

diff --git a/src/uu/sort/src/sort.rs b/src/uu/sort/src/sort.rs
index bc331915b14..5fcfe2c82da 100644
--- a/src/uu/sort/src/sort.rs
+++ b/src/uu/sort/src/sort.rs
@@ -1280,6 +1280,7 @@ pub fn uu_app() -> Command {
         .infer_long_args(true)
         .disable_help_flag(true)
         .disable_version_flag(true)
+        .args_override_self(true)
         .arg(
             Arg::new(options::HELP)
                 .long(options::HELP)
diff --git a/tests/by-util/test_sort.rs b/tests/by-util/test_sort.rs
index 690623c1c96..d22bffae4d8 100644
--- a/tests/by-util/test_sort.rs
+++ b/tests/by-util/test_sort.rs
@@ -1181,3 +1181,11 @@ fn test_tmp_files_deleted_on_sigint() {
 fn test_same_sort_mode_twice() {
     new_ucmd!().args(&["-k", "2n,2n", "empty.txt"]).succeeds();
 }
+
+#[test]
+fn test_args_override() {
+    new_ucmd!()
+        .args(&["-f", "-f"])
+        .pipe_in("foo")
+        .succeeds();
+}

From 3e6187269e24a5222f456494bc70582d96d2ee0d Mon Sep 17 00:00:00 2001
From: allaboutevemirolive <xkmxlfirdxus@gmail.com>
Date: Wed, 20 Dec 2023 23:30:46 +0200
Subject: [PATCH 225/429] fix duplicate flags

---
 src/uu/expand/src/expand.rs                   |  1 +
 tests/by-util/test_expand.rs                  | 14 ++++++++++++++
 tests/fixtures/expand/alice_in_wonderland.txt |  5 +++++
 3 files changed, 20 insertions(+)
 create mode 100644 tests/fixtures/expand/alice_in_wonderland.txt

diff --git a/src/uu/expand/src/expand.rs b/src/uu/expand/src/expand.rs
index 99b9d6b815d..eb9766eb4f6 100644
--- a/src/uu/expand/src/expand.rs
+++ b/src/uu/expand/src/expand.rs
@@ -275,6 +275,7 @@ pub fn uu_app() -> Command {
         .after_help(LONG_HELP)
         .override_usage(format_usage(USAGE))
         .infer_long_args(true)
+        .args_override_self(true)
         .arg(
             Arg::new(options::INITIAL)
                 .long(options::INITIAL)
diff --git a/tests/by-util/test_expand.rs b/tests/by-util/test_expand.rs
index f6802358cc3..a1173c49617 100644
--- a/tests/by-util/test_expand.rs
+++ b/tests/by-util/test_expand.rs
@@ -392,3 +392,17 @@ fn test_comma_with_plus_4() {
         //          01234567890
         .stdout_is("a  b    c");
 }
+
+#[test]
+fn test_args_override() {
+    new_ucmd!()
+        .args(&["-i", "-i", "alice_in_wonderland.txt"])
+        .run()
+        .stdout_is(
+            "Alice was beginning to get very tired of sitting by\n\
+        her sister on the bank, and of having nothing to do: once or twice\n\
+        she had peeped into the book her sister was reading, but it had no\n\
+        pictures or conversations in it, \"and what is the use of a book,\"\n\
+        thought Alice \"without pictures or conversation?\"\n",
+        );
+}
diff --git a/tests/fixtures/expand/alice_in_wonderland.txt b/tests/fixtures/expand/alice_in_wonderland.txt
new file mode 100644
index 00000000000..a95562a1ce6
--- /dev/null
+++ b/tests/fixtures/expand/alice_in_wonderland.txt
@@ -0,0 +1,5 @@
+Alice was beginning to get very tired of sitting by
+her sister on the bank, and of having nothing to do: once or twice
+she had peeped into the book her sister was reading, but it had no
+pictures or conversations in it, "and what is the use of a book,"
+thought Alice "without pictures or conversation?"

From 07374a95888a2d58aae4e88217a7a1df32721631 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Wed, 20 Dec 2023 23:09:15 +0100
Subject: [PATCH 226/429] mv: dir2dir: adjust GNU tests - our error message is
 better

---
 util/build-gnu.sh | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/util/build-gnu.sh b/util/build-gnu.sh
index 4a14f3f6c4d..4b682f4ada0 100755
--- a/util/build-gnu.sh
+++ b/util/build-gnu.sh
@@ -272,6 +272,9 @@ sed -i -Ez "s/\n([^\n#]*pad-3\.2[^\n]*)\n([^\n]*)\n([^\n]*)/\n# uutils\/numfmt s
 sed -i -e "s/\$prog: multiple field specifications/error: The argument '--field <FIELDS>' was provided more than once, but cannot be used multiple times\n\nUsage: numfmt [OPTION]... [NUMBER]...\n\n\nFor more information try '--help'/g" tests/misc/numfmt.pl
 sed -i -e "s/Try 'mv --help' for more information/For more information, try '--help'/g" -e "s/mv: missing file operand/error: the following required arguments were not provided:\n  <files>...\n\nUsage: mv [OPTION]... [-T] SOURCE DEST\n       mv [OPTION]... SOURCE... DIRECTORY\n       mv [OPTION]... -t DIRECTORY SOURCE...\n/g" -e "s/mv: missing destination file operand after 'no-file'/error: The argument '<files>...' requires at least 2 values, but only 1 was provided\n\nUsage: mv [OPTION]... [-T] SOURCE DEST\n       mv [OPTION]... SOURCE... DIRECTORY\n       mv [OPTION]... -t DIRECTORY SOURCE...\n/g" tests/mv/diag.sh
 
+# our error message is better
+sed -i -e "s|mv: cannot overwrite 'a/t': Directory not empty|mv: cannot move 'b/t' to 'a/t': Directory not empty|" tests/mv/dir2dir.sh
+
 # GNU doesn't support width > INT_MAX
 # disable these test cases
 sed -i -E "s|^([^#]*2_31.*)$|#\1|g" tests/printf/printf-cov.pl

From f16a4ae9c9e79337b3766a57ec58d7353287ec1f Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Thu, 21 Dec 2023 09:37:36 +0100
Subject: [PATCH 227/429] ls: remove condition with unreachable "else" block

---
 src/uu/ls/src/ls.rs | 10 +++-------
 1 file changed, 3 insertions(+), 7 deletions(-)

diff --git a/src/uu/ls/src/ls.rs b/src/uu/ls/src/ls.rs
index 6db8395cec7..f45f46b13a5 100644
--- a/src/uu/ls/src/ls.rs
+++ b/src/uu/ls/src/ls.rs
@@ -2480,14 +2480,10 @@ fn get_block_size(md: &Metadata, config: &Config) -> u64 {
         match config.size_format {
             SizeFormat::Binary | SizeFormat::Decimal => raw_blocks,
             SizeFormat::Bytes => {
-                if cfg!(unix) {
-                    if let Some(user_block_size) = config.block_size {
-                        raw_blocks / user_block_size
-                    } else {
-                        raw_blocks / DEFAULT_BLOCK_SIZE
-                    }
+                if let Some(user_block_size) = config.block_size {
+                    raw_blocks / user_block_size
                 } else {
-                    raw_blocks
+                    raw_blocks / DEFAULT_BLOCK_SIZE
                 }
             }
         }

From f874788b2c4900ce52f052b2ed6cf3a6e9acecb0 Mon Sep 17 00:00:00 2001
From: allaboutevemirolive <xkmxlfirdxus@gmail.com>
Date: Thu, 21 Dec 2023 10:48:58 +0200
Subject: [PATCH 228/429] Use better testcase

---
 tests/by-util/test_expand.rs                  | 15 +++++++++------
 tests/fixtures/expand/alice_in_wonderland.txt |  5 -----
 2 files changed, 9 insertions(+), 11 deletions(-)
 delete mode 100644 tests/fixtures/expand/alice_in_wonderland.txt

diff --git a/tests/by-util/test_expand.rs b/tests/by-util/test_expand.rs
index a1173c49617..1e26b32732c 100644
--- a/tests/by-util/test_expand.rs
+++ b/tests/by-util/test_expand.rs
@@ -396,13 +396,16 @@ fn test_comma_with_plus_4() {
 #[test]
 fn test_args_override() {
     new_ucmd!()
-        .args(&["-i", "-i", "alice_in_wonderland.txt"])
+        .args(&["-i", "-i", "with-trailing-tab.txt"])
         .run()
         .stdout_is(
-            "Alice was beginning to get very tired of sitting by\n\
-        her sister on the bank, and of having nothing to do: once or twice\n\
-        she had peeped into the book her sister was reading, but it had no\n\
-        pictures or conversations in it, \"and what is the use of a book,\"\n\
-        thought Alice \"without pictures or conversation?\"\n",
+            "// !note: file contains significant whitespace
+// * indentation uses <TAB> characters
+int main() {
+        // * next line has both a leading & trailing tab
+        // with tabs=>	
+        return 0;
+}
+",
         );
 }
diff --git a/tests/fixtures/expand/alice_in_wonderland.txt b/tests/fixtures/expand/alice_in_wonderland.txt
deleted file mode 100644
index a95562a1ce6..00000000000
--- a/tests/fixtures/expand/alice_in_wonderland.txt
+++ /dev/null
@@ -1,5 +0,0 @@
-Alice was beginning to get very tired of sitting by
-her sister on the bank, and of having nothing to do: once or twice
-she had peeped into the book her sister was reading, but it had no
-pictures or conversations in it, "and what is the use of a book,"
-thought Alice "without pictures or conversation?"

From 4b2577fc789559ffb3c7c954e812a69ed6432f65 Mon Sep 17 00:00:00 2001
From: Terts Diepraam <terts.diepraam@gmail.com>
Date: Thu, 21 Dec 2023 10:19:52 +0100
Subject: [PATCH 229/429] test/sort: run cargo fmt

---
 tests/by-util/test_sort.rs | 5 +----
 1 file changed, 1 insertion(+), 4 deletions(-)

diff --git a/tests/by-util/test_sort.rs b/tests/by-util/test_sort.rs
index d22bffae4d8..97c72c7b19b 100644
--- a/tests/by-util/test_sort.rs
+++ b/tests/by-util/test_sort.rs
@@ -1184,8 +1184,5 @@ fn test_same_sort_mode_twice() {
 
 #[test]
 fn test_args_override() {
-    new_ucmd!()
-        .args(&["-f", "-f"])
-        .pipe_in("foo")
-        .succeeds();
+    new_ucmd!().args(&["-f", "-f"]).pipe_in("foo").succeeds();
 }

From 0164934afecbfb035281e5b58191bdcec2ad2b0b Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Tue, 14 Nov 2023 17:41:19 +0100
Subject: [PATCH 230/429] df: fix rounding issue in test

Set block size to 1 so the returned values are the same values as
used for the calculation of the percentage values
---
 tests/by-util/test_df.rs | 6 +++++-
 1 file changed, 5 insertions(+), 1 deletion(-)

diff --git a/tests/by-util/test_df.rs b/tests/by-util/test_df.rs
index 227121ef4df..0276f18c3c1 100644
--- a/tests/by-util/test_df.rs
+++ b/tests/by-util/test_df.rs
@@ -422,7 +422,11 @@ fn test_total_label_in_correct_column() {
 #[test]
 fn test_use_percentage() {
     let output = new_ucmd!()
-        .args(&["--total", "--output=used,avail,pcent"])
+        // set block size = 1, otherwise the returned values for
+        // "used" and "avail" will be rounded. And using them to calculate
+        // the "percentage" values might lead to a mismatch with the returned
+        // "percentage" values.
+        .args(&["--total", "--output=used,avail,pcent", "--block-size=1"])
         .succeeds()
         .stdout_move_str();
 

From 546201bd00c913ead6f75d983c0dfabd2b921348 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Thu, 21 Dec 2023 16:18:00 +0100
Subject: [PATCH 231/429] fuzz: add the capability to pipe info into fuzz
 (#5668)

* fuzz: add the capability to pipe info into fuzz

* address the comments

* show the piped message if any
---
 fuzz/Cargo.toml                  |   1 +
 fuzz/fuzz_targets/fuzz_common.rs | 106 +++++++++++++++++++++++++------
 fuzz/fuzz_targets/fuzz_echo.rs   |   5 +-
 fuzz/fuzz_targets/fuzz_expr.rs   |   5 +-
 fuzz/fuzz_targets/fuzz_printf.rs |   5 +-
 fuzz/fuzz_targets/fuzz_seq.rs    |   5 +-
 fuzz/fuzz_targets/fuzz_test.rs   |   5 +-
 7 files changed, 101 insertions(+), 31 deletions(-)

diff --git a/fuzz/Cargo.toml b/fuzz/Cargo.toml
index c98f105ad19..3d5862c6970 100644
--- a/fuzz/Cargo.toml
+++ b/fuzz/Cargo.toml
@@ -10,6 +10,7 @@ cargo-fuzz = true
 [dependencies]
 libfuzzer-sys = "0.4"
 libc = "0.2"
+tempfile = "3"
 rand = { version = "0.8", features = ["small_rng"] }
 
 uucore = { path = "../src/uucore/" }
diff --git a/fuzz/fuzz_targets/fuzz_common.rs b/fuzz/fuzz_targets/fuzz_common.rs
index 89c82fba25e..11b75a2fa09 100644
--- a/fuzz/fuzz_targets/fuzz_common.rs
+++ b/fuzz/fuzz_targets/fuzz_common.rs
@@ -3,14 +3,15 @@
 // For the full copyright and license information, please view the LICENSE
 // file that was distributed with this source code.
 
+use libc::STDIN_FILENO;
 use libc::{close, dup, dup2, pipe, STDERR_FILENO, STDOUT_FILENO};
 use rand::prelude::SliceRandom;
 use rand::Rng;
 use std::ffi::OsString;
 use std::io;
-use std::io::Write;
-use std::os::fd::RawFd;
-use std::process::Command;
+use std::io::{Seek, SeekFrom, Write};
+use std::os::fd::{AsRawFd, RawFd};
+use std::process::{Command, Stdio};
 use std::sync::atomic::Ordering;
 use std::sync::{atomic::AtomicBool, Once};
 
@@ -49,7 +50,11 @@ pub fn is_gnu_cmd(cmd_path: &str) -> Result<(), std::io::Error> {
     }
 }
 
-pub fn generate_and_run_uumain<F>(args: &[OsString], uumain_function: F) -> CommandResult
+pub fn generate_and_run_uumain<F>(
+    args: &[OsString],
+    uumain_function: F,
+    pipe_input: Option<&str>,
+) -> CommandResult
 where
     F: FnOnce(std::vec::IntoIter<OsString>) -> i32,
 {
@@ -58,8 +63,8 @@ where
     let original_stderr_fd = unsafe { dup(STDERR_FILENO) };
     if original_stdout_fd == -1 || original_stderr_fd == -1 {
         return CommandResult {
-            stdout: "Failed to duplicate STDOUT_FILENO or STDERR_FILENO".to_string(),
-            stderr: "".to_string(),
+            stdout: "".to_string(),
+            stderr: "Failed to duplicate STDOUT_FILENO or STDERR_FILENO".to_string(),
             exit_code: -1,
         };
     }
@@ -72,8 +77,8 @@ where
         || unsafe { pipe(pipe_stderr_fds.as_mut_ptr()) } == -1
     {
         return CommandResult {
-            stdout: "Failed to create pipes".to_string(),
-            stderr: "".to_string(),
+            stdout: "".to_string(),
+            stderr: "Failed to create pipes".to_string(),
             exit_code: -1,
         };
     }
@@ -89,12 +94,32 @@ where
             close(pipe_stderr_fds[1]);
         }
         return CommandResult {
-            stdout: "Failed to redirect STDOUT_FILENO or STDERR_FILENO".to_string(),
-            stderr: "".to_string(),
+            stdout: "".to_string(),
+            stderr: "Failed to redirect STDOUT_FILENO or STDERR_FILENO".to_string(),
             exit_code: -1,
         };
     }
 
+    let original_stdin_fd = if let Some(input_str) = pipe_input {
+        // we have pipe input
+        let mut input_file = tempfile::tempfile().unwrap();
+        write!(input_file, "{}", input_str).unwrap();
+        input_file.seek(SeekFrom::Start(0)).unwrap();
+
+        // Redirect stdin to read from the in-memory file
+        let original_stdin_fd = unsafe { dup(STDIN_FILENO) };
+        if original_stdin_fd == -1 || unsafe { dup2(input_file.as_raw_fd(), STDIN_FILENO) } == -1 {
+            return CommandResult {
+                stdout: "".to_string(),
+                stderr: "Failed to set up stdin redirection".to_string(),
+                exit_code: -1,
+            };
+        }
+        Some(original_stdin_fd)
+    } else {
+        None
+    };
+
     let uumain_exit_status = uumain_function(args.to_owned().into_iter());
 
     io::stdout().flush().unwrap();
@@ -105,8 +130,8 @@ where
         || unsafe { dup2(original_stderr_fd, STDERR_FILENO) } == -1
     {
         return CommandResult {
-            stdout: "Failed to restore the original STDOUT_FILENO or STDERR_FILENO".to_string(),
-            stderr: "".to_string(),
+            stdout: "".to_string(),
+            stderr: "Failed to restore the original STDOUT_FILENO or STDERR_FILENO".to_string(),
             exit_code: -1,
         };
     }
@@ -118,6 +143,18 @@ where
         close(pipe_stderr_fds[1]);
     }
 
+    // Restore the original stdin if it was modified
+    if let Some(fd) = original_stdin_fd {
+        if unsafe { dup2(fd, STDIN_FILENO) } == -1 {
+            return CommandResult {
+                stdout: "".to_string(),
+                stderr: "Failed to restore the original STDIN".to_string(),
+                exit_code: -1,
+            };
+        }
+        unsafe { close(fd) };
+    }
+
     let captured_stdout = read_from_fd(pipe_stdout_fds[0]).trim().to_string();
     let captured_stderr = read_from_fd(pipe_stderr_fds[0]).to_string();
     let captured_stderr = captured_stderr
@@ -165,6 +202,7 @@ pub fn run_gnu_cmd(
     cmd_path: &str,
     args: &[OsString],
     check_gnu: bool,
+    pipe_input: Option<&str>,
 ) -> Result<CommandResult, CommandResult> {
     if check_gnu {
         match is_gnu_cmd(cmd_path) {
@@ -185,18 +223,40 @@ pub fn run_gnu_cmd(
         command.arg(arg);
     }
 
-    let output = match command.output() {
-        Ok(output) => output,
-        Err(e) => {
-            return Err(CommandResult {
-                stdout: String::new(),
-                stderr: e.to_string(),
-                exit_code: -1,
-            });
+    let output = if let Some(input_str) = pipe_input {
+        // We have an pipe input
+        command.stdin(Stdio::piped()).stdout(Stdio::piped());
+
+        let mut child = command.spawn().expect("Failed to execute command");
+        let child_stdin = child.stdin.as_mut().unwrap();
+        child_stdin
+            .write_all(input_str.as_bytes())
+            .expect("Failed to write to stdin");
+
+        match child.wait_with_output() {
+            Ok(output) => output,
+            Err(e) => {
+                return Err(CommandResult {
+                    stdout: String::new(),
+                    stderr: e.to_string(),
+                    exit_code: -1,
+                });
+            }
+        }
+    } else {
+        // Just run with args
+        match command.output() {
+            Ok(output) => output,
+            Err(e) => {
+                return Err(CommandResult {
+                    stdout: String::new(),
+                    stderr: e.to_string(),
+                    exit_code: -1,
+                });
+            }
         }
     };
     let exit_code = output.status.code().unwrap_or(-1);
-
     // Here we get stdout and stderr as Strings
     let stdout = String::from_utf8_lossy(&output.stdout).to_string();
     let stderr = String::from_utf8_lossy(&output.stderr).to_string();
@@ -233,12 +293,16 @@ pub fn run_gnu_cmd(
 pub fn compare_result(
     test_type: &str,
     input: &str,
+    pipe_input: Option<&str>,
     rust_result: &CommandResult,
     gnu_result: &CommandResult,
     fail_on_stderr_diff: bool,
 ) {
     println!("Test Type: {}", test_type);
     println!("Input: {}", input);
+    if let Some(pipe) = pipe_input {
+        println!("Pipe: {}", pipe);
+    }
 
     let mut discrepancies = Vec::new();
     let mut should_panic = false;
diff --git a/fuzz/fuzz_targets/fuzz_echo.rs b/fuzz/fuzz_targets/fuzz_echo.rs
index bc391bd3e05..3f15b257e6e 100644
--- a/fuzz/fuzz_targets/fuzz_echo.rs
+++ b/fuzz/fuzz_targets/fuzz_echo.rs
@@ -59,9 +59,9 @@ fuzz_target!(|_data: &[u8]| {
     let echo_input = generate_echo();
     let mut args = vec![OsString::from("echo")];
     args.extend(echo_input.split_whitespace().map(OsString::from));
-    let rust_result = generate_and_run_uumain(&args, uumain);
+    let rust_result = generate_and_run_uumain(&args, uumain, None);
 
-    let gnu_result = match run_gnu_cmd(CMD_PATH, &args[1..], false) {
+    let gnu_result = match run_gnu_cmd(CMD_PATH, &args[1..], false, None) {
         Ok(result) => result,
         Err(error_result) => {
             eprintln!("Failed to run GNU command:");
@@ -78,6 +78,7 @@ fuzz_target!(|_data: &[u8]| {
     compare_result(
         "echo",
         &format!("{:?}", &args[1..]),
+        None,
         &rust_result,
         &gnu_result,
         true,
diff --git a/fuzz/fuzz_targets/fuzz_expr.rs b/fuzz/fuzz_targets/fuzz_expr.rs
index 9f2d28603ab..8bc18fae47e 100644
--- a/fuzz/fuzz_targets/fuzz_expr.rs
+++ b/fuzz/fuzz_targets/fuzz_expr.rs
@@ -69,9 +69,9 @@ fuzz_target!(|_data: &[u8]| {
     // because uutils expr doesn't support localization yet
     // TODO remove once uutils expr supports localization
     env::set_var("LC_COLLATE", "C");
-    let rust_result = generate_and_run_uumain(&args, uumain);
+    let rust_result = generate_and_run_uumain(&args, uumain, None);
 
-    let gnu_result = match run_gnu_cmd(CMD_PATH, &args[1..], false) {
+    let gnu_result = match run_gnu_cmd(CMD_PATH, &args[1..], false, None) {
         Ok(result) => result,
         Err(error_result) => {
             eprintln!("Failed to run GNU command:");
@@ -88,6 +88,7 @@ fuzz_target!(|_data: &[u8]| {
     compare_result(
         "expr",
         &format!("{:?}", &args[1..]),
+        None,
         &rust_result,
         &gnu_result,
         false, // Set to true if you want to fail on stderr diff
diff --git a/fuzz/fuzz_targets/fuzz_printf.rs b/fuzz/fuzz_targets/fuzz_printf.rs
index 25cf58c8e1b..72fac540b17 100644
--- a/fuzz/fuzz_targets/fuzz_printf.rs
+++ b/fuzz/fuzz_targets/fuzz_printf.rs
@@ -80,9 +80,9 @@ fuzz_target!(|_data: &[u8]| {
     let printf_input = generate_printf();
     let mut args = vec![OsString::from("printf")];
     args.extend(printf_input.split_whitespace().map(OsString::from));
-    let rust_result = generate_and_run_uumain(&args, uumain);
+    let rust_result = generate_and_run_uumain(&args, uumain, None);
 
-    let gnu_result = match run_gnu_cmd(CMD_PATH, &args[1..], false) {
+    let gnu_result = match run_gnu_cmd(CMD_PATH, &args[1..], false, None) {
         Ok(result) => result,
         Err(error_result) => {
             eprintln!("Failed to run GNU command:");
@@ -99,6 +99,7 @@ fuzz_target!(|_data: &[u8]| {
     compare_result(
         "printf",
         &format!("{:?}", &args[1..]),
+        None,
         &rust_result,
         &gnu_result,
         false, // Set to true if you want to fail on stderr diff
diff --git a/fuzz/fuzz_targets/fuzz_seq.rs b/fuzz/fuzz_targets/fuzz_seq.rs
index fdeaed16dc3..7bb4f8af956 100644
--- a/fuzz/fuzz_targets/fuzz_seq.rs
+++ b/fuzz/fuzz_targets/fuzz_seq.rs
@@ -48,9 +48,9 @@ fuzz_target!(|_data: &[u8]| {
     let mut args = vec![OsString::from("seq")];
     args.extend(seq.split_whitespace().map(OsString::from));
 
-    let rust_result = generate_and_run_uumain(&args, uumain);
+    let rust_result = generate_and_run_uumain(&args, uumain, None);
 
-    let gnu_result = match run_gnu_cmd(CMD_PATH, &args[1..], false) {
+    let gnu_result = match run_gnu_cmd(CMD_PATH, &args[1..], false, None) {
         Ok(result) => result,
         Err(error_result) => {
             eprintln!("Failed to run GNU command:");
@@ -67,6 +67,7 @@ fuzz_target!(|_data: &[u8]| {
     compare_result(
         "seq",
         &format!("{:?}", &args[1..]),
+        None,
         &rust_result,
         &gnu_result,
         false, // Set to true if you want to fail on stderr diff
diff --git a/fuzz/fuzz_targets/fuzz_test.rs b/fuzz/fuzz_targets/fuzz_test.rs
index eeee2dc3e2c..bed7ca77088 100644
--- a/fuzz/fuzz_targets/fuzz_test.rs
+++ b/fuzz/fuzz_targets/fuzz_test.rs
@@ -184,9 +184,9 @@ fuzz_target!(|_data: &[u8]| {
         args.push(OsString::from(generate_test_arg()));
     }
 
-    let rust_result = generate_and_run_uumain(&args, uumain);
+    let rust_result = generate_and_run_uumain(&args, uumain, None);
 
-    let gnu_result = match run_gnu_cmd(CMD_PATH, &args[1..], false) {
+    let gnu_result = match run_gnu_cmd(CMD_PATH, &args[1..], false, None) {
         Ok(result) => result,
         Err(error_result) => {
             eprintln!("Failed to run GNU command:");
@@ -203,6 +203,7 @@ fuzz_target!(|_data: &[u8]| {
     compare_result(
         "test",
         &format!("{:?}", &args[1..]),
+        None,
         &rust_result,
         &gnu_result,
         false, // Set to true if you want to fail on stderr diff

From 311901de3a49d83194134dcfcd79a187c53c324e Mon Sep 17 00:00:00 2001
From: Malte Poll <1780588+malt3@users.noreply.github.com>
Date: Fri, 22 Dec 2023 10:49:39 +0100
Subject: [PATCH 232/429] ci: add aarch64-unknown-linux-musl release artifact

---
 .github/workflows/CICD.yml | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/.github/workflows/CICD.yml b/.github/workflows/CICD.yml
index 8a7ff3f0624..ea369e4ef6f 100644
--- a/.github/workflows/CICD.yml
+++ b/.github/workflows/CICD.yml
@@ -468,6 +468,7 @@ jobs:
           # - { os , target , cargo-options , features , use-cross , toolchain, skip-tests }
           - { os: ubuntu-latest  , target: arm-unknown-linux-gnueabihf, features: feat_os_unix_gnueabihf, use-cross: use-cross, }
           - { os: ubuntu-latest  , target: aarch64-unknown-linux-gnu   , features: feat_os_unix_gnueabihf , use-cross: use-cross }
+          - { os: ubuntu-latest  , target: aarch64-unknown-linux-musl  , features: feat_os_unix_musl      , use-cross: use-cross }
           # - { os: ubuntu-latest  , target: x86_64-unknown-linux-gnu    , features: feat_selinux           , use-cross: use-cross }
           - { os: ubuntu-latest  , target: i686-unknown-linux-gnu      , features: feat_os_unix           , use-cross: use-cross }
           - { os: ubuntu-latest  , target: i686-unknown-linux-musl     , features: feat_os_unix_musl      , use-cross: use-cross }
@@ -590,7 +591,7 @@ jobs:
         # * executable for `strip`?
         STRIP="strip"
         case ${{ matrix.job.target }} in
-          aarch64-*-linux-gnu) STRIP="aarch64-linux-gnu-strip" ;;
+          aarch64-*-linux-*) STRIP="aarch64-linux-gnu-strip" ;;
           arm-*-linux-gnueabihf) STRIP="arm-linux-gnueabihf-strip" ;;
           *-pc-windows-msvc) STRIP="" ;;
         esac;
@@ -612,7 +613,7 @@ jobs:
         ## Install/setup prerequisites
         case '${{ matrix.job.target }}' in
           arm-unknown-linux-gnueabihf) sudo apt-get -y update ; sudo apt-get -y install gcc-arm-linux-gnueabihf ;;
-          aarch64-unknown-linux-gnu) sudo apt-get -y update ; sudo apt-get -y install gcc-aarch64-linux-gnu ;;
+          aarch64-unknown-linux-*) sudo apt-get -y update ; sudo apt-get -y install gcc-aarch64-linux-gnu ;;
           *-redox*) sudo apt-get -y update ; sudo apt-get -y install fuse3 libfuse-dev ;;
         esac
         case '${{ matrix.job.os }}' in

From a8a5931cae17387a9c1f24ec54d18185c511a506 Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Fri, 22 Dec 2023 11:15:01 +0100
Subject: [PATCH 233/429] ls: introduce 2nd blocksize & fix todos in tests

---
 src/uu/ls/src/ls.rs      | 70 +++++++++++++++++++++-------------------
 tests/by-util/test_ls.rs | 47 +++++++++++++++++++++------
 2 files changed, 74 insertions(+), 43 deletions(-)

diff --git a/src/uu/ls/src/ls.rs b/src/uu/ls/src/ls.rs
index f45f46b13a5..7ad1704fc4e 100644
--- a/src/uu/ls/src/ls.rs
+++ b/src/uu/ls/src/ls.rs
@@ -161,8 +161,8 @@ pub mod options {
 
 const DEFAULT_TERM_WIDTH: u16 = 80;
 const POSIXLY_CORRECT_BLOCK_SIZE: u64 = 512;
-#[cfg(unix)]
 const DEFAULT_BLOCK_SIZE: u64 = 1024;
+const DEFAULT_FILE_SIZE_BLOCK_SIZE: u64 = 1;
 
 #[derive(Debug)]
 enum LsError {
@@ -409,7 +409,9 @@ pub struct Config {
     color: Option<LsColors>,
     long: LongFormat,
     alloc_size: bool,
-    block_size: Option<u64>,
+    file_size_block_size: u64,
+    #[allow(dead_code)]
+    block_size: u64, // is never read on Windows
     width: u16,
     // Dir and vdir needs access to this field
     pub quoting_style: QuotingStyle,
@@ -822,6 +824,7 @@ impl Config {
         let env_var_block_size = std::env::var_os("BLOCK_SIZE");
         let env_var_ls_block_size = std::env::var_os("LS_BLOCK_SIZE");
         let env_var_posixly_correct = std::env::var_os("POSIXLY_CORRECT");
+        let mut is_env_var_blocksize = false;
 
         let raw_block_size = if let Some(opt_block_size) = opt_block_size {
             OsString::from(opt_block_size)
@@ -831,6 +834,7 @@ impl Config {
             } else if let Some(env_var_block_size) = env_var_block_size {
                 env_var_block_size
             } else if let Some(env_var_blocksize) = env_var_blocksize {
+                is_env_var_blocksize = true;
                 env_var_blocksize
             } else {
                 OsString::from("")
@@ -839,9 +843,16 @@ impl Config {
             OsString::from("")
         };
 
-        let block_size: Option<u64> = if !opt_si && !opt_hr && !raw_block_size.is_empty() {
+        let (file_size_block_size, block_size) = if !opt_si && !opt_hr && !raw_block_size.is_empty()
+        {
             match parse_size_u64(&raw_block_size.to_string_lossy()) {
-                Ok(size) => Some(size),
+                Ok(size) => {
+                    if is_env_var_blocksize {
+                        (DEFAULT_FILE_SIZE_BLOCK_SIZE, size)
+                    } else {
+                        (size, size)
+                    }
+                }
                 Err(_) => {
                     // only fail if invalid block size was specified with --block-size,
                     // ignore invalid block size from env vars
@@ -850,13 +861,19 @@ impl Config {
                             invalid_block_size.clone(),
                         )));
                     }
-                    None
+                    if is_env_var_blocksize {
+                        (DEFAULT_FILE_SIZE_BLOCK_SIZE, DEFAULT_BLOCK_SIZE)
+                    } else {
+                        (DEFAULT_BLOCK_SIZE, DEFAULT_BLOCK_SIZE)
+                    }
                 }
             }
         } else if env_var_posixly_correct.is_some() {
-            Some(POSIXLY_CORRECT_BLOCK_SIZE)
+            (DEFAULT_FILE_SIZE_BLOCK_SIZE, POSIXLY_CORRECT_BLOCK_SIZE)
+        } else if opt_si {
+            (DEFAULT_FILE_SIZE_BLOCK_SIZE, 1000)
         } else {
-            None
+            (DEFAULT_FILE_SIZE_BLOCK_SIZE, DEFAULT_BLOCK_SIZE)
         };
 
         let long = {
@@ -1062,6 +1079,7 @@ impl Config {
             inode: options.get_flag(options::INODE),
             long,
             alloc_size: options.get_flag(options::size::ALLOCATION_SIZE),
+            file_size_block_size,
             block_size,
             width,
             quoting_style,
@@ -2479,13 +2497,7 @@ fn get_block_size(md: &Metadata, config: &Config) -> u64 {
         };
         match config.size_format {
             SizeFormat::Binary | SizeFormat::Decimal => raw_blocks,
-            SizeFormat::Bytes => {
-                if let Some(user_block_size) = config.block_size {
-                    raw_blocks / user_block_size
-                } else {
-                    raw_blocks / DEFAULT_BLOCK_SIZE
-                }
-            }
+            SizeFormat::Bytes => raw_blocks / config.block_size,
         }
     }
     #[cfg(not(unix))]
@@ -2955,26 +2967,16 @@ fn display_len_or_rdev(metadata: &Metadata, config: &Config) -> SizeOrDeviceId {
             return SizeOrDeviceId::Device(major.to_string(), minor.to_string());
         }
     }
-    // Reported file len only adjusted for block_size when block_size is set
-    if let Some(user_block_size) = config.block_size {
-        // ordinary division of unsigned integers rounds down,
-        // this is similar to the Rust API for division that rounds up,
-        // currently in nightly only, however once
-        // https://github.com/rust-lang/rust/pull/88582 : "div_ceil"
-        // is stable we should use that instead
-        let len_adjusted = {
-            let d = metadata.len() / user_block_size;
-            let r = metadata.len() % user_block_size;
-            if r == 0 {
-                d
-            } else {
-                d + 1
-            }
-        };
-        SizeOrDeviceId::Size(display_size(len_adjusted, config))
-    } else {
-        SizeOrDeviceId::Size(display_size(metadata.len(), config))
-    }
+    let len_adjusted = {
+        let d = metadata.len() / config.file_size_block_size;
+        let r = metadata.len() % config.file_size_block_size;
+        if r == 0 {
+            d
+        } else {
+            d + 1
+        }
+    };
+    SizeOrDeviceId::Size(display_size(len_adjusted, config))
 }
 
 fn display_size(size: u64, config: &Config) -> String {
diff --git a/tests/by-util/test_ls.rs b/tests/by-util/test_ls.rs
index 8aeb762c79b..a7744063fa3 100644
--- a/tests/by-util/test_ls.rs
+++ b/tests/by-util/test_ls.rs
@@ -3862,8 +3862,8 @@ fn test_posixly_correct_and_block_size_env_vars() {
         .arg("-l")
         .env("POSIXLY_CORRECT", "some_value")
         .succeeds()
-        .stdout_contains_line("total 8");
-    //.stdout_contains(" 1024 "); // TODO needs second internal blocksize
+        .stdout_contains_line("total 8")
+        .stdout_contains(" 1024 ");
 
     scene
         .ucmd()
@@ -3886,8 +3886,8 @@ fn test_posixly_correct_and_block_size_env_vars() {
         .arg("-l")
         .env("BLOCKSIZE", "512")
         .succeeds()
-        .stdout_contains_line("total 8");
-    //.stdout_contains(" 1024 "); // TODO needs second internal blocksize
+        .stdout_contains_line("total 8")
+        .stdout_contains(" 1024 ");
 }
 
 #[test]
@@ -3900,13 +3900,42 @@ fn test_ls_invalid_block_size() {
         .stderr_is("ls: invalid --block-size argument 'invalid'\n");
 }
 
-// TODO ensure the correct block size is used when using -l because
-// the output of "ls -l" and "BLOCK_SIZE=invalid ls -l" is different
+#[cfg(all(unix, feature = "dd"))]
 #[test]
 fn test_ls_invalid_block_size_in_env_var() {
-    new_ucmd!().env("LS_BLOCK_SIZE", "invalid").succeeds();
-    new_ucmd!().env("BLOCK_SIZE", "invalid").succeeds();
-    new_ucmd!().env("BLOCKSIZE", "invalid").succeeds();
+    let scene = TestScenario::new(util_name!());
+
+    scene
+        .ccmd("dd")
+        .arg("if=/dev/zero")
+        .arg("of=file")
+        .arg("bs=1024")
+        .arg("count=1")
+        .succeeds();
+
+    scene
+        .ucmd()
+        .arg("-og")
+        .env("LS_BLOCK_SIZE", "invalid")
+        .succeeds()
+        .stdout_contains_line("total 4")
+        .stdout_contains(" 1 1 "); // hardlink count + file size
+
+    scene
+        .ucmd()
+        .arg("-og")
+        .env("BLOCK_SIZE", "invalid")
+        .succeeds()
+        .stdout_contains_line("total 4")
+        .stdout_contains(" 1 1 "); // hardlink count + file size
+
+    scene
+        .ucmd()
+        .arg("-og")
+        .env("BLOCKSIZE", "invalid")
+        .succeeds()
+        .stdout_contains_line("total 4")
+        .stdout_contains(" 1024 ");
 }
 
 #[cfg(all(unix, feature = "dd"))]

From 1c6317af76afbef7f2e8a02987bccb9a66339f1c Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Fri, 22 Dec 2023 17:03:59 +0100
Subject: [PATCH 234/429] mv: allow dest with slash when using --update

---
 src/uu/mv/src/mv.rs      |  6 +++++-
 tests/by-util/test_mv.rs | 14 ++++++++++++++
 2 files changed, 19 insertions(+), 1 deletion(-)

diff --git a/src/uu/mv/src/mv.rs b/src/uu/mv/src/mv.rs
index a042acb87a1..dec6d3ad3a7 100644
--- a/src/uu/mv/src/mv.rs
+++ b/src/uu/mv/src/mv.rs
@@ -341,7 +341,11 @@ fn handle_two_paths(source: &Path, target: &Path, opts: &Options) -> UResult<()>
 
     let target_is_dir = target.is_dir();
 
-    if path_ends_with_terminator(target) && !target_is_dir && !opts.no_target_dir {
+    if path_ends_with_terminator(target)
+        && !target_is_dir
+        && !opts.no_target_dir
+        && opts.update != UpdateMode::ReplaceIfOlder
+    {
         return Err(MvError::FailedToAccessNotADirectory(target.quote().to_string()).into());
     }
 
diff --git a/tests/by-util/test_mv.rs b/tests/by-util/test_mv.rs
index 3fb002dc3e0..75500ac63d9 100644
--- a/tests/by-util/test_mv.rs
+++ b/tests/by-util/test_mv.rs
@@ -905,6 +905,20 @@ fn test_mv_update_option() {
     assert!(!at.file_exists(file_b));
 }
 
+#[test]
+fn test_mv_update_with_dest_ending_with_slash() {
+    let (at, mut ucmd) = at_and_ucmd!();
+    let source = "source";
+    let dest = "destination/";
+
+    at.mkdir("source");
+
+    ucmd.arg("--update").arg(source).arg(dest).succeeds();
+
+    assert!(!at.dir_exists(source));
+    assert!(at.dir_exists(dest));
+}
+
 #[test]
 fn test_mv_arg_update_none() {
     let (at, mut ucmd) = at_and_ucmd!();

From 9ca7c3e107c8af9b5330da26c28298c7e3f5e05b Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Thu, 21 Dec 2023 00:17:49 +0100
Subject: [PATCH 235/429] install: with -t, check if we aren't passed a file

Should pass tests/install/basic-1
---
 src/uu/install/src/install.rs | 11 +++++++++++
 tests/by-util/test_install.rs | 24 ++++++++++++++++++++++++
 2 files changed, 35 insertions(+)

diff --git a/src/uu/install/src/install.rs b/src/uu/install/src/install.rs
index 43925a7f8e4..7cb305a25c4 100644
--- a/src/uu/install/src/install.rs
+++ b/src/uu/install/src/install.rs
@@ -66,6 +66,7 @@ enum InstallError {
     InvalidUser(String),
     InvalidGroup(String),
     OmittingDirectory(PathBuf),
+    NotADirectory(PathBuf),
 }
 
 impl UError for InstallError {
@@ -120,6 +121,9 @@ impl Display for InstallError {
             Self::InvalidUser(user) => write!(f, "invalid user: {}", user.quote()),
             Self::InvalidGroup(group) => write!(f, "invalid group: {}", group.quote()),
             Self::OmittingDirectory(dir) => write!(f, "omitting directory {}", dir.quote()),
+            Self::NotADirectory(dir) => {
+                write!(f, "failed to access {}: Not a directory", dir.quote())
+            }
         }
     }
 }
@@ -583,6 +587,13 @@ fn standard(mut paths: Vec<String>, b: &Behavior) -> UResult<()> {
                 }
             }
         }
+        if b.target_dir.is_some() {
+            let p = to_create.unwrap();
+
+            if !p.exists() || !p.is_dir() {
+                return Err(InstallError::NotADirectory(p.to_path_buf()).into());
+            }
+        }
     }
 
     if sources.len() > 1 || is_potential_directory_path(&target) {
diff --git a/tests/by-util/test_install.rs b/tests/by-util/test_install.rs
index 7387748c619..9c8f929f483 100644
--- a/tests/by-util/test_install.rs
+++ b/tests/by-util/test_install.rs
@@ -1538,3 +1538,27 @@ fn test_install_compare_option() {
         .code_is(1)
         .stderr_contains("Options --compare and --strip are mutually exclusive");
 }
+
+#[test]
+// Matches part of tests/install/basic-1
+fn test_t_exist_dir() {
+    let scene = TestScenario::new(util_name!());
+    let at = &scene.fixtures;
+
+    let source1 = "file";
+    let target_dir = "sub4/";
+    let target_file = "sub4/file_exists";
+
+    at.touch(source1);
+    at.mkdir(target_dir);
+    at.touch(target_file);
+
+    scene
+        .ucmd()
+        .arg("-t")
+        .arg(target_file)
+        .arg("-Dv")
+        .arg(source1)
+        .fails()
+        .stderr_contains("failed to access 'sub4/file_exists': Not a directory");
+}

From 837640bc0235533f498aace9fc5c9541638ad88f Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Sat, 23 Dec 2023 11:53:25 +0100
Subject: [PATCH 236/429] cp: manages the 'seen' file list before copying

Should help with tests/mv/childproof.sh
---
 src/uu/cp/src/cp.rs      | 46 ++++++++++++++++++++++++++++++----------
 tests/by-util/test_cp.rs | 19 +++++++++++++++++
 2 files changed, 54 insertions(+), 11 deletions(-)

diff --git a/src/uu/cp/src/cp.rs b/src/uu/cp/src/cp.rs
index de01a5ef38c..d7aeea1b99d 100644
--- a/src/uu/cp/src/cp.rs
+++ b/src/uu/cp/src/cp.rs
@@ -1171,6 +1171,9 @@ pub fn copy(sources: &[PathBuf], target: &Path, options: &Options) -> CopyResult
     //
     // key is the source file's information and the value is the destination filepath.
     let mut copied_files: HashMap<FileInformation, PathBuf> = HashMap::with_capacity(sources.len());
+    // remember the copied destinations for further usage.
+    // we can't use copied_files as it is because the key is the source file's information.
+    let mut copied_destinations: HashSet<PathBuf> = HashSet::with_capacity(sources.len());
 
     let progress_bar = if options.progress_bar {
         let pb = ProgressBar::new(disk_usage(sources, options.recursive)?)
@@ -1191,17 +1194,38 @@ pub fn copy(sources: &[PathBuf], target: &Path, options: &Options) -> CopyResult
         if seen_sources.contains(source) {
             // FIXME: compare sources by the actual file they point to, not their path. (e.g. dir/file == dir/../dir/file in most cases)
             show_warning!("source {} specified more than once", source.quote());
-        } else if let Err(error) = copy_source(
-            &progress_bar,
-            source,
-            target,
-            target_type,
-            options,
-            &mut symlinked_files,
-            &mut copied_files,
-        ) {
-            show_error_if_needed(&error);
-            non_fatal_errors = true;
+        } else {
+            // We need to compute the destination path
+
+            let dest = construct_dest_path(source, target, target_type, options)
+                .unwrap_or_else(|_| target.to_path_buf());
+
+            if fs::metadata(&dest).is_ok() && !fs::symlink_metadata(&dest)?.file_type().is_symlink()
+            {
+                // There is already a file and it isn't a symlink (managed in a different place)
+                if copied_destinations.contains(&dest) {
+                    // If the target file was already created in this cp call, do not overwrite
+                    return Err(Error::Error(format!(
+                        "will not overwrite just-created '{}' with '{}'",
+                        dest.display(),
+                        source.display()
+                    )));
+                }
+            }
+
+            if let Err(error) = copy_source(
+                &progress_bar,
+                source,
+                target,
+                target_type,
+                options,
+                &mut symlinked_files,
+                &mut copied_files,
+            ) {
+                show_error_if_needed(&error);
+                non_fatal_errors = true;
+            }
+            copied_destinations.insert(dest.clone());
         }
         seen_sources.insert(source);
     }
diff --git a/tests/by-util/test_cp.rs b/tests/by-util/test_cp.rs
index 37bec522238..5227f01944d 100644
--- a/tests/by-util/test_cp.rs
+++ b/tests/by-util/test_cp.rs
@@ -3559,3 +3559,22 @@ fn test_cp_attributes_only() {
     assert_eq!(mode_a, at.metadata(a).mode());
     assert_eq!(mode_b, at.metadata(b).mode());
 }
+
+#[test]
+fn test_cp_seen_file() {
+    let (at, mut ucmd) = at_and_ucmd!();
+
+    at.mkdir("a");
+    at.mkdir("b");
+    at.mkdir("c");
+    at.write("a/f", "a");
+    at.write("b/f", "b");
+
+    ucmd.arg("a/f")
+        .arg("b/f")
+        .arg("c")
+        .fails()
+        .stderr_contains("will not overwrite just-created 'c/f' with 'b/f'");
+
+    assert!(at.plus("c").join("f").exists());
+}

From 06c98fbdd33e28110e8442dd4e6b261c3b6a1e22 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Sat, 23 Dec 2023 12:48:38 +0100
Subject: [PATCH 237/429] cp: don't fail when --backup=numbered is passed

---
 src/uu/cp/src/cp.rs      |  4 +++-
 tests/by-util/test_cp.rs | 15 +++++++++++++--
 2 files changed, 16 insertions(+), 3 deletions(-)

diff --git a/src/uu/cp/src/cp.rs b/src/uu/cp/src/cp.rs
index d7aeea1b99d..4d002359f93 100644
--- a/src/uu/cp/src/cp.rs
+++ b/src/uu/cp/src/cp.rs
@@ -1203,7 +1203,9 @@ pub fn copy(sources: &[PathBuf], target: &Path, options: &Options) -> CopyResult
             if fs::metadata(&dest).is_ok() && !fs::symlink_metadata(&dest)?.file_type().is_symlink()
             {
                 // There is already a file and it isn't a symlink (managed in a different place)
-                if copied_destinations.contains(&dest) {
+                if copied_destinations.contains(&dest)
+                    && options.backup != BackupMode::NumberedBackup
+                {
                     // If the target file was already created in this cp call, do not overwrite
                     return Err(Error::Error(format!(
                         "will not overwrite just-created '{}' with '{}'",
diff --git a/tests/by-util/test_cp.rs b/tests/by-util/test_cp.rs
index 5227f01944d..eda5dd4c6e4 100644
--- a/tests/by-util/test_cp.rs
+++ b/tests/by-util/test_cp.rs
@@ -3562,7 +3562,8 @@ fn test_cp_attributes_only() {
 
 #[test]
 fn test_cp_seen_file() {
-    let (at, mut ucmd) = at_and_ucmd!();
+    let ts = TestScenario::new(util_name!());
+    let at = &ts.fixtures;
 
     at.mkdir("a");
     at.mkdir("b");
@@ -3570,11 +3571,21 @@ fn test_cp_seen_file() {
     at.write("a/f", "a");
     at.write("b/f", "b");
 
-    ucmd.arg("a/f")
+    ts.ucmd()
+        .arg("a/f")
         .arg("b/f")
         .arg("c")
         .fails()
         .stderr_contains("will not overwrite just-created 'c/f' with 'b/f'");
 
     assert!(at.plus("c").join("f").exists());
+
+    ts.ucmd()
+        .arg("--backup=numbered")
+        .arg("a/f")
+        .arg("b/f")
+        .arg("c")
+        .succeeds();
+    assert!(at.plus("c").join("f").exists());
+    assert!(at.plus("c").join("f.~1~").exists());
 }

From 3af8ad0fe6b211c00df5f1c9c75fc83ba32aad1d Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Sat, 23 Dec 2023 13:04:48 +0100
Subject: [PATCH 238/429] mv: manages the 'seen' file list before moving

Should help with tests/mv/childproof.sh
---
 src/uu/mv/src/mv.rs      | 17 +++++++++++++++++
 tests/by-util/test_mv.rs | 26 ++++++++++++++++++++++++++
 2 files changed, 43 insertions(+)

diff --git a/src/uu/mv/src/mv.rs b/src/uu/mv/src/mv.rs
index dec6d3ad3a7..75a295502c2 100644
--- a/src/uu/mv/src/mv.rs
+++ b/src/uu/mv/src/mv.rs
@@ -10,6 +10,7 @@ mod error;
 use clap::builder::ValueParser;
 use clap::{crate_version, error::ErrorKind, Arg, ArgAction, ArgMatches, Command};
 use indicatif::{MultiProgress, ProgressBar, ProgressStyle};
+use std::collections::HashSet;
 use std::env;
 use std::ffi::OsString;
 use std::fs;
@@ -434,6 +435,9 @@ pub fn mv(files: &[OsString], opts: &Options) -> UResult<()> {
 
 #[allow(clippy::cognitive_complexity)]
 fn move_files_into_dir(files: &[PathBuf], target_dir: &Path, opts: &Options) -> UResult<()> {
+    // remember the moved destinations for further usage
+    let mut moved_destinations: HashSet<PathBuf> = HashSet::with_capacity(files.len());
+
     if !target_dir.is_dir() {
         return Err(MvError::NotADirectory(target_dir.quote().to_string()).into());
     }
@@ -471,6 +475,18 @@ fn move_files_into_dir(files: &[PathBuf], target_dir: &Path, opts: &Options) ->
             }
         };
 
+        if moved_destinations.contains(&targetpath) && opts.backup != BackupMode::NumberedBackup {
+            // If the target file was already created in this mv call, do not overwrite
+            return Err(USimpleError::new(
+                1,
+                format!(
+                    "will not overwrite just-created '{}' with '{}'",
+                    targetpath.display(),
+                    sourcepath.display()
+                ),
+            ));
+        }
+
         // Check if we have mv dir1 dir2 dir2
         // And generate an error if this is the case
         if let Ok(canonicalized_source) = sourcepath.canonicalize() {
@@ -513,6 +529,7 @@ fn move_files_into_dir(files: &[PathBuf], target_dir: &Path, opts: &Options) ->
         if let Some(ref pb) = count_progress {
             pb.inc(1);
         }
+        moved_destinations.insert(targetpath.clone());
     }
     Ok(())
 }
diff --git a/tests/by-util/test_mv.rs b/tests/by-util/test_mv.rs
index 75500ac63d9..2e2dc3d81e6 100644
--- a/tests/by-util/test_mv.rs
+++ b/tests/by-util/test_mv.rs
@@ -1469,6 +1469,32 @@ fn test_mv_file_into_dir_where_both_are_files() {
         .stderr_contains("mv: failed to access 'b/': Not a directory");
 }
 
+#[test]
+fn test_mv_seen_file() {
+    let ts = TestScenario::new(util_name!());
+    let at = &ts.fixtures;
+
+    at.mkdir("a");
+    at.mkdir("b");
+    at.mkdir("c");
+    at.write("a/f", "a");
+    at.write("b/f", "b");
+
+    ts.ucmd()
+        .arg("a/f")
+        .arg("b/f")
+        .arg("c")
+        .fails()
+        .stderr_contains("will not overwrite just-created 'c/f' with 'b/f'");
+
+    // a/f has been moved into c/f
+    assert!(at.plus("c").join("f").exists());
+    // b/f still exists
+    assert!(at.plus("b").join("f").exists());
+    // a/f no longer exists
+    assert!(!at.plus("a").join("f").exists());
+}
+
 #[test]
 fn test_mv_dir_into_file_where_both_are_files() {
     let scene = TestScenario::new(util_name!());

From 9c7fd5e8cb1f5736235461ed521102b9182a538d Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Sat, 23 Dec 2023 13:05:52 +0100
Subject: [PATCH 239/429] mv: rename the variable to match the name in cp

---
 src/uu/mv/src/mv.rs | 9 +++++----
 1 file changed, 5 insertions(+), 4 deletions(-)

diff --git a/src/uu/mv/src/mv.rs b/src/uu/mv/src/mv.rs
index 75a295502c2..058532851b0 100644
--- a/src/uu/mv/src/mv.rs
+++ b/src/uu/mv/src/mv.rs
@@ -434,7 +434,7 @@ pub fn mv(files: &[OsString], opts: &Options) -> UResult<()> {
 }
 
 #[allow(clippy::cognitive_complexity)]
-fn move_files_into_dir(files: &[PathBuf], target_dir: &Path, opts: &Options) -> UResult<()> {
+fn move_files_into_dir(files: &[PathBuf], target_dir: &Path, options: &Options) -> UResult<()> {
     // remember the moved destinations for further usage
     let mut moved_destinations: HashSet<PathBuf> = HashSet::with_capacity(files.len());
 
@@ -446,7 +446,7 @@ fn move_files_into_dir(files: &[PathBuf], target_dir: &Path, opts: &Options) ->
         .canonicalize()
         .unwrap_or_else(|_| target_dir.to_path_buf());
 
-    let multi_progress = opts.progress_bar.then(MultiProgress::new);
+    let multi_progress = options.progress_bar.then(MultiProgress::new);
 
     let count_progress = if let Some(ref multi_progress) = multi_progress {
         if files.len() > 1 {
@@ -475,7 +475,8 @@ fn move_files_into_dir(files: &[PathBuf], target_dir: &Path, opts: &Options) ->
             }
         };
 
-        if moved_destinations.contains(&targetpath) && opts.backup != BackupMode::NumberedBackup {
+        if moved_destinations.contains(&targetpath) && options.backup != BackupMode::NumberedBackup
+        {
             // If the target file was already created in this mv call, do not overwrite
             return Err(USimpleError::new(
                 1,
@@ -509,7 +510,7 @@ fn move_files_into_dir(files: &[PathBuf], target_dir: &Path, opts: &Options) ->
             }
         }
 
-        match rename(sourcepath, &targetpath, opts, multi_progress.as_ref()) {
+        match rename(sourcepath, &targetpath, options, multi_progress.as_ref()) {
             Err(e) if e.to_string().is_empty() => set_exit_code(1),
             Err(e) => {
                 let e = e.map_err_context(|| {

From c94773f522bdaa5f9c01b9242e912ad8af885605 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Sat, 23 Dec 2023 13:27:00 +0100
Subject: [PATCH 240/429] mv: make sure it continues when hiting an error

---
 src/uu/mv/src/mv.rs      |  3 ++-
 tests/by-util/test_mv.rs | 26 ++++++++++++++++++++++++++
 2 files changed, 28 insertions(+), 1 deletion(-)

diff --git a/src/uu/mv/src/mv.rs b/src/uu/mv/src/mv.rs
index 058532851b0..ff5aaf93d58 100644
--- a/src/uu/mv/src/mv.rs
+++ b/src/uu/mv/src/mv.rs
@@ -478,7 +478,7 @@ fn move_files_into_dir(files: &[PathBuf], target_dir: &Path, options: &Options)
         if moved_destinations.contains(&targetpath) && options.backup != BackupMode::NumberedBackup
         {
             // If the target file was already created in this mv call, do not overwrite
-            return Err(USimpleError::new(
+            show!(USimpleError::new(
                 1,
                 format!(
                     "will not overwrite just-created '{}' with '{}'",
@@ -486,6 +486,7 @@ fn move_files_into_dir(files: &[PathBuf], target_dir: &Path, options: &Options)
                     sourcepath.display()
                 ),
             ));
+            continue;
         }
 
         // Check if we have mv dir1 dir2 dir2
diff --git a/tests/by-util/test_mv.rs b/tests/by-util/test_mv.rs
index 2e2dc3d81e6..bc75ada3fae 100644
--- a/tests/by-util/test_mv.rs
+++ b/tests/by-util/test_mv.rs
@@ -1495,6 +1495,32 @@ fn test_mv_seen_file() {
     assert!(!at.plus("a").join("f").exists());
 }
 
+#[test]
+fn test_mv_seen_multiple_files_to_directory() {
+    let ts = TestScenario::new(util_name!());
+    let at = &ts.fixtures;
+
+    at.mkdir("a");
+    at.mkdir("b");
+    at.mkdir("c");
+    at.write("a/f", "a");
+    at.write("b/f", "b");
+    at.write("b/g", "g");
+
+    ts.ucmd()
+        .arg("a/f")
+        .arg("b/f")
+        .arg("b/g")
+        .arg("c")
+        .fails()
+        .stderr_contains("will not overwrite just-created 'c/f' with 'b/f'");
+    assert!(!at.plus("a").join("f").exists());
+    assert!(at.plus("b").join("f").exists());
+    assert!(!at.plus("b").join("g").exists());
+    assert!(at.plus("c").join("f").exists());
+    assert!(at.plus("c").join("g").exists());
+}
+
 #[test]
 fn test_mv_dir_into_file_where_both_are_files() {
     let scene = TestScenario::new(util_name!());

From ceecac110c6a6db324a0766fc0909b4586b5b3ad Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Sat, 23 Dec 2023 13:43:11 +0100
Subject: [PATCH 241/429] ln: manages the 'seen' file list before linking

Should help with tests/mv/childproof.sh
---
 src/uu/ln/src/ln.rs      | 15 +++++++++++++-
 tests/by-util/test_ln.rs | 43 ++++++++++++++++++++++++++++++++++++++++
 2 files changed, 57 insertions(+), 1 deletion(-)

diff --git a/src/uu/ln/src/ln.rs b/src/uu/ln/src/ln.rs
index 8b76aa73c0b..e53af03a243 100644
--- a/src/uu/ln/src/ln.rs
+++ b/src/uu/ln/src/ln.rs
@@ -12,6 +12,7 @@ use uucore::fs::{make_path_relative_to, paths_refer_to_same_file};
 use uucore::{format_usage, help_about, help_section, help_usage, prompt_yes, show_error};
 
 use std::borrow::Cow;
+use std::collections::HashSet;
 use std::error::Error;
 use std::ffi::OsString;
 use std::fmt::Display;
@@ -295,6 +296,8 @@ fn link_files_in_dir(files: &[PathBuf], target_dir: &Path, settings: &Settings)
     if !target_dir.is_dir() {
         return Err(LnError::TargetIsDirectory(target_dir.to_owned()).into());
     }
+    // remember the linked destinations for further usage
+    let mut linked_destinations: HashSet<PathBuf> = HashSet::with_capacity(files.len());
 
     let mut all_successful = true;
     for srcpath in files {
@@ -338,10 +341,20 @@ fn link_files_in_dir(files: &[PathBuf], target_dir: &Path, settings: &Settings)
                 }
             };
 
-        if let Err(e) = link(srcpath, &targetpath, settings) {
+        if linked_destinations.contains(&targetpath) {
+            // If the target file was already created in this linked call, do not overwrite
+            show_error!(
+                "will not overwrite just-created '{}' with '{}'",
+                targetpath.display(),
+                srcpath.display()
+            );
+            all_successful = false;
+        } else if let Err(e) = link(srcpath, &targetpath, settings) {
             show_error!("{}", e);
             all_successful = false;
         }
+
+        linked_destinations.insert(targetpath.clone());
     }
     if all_successful {
         Ok(())
diff --git a/tests/by-util/test_ln.rs b/tests/by-util/test_ln.rs
index dc31f726116..b6453bf4376 100644
--- a/tests/by-util/test_ln.rs
+++ b/tests/by-util/test_ln.rs
@@ -3,6 +3,8 @@
 // For the full copyright and license information, please view the LICENSE
 // file that was distributed with this source code.
 use crate::common::util::TestScenario;
+#[cfg(unix)]
+use std::os::unix::fs::MetadataExt;
 use std::path::PathBuf;
 
 #[test]
@@ -719,3 +721,44 @@ fn test_symlink_remove_existing_same_src_and_dest() {
     assert!(at.file_exists("a") && !at.symlink_exists("a"));
     assert_eq!(at.read("a"), "sample");
 }
+
+#[test]
+fn test_ln_seen_file() {
+    let ts = TestScenario::new(util_name!());
+    let at = &ts.fixtures;
+
+    at.mkdir("a");
+    at.mkdir("b");
+    at.mkdir("c");
+    at.write("a/f", "a");
+    at.write("b/f", "b");
+
+    ts.ucmd()
+        .arg("a/f")
+        .arg("b/f")
+        .arg("c")
+        .fails()
+        .stderr_contains("will not overwrite just-created 'c/f' with 'b/f'");
+
+    assert!(at.plus("c").join("f").exists());
+    // b/f still exists
+    assert!(at.plus("b").join("f").exists());
+    // a/f no longer exists
+    assert!(at.plus("a").join("f").exists());
+    #[cfg(unix)]
+    {
+        // Check inode numbers
+        let inode_a_f = at.plus("a").join("f").metadata().unwrap().ino();
+        let inode_b_f = at.plus("b").join("f").metadata().unwrap().ino();
+        let inode_c_f = at.plus("c").join("f").metadata().unwrap().ino();
+
+        assert_eq!(
+            inode_a_f, inode_c_f,
+            "Inode numbers of a/f and c/f should be equal"
+        );
+        assert_ne!(
+            inode_b_f, inode_c_f,
+            "Inode numbers of b/f and c/f should not be equal"
+        );
+    }
+}

From 283269405667da4ec4bd672e310bc702f0212f43 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Sat, 23 Dec 2023 15:29:32 +0100
Subject: [PATCH 242/429] install: support when a hyphen is passed (#5697)

* install: support when a hyphen is passed

Should fix: tests/install/strip-program.sh

Co-authored-by: Daniel Hofstetter <daniel.hofstetter@42dh.com>
---
 src/uu/install/src/install.rs | 16 +++++++++++++++-
 tests/by-util/test_install.rs | 28 ++++++++++++++++++++++++++++
 2 files changed, 43 insertions(+), 1 deletion(-)

diff --git a/src/uu/install/src/install.rs b/src/uu/install/src/install.rs
index 43925a7f8e4..1154b32c187 100644
--- a/src/uu/install/src/install.rs
+++ b/src/uu/install/src/install.rs
@@ -749,7 +749,21 @@ fn copy_file(from: &Path, to: &Path) -> UResult<()> {
 /// Returns an empty Result or an error in case of failure.
 ///
 fn strip_file(to: &Path, b: &Behavior) -> UResult<()> {
-    match process::Command::new(&b.strip_program).arg(to).output() {
+    // Check if the filename starts with a hyphen and adjust the path
+    let to = if to
+        .file_name()
+        .unwrap_or_default()
+        .to_str()
+        .unwrap_or_default()
+        .starts_with('-')
+    {
+        let mut new_path = PathBuf::from(".");
+        new_path.push(to);
+        new_path
+    } else {
+        to.to_path_buf()
+    };
+    match process::Command::new(&b.strip_program).arg(&to).output() {
         Ok(o) => {
             if !o.status.success() {
                 // Follow GNU's behavior: if strip fails, removes the target
diff --git a/tests/by-util/test_install.rs b/tests/by-util/test_install.rs
index 7387748c619..3e61bc92b49 100644
--- a/tests/by-util/test_install.rs
+++ b/tests/by-util/test_install.rs
@@ -674,6 +674,34 @@ fn test_install_and_strip_with_program() {
     assert!(!stdout.contains(STRIP_SOURCE_FILE_SYMBOL));
 }
 
+#[cfg(all(unix, feature = "chmod"))]
+#[test]
+// FixME: Freebsd fails on 'No such file or directory'
+#[cfg(not(target_os = "freebsd"))]
+fn test_install_and_strip_with_program_hyphen() {
+    let scene = TestScenario::new(util_name!());
+
+    let at = &scene.fixtures;
+    let content = r#"#!/bin/sh
+    echo $1 &> /tmp/a.log
+    printf -- '%s\n' "$1" | grep '^[^-]'
+    "#;
+    at.write("no-hyphen", content);
+    scene.ccmd("chmod").arg("+x").arg("no-hyphen").succeeds();
+
+    at.touch("src");
+    scene
+        .ucmd()
+        .arg("-s")
+        .arg("--strip-program")
+        .arg("./no-hyphen")
+        .arg("--")
+        .arg("src")
+        .arg("-dest")
+        .succeeds()
+        .no_stderr();
+}
+
 #[test]
 #[cfg(not(windows))]
 fn test_install_and_strip_with_invalid_program() {

From 8685e05f4e9db68597ba164aba3dfcef518c4497 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Sat, 23 Dec 2023 17:58:05 +0100
Subject: [PATCH 243/429] cp: debug with --update=none should show 'skipped'

---
 src/uu/cp/src/cp.rs      |  8 +++++++-
 tests/by-util/test_cp.rs | 15 +++++++++++++++
 2 files changed, 22 insertions(+), 1 deletion(-)

diff --git a/src/uu/cp/src/cp.rs b/src/uu/cp/src/cp.rs
index de01a5ef38c..359f2357209 100644
--- a/src/uu/cp/src/cp.rs
+++ b/src/uu/cp/src/cp.rs
@@ -1815,7 +1815,13 @@ fn copy_file(
                             symlinked_files,
                         )?;
                     }
-                    update_control::UpdateMode::ReplaceNone => return Ok(()),
+                    update_control::UpdateMode::ReplaceNone => {
+                        if options.debug {
+                            println!("skipped {}", dest.quote());
+                        }
+
+                        return Ok(());
+                    }
                     update_control::UpdateMode::ReplaceIfOlder => {
                         let dest_metadata = fs::symlink_metadata(dest)?;
 
diff --git a/tests/by-util/test_cp.rs b/tests/by-util/test_cp.rs
index 37bec522238..8a20443a4fc 100644
--- a/tests/by-util/test_cp.rs
+++ b/tests/by-util/test_cp.rs
@@ -3367,6 +3367,21 @@ fn test_cp_debug_sparse_reflink() {
     }
 }
 
+#[test]
+fn test_cp_debug_no_update() {
+    let ts = TestScenario::new(util_name!());
+    let at = &ts.fixtures;
+    at.touch("a");
+    at.touch("b");
+    ts.ucmd()
+        .arg("--debug")
+        .arg("--update=none")
+        .arg("a")
+        .arg("b")
+        .succeeds()
+        .stdout_contains("skipped 'b'");
+}
+
 #[test]
 #[cfg(target_os = "linux")]
 fn test_cp_debug_sparse_always() {

From 9b78016ac5ef019ca19557c5967484aebb9d6ba4 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Sat, 23 Dec 2023 23:03:13 +0100
Subject: [PATCH 244/429] runcon: remove trailing '.'

Upstream doesn't have in:
https://github.com/coreutils/coreutils/blob/master/tests/runcon/runcon-no-reorder.sh#L22
---
 src/uu/runcon/src/errors.rs | 1 -
 1 file changed, 1 deletion(-)

diff --git a/src/uu/runcon/src/errors.rs b/src/uu/runcon/src/errors.rs
index 382ab3bed36..b2bfcad9598 100644
--- a/src/uu/runcon/src/errors.rs
+++ b/src/uu/runcon/src/errors.rs
@@ -87,7 +87,6 @@ where
         err = source;
         write!(writer, ": {err}")?;
     }
-    write!(writer, ".")?;
     Ok(())
 }
 

From c5b08f1c4a226f5f6c3a377b282d51a4fb784318 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Sun, 24 Dec 2023 11:39:55 +0100
Subject: [PATCH 245/429] shred: improve some output to match GNU's

---
 src/uu/shred/src/shred.rs | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/src/uu/shred/src/shred.rs b/src/uu/shred/src/shred.rs
index d4209aa3a97..a77bfe5e134 100644
--- a/src/uu/shred/src/shred.rs
+++ b/src/uu/shred/src/shred.rs
@@ -435,7 +435,7 @@ fn wipe_file(
             let pass_name = pass_name(&pass_type);
             if total_passes < 10 {
                 show_error!(
-                    "{}: pass {}/{} ({})... ",
+                    "{}: pass {}/{} ({})...",
                     path.maybe_quote(),
                     i + 1,
                     total_passes,
@@ -443,7 +443,7 @@ fn wipe_file(
                 );
             } else {
                 show_error!(
-                    "{}: pass {:2.0}/{:2.0} ({})... ",
+                    "{}: pass {:2.0}/{:2.0} ({})...",
                     path.maybe_quote(),
                     i + 1,
                     total_passes,
@@ -522,7 +522,7 @@ fn wipe_name(orig_path: &Path, verbose: bool) -> Option<PathBuf> {
                         show_error!(
                             "{}: renamed to {}",
                             last_path.maybe_quote(),
-                            new_path.quote()
+                            new_path.display()
                         );
                     }
 

From 143705b1936458cf98acf0190fd1a609b75a492d Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Sun, 24 Dec 2023 12:57:21 +0100
Subject: [PATCH 246/429] Bump crossbeam crates

crossbeam-channel from 0.5.8 to 0.5.10
crossbeam-deque from 0.8.2 to 0.8.4
crossbeam-epoch from 0.9.14 to 0.9.17
crossbeam-utils from 0.8.15 to 0.8.18
---
 Cargo.lock | 27 ++++++++-------------------
 1 file changed, 8 insertions(+), 19 deletions(-)

diff --git a/Cargo.lock b/Cargo.lock
index 44d458ae319..d92a288755c 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -590,9 +590,9 @@ dependencies = [
 
 [[package]]
 name = "crossbeam-channel"
-version = "0.5.8"
+version = "0.5.10"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "a33c2bf77f2df06183c3aa30d1e96c0695a313d4f9c453cc3762a6db39f99200"
+checksum = "82a9b73a36529d9c47029b9fb3a6f0ea3cc916a261195352ba19e770fc1748b2"
 dependencies = [
  "cfg-if",
  "crossbeam-utils",
@@ -600,9 +600,9 @@ dependencies = [
 
 [[package]]
 name = "crossbeam-deque"
-version = "0.8.2"
+version = "0.8.4"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "715e8152b692bba2d374b53d4875445368fdf21a94751410af607a5ac677d1fc"
+checksum = "fca89a0e215bab21874660c67903c5f143333cab1da83d041c7ded6053774751"
 dependencies = [
  "cfg-if",
  "crossbeam-epoch",
@@ -611,22 +611,20 @@ dependencies = [
 
 [[package]]
 name = "crossbeam-epoch"
-version = "0.9.14"
+version = "0.9.17"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "46bd5f3f85273295a9d14aedfb86f6aadbff6d8f5295c4a9edb08e819dcf5695"
+checksum = "0e3681d554572a651dda4186cd47240627c3d0114d45a95f6ad27f2f22e7548d"
 dependencies = [
  "autocfg",
  "cfg-if",
  "crossbeam-utils",
- "memoffset",
- "scopeguard",
 ]
 
 [[package]]
 name = "crossbeam-utils"
-version = "0.8.15"
+version = "0.8.18"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "3c063cd8cc95f5c377ed0d4b49a4b21f632396ff690e8470c29b3359b346984b"
+checksum = "c3a430a770ebd84726f584a90ee7f020d28db52c6d02138900f22341f866d39c"
 dependencies = [
  "cfg-if",
 ]
@@ -1278,15 +1276,6 @@ dependencies = [
  "libc",
 ]
 
-[[package]]
-name = "memoffset"
-version = "0.8.0"
-source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "d61c719bcfbcf5d62b3a09efa6088de8c54bc0bfcd3ea7ae39fcc186108b8de1"
-dependencies = [
- "autocfg",
-]
-
 [[package]]
 name = "minimal-lexical"
 version = "0.2.1"

From df492d34cbbc46bdd3325e3603daeeb53e5a46c6 Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Sun, 24 Dec 2023 13:20:57 +0100
Subject: [PATCH 247/429] wc: disable part of test on Android

---
 tests/by-util/test_wc.rs | 18 +++++++++++-------
 1 file changed, 11 insertions(+), 7 deletions(-)

diff --git a/tests/by-util/test_wc.rs b/tests/by-util/test_wc.rs
index 77716e43af2..c0a4a341319 100644
--- a/tests/by-util/test_wc.rs
+++ b/tests/by-util/test_wc.rs
@@ -428,13 +428,17 @@ fn test_files_from_pseudo_filesystem() {
     let result = new_ucmd!().arg("-c").arg("/proc/cpuinfo").succeeds();
     assert_ne!(result.stdout_str(), "0 /proc/cpuinfo\n");
 
-    let (at, mut ucmd) = at_and_ucmd!();
-    let result = ucmd.arg("-c").arg("/sys/kernel/profiling").succeeds();
-    let actual = at.read("/sys/kernel/profiling").len();
-    assert_eq!(
-        result.stdout_str(),
-        format!("{} /sys/kernel/profiling\n", actual)
-    );
+    // the following block fails on Android with a "Permission denied" error
+    #[cfg(target_os = "linux")]
+    {
+        let (at, mut ucmd) = at_and_ucmd!();
+        let result = ucmd.arg("-c").arg("/sys/kernel/profiling").succeeds();
+        let actual = at.read("/sys/kernel/profiling").len();
+        assert_eq!(
+            result.stdout_str(),
+            format!("{} /sys/kernel/profiling\n", actual)
+        );
+    }
 }
 
 #[test]

From 28d684b5ace7275666955b4466de0439eadcf025 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Sat, 16 Dec 2023 17:19:06 +0100
Subject: [PATCH 248/429] ls: add a comment

---
 src/uu/ls/src/ls.rs | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/src/uu/ls/src/ls.rs b/src/uu/ls/src/ls.rs
index 7ad1704fc4e..23ceb1a5888 100644
--- a/src/uu/ls/src/ls.rs
+++ b/src/uu/ls/src/ls.rs
@@ -1812,6 +1812,7 @@ struct PathData {
     // Result<MetaData> got from symlink_metadata() or metadata() based on config
     md: OnceCell<Option<Metadata>>,
     ft: OnceCell<Option<FileType>>,
+    // can be used to avoid reading the metadata. Can be also called d_type
     de: Option<DirEntry>,
     // Name of the file - will be empty for . or ..
     display_name: OsString,
@@ -1911,6 +1912,7 @@ impl PathData {
         self.md
             .get_or_init(|| {
                 // check if we can use DirEntry metadata
+                // it will avoid a call to stat()
                 if !self.must_dereference {
                     if let Some(dir_entry) = &self.de {
                         return dir_entry.metadata().ok();

From c0c5ec25b6581739a647dd7494fb4c39e6a450f8 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Sat, 16 Dec 2023 17:19:28 +0100
Subject: [PATCH 249/429] ls: rename a function for something more explicit

---
 src/uu/ls/src/ls.rs | 36 +++++++++++++++++++-----------------
 1 file changed, 19 insertions(+), 17 deletions(-)

diff --git a/src/uu/ls/src/ls.rs b/src/uu/ls/src/ls.rs
index 23ceb1a5888..ce5c2fcba5e 100644
--- a/src/uu/ls/src/ls.rs
+++ b/src/uu/ls/src/ls.rs
@@ -1908,7 +1908,7 @@ impl PathData {
         }
     }
 
-    fn md(&self, out: &mut BufWriter<Stdout>) -> Option<&Metadata> {
+    fn get_metadata(&self, out: &mut BufWriter<Stdout>) -> Option<&Metadata> {
         self.md
             .get_or_init(|| {
                 // check if we can use DirEntry metadata
@@ -1949,7 +1949,7 @@ impl PathData {
 
     fn file_type(&self, out: &mut BufWriter<Stdout>) -> Option<&FileType> {
         self.ft
-            .get_or_init(|| self.md(out).map(|md| md.file_type()))
+            .get_or_init(|| self.get_metadata(out).map(|md| md.file_type()))
             .as_ref()
     }
 }
@@ -1982,7 +1982,7 @@ pub fn list(locs: Vec<&Path>, config: &Config) -> UResult<()> {
         // Proper GNU handling is don't show if dereferenced symlink DNE
         // but only for the base dir, for a child dir show, and print ?s
         // in long format
-        if path_data.md(&mut out).is_none() {
+        if path_data.get_metadata(&mut out).is_none() {
             continue;
         }
 
@@ -2070,12 +2070,14 @@ fn sort_entries(entries: &mut [PathData], config: &Config, out: &mut BufWriter<S
     match config.sort {
         Sort::Time => entries.sort_by_key(|k| {
             Reverse(
-                k.md(out)
+                k.get_metadata(out)
                     .and_then(|md| get_system_time(md, config))
                     .unwrap_or(UNIX_EPOCH),
             )
         }),
-        Sort::Size => entries.sort_by_key(|k| Reverse(k.md(out).map(|md| md.len()).unwrap_or(0))),
+        Sort::Size => {
+            entries.sort_by_key(|k| Reverse(k.get_metadata(out).map(|md| md.len()).unwrap_or(0)))
+        }
         // The default sort in GNU ls is case insensitive
         Sort::Name => entries.sort_by(|a, b| a.display_name.cmp(&b.display_name)),
         Sort::Version => entries.sort_by(|a, b| {
@@ -2305,7 +2307,7 @@ fn display_dir_entry_size(
     out: &mut BufWriter<std::io::Stdout>,
 ) -> (usize, usize, usize, usize, usize, usize) {
     // TODO: Cache/memorize the display_* results so we don't have to recalculate them.
-    if let Some(md) = entry.md(out) {
+    if let Some(md) = entry.get_metadata(out) {
         let (size_len, major_len, minor_len) = match display_len_or_rdev(md, config) {
             SizeOrDeviceId::Device(major, minor) => (
                 (major.len() + minor.len() + 2usize),
@@ -2343,7 +2345,7 @@ fn return_total(
     let mut total_size = 0;
     for item in items {
         total_size += item
-            .md(out)
+            .get_metadata(out)
             .as_ref()
             .map_or(0, |md| get_block_size(md, config));
     }
@@ -2367,7 +2369,7 @@ fn display_additional_leading_info(
     #[cfg(unix)]
     {
         if config.inode {
-            let i = if let Some(md) = item.md(out) {
+            let i = if let Some(md) = item.get_metadata(out) {
                 get_inode(md)
             } else {
                 "?".to_owned()
@@ -2377,7 +2379,7 @@ fn display_additional_leading_info(
     }
 
     if config.alloc_size {
-        let s = if let Some(md) = item.md(out) {
+        let s = if let Some(md) = item.get_metadata(out) {
             display_size(get_block_size(md, config), config)
         } else {
             "?".to_owned()
@@ -2592,7 +2594,7 @@ fn display_item_long(
     if config.dired {
         output_display += "  ";
     }
-    if let Some(md) = item.md(out) {
+    if let Some(md) = item.get_metadata(out) {
         write!(
             output_display,
             "{}{} {}",
@@ -3019,7 +3021,7 @@ fn classify_file(path: &PathData, out: &mut BufWriter<Stdout>) -> Option<char> {
             } else if file_type.is_file()
                 // Safe unwrapping if the file was removed between listing and display
                 // See https://github.com/uutils/coreutils/issues/5371
-                && path.md(out).map(file_is_executable).unwrap_or_default()
+                && path.get_metadata(out).map(file_is_executable).unwrap_or_default()
             {
                 Some('*')
             } else {
@@ -3066,7 +3068,7 @@ fn display_item_name(
     }
 
     if let Some(ls_colors) = &config.color {
-        let md = path.md(out);
+        let md = path.get_metadata(out);
         name = if md.is_some() {
             color_name(name, &path.p_buf, md, ls_colors, style_manager)
         } else {
@@ -3143,7 +3145,7 @@ fn display_item_name(
                     // Because we use an absolute path, we can assume this is guaranteed to exist.
                     // Otherwise, we use path.md(), which will guarantee we color to the same
                     // color of non-existent symlinks according to style_for_path_with_metadata.
-                    if path.md(out).is_none()
+                    if path.get_metadata(out).is_none()
                         && get_metadata(target_data.p_buf.as_path(), target_data.must_dereference)
                             .is_err()
                     {
@@ -3156,7 +3158,7 @@ fn display_item_name(
                             target_data.must_dereference,
                         ) {
                             Ok(md) => md,
-                            Err(_) => path.md(out).unwrap().clone(),
+                            Err(_) => path.get_metadata(out).unwrap().clone(),
                         };
 
                         name.push_str(&color_name(
@@ -3366,7 +3368,7 @@ fn calculate_padding_collection(
     for item in items {
         #[cfg(unix)]
         if config.inode {
-            let inode_len = if let Some(md) = item.md(out) {
+            let inode_len = if let Some(md) = item.get_metadata(out) {
                 display_inode(md).len()
             } else {
                 continue;
@@ -3375,7 +3377,7 @@ fn calculate_padding_collection(
         }
 
         if config.alloc_size {
-            if let Some(md) = item.md(out) {
+            if let Some(md) = item.get_metadata(out) {
                 let block_size_len = display_size(get_block_size(md, config), config).len();
                 padding_collections.block_size = block_size_len.max(padding_collections.block_size);
             }
@@ -3425,7 +3427,7 @@ fn calculate_padding_collection(
 
     for item in items {
         if config.alloc_size {
-            if let Some(md) = item.md(out) {
+            if let Some(md) = item.get_metadata(out) {
                 let block_size_len = display_size(get_block_size(md, config), config).len();
                 padding_collections.block_size = block_size_len.max(padding_collections.block_size);
             }

From 1bd8ce5ddf067137cb6fdf0c552b6402ebe8cd90 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Sat, 16 Dec 2023 17:31:39 +0100
Subject: [PATCH 250/429] ls/color_name: use PathData instead of a Path as we
 want to check for DirEntry

---
 src/uu/ls/src/ls.rs | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/src/uu/ls/src/ls.rs b/src/uu/ls/src/ls.rs
index ce5c2fcba5e..04b5a4ebc06 100644
--- a/src/uu/ls/src/ls.rs
+++ b/src/uu/ls/src/ls.rs
@@ -3070,11 +3070,11 @@ fn display_item_name(
     if let Some(ls_colors) = &config.color {
         let md = path.get_metadata(out);
         name = if md.is_some() {
-            color_name(name, &path.p_buf, md, ls_colors, style_manager)
+            color_name(name, path, md, ls_colors, style_manager)
         } else {
             color_name(
                 name,
-                &path.p_buf,
+                path,
                 path.p_buf.symlink_metadata().ok().as_ref(),
                 ls_colors,
                 style_manager,
@@ -3163,7 +3163,7 @@ fn display_item_name(
 
                         name.push_str(&color_name(
                             escape_name(target.as_os_str(), &config.quoting_style),
-                            &target_data.p_buf,
+                            &target_data,
                             Some(&target_metadata),
                             ls_colors,
                             style_manager,
@@ -3266,12 +3266,12 @@ impl StyleManager {
 /// Colors the provided name based on the style determined for the given path.
 fn color_name(
     name: String,
-    path: &Path,
+    path: &PathData,
     md: Option<&Metadata>,
     ls_colors: &LsColors,
     style_manager: &mut StyleManager,
 ) -> String {
-    match ls_colors.style_for_path_with_metadata(path, md) {
+    match ls_colors.style_for_path_with_metadata(&path.p_buf, md) {
         Some(style) => style_manager.apply_style(style, &name),
         None => name,
     }

From 95fa81250efbced764ab1ad3abf7bc63dcd77ae5 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Sat, 16 Dec 2023 17:37:57 +0100
Subject: [PATCH 251/429] ls/color_name: use the DirEntry if available

---
 src/uu/ls/src/ls.rs | 11 +++++++++++
 1 file changed, 11 insertions(+)

diff --git a/src/uu/ls/src/ls.rs b/src/uu/ls/src/ls.rs
index 04b5a4ebc06..b91d44d7200 100644
--- a/src/uu/ls/src/ls.rs
+++ b/src/uu/ls/src/ls.rs
@@ -3271,6 +3271,17 @@ fn color_name(
     ls_colors: &LsColors,
     style_manager: &mut StyleManager,
 ) -> String {
+    if !path.must_dereference {
+        // If we need to dereference (follow) a symlink, we will need to get the metadata
+        if let Some(de) = &path.de {
+            // There is a DirEntry, we don't need to get the metadata for the color
+            return match ls_colors.style_for(de) {
+                Some(style) => style_manager.apply_style(style, &name),
+                None => name,
+            };
+        }
+    }
+
     match ls_colors.style_for_path_with_metadata(&path.p_buf, md) {
         Some(style) => style_manager.apply_style(style, &name),
         None => name,

From 147721c24b9ddbba6d1451906231ac3d0318e3eb Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Sat, 16 Dec 2023 18:24:33 +0100
Subject: [PATCH 252/429] ls: Improve the access to metadata of the files
 Should fix tests/ls/stat-free-color.sh

---
 src/uu/ls/src/ls.rs | 79 +++++++++++++++++++++++++++------------------
 1 file changed, 47 insertions(+), 32 deletions(-)

diff --git a/src/uu/ls/src/ls.rs b/src/uu/ls/src/ls.rs
index b91d44d7200..bdea5c7bf3f 100644
--- a/src/uu/ls/src/ls.rs
+++ b/src/uu/ls/src/ls.rs
@@ -2118,7 +2118,8 @@ fn sort_entries(entries: &mut [PathData], config: &Config, out: &mut BufWriter<S
             !match md {
                 None | Some(None) => {
                     // If it metadata cannot be determined, treat as a file.
-                    get_metadata(p.p_buf.as_path(), true).map_or_else(|_| false, |m| m.is_dir())
+                    get_metadata(p.p_buf.as_path(), true)
+                        .map_or_else(|_| false, |m| m.is_dir())
                 }
                 Some(Some(m)) => m.is_dir(),
             }
@@ -3068,18 +3069,7 @@ fn display_item_name(
     }
 
     if let Some(ls_colors) = &config.color {
-        let md = path.get_metadata(out);
-        name = if md.is_some() {
-            color_name(name, path, md, ls_colors, style_manager)
-        } else {
-            color_name(
-                name,
-                path,
-                path.p_buf.symlink_metadata().ok().as_ref(),
-                ls_colors,
-                style_manager,
-            )
-        };
+        name = color_name(name, path, ls_colors, style_manager, out, false, None);
     }
 
     if config.format != Format::Long && !more_info.is_empty() {
@@ -3146,27 +3136,22 @@ fn display_item_name(
                     // Otherwise, we use path.md(), which will guarantee we color to the same
                     // color of non-existent symlinks according to style_for_path_with_metadata.
                     if path.get_metadata(out).is_none()
-                        && get_metadata(target_data.p_buf.as_path(), target_data.must_dereference)
-                            .is_err()
+                        && get_metadata(
+                            target_data.p_buf.as_path(),
+                            target_data.must_dereference,
+                        )
+                        .is_err()
                     {
                         name.push_str(&path.p_buf.read_link().unwrap().to_string_lossy());
                     } else {
-                        // Use fn get_metadata instead of md() here and above because ls
-                        // should not exit with an err, if we are unable to obtain the target_metadata
-                        let target_metadata = match get_metadata(
-                            target_data.p_buf.as_path(),
-                            target_data.must_dereference,
-                        ) {
-                            Ok(md) => md,
-                            Err(_) => path.get_metadata(out).unwrap().clone(),
-                        };
-
                         name.push_str(&color_name(
                             escape_name(target.as_os_str(), &config.quoting_style),
-                            &target_data,
-                            Some(&target_metadata),
+                            path,
                             ls_colors,
                             style_manager,
+                            out,
+                            true,
+                            Some(&target_data),
                         ));
                     }
                 } else {
@@ -3263,13 +3248,18 @@ impl StyleManager {
     }
 }
 
-/// Colors the provided name based on the style determined for the given path.
+/// Colors the provided name based on the style determined for the given path
+/// This function is quite long because it tries to leverage DirEntry to avoid
+/// unnecessary calls to stat()
+/// and manages the symlink errors
 fn color_name(
     name: String,
     path: &PathData,
-    md: Option<&Metadata>,
     ls_colors: &LsColors,
     style_manager: &mut StyleManager,
+    out: &mut BufWriter<Stdout>,
+    check_for_deref: bool,
+    target_symlink: Option<&PathData>,
 ) -> String {
     if !path.must_dereference {
         // If we need to dereference (follow) a symlink, we will need to get the metadata
@@ -3282,9 +3272,34 @@ fn color_name(
         }
     }
 
-    match ls_colors.style_for_path_with_metadata(&path.p_buf, md) {
-        Some(style) => style_manager.apply_style(style, &name),
-        None => name,
+    if check_for_deref {
+        // use the optional target_symlink
+        // Use fn get_metadata instead of md() here and above because ls
+        // should not exit with an err, if we are unable to obtain the target_metadata
+
+        let target = target_symlink.unwrap_or(path);
+        let md = match get_metadata(target.p_buf.as_path(), path.must_dereference) {
+            Ok(md) => md,
+            Err(_) => target.get_metadata(out).unwrap().clone(),
+        };
+        return match ls_colors.style_for_path_with_metadata(&path.p_buf, Some(&md)) {
+            Some(style) => style_manager.apply_style(style, &name),
+            None => name,
+        };
+    } else {
+        let md_option = path.get_metadata(out);
+        let symlink_metadata = path.p_buf.symlink_metadata().ok();
+
+        let md = if md_option.is_some() {
+            md_option
+        } else {
+            symlink_metadata.as_ref()
+        };
+
+        return match ls_colors.style_for_path_with_metadata(&path.p_buf, md) {
+            Some(style) => style_manager.apply_style(style, &name),
+            None => name,
+        };
     }
 }
 

From 445d0af277c74e98d10c3d278e09c32e2524808e Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Sat, 16 Dec 2023 18:47:02 +0100
Subject: [PATCH 253/429] ls: rename get_metadata_with_deref_opt

---
 src/uu/ls/src/ls.rs | 12 ++++++------
 1 file changed, 6 insertions(+), 6 deletions(-)

diff --git a/src/uu/ls/src/ls.rs b/src/uu/ls/src/ls.rs
index bdea5c7bf3f..318faea3152 100644
--- a/src/uu/ls/src/ls.rs
+++ b/src/uu/ls/src/ls.rs
@@ -1920,7 +1920,7 @@ impl PathData {
                 }
 
                 // if not, check if we can use Path metadata
-                match get_metadata(self.p_buf.as_path(), self.must_dereference) {
+                match get_metadata_with_deref_opt(self.p_buf.as_path(), self.must_dereference) {
                     Err(err) => {
                         // FIXME: A bit tricky to propagate the result here
                         out.flush().unwrap();
@@ -2118,7 +2118,7 @@ fn sort_entries(entries: &mut [PathData], config: &Config, out: &mut BufWriter<S
             !match md {
                 None | Some(None) => {
                     // If it metadata cannot be determined, treat as a file.
-                    get_metadata(p.p_buf.as_path(), true)
+                    get_metadata_with_deref_opt(p.p_buf.as_path(), true)
                         .map_or_else(|_| false, |m| m.is_dir())
                 }
                 Some(Some(m)) => m.is_dir(),
@@ -2294,7 +2294,7 @@ fn enter_directory(
     Ok(())
 }
 
-fn get_metadata(p_buf: &Path, dereference: bool) -> std::io::Result<Metadata> {
+fn get_metadata_with_deref_opt(p_buf: &Path, dereference: bool) -> std::io::Result<Metadata> {
     if dereference {
         p_buf.metadata()
     } else {
@@ -3136,7 +3136,7 @@ fn display_item_name(
                     // Otherwise, we use path.md(), which will guarantee we color to the same
                     // color of non-existent symlinks according to style_for_path_with_metadata.
                     if path.get_metadata(out).is_none()
-                        && get_metadata(
+                        && get_metadata_with_deref_opt(
                             target_data.p_buf.as_path(),
                             target_data.must_dereference,
                         )
@@ -3278,7 +3278,7 @@ fn color_name(
         // should not exit with an err, if we are unable to obtain the target_metadata
 
         let target = target_symlink.unwrap_or(path);
-        let md = match get_metadata(target.p_buf.as_path(), path.must_dereference) {
+        let md = match get_metadata_with_deref_opt(target.p_buf.as_path(), path.must_dereference) {
             Ok(md) => md,
             Err(_) => target.get_metadata(out).unwrap().clone(),
         };
@@ -3329,7 +3329,7 @@ fn get_security_context(config: &Config, p_buf: &Path, must_dereference: bool) -
     // does not support SELinux.
     // Conforms to the GNU coreutils where a dangling symlink results in exit code 1.
     if must_dereference {
-        match get_metadata(p_buf, must_dereference) {
+        match get_metadata_with_deref_opt(p_buf, must_dereference) {
             Err(err) => {
                 // The Path couldn't be dereferenced, so return early and set exit code 1
                 // to indicate a minor error

From 5120acb27a8ad81aa13000cdbb90e6585d137ebf Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Sun, 17 Dec 2023 09:46:07 +0100
Subject: [PATCH 254/429] fix a clippy warning

---
 src/uu/ls/src/ls.rs | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/uu/ls/src/ls.rs b/src/uu/ls/src/ls.rs
index 318faea3152..b8fb29f1985 100644
--- a/src/uu/ls/src/ls.rs
+++ b/src/uu/ls/src/ls.rs
@@ -2076,7 +2076,7 @@ fn sort_entries(entries: &mut [PathData], config: &Config, out: &mut BufWriter<S
             )
         }),
         Sort::Size => {
-            entries.sort_by_key(|k| Reverse(k.get_metadata(out).map(|md| md.len()).unwrap_or(0)))
+            entries.sort_by_key(|k| Reverse(k.get_metadata(out).map(|md| md.len()).unwrap_or(0)));
         }
         // The default sort in GNU ls is case insensitive
         Sort::Name => entries.sort_by(|a, b| a.display_name.cmp(&b.display_name)),

From 69f723a263c8da4a55c12f22ab683eb8e6190405 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Sun, 17 Dec 2023 10:02:16 +0100
Subject: [PATCH 255/429] ls: adjust the tests/ls/stat-free-color.sh as we have
 less syscall

---
 util/build-gnu.sh | 6 ++++++
 1 file changed, 6 insertions(+)

diff --git a/util/build-gnu.sh b/util/build-gnu.sh
index 4b682f4ada0..be09c7c20e8 100755
--- a/util/build-gnu.sh
+++ b/util/build-gnu.sh
@@ -294,3 +294,9 @@ ls: invalid --time-style argument 'XX'\nPossible values are: [\"full-iso\", \"lo
 # "hostid BEFORE --help" doesn't fail for GNU. we fail. we are probably doing better
 # "hostid BEFORE --help AFTER " same for this
 sed -i -e "s/env \$prog \$BEFORE \$opt > out2/env \$prog \$BEFORE \$opt > out2 #/" -e "s/env \$prog \$BEFORE \$opt AFTER > out3/env \$prog \$BEFORE \$opt AFTER > out3 #/" -e "s/compare exp out2/compare exp out2 #/" -e "s/compare exp out3/compare exp out3 #/" tests/help/help-version-getopt.sh
+
+# Add debug info + we have less syscall then GNU's. Adjust our check.
+sed -i -e '/test \$n_stat1 = \$n_stat2 \\/c\
+echo "n_stat1 = \$n_stat1"\n\
+echo "n_stat2 = \$n_stat2"\n\
+test \$n_stat1 -ge \$n_stat2 \\' tests/ls/stat-free-color.sh

From a3c7359056d90e74f604b1b97da731feddc5dbfc Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Sun, 17 Dec 2023 16:26:21 +0100
Subject: [PATCH 256/429] ls: refactor the code

---
 src/uu/ls/src/ls.rs | 38 +++++++++++++++++++-------------------
 1 file changed, 19 insertions(+), 19 deletions(-)

diff --git a/src/uu/ls/src/ls.rs b/src/uu/ls/src/ls.rs
index b8fb29f1985..81167ae3402 100644
--- a/src/uu/ls/src/ls.rs
+++ b/src/uu/ls/src/ls.rs
@@ -3248,6 +3248,19 @@ impl StyleManager {
     }
 }
 
+fn apply_style_based_on_metadata(
+    path: &PathData,
+    md_option: Option<&Metadata>,
+    ls_colors: &LsColors,
+    style_manager: &mut StyleManager,
+    name: &str,
+) -> String {
+    match ls_colors.style_for_path_with_metadata(&path.p_buf, md_option) {
+        Some(style) => style_manager.apply_style(style, name),
+        None => name.to_owned(),
+    }
+}
+
 /// Colors the provided name based on the style determined for the given path
 /// This function is quite long because it tries to leverage DirEntry to avoid
 /// unnecessary calls to stat()
@@ -3276,30 +3289,17 @@ fn color_name(
         // use the optional target_symlink
         // Use fn get_metadata instead of md() here and above because ls
         // should not exit with an err, if we are unable to obtain the target_metadata
-
         let target = target_symlink.unwrap_or(path);
-        let md = match get_metadata_with_deref_opt(target.p_buf.as_path(), path.must_dereference) {
-            Ok(md) => md,
-            Err(_) => target.get_metadata(out).unwrap().clone(),
-        };
-        return match ls_colors.style_for_path_with_metadata(&path.p_buf, Some(&md)) {
-            Some(style) => style_manager.apply_style(style, &name),
-            None => name,
-        };
+        let md = get_metadata_with_deref_opt(target.p_buf.as_path(), path.must_dereference)
+            .unwrap_or_else(|_| target.get_metadata(out).unwrap().clone());
+
+        apply_style_based_on_metadata(path, Some(&md), ls_colors, style_manager, &name)
     } else {
         let md_option = path.get_metadata(out);
         let symlink_metadata = path.p_buf.symlink_metadata().ok();
+        let md = md_option.or(symlink_metadata.as_ref());
 
-        let md = if md_option.is_some() {
-            md_option
-        } else {
-            symlink_metadata.as_ref()
-        };
-
-        return match ls_colors.style_for_path_with_metadata(&path.p_buf, md) {
-            Some(style) => style_manager.apply_style(style, &name),
-            None => name,
-        };
+        apply_style_based_on_metadata(path, md, ls_colors, style_manager, &name)
     }
 }
 

From 53b3c782ef0564384e196c3ed79740e56f4175e1 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Mon, 18 Dec 2023 09:40:25 +0100
Subject: [PATCH 257/429] add a link to d_type doc

---
 src/uu/ls/src/ls.rs | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/src/uu/ls/src/ls.rs b/src/uu/ls/src/ls.rs
index 81167ae3402..d8fbde6e742 100644
--- a/src/uu/ls/src/ls.rs
+++ b/src/uu/ls/src/ls.rs
@@ -1812,7 +1812,8 @@ struct PathData {
     // Result<MetaData> got from symlink_metadata() or metadata() based on config
     md: OnceCell<Option<Metadata>>,
     ft: OnceCell<Option<FileType>>,
-    // can be used to avoid reading the metadata. Can be also called d_type
+    // can be used to avoid reading the metadata. Can be also called d_type:
+    // https://www.gnu.org/software/libc/manual/html_node/Directory-Entries.html
     de: Option<DirEntry>,
     // Name of the file - will be empty for . or ..
     display_name: OsString,

From 18035a5f82e9f30e2f8fb1e3b6778df61fcd9067 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Wed, 20 Dec 2023 15:45:34 +0100
Subject: [PATCH 258/429] update of the function names in the comment

Co-authored-by: Daniel Hofstetter <daniel.hofstetter@42dh.com>
---
 src/uu/ls/src/ls.rs | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/uu/ls/src/ls.rs b/src/uu/ls/src/ls.rs
index d8fbde6e742..70d05d95eb3 100644
--- a/src/uu/ls/src/ls.rs
+++ b/src/uu/ls/src/ls.rs
@@ -3288,7 +3288,7 @@ fn color_name(
 
     if check_for_deref {
         // use the optional target_symlink
-        // Use fn get_metadata instead of md() here and above because ls
+        // Use fn get_metadata_with_deref_opt instead of get_metadata() here because ls
         // should not exit with an err, if we are unable to obtain the target_metadata
         let target = target_symlink.unwrap_or(path);
         let md = get_metadata_with_deref_opt(target.p_buf.as_path(), path.must_dereference)

From c5217b3136808a078225f94cd0d686b2a41a2dcb Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Sun, 24 Dec 2023 15:03:34 +0100
Subject: [PATCH 259/429] ls: remove unused arg check_for_deref

---
 src/uu/ls/src/ls.rs | 7 ++-----
 1 file changed, 2 insertions(+), 5 deletions(-)

diff --git a/src/uu/ls/src/ls.rs b/src/uu/ls/src/ls.rs
index 70d05d95eb3..163fc78e1a4 100644
--- a/src/uu/ls/src/ls.rs
+++ b/src/uu/ls/src/ls.rs
@@ -3070,7 +3070,7 @@ fn display_item_name(
     }
 
     if let Some(ls_colors) = &config.color {
-        name = color_name(name, path, ls_colors, style_manager, out, false, None);
+        name = color_name(name, path, ls_colors, style_manager, out, None);
     }
 
     if config.format != Format::Long && !more_info.is_empty() {
@@ -3151,7 +3151,6 @@ fn display_item_name(
                             ls_colors,
                             style_manager,
                             out,
-                            true,
                             Some(&target_data),
                         ));
                     }
@@ -3272,7 +3271,6 @@ fn color_name(
     ls_colors: &LsColors,
     style_manager: &mut StyleManager,
     out: &mut BufWriter<Stdout>,
-    check_for_deref: bool,
     target_symlink: Option<&PathData>,
 ) -> String {
     if !path.must_dereference {
@@ -3286,11 +3284,10 @@ fn color_name(
         }
     }
 
-    if check_for_deref {
+    if let Some(target) = target_symlink {
         // use the optional target_symlink
         // Use fn get_metadata_with_deref_opt instead of get_metadata() here because ls
         // should not exit with an err, if we are unable to obtain the target_metadata
-        let target = target_symlink.unwrap_or(path);
         let md = get_metadata_with_deref_opt(target.p_buf.as_path(), path.must_dereference)
             .unwrap_or_else(|_| target.get_metadata(out).unwrap().clone());
 

From 15573579cc4d043d6505011becbf82966f5d52b0 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Sun, 24 Dec 2023 15:18:31 +0100
Subject: [PATCH 260/429] Fix the windows tests

---
 tests/by-util/test_cp.rs | 15 +++++++++------
 tests/by-util/test_ln.rs | 16 ++++++++++------
 tests/by-util/test_mv.rs | 33 ++++++++++++++++++++-------------
 3 files changed, 39 insertions(+), 25 deletions(-)

diff --git a/tests/by-util/test_cp.rs b/tests/by-util/test_cp.rs
index eda5dd4c6e4..07b9620a637 100644
--- a/tests/by-util/test_cp.rs
+++ b/tests/by-util/test_cp.rs
@@ -3571,12 +3571,15 @@ fn test_cp_seen_file() {
     at.write("a/f", "a");
     at.write("b/f", "b");
 
-    ts.ucmd()
-        .arg("a/f")
-        .arg("b/f")
-        .arg("c")
-        .fails()
-        .stderr_contains("will not overwrite just-created 'c/f' with 'b/f'");
+    let result = ts.ucmd().arg("a/f").arg("b/f").arg("c").fails();
+    #[cfg(not(unix))]
+    assert!(result
+        .stderr_str()
+        .contains("will not overwrite just-created 'c\\f' with 'b/f'"));
+    #[cfg(unix)]
+    assert!(result
+        .stderr_str()
+        .contains("will not overwrite just-created 'c/f' with 'b/f'"));
 
     assert!(at.plus("c").join("f").exists());
 
diff --git a/tests/by-util/test_ln.rs b/tests/by-util/test_ln.rs
index b6453bf4376..e51d99732cd 100644
--- a/tests/by-util/test_ln.rs
+++ b/tests/by-util/test_ln.rs
@@ -733,12 +733,16 @@ fn test_ln_seen_file() {
     at.write("a/f", "a");
     at.write("b/f", "b");
 
-    ts.ucmd()
-        .arg("a/f")
-        .arg("b/f")
-        .arg("c")
-        .fails()
-        .stderr_contains("will not overwrite just-created 'c/f' with 'b/f'");
+    let result = ts.ucmd().arg("a/f").arg("b/f").arg("c").fails();
+
+    #[cfg(not(unix))]
+    assert!(result
+        .stderr_str()
+        .contains("will not overwrite just-created 'c\\f' with 'b/f'"));
+    #[cfg(unix)]
+    assert!(result
+        .stderr_str()
+        .contains("will not overwrite just-created 'c/f' with 'b/f'"));
 
     assert!(at.plus("c").join("f").exists());
     // b/f still exists
diff --git a/tests/by-util/test_mv.rs b/tests/by-util/test_mv.rs
index bc75ada3fae..61a4aebf657 100644
--- a/tests/by-util/test_mv.rs
+++ b/tests/by-util/test_mv.rs
@@ -1480,12 +1480,16 @@ fn test_mv_seen_file() {
     at.write("a/f", "a");
     at.write("b/f", "b");
 
-    ts.ucmd()
-        .arg("a/f")
-        .arg("b/f")
-        .arg("c")
-        .fails()
-        .stderr_contains("will not overwrite just-created 'c/f' with 'b/f'");
+    let result = ts.ucmd().arg("a/f").arg("b/f").arg("c").fails();
+
+    #[cfg(not(unix))]
+    assert!(result
+        .stderr_str()
+        .contains("will not overwrite just-created 'c\\f' with 'b/f'"));
+    #[cfg(unix)]
+    assert!(result
+        .stderr_str()
+        .contains("will not overwrite just-created 'c/f' with 'b/f'"));
 
     // a/f has been moved into c/f
     assert!(at.plus("c").join("f").exists());
@@ -1507,13 +1511,16 @@ fn test_mv_seen_multiple_files_to_directory() {
     at.write("b/f", "b");
     at.write("b/g", "g");
 
-    ts.ucmd()
-        .arg("a/f")
-        .arg("b/f")
-        .arg("b/g")
-        .arg("c")
-        .fails()
-        .stderr_contains("will not overwrite just-created 'c/f' with 'b/f'");
+    let result = ts.ucmd().arg("a/f").arg("b/f").arg("b/g").arg("c").fails();
+    #[cfg(not(unix))]
+    assert!(result
+        .stderr_str()
+        .contains("will not overwrite just-created 'c\\f' with 'b/f'"));
+    #[cfg(unix)]
+    assert!(result
+        .stderr_str()
+        .contains("will not overwrite just-created 'c/f' with 'b/f'"));
+
     assert!(!at.plus("a").join("f").exists());
     assert!(at.plus("b").join("f").exists());
     assert!(!at.plus("b").join("g").exists());

From 0220353c4cd9a3fb038b9bcf6d6dc21f31300718 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Sun, 24 Dec 2023 15:26:38 +0100
Subject: [PATCH 261/429] test_install.rs: Remove a debug artifact

---
 tests/by-util/test_install.rs | 1 -
 1 file changed, 1 deletion(-)

diff --git a/tests/by-util/test_install.rs b/tests/by-util/test_install.rs
index 5957e73dc47..85335285aae 100644
--- a/tests/by-util/test_install.rs
+++ b/tests/by-util/test_install.rs
@@ -683,7 +683,6 @@ fn test_install_and_strip_with_program_hyphen() {
 
     let at = &scene.fixtures;
     let content = r#"#!/bin/sh
-    echo $1 &> /tmp/a.log
     printf -- '%s\n' "$1" | grep '^[^-]'
     "#;
     at.write("no-hyphen", content);

From 270ac90cc13cf446cdccd884e3b9e4de4aec5842 Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Sat, 23 Dec 2023 17:24:54 +0100
Subject: [PATCH 262/429] ls: set correct block size when -k is provided

---
 src/uu/ls/src/ls.rs      | 42 ++++++++++++++++++---------------
 tests/by-util/test_ls.rs | 50 ++++++++++++++++++++++++++++++++++++++++
 2 files changed, 74 insertions(+), 18 deletions(-)

diff --git a/src/uu/ls/src/ls.rs b/src/uu/ls/src/ls.rs
index 7ad1704fc4e..ab8fbf04327 100644
--- a/src/uu/ls/src/ls.rs
+++ b/src/uu/ls/src/ls.rs
@@ -828,17 +828,13 @@ impl Config {
 
         let raw_block_size = if let Some(opt_block_size) = opt_block_size {
             OsString::from(opt_block_size)
-        } else if !opt_kb {
-            if let Some(env_var_ls_block_size) = env_var_ls_block_size {
-                env_var_ls_block_size
-            } else if let Some(env_var_block_size) = env_var_block_size {
-                env_var_block_size
-            } else if let Some(env_var_blocksize) = env_var_blocksize {
-                is_env_var_blocksize = true;
-                env_var_blocksize
-            } else {
-                OsString::from("")
-            }
+        } else if let Some(env_var_ls_block_size) = env_var_ls_block_size {
+            env_var_ls_block_size
+        } else if let Some(env_var_block_size) = env_var_block_size {
+            env_var_block_size
+        } else if let Some(env_var_blocksize) = env_var_blocksize {
+            is_env_var_blocksize = true;
+            env_var_blocksize
         } else {
             OsString::from("")
         };
@@ -846,13 +842,19 @@ impl Config {
         let (file_size_block_size, block_size) = if !opt_si && !opt_hr && !raw_block_size.is_empty()
         {
             match parse_size_u64(&raw_block_size.to_string_lossy()) {
-                Ok(size) => {
-                    if is_env_var_blocksize {
-                        (DEFAULT_FILE_SIZE_BLOCK_SIZE, size)
-                    } else {
-                        (size, size)
+                Ok(size) => match (is_env_var_blocksize, opt_kb) {
+                    (true, true) => (DEFAULT_FILE_SIZE_BLOCK_SIZE, DEFAULT_BLOCK_SIZE),
+                    (true, false) => (DEFAULT_FILE_SIZE_BLOCK_SIZE, size),
+                    (false, true) => {
+                        // --block-size overrides -k
+                        if opt_block_size.is_some() {
+                            (size, size)
+                        } else {
+                            (size, DEFAULT_BLOCK_SIZE)
+                        }
                     }
-                }
+                    (false, false) => (size, size),
+                },
                 Err(_) => {
                     // only fail if invalid block size was specified with --block-size,
                     // ignore invalid block size from env vars
@@ -869,7 +871,11 @@ impl Config {
                 }
             }
         } else if env_var_posixly_correct.is_some() {
-            (DEFAULT_FILE_SIZE_BLOCK_SIZE, POSIXLY_CORRECT_BLOCK_SIZE)
+            if opt_kb {
+                (DEFAULT_FILE_SIZE_BLOCK_SIZE, DEFAULT_BLOCK_SIZE)
+            } else {
+                (DEFAULT_FILE_SIZE_BLOCK_SIZE, POSIXLY_CORRECT_BLOCK_SIZE)
+            }
         } else if opt_si {
             (DEFAULT_FILE_SIZE_BLOCK_SIZE, 1000)
         } else {
diff --git a/tests/by-util/test_ls.rs b/tests/by-util/test_ls.rs
index a7744063fa3..5da8912e3f0 100644
--- a/tests/by-util/test_ls.rs
+++ b/tests/by-util/test_ls.rs
@@ -3890,6 +3890,56 @@ fn test_posixly_correct_and_block_size_env_vars() {
         .stdout_contains(" 1024 ");
 }
 
+#[cfg(all(unix, feature = "dd"))]
+#[test]
+fn test_posixly_correct_and_block_size_env_vars_with_k() {
+    let scene = TestScenario::new(util_name!());
+
+    scene
+        .ccmd("dd")
+        .arg("if=/dev/zero")
+        .arg("of=file")
+        .arg("bs=1024")
+        .arg("count=1")
+        .succeeds();
+
+    scene
+        .ucmd()
+        .arg("-l")
+        .arg("-k")
+        .env("POSIXLY_CORRECT", "some_value")
+        .succeeds()
+        .stdout_contains_line("total 4")
+        .stdout_contains(" 1024 ");
+
+    scene
+        .ucmd()
+        .arg("-l")
+        .arg("-k")
+        .env("LS_BLOCK_SIZE", "512")
+        .succeeds()
+        .stdout_contains_line("total 4")
+        .stdout_contains(" 2 ");
+
+    scene
+        .ucmd()
+        .arg("-l")
+        .arg("-k")
+        .env("BLOCK_SIZE", "512")
+        .succeeds()
+        .stdout_contains_line("total 4")
+        .stdout_contains(" 2 ");
+
+    scene
+        .ucmd()
+        .arg("-l")
+        .arg("-k")
+        .env("BLOCKSIZE", "512")
+        .succeeds()
+        .stdout_contains_line("total 4")
+        .stdout_contains(" 1024 ");
+}
+
 #[test]
 fn test_ls_invalid_block_size() {
     new_ucmd!()

From 3e892de4d53958922e8a0be71bf1aee80821d590 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Sun, 24 Dec 2023 16:37:43 +0100
Subject: [PATCH 263/429] gnu: Improve the diff when comparing diff

---
 util/build-gnu.sh | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/util/build-gnu.sh b/util/build-gnu.sh
index 4b682f4ada0..0b6f984d9a8 100755
--- a/util/build-gnu.sh
+++ b/util/build-gnu.sh
@@ -115,6 +115,8 @@ else
     # Change the PATH in the Makefile to test the uutils coreutils instead of the GNU coreutils
     sed -i "s/^[[:blank:]]*PATH=.*/  PATH='${UU_BUILD_DIR//\//\\/}\$(PATH_SEPARATOR)'\"\$\$PATH\" \\\/" Makefile
     sed -i 's| tr | /usr/bin/tr |' tests/init.sh
+    # Use a better diff
+    sed -i 's|diff -c|diff -u|g' tests/Coreutils.pm
     make -j "$(nproc)"
     touch gnu-built
 fi

From 853f73b7c9b10074bbd39d2bff5f1a2e00ac3159 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Mon, 25 Dec 2023 11:05:55 +0100
Subject: [PATCH 264/429] tee test: fix a warning on not(linux) warning: unused
 import: `std::fmt::Write`

---
 tests/by-util/test_tee.rs | 1 +
 1 file changed, 1 insertion(+)

diff --git a/tests/by-util/test_tee.rs b/tests/by-util/test_tee.rs
index 2b3fd2670ab..34076bbf9b1 100644
--- a/tests/by-util/test_tee.rs
+++ b/tests/by-util/test_tee.rs
@@ -3,6 +3,7 @@
 // For the full copyright and license information, please view the LICENSE
 // file that was distributed with this source code.
 use crate::common::util::TestScenario;
+#[cfg(target_os = "linux")]
 use std::fmt::Write;
 
 // tests for basic tee functionality.

From f86e314f4686f912c91fa1cf4c4f95c7f856dd5c Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Mon, 25 Dec 2023 09:47:37 +0100
Subject: [PATCH 265/429] Fix some obvious comment

Co-authored-by: Daniel Hofstetter <daniel.hofstetter@42dh.com>
---
 src/uu/cp/src/cp.rs      | 2 --
 src/uu/ln/src/ln.rs      | 2 +-
 tests/by-util/test_ln.rs | 2 +-
 3 files changed, 2 insertions(+), 4 deletions(-)

diff --git a/src/uu/cp/src/cp.rs b/src/uu/cp/src/cp.rs
index 4d002359f93..72bfbf54e5b 100644
--- a/src/uu/cp/src/cp.rs
+++ b/src/uu/cp/src/cp.rs
@@ -1195,8 +1195,6 @@ pub fn copy(sources: &[PathBuf], target: &Path, options: &Options) -> CopyResult
             // FIXME: compare sources by the actual file they point to, not their path. (e.g. dir/file == dir/../dir/file in most cases)
             show_warning!("source {} specified more than once", source.quote());
         } else {
-            // We need to compute the destination path
-
             let dest = construct_dest_path(source, target, target_type, options)
                 .unwrap_or_else(|_| target.to_path_buf());
 
diff --git a/src/uu/ln/src/ln.rs b/src/uu/ln/src/ln.rs
index e53af03a243..a056ee256a1 100644
--- a/src/uu/ln/src/ln.rs
+++ b/src/uu/ln/src/ln.rs
@@ -342,7 +342,7 @@ fn link_files_in_dir(files: &[PathBuf], target_dir: &Path, settings: &Settings)
             };
 
         if linked_destinations.contains(&targetpath) {
-            // If the target file was already created in this linked call, do not overwrite
+            // If the target file was already created in this ln call, do not overwrite
             show_error!(
                 "will not overwrite just-created '{}' with '{}'",
                 targetpath.display(),
diff --git a/tests/by-util/test_ln.rs b/tests/by-util/test_ln.rs
index e51d99732cd..78978a06ead 100644
--- a/tests/by-util/test_ln.rs
+++ b/tests/by-util/test_ln.rs
@@ -747,7 +747,7 @@ fn test_ln_seen_file() {
     assert!(at.plus("c").join("f").exists());
     // b/f still exists
     assert!(at.plus("b").join("f").exists());
-    // a/f no longer exists
+    // a/f still exists
     assert!(at.plus("a").join("f").exists());
     #[cfg(unix)]
     {

From 60d71e3f2a855925fe526e3df0a36accf959774d Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Mon, 25 Dec 2023 11:22:04 +0100
Subject: [PATCH 266/429] ln: disable a test on android

---
 tests/by-util/test_ln.rs | 1 +
 1 file changed, 1 insertion(+)

diff --git a/tests/by-util/test_ln.rs b/tests/by-util/test_ln.rs
index 78978a06ead..2501e9d362a 100644
--- a/tests/by-util/test_ln.rs
+++ b/tests/by-util/test_ln.rs
@@ -723,6 +723,7 @@ fn test_symlink_remove_existing_same_src_and_dest() {
 }
 
 #[test]
+#[cfg(not(target_os = "android"))]
 fn test_ln_seen_file() {
     let ts = TestScenario::new(util_name!());
     let at = &ts.fixtures;

From e232ec657e462e7eb790bae184cad0f4322585cc Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Mon, 25 Dec 2023 12:36:56 +0100
Subject: [PATCH 267/429] Disable fuzzing seq until the
 https://github.com/uutils/coreutils/issues/5724 is fixed

---
 .github/workflows/fuzzing.yml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/.github/workflows/fuzzing.yml b/.github/workflows/fuzzing.yml
index c29294d4d6c..1945088442a 100644
--- a/.github/workflows/fuzzing.yml
+++ b/.github/workflows/fuzzing.yml
@@ -48,7 +48,7 @@ jobs:
           - { name: fuzz_expr, should_pass: true }
           - { name: fuzz_printf, should_pass: false }
           - { name: fuzz_echo, should_pass: true }
-          - { name: fuzz_seq, should_pass: false }
+          # - { name: fuzz_seq, should_pass: false }
           - { name: fuzz_parse_glob, should_pass: true }
           - { name: fuzz_parse_size, should_pass: true }
           - { name: fuzz_parse_time, should_pass: true }

From 4946478409a045733b33752485d295f0d9068249 Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Wed, 1 Nov 2023 10:42:21 +0100
Subject: [PATCH 268/429] cp: -l don't fail if dest is hardlink to source

---
 src/uu/cp/src/cp.rs      |  6 ++++++
 tests/by-util/test_cp.rs | 19 +++++++++++++++++++
 2 files changed, 25 insertions(+)

diff --git a/src/uu/cp/src/cp.rs b/src/uu/cp/src/cp.rs
index c03eb25a5c5..ebd865dc354 100644
--- a/src/uu/cp/src/cp.rs
+++ b/src/uu/cp/src/cp.rs
@@ -1682,6 +1682,12 @@ fn copy_file(
     }
 
     if file_or_link_exists(dest) {
+        if are_hardlinks_to_same_file(source, dest)
+            && !options.force()
+            && options.backup == BackupMode::NoBackup
+        {
+            return Ok(());
+        }
         handle_existing_dest(source, dest, options, source_in_command_line)?;
     }
 
diff --git a/tests/by-util/test_cp.rs b/tests/by-util/test_cp.rs
index dfd20c9c261..261057cf3a4 100644
--- a/tests/by-util/test_cp.rs
+++ b/tests/by-util/test_cp.rs
@@ -531,6 +531,25 @@ fn test_cp_arg_link() {
     assert_eq!(at.metadata(TEST_HELLO_WORLD_SOURCE).st_nlink(), 2);
 }
 
+#[test]
+#[cfg(target_os = "linux")]
+fn test_cp_arg_link_with_dest_hardlink_to_source() {
+    use std::os::linux::fs::MetadataExt;
+
+    let (at, mut ucmd) = at_and_ucmd!();
+    let file = "file";
+    let hardlink = "hardlink";
+
+    at.touch(file);
+    at.hard_link(file, hardlink);
+
+    ucmd.args(&["--link", file, hardlink]).succeeds();
+
+    assert_eq!(at.metadata(file).st_nlink(), 2);
+    assert!(at.file_exists(file));
+    assert!(at.file_exists(hardlink));
+}
+
 #[test]
 fn test_cp_arg_symlink() {
     let (at, mut ucmd) = at_and_ucmd!();

From 97a6df78a463604d30064fd476df7877f4be6d0e Mon Sep 17 00:00:00 2001
From: "renovate[bot]" <29139614+renovate[bot]@users.noreply.github.com>
Date: Fri, 15 Sep 2023 13:01:25 +0000
Subject: [PATCH 269/429] chore(deps): update dependency ubuntu to v22

---
 .github/workflows/GnuTests.yml | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/.github/workflows/GnuTests.yml b/.github/workflows/GnuTests.yml
index 3ce6e8be27b..0799b2e6c14 100644
--- a/.github/workflows/GnuTests.yml
+++ b/.github/workflows/GnuTests.yml
@@ -30,7 +30,7 @@ jobs:
       contents: read  # for actions/checkout to fetch code
       pull-requests: read  # for dawidd6/action-download-artifact to query commit hash
     name: Run GNU tests
-    runs-on: ubuntu-20.04
+    runs-on: ubuntu-22.04
     steps:
     - name: Initialize workflow variables
       id: vars
@@ -308,7 +308,7 @@ jobs:
 
   gnu_coverage:
     name: Run GNU tests with coverage
-    runs-on: ubuntu-20.04
+    runs-on: ubuntu-22.04
     steps:
     - name: Checkout code uutil
       uses: actions/checkout@v4

From 1915e3c438b8c096188eba3ba04b2276d2a4adc5 Mon Sep 17 00:00:00 2001
From: Nathan Houghton <nathan@brainwerk.org>
Date: Sun, 22 Oct 2023 10:22:36 -0700
Subject: [PATCH 270/429] tests/test: Ensure the test fixture files have the
 expected gid

On some platforms (mostly the BSDs) the test fixture files copied to the
/tmp directory will have a different gid than the current egid (due to
the sticky bit set on the /tmp directory). Fix this before running the
"test" command.
---
 tests/by-util/test_test.rs | 42 +++++++++++++++++++++++++++++++++-----
 1 file changed, 37 insertions(+), 5 deletions(-)

diff --git a/tests/by-util/test_test.rs b/tests/by-util/test_test.rs
index b91bc727d40..277e4622a69 100644
--- a/tests/by-util/test_test.rs
+++ b/tests/by-util/test_test.rs
@@ -667,7 +667,7 @@ fn test_nonexistent_file_not_owned_by_euid() {
 }
 
 #[test]
-#[cfg(all(not(windows), not(target_os = "freebsd")))]
+#[cfg(not(windows))]
 fn test_file_not_owned_by_euid() {
     new_ucmd!()
         .args(&["-f", "/bin/sh", "-a", "!", "-O", "/bin/sh"])
@@ -675,9 +675,32 @@ fn test_file_not_owned_by_euid() {
 }
 
 #[test]
-#[cfg(all(not(windows), not(target_os = "freebsd")))]
+#[cfg(not(windows))]
 fn test_file_owned_by_egid() {
-    new_ucmd!().args(&["-G", "regular_file"]).succeeds();
+    let scene = TestScenario::new(util_name!());
+    let at = &scene.fixtures;
+
+    // On some platforms (mostly the BSDs) the test fixture files copied to the
+    // /tmp directory will have a different gid than the current egid (due to
+    // the sticky bit set on the /tmp directory). Fix this before running the
+    // test command.
+    use std::ffi::CString;
+    use std::os::unix::ffi::OsStrExt;
+    use std::os::unix::fs::MetadataExt;
+    use uucore::process::getegid;
+
+    let metadata = at.metadata("regular_file");
+    let file_gid = metadata.gid();
+    let user_gid = getegid();
+
+    if user_gid != file_gid {
+        let file_uid = metadata.uid();
+        let path = CString::new(at.plus("regular_file").as_os_str().as_bytes()).expect("bad path");
+        let r = unsafe { libc::chown(path.as_ptr().into(), file_uid, user_gid) };
+        assert_ne!(r, -1);
+    }
+
+    scene.ucmd().args(&["-G", "regular_file"]).succeeds();
 }
 
 #[test]
@@ -690,10 +713,19 @@ fn test_nonexistent_file_not_owned_by_egid() {
 }
 
 #[test]
-#[cfg(all(not(windows), not(target_os = "freebsd")))]
+#[cfg(not(windows))]
 fn test_file_not_owned_by_egid() {
+    let target_file = if cfg!(target_os = "freebsd") {
+        // The coreutils test runner user has a primary group id of "wheel",
+        // which matches the gid of /bin/sh, so use /sbin/shutdown which has gid
+        // of "operator".
+        "/sbin/shutdown"
+    } else {
+        "/bin/sh"
+    };
+
     new_ucmd!()
-        .args(&["-f", "/bin/sh", "-a", "!", "-G", "/bin/sh"])
+        .args(&["-f", target_file, "-a", "!", "-G", target_file])
         .succeeds();
 }
 

From 03f1b8aa3a4a86b3bdefaf683cc175f8f24b73bc Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Tue, 31 Oct 2023 14:41:00 +0100
Subject: [PATCH 271/429] mv: fix subdir detection

---
 src/uu/mv/src/mv.rs      | 30 ++++++++----------------------
 tests/by-util/test_mv.rs | 14 ++++++++++++++
 2 files changed, 22 insertions(+), 22 deletions(-)

diff --git a/src/uu/mv/src/mv.rs b/src/uu/mv/src/mv.rs
index dec6d3ad3a7..82550e9bd37 100644
--- a/src/uu/mv/src/mv.rs
+++ b/src/uu/mv/src/mv.rs
@@ -358,29 +358,15 @@ fn handle_two_paths(source: &Path, target: &Path, opts: &Options) -> UResult<()>
             } else {
                 Err(MvError::DirectoryToNonDirectory(target.quote().to_string()).into())
             }
+        // Check that source & target do not contain same subdir/dir when both exist
+        // mkdir dir1/dir2; mv dir1 dir1/dir2
+        } else if target.starts_with(source) {
+            Err(MvError::SelfTargetSubdirectory(
+                source.display().to_string(),
+                target.display().to_string(),
+            )
+            .into())
         } else {
-            // Check that source & target  do not contain same subdir/dir when both exist
-            // mkdir dir1/dir2; mv dir1 dir1/dir2
-            let target_contains_itself = target
-                .as_os_str()
-                .to_str()
-                .ok_or("not a valid unicode string")
-                .and_then(|t| {
-                    source
-                        .as_os_str()
-                        .to_str()
-                        .ok_or("not a valid unicode string")
-                        .map(|s| t.contains(s))
-                })
-                .unwrap();
-
-            if target_contains_itself {
-                return Err(MvError::SelfTargetSubdirectory(
-                    source.display().to_string(),
-                    target.display().to_string(),
-                )
-                .into());
-            }
             move_files_into_dir(&[source.to_path_buf()], target, opts)
         }
     } else if target.exists() && source.is_dir() {
diff --git a/tests/by-util/test_mv.rs b/tests/by-util/test_mv.rs
index 75500ac63d9..22548d831a6 100644
--- a/tests/by-util/test_mv.rs
+++ b/tests/by-util/test_mv.rs
@@ -1455,6 +1455,20 @@ fn test_mv_directory_into_subdirectory_of_itself_fails() {
         );
 }
 
+#[test]
+fn test_mv_dir_into_dir_with_source_name_a_prefix_of_target_name() {
+    let (at, mut ucmd) = at_and_ucmd!();
+    let source = "test";
+    let target = "test2";
+
+    at.mkdir(source);
+    at.mkdir(target);
+
+    ucmd.arg(source).arg(target).succeeds().no_output();
+
+    assert!(at.dir_exists(&format!("{target}/{source}")));
+}
+
 #[test]
 fn test_mv_file_into_dir_where_both_are_files() {
     let scene = TestScenario::new(util_name!());

From 030fd3d4d2cb25b0b1ac340bf9416d023c115745 Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Tue, 14 Nov 2023 14:24:12 +0100
Subject: [PATCH 272/429] du: test behavior with POSIXLY_CORRECT set

---
 tests/by-util/test_du.rs | 26 ++++++++++++++++++++++++++
 1 file changed, 26 insertions(+)

diff --git a/tests/by-util/test_du.rs b/tests/by-util/test_du.rs
index cb1341432a0..243ee53c443 100644
--- a/tests/by-util/test_du.rs
+++ b/tests/by-util/test_du.rs
@@ -118,6 +118,32 @@ fn test_du_invalid_size() {
     }
 }
 
+#[test]
+fn test_du_with_posixly_correct() {
+    let ts = TestScenario::new(util_name!());
+    let at = &ts.fixtures;
+    let dir = "a";
+
+    at.mkdir(dir);
+    at.write(&format!("{dir}/file"), "some content");
+
+    let expected = ts
+        .ucmd()
+        .arg(dir)
+        .arg("--block-size=512")
+        .succeeds()
+        .stdout_move_str();
+
+    let result = ts
+        .ucmd()
+        .arg(dir)
+        .env("POSIXLY_CORRECT", "1")
+        .succeeds()
+        .stdout_move_str();
+
+    assert_eq!(expected, result);
+}
+
 #[test]
 fn test_du_basics_bad_name() {
     new_ucmd!()

From da43183fc7263a37a1536d9077f0f168c004002d Mon Sep 17 00:00:00 2001
From: Paul  Houssel <paul.houssel@telecom-sudparis.eu>
Date: Tue, 26 Dec 2023 09:52:32 +0100
Subject: [PATCH 273/429] cat: address cognitive_complexity lint

Signed-off-by: Paul  Houssel <paul.houssel@telecom-sudparis.eu>
---
 src/uu/cat/src/cat.rs | 83 ++++++++++++++++++++++++++++---------------
 1 file changed, 55 insertions(+), 28 deletions(-)

diff --git a/src/uu/cat/src/cat.rs b/src/uu/cat/src/cat.rs
index 8aaecb8c175..af55442ca5e 100644
--- a/src/uu/cat/src/cat.rs
+++ b/src/uu/cat/src/cat.rs
@@ -463,7 +463,6 @@ fn write_fast<R: FdReadable>(handle: &mut InputHandle<R>) -> CatResult<()> {
 
 /// Outputs file contents to stdout in a line-by-line fashion,
 /// propagating any errors that might occur.
-#[allow(clippy::cognitive_complexity)]
 fn write_lines<R: FdReadable>(
     handle: &mut InputHandle<R>,
     options: &OutputOptions,
@@ -482,22 +481,7 @@ fn write_lines<R: FdReadable>(
         while pos < n {
             // skip empty line_number enumerating them if needed
             if in_buf[pos] == b'\n' {
-                // \r followed by \n is printed as ^M when show_ends is enabled, so that \r\n prints as ^M$
-                if state.skipped_carriage_return && options.show_ends {
-                    writer.write_all(b"^M")?;
-                    state.skipped_carriage_return = false;
-                }
-                if !state.at_line_start || !options.squeeze_blank || !state.one_blank_kept {
-                    state.one_blank_kept = true;
-                    if state.at_line_start && options.number == NumberingMode::All {
-                        write!(writer, "{0:6}\t", state.line_number)?;
-                        state.line_number += 1;
-                    }
-                    writer.write_all(options.end_of_line().as_bytes())?;
-                    if handle.is_interactive {
-                        writer.flush()?;
-                    }
-                }
+                write_new_line(&mut writer, options, state, handle.is_interactive)?;
                 state.at_line_start = true;
                 pos += 1;
                 continue;
@@ -514,13 +498,8 @@ fn write_lines<R: FdReadable>(
             }
 
             // print to end of line or end of buffer
-            let offset = if options.show_nonprint {
-                write_nonprint_to_end(&in_buf[pos..], &mut writer, options.tab().as_bytes())
-            } else if options.show_tabs {
-                write_tab_to_end(&in_buf[pos..], &mut writer)
-            } else {
-                write_to_end(&in_buf[pos..], &mut writer)
-            };
+            let offset = write_end(&mut writer, &in_buf[pos..], options);
+
             // end of buffer?
             if offset + pos == in_buf.len() {
                 state.at_line_start = false;
@@ -531,10 +510,11 @@ fn write_lines<R: FdReadable>(
             } else {
                 assert_eq!(in_buf[pos + offset], b'\n');
                 // print suitable end of line
-                writer.write_all(options.end_of_line().as_bytes())?;
-                if handle.is_interactive {
-                    writer.flush()?;
-                }
+                write_end_of_line(
+                    &mut writer,
+                    options.end_of_line().as_bytes(),
+                    handle.is_interactive,
+                )?;
                 state.at_line_start = true;
             }
             pos += offset + 1;
@@ -544,6 +524,41 @@ fn write_lines<R: FdReadable>(
     Ok(())
 }
 
+// \r followed by \n is printed as ^M when show_ends is enabled, so that \r\n prints as ^M$
+fn write_new_line<W: Write>(
+    writer: &mut W,
+    options: &OutputOptions,
+    state: &mut OutputState,
+    is_interactive: bool,
+) -> CatResult<()> {
+    if state.skipped_carriage_return && options.show_ends {
+        writer.write_all(b"^M")?;
+        state.skipped_carriage_return = false;
+    }
+    if !state.at_line_start || !options.squeeze_blank || !state.one_blank_kept {
+        state.one_blank_kept = true;
+        if state.at_line_start && options.number == NumberingMode::All {
+            write!(writer, "{0:6}\t", state.line_number)?;
+            state.line_number += 1;
+        }
+        writer.write_all(options.end_of_line().as_bytes())?;
+        if is_interactive {
+            writer.flush()?;
+        }
+    }
+    Ok(())
+}
+
+fn write_end<W: Write>(writer: &mut W, in_buf: &[u8], options: &OutputOptions) -> usize {
+    if options.show_nonprint {
+        write_nonprint_to_end(in_buf, writer, options.tab().as_bytes())
+    } else if options.show_tabs {
+        write_tab_to_end(in_buf, writer)
+    } else {
+        write_to_end(in_buf, writer)
+    }
+}
+
 // write***_to_end methods
 // Write all symbols till \n or \r or end of buffer is reached
 // We need to stop at \r because it may be written as ^M depending on the byte after and settings;
@@ -610,6 +625,18 @@ fn write_nonprint_to_end<W: Write>(in_buf: &[u8], writer: &mut W, tab: &[u8]) ->
     count
 }
 
+fn write_end_of_line<W: Write>(
+    writer: &mut W,
+    end_of_line: &[u8],
+    is_interactive: bool,
+) -> CatResult<()> {
+    writer.write_all(end_of_line)?;
+    if is_interactive {
+        writer.flush()?;
+    }
+    Ok(())
+}
+
 #[cfg(test)]
 mod tests {
     use std::io::{stdout, BufWriter};

From eb3dd521eece286db6b71187a15c35a3ed0e5b7b Mon Sep 17 00:00:00 2001
From: Paul  Houssel <paul.houssel@telecom-sudparis.eu>
Date: Tue, 26 Dec 2023 10:42:44 +0100
Subject: [PATCH 274/429] touch: address cognitive_complexity lint

Signed-off-by: Paul  Houssel <paul.houssel@telecom-sudparis.eu>
---
 src/uu/touch/src/touch.rs | 165 +++++++++++++++++++++-----------------
 1 file changed, 90 insertions(+), 75 deletions(-)

diff --git a/src/uu/touch/src/touch.rs b/src/uu/touch/src/touch.rs
index 51c09801b0a..ebdff8d2116 100644
--- a/src/uu/touch/src/touch.rs
+++ b/src/uu/touch/src/touch.rs
@@ -11,7 +11,7 @@ use chrono::{
     TimeZone, Timelike,
 };
 use clap::builder::ValueParser;
-use clap::{crate_version, Arg, ArgAction, ArgGroup, Command};
+use clap::{crate_version, Arg, ArgAction, ArgGroup, ArgMatches, Command};
 use filetime::{set_file_times, set_symlink_file_times, FileTime};
 use std::ffi::OsString;
 use std::fs::{self, File};
@@ -73,7 +73,6 @@ fn filetime_to_datetime(ft: &FileTime) -> Option<DateTime<Local>> {
 }
 
 #[uucore::main]
-#[allow(clippy::cognitive_complexity)]
 pub fn uumain(args: impl uucore::Args) -> UResult<()> {
     let matches = uu_app().try_get_matches_from(args)?;
 
@@ -86,37 +85,8 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
             ),
         )
     })?;
-    let (mut atime, mut mtime) = match (
-        matches.get_one::<OsString>(options::sources::REFERENCE),
-        matches.get_one::<String>(options::sources::DATE),
-    ) {
-        (Some(reference), Some(date)) => {
-            let (atime, mtime) = stat(Path::new(reference), !matches.get_flag(options::NO_DEREF))?;
-            let atime = filetime_to_datetime(&atime).ok_or_else(|| {
-                USimpleError::new(1, "Could not process the reference access time")
-            })?;
-            let mtime = filetime_to_datetime(&mtime).ok_or_else(|| {
-                USimpleError::new(1, "Could not process the reference modification time")
-            })?;
-            (parse_date(atime, date)?, parse_date(mtime, date)?)
-        }
-        (Some(reference), None) => {
-            stat(Path::new(reference), !matches.get_flag(options::NO_DEREF))?
-        }
-        (None, Some(date)) => {
-            let timestamp = parse_date(Local::now(), date)?;
-            (timestamp, timestamp)
-        }
-        (None, None) => {
-            let timestamp = if let Some(ts) = matches.get_one::<String>(options::sources::TIMESTAMP)
-            {
-                parse_timestamp(ts)?
-            } else {
-                datetime_to_filetime(&Local::now())
-            };
-            (timestamp, timestamp)
-        }
-    };
+
+    let (atime, mtime) = determine_times(&matches)?;
 
     for filename in files {
         // FIXME: find a way to avoid having to clone the path
@@ -165,48 +135,7 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
             }
         }
 
-        // If changing "only" atime or mtime, grab the existing value of the other.
-        // Note that "-a" and "-m" may be passed together; this is not an xor.
-        if matches.get_flag(options::ACCESS)
-            || matches.get_flag(options::MODIFICATION)
-            || matches.contains_id(options::TIME)
-        {
-            let st = stat(path, !matches.get_flag(options::NO_DEREF))?;
-            let time = matches
-                .get_one::<String>(options::TIME)
-                .map(|s| s.as_str())
-                .unwrap_or("");
-
-            if !(matches.get_flag(options::ACCESS)
-                || time.contains(&"access".to_owned())
-                || time.contains(&"atime".to_owned())
-                || time.contains(&"use".to_owned()))
-            {
-                atime = st.0;
-            }
-
-            if !(matches.get_flag(options::MODIFICATION)
-                || time.contains(&"modify".to_owned())
-                || time.contains(&"mtime".to_owned()))
-            {
-                mtime = st.1;
-            }
-        }
-
-        // sets the file access and modification times for a file or a symbolic link.
-        // The filename, access time (atime), and modification time (mtime) are provided as inputs.
-
-        // If the filename is not "-", indicating a special case for touch -h -,
-        // the code checks if the NO_DEREF flag is set, which means the user wants to
-        // set the times for a symbolic link itself, rather than the file it points to.
-        if filename == "-" {
-            filetime::set_file_times(path, atime, mtime)
-        } else if matches.get_flag(options::NO_DEREF) {
-            set_symlink_file_times(path, atime, mtime)
-        } else {
-            set_file_times(path, atime, mtime)
-        }
-        .map_err_context(|| format!("setting times of {}", path.quote()))?;
+        update_times(&matches, path, atime, mtime, filename)?;
     }
     Ok(())
 }
@@ -307,6 +236,92 @@ pub fn uu_app() -> Command {
         )
 }
 
+// Determine the access and modification time
+fn determine_times(matches: &ArgMatches) -> UResult<(FileTime, FileTime)> {
+    match (
+        matches.get_one::<OsString>(options::sources::REFERENCE),
+        matches.get_one::<String>(options::sources::DATE),
+    ) {
+        (Some(reference), Some(date)) => {
+            let (atime, mtime) = stat(Path::new(&reference), !matches.get_flag(options::NO_DEREF))?;
+            let atime = filetime_to_datetime(&atime).ok_or_else(|| {
+                USimpleError::new(1, "Could not process the reference access time")
+            })?;
+            let mtime = filetime_to_datetime(&mtime).ok_or_else(|| {
+                USimpleError::new(1, "Could not process the reference modification time")
+            })?;
+            Ok((parse_date(atime, date)?, parse_date(mtime, date)?))
+        }
+        (Some(reference), None) => {
+            stat(Path::new(&reference), !matches.get_flag(options::NO_DEREF))
+        }
+        (None, Some(date)) => {
+            let timestamp = parse_date(Local::now(), date)?;
+            Ok((timestamp, timestamp))
+        }
+        (None, None) => {
+            let timestamp = if let Some(ts) = matches.get_one::<String>(options::sources::TIMESTAMP)
+            {
+                parse_timestamp(ts)?
+            } else {
+                datetime_to_filetime(&Local::now())
+            };
+            Ok((timestamp, timestamp))
+        }
+    }
+}
+
+// Updating file access and modification times based on user-specified options
+fn update_times(
+    matches: &ArgMatches,
+    path: &Path,
+    mut atime: FileTime,
+    mut mtime: FileTime,
+    filename: &OsString,
+) -> UResult<()> {
+    // If changing "only" atime or mtime, grab the existing value of the other.
+    // Note that "-a" and "-m" may be passed together; this is not an xor.
+    if matches.get_flag(options::ACCESS)
+        || matches.get_flag(options::MODIFICATION)
+        || matches.contains_id(options::TIME)
+    {
+        let st = stat(path, !matches.get_flag(options::NO_DEREF))?;
+        let time = matches
+            .get_one::<String>(options::TIME)
+            .map(|s| s.as_str())
+            .unwrap_or("");
+
+        if !(matches.get_flag(options::ACCESS)
+            || time.contains(&"access".to_owned())
+            || time.contains(&"atime".to_owned())
+            || time.contains(&"use".to_owned()))
+        {
+            atime = st.0;
+        }
+
+        if !(matches.get_flag(options::MODIFICATION)
+            || time.contains(&"modify".to_owned())
+            || time.contains(&"mtime".to_owned()))
+        {
+            mtime = st.1;
+        }
+    }
+
+    // sets the file access and modification times for a file or a symbolic link.
+    // The filename, access time (atime), and modification time (mtime) are provided as inputs.
+
+    // If the filename is not "-", indicating a special case for touch -h -,
+    // the code checks if the NO_DEREF flag is set, which means the user wants to
+    // set the times for a symbolic link itself, rather than the file it points to.
+    if filename == "-" {
+        filetime::set_file_times(path, atime, mtime)
+    } else if matches.get_flag(options::NO_DEREF) {
+        set_symlink_file_times(path, atime, mtime)
+    } else {
+        set_file_times(path, atime, mtime)
+    }
+    .map_err_context(|| format!("setting times of {}", path.quote()))
+}
 // Get metadata of the provided path
 // If `follow` is `true`, the function will try to follow symlinks
 // If `follow` is `false` or the symlink is broken, the function will return metadata of the symlink itself

From 30eb77ac798e3e47d00187c4f25d64ac6eb99cdf Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Tue, 26 Dec 2023 14:40:31 +0100
Subject: [PATCH 275/429] du: implement files0-from (#5721)

* du: implement files0-from

Should make tests/du/files0-from-dir pass

* du: prepare tests/du/files0-from.pl

* fix the build on Windows

* add testfile to the ignore list

* remove useless comment

Co-authored-by: Daniel Hofstetter <daniel.hofstetter@42dh.com>

* mkdir is enough

Co-authored-by: Daniel Hofstetter <daniel.hofstetter@42dh.com>

* address review comments

---------

Co-authored-by: Daniel Hofstetter <daniel.hofstetter@42dh.com>
---
 src/uu/du/src/du.rs      | 81 ++++++++++++++++++++++++++++++++++++----
 tests/by-util/test_du.rs | 74 +++++++++++++++++++++++++++++++++++-
 util/build-gnu.sh        |  4 ++
 3 files changed, 150 insertions(+), 9 deletions(-)

diff --git a/src/uu/du/src/du.rs b/src/uu/du/src/du.rs
index 1213e004f15..e3f5a718654 100644
--- a/src/uu/du/src/du.rs
+++ b/src/uu/du/src/du.rs
@@ -65,6 +65,7 @@ mod options {
     pub const INODES: &str = "inodes";
     pub const EXCLUDE: &str = "exclude";
     pub const EXCLUDE_FROM: &str = "exclude-from";
+    pub const FILES0_FROM: &str = "files0-from";
     pub const VERBOSE: &str = "verbose";
     pub const FILE: &str = "FILE";
 }
@@ -587,6 +588,49 @@ pub fn div_ceil(a: u64, b: u64) -> u64 {
     (a + b - 1) / b
 }
 
+// Read file paths from the specified file, separated by null characters
+fn read_files_from(file_name: &str) -> Result<Vec<PathBuf>, std::io::Error> {
+    let reader: Box<dyn BufRead> = if file_name == "-" {
+        // Read from standard input
+        Box::new(BufReader::new(std::io::stdin()))
+    } else {
+        // First, check if the file_name is a directory
+        let path = PathBuf::from(file_name);
+        if path.is_dir() {
+            return Err(std::io::Error::new(
+                std::io::ErrorKind::Other,
+                format!("{}: read error: Is a directory", file_name),
+            ));
+        }
+
+        // Attempt to open the file and handle the error if it does not exist
+        match File::open(file_name) {
+            Ok(file) => Box::new(BufReader::new(file)),
+            Err(e) if e.kind() == std::io::ErrorKind::NotFound => {
+                return Err(std::io::Error::new(
+                    std::io::ErrorKind::Other,
+                    format!(
+                        "cannot open '{}' for reading: No such file or directory",
+                        file_name
+                    ),
+                ))
+            }
+            Err(e) => return Err(e),
+        }
+    };
+
+    let mut paths = Vec::new();
+
+    for line in reader.split(b'\0') {
+        let path = line?;
+        if !path.is_empty() {
+            paths.push(PathBuf::from(String::from_utf8_lossy(&path).to_string()));
+        }
+    }
+
+    Ok(paths)
+}
+
 #[uucore::main]
 #[allow(clippy::cognitive_complexity)]
 pub fn uumain(args: impl uucore::Args) -> UResult<()> {
@@ -601,13 +645,28 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
         summarize,
     )?;
 
-    let files = match matches.get_one::<String>(options::FILE) {
-        Some(_) => matches
-            .get_many::<String>(options::FILE)
-            .unwrap()
-            .map(PathBuf::from)
-            .collect(),
-        None => vec![PathBuf::from(".")],
+    let files = if let Some(file_from) = matches.get_one::<String>(options::FILES0_FROM) {
+        if file_from == "-" && matches.get_one::<String>(options::FILE).is_some() {
+            return Err(std::io::Error::new(
+                std::io::ErrorKind::Other,
+                format!(
+                    "extra operand {}\nfile operands cannot be combined with --files0-from",
+                    matches.get_one::<String>(options::FILE).unwrap().quote()
+                ),
+            )
+            .into());
+        }
+
+        read_files_from(file_from)?
+    } else {
+        match matches.get_one::<String>(options::FILE) {
+            Some(_) => matches
+                .get_many::<String>(options::FILE)
+                .unwrap()
+                .map(PathBuf::from)
+                .collect(),
+            None => vec![PathBuf::from(".")],
+        }
     };
 
     let time = matches.contains_id(options::TIME).then(|| {
@@ -954,6 +1013,14 @@ pub fn uu_app() -> Command {
                 .help("exclude files that match any pattern in FILE")
                 .action(ArgAction::Append)
         )
+        .arg(
+            Arg::new(options::FILES0_FROM)
+                .long("files0-from")
+                .value_name("FILE")
+                .value_hint(clap::ValueHint::FilePath)
+                .help("summarize device usage of the NUL-terminated file names specified in file F; if F is -, then read names from standard input")
+                .action(ArgAction::Append)
+        )
         .arg(
             Arg::new(options::TIME)
                 .long(options::TIME)
diff --git a/tests/by-util/test_du.rs b/tests/by-util/test_du.rs
index 72ffb22ffb5..27560cbdcca 100644
--- a/tests/by-util/test_du.rs
+++ b/tests/by-util/test_du.rs
@@ -3,10 +3,9 @@
 // For the full copyright and license information, please view the LICENSE
 // file that was distributed with this source code.
 
-// spell-checker:ignore (paths) sublink subwords azerty azeaze xcwww azeaz amaz azea qzerty tazerty tsublink
+// spell-checker:ignore (paths) sublink subwords azerty azeaze xcwww azeaz amaz azea qzerty tazerty tsublink testfile1 testfile2 filelist testdir testfile
 #[cfg(not(windows))]
 use regex::Regex;
-#[cfg(not(windows))]
 use std::io::Write;
 
 #[cfg(any(target_os = "linux", target_os = "android"))]
@@ -991,3 +990,74 @@ fn test_du_symlink_multiple_fail() {
     assert_eq!(result.code(), 1);
     result.stdout_contains("4\tfile1\n");
 }
+
+#[test]
+// Disable on Windows because of different path separators and handling of null characters
+#[cfg(not(target_os = "windows"))]
+fn test_du_files0_from() {
+    let ts = TestScenario::new(util_name!());
+    let at = &ts.fixtures;
+
+    let mut file1 = at.make_file("testfile1");
+    file1.write_all(b"content1").unwrap();
+    let mut file2 = at.make_file("testfile2");
+    file2.write_all(b"content2").unwrap();
+
+    at.mkdir("testdir");
+    let mut file3 = at.make_file("testdir/testfile3");
+    file3.write_all(b"content3").unwrap();
+
+    let mut file_list = at.make_file("filelist");
+    write!(file_list, "testfile1\0testfile2\0testdir\0").unwrap();
+
+    ts.ucmd()
+        .arg("--files0-from=filelist")
+        .succeeds()
+        .stdout_contains("testfile1")
+        .stdout_contains("testfile2")
+        .stdout_contains("testdir");
+}
+
+#[test]
+fn test_du_files0_from_stdin() {
+    let ts = TestScenario::new(util_name!());
+    let at = &ts.fixtures;
+
+    let mut file1 = at.make_file("testfile1");
+    file1.write_all(b"content1").unwrap();
+    let mut file2 = at.make_file("testfile2");
+    file2.write_all(b"content2").unwrap();
+
+    let input = "testfile1\0testfile2\0";
+
+    ts.ucmd()
+        .arg("--files0-from=-")
+        .pipe_in(input)
+        .succeeds()
+        .stdout_contains("testfile1")
+        .stdout_contains("testfile2");
+}
+
+#[test]
+fn test_du_files0_from_dir() {
+    let ts = TestScenario::new(util_name!());
+    let at = &ts.fixtures;
+
+    at.mkdir("dir");
+
+    let result = ts.ucmd().arg("--files0-from=dir").fails();
+    assert_eq!(result.stderr_str(), "du: dir: read error: Is a directory\n");
+}
+
+#[test]
+fn test_du_files0_from_combined() {
+    let ts = TestScenario::new(util_name!());
+    let at = &ts.fixtures;
+
+    at.mkdir("dir");
+
+    let result = ts.ucmd().arg("--files0-from=-").arg("foo").fails();
+    let stderr = result.stderr_str();
+
+    assert!(stderr.contains("file operands cannot be combined with --files0-from"));
+}
diff --git a/util/build-gnu.sh b/util/build-gnu.sh
index dbddc8a315e..18545dd4817 100755
--- a/util/build-gnu.sh
+++ b/util/build-gnu.sh
@@ -283,6 +283,10 @@ sed -i -E "s|^([^#]*2_31.*)$|#\1|g" tests/printf/printf-cov.pl
 
 sed -i -e "s/du: invalid -t argument/du: invalid --threshold argument/" -e "s/du: option requires an argument/error: a value is required for '--threshold <SIZE>' but none was supplied/" -e "/Try 'du --help' for more information./d" tests/du/threshold.sh
 
+# Remove the extra output check
+sed -i -e "s|Try '\$prog --help' for more information.\\\n||" tests/du/files0-from.pl
+sed -i -e "s|when reading file names from stdin, no file name of\"|-: No such file or directory\n\"|" -e "s| '-' allowed\\\n||" tests/du/files0-from.pl
+
 awk 'BEGIN {count=0} /compare exp out2/ && count < 6 {sub(/compare exp out2/, "grep -q \"cannot be used with\" out2"); count++} 1' tests/df/df-output.sh > tests/df/df-output.sh.tmp && mv tests/df/df-output.sh.tmp tests/df/df-output.sh
 
 # with ls --dired, in case of error, we have a slightly different error position

From 37c83ec480253bb62153dae8e595f5416c81669f Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Tue, 26 Dec 2023 15:15:02 +0100
Subject: [PATCH 276/429] du: simplify file creation in tests

---
 tests/by-util/test_du.rs | 38 +++++++++++++-------------------------
 1 file changed, 13 insertions(+), 25 deletions(-)

diff --git a/tests/by-util/test_du.rs b/tests/by-util/test_du.rs
index 27560cbdcca..db881291bde 100644
--- a/tests/by-util/test_du.rs
+++ b/tests/by-util/test_du.rs
@@ -6,7 +6,6 @@
 // spell-checker:ignore (paths) sublink subwords azerty azeaze xcwww azeaz amaz azea qzerty tazerty tsublink testfile1 testfile2 filelist testdir testfile
 #[cfg(not(windows))]
 use regex::Regex;
-use std::io::Write;
 
 #[cfg(any(target_os = "linux", target_os = "android"))]
 use crate::common::util::expected_result;
@@ -347,12 +346,10 @@ fn test_du_dereference_args() {
     let ts = TestScenario::new(util_name!());
     let at = &ts.fixtures;
 
-    at.mkdir_all("subdir");
-    let mut file1 = at.make_file("subdir/file-ignore1");
-    file1.write_all(b"azeaze").unwrap();
-    let mut file2 = at.make_file("subdir/file-ignore1");
-    file2.write_all(b"amaz?ng").unwrap();
-    at.symlink_dir("subdir", "sublink");
+    at.mkdir("dir");
+    at.write("dir/file-ignore1", "azeaze");
+    at.write("dir/file-ignore2", "amaz?ng");
+    at.symlink_dir("dir", "sublink");
 
     for arg in ["-D", "-H", "--dereference-args"] {
         let result = ts.ucmd().arg(arg).arg("-s").arg("sublink").succeeds();
@@ -848,10 +845,8 @@ fn test_du_exclude_mix() {
     let ts = TestScenario::new(util_name!());
     let at = &ts.fixtures;
 
-    let mut file1 = at.make_file("file-ignore1");
-    file1.write_all(b"azeaze").unwrap();
-    let mut file2 = at.make_file("file-ignore2");
-    file2.write_all(b"amaz?ng").unwrap();
+    at.write("file-ignore1", "azeaze");
+    at.write("file-ignore2", "amaz?ng");
 
     at.mkdir_all("azerty/xcwww/azeaze");
     at.mkdir_all("azerty/xcwww/qzerty");
@@ -983,8 +978,7 @@ fn test_du_symlink_multiple_fail() {
     let at = &ts.fixtures;
 
     at.symlink_file("non-existing.txt", "target.txt");
-    let mut file1 = at.make_file("file1");
-    file1.write_all(b"azeaze").unwrap();
+    at.write("file1", "azeaze");
 
     let result = ts.ucmd().arg("-L").arg("target.txt").arg("file1").fails();
     assert_eq!(result.code(), 1);
@@ -998,17 +992,13 @@ fn test_du_files0_from() {
     let ts = TestScenario::new(util_name!());
     let at = &ts.fixtures;
 
-    let mut file1 = at.make_file("testfile1");
-    file1.write_all(b"content1").unwrap();
-    let mut file2 = at.make_file("testfile2");
-    file2.write_all(b"content2").unwrap();
+    at.write("testfile1", "content1");
+    at.write("testfile2", "content2");
 
     at.mkdir("testdir");
-    let mut file3 = at.make_file("testdir/testfile3");
-    file3.write_all(b"content3").unwrap();
+    at.write("testdir/testfile3", "content3");
 
-    let mut file_list = at.make_file("filelist");
-    write!(file_list, "testfile1\0testfile2\0testdir\0").unwrap();
+    at.write("filelist", "testfile1\0testfile2\0testdir\0");
 
     ts.ucmd()
         .arg("--files0-from=filelist")
@@ -1023,10 +1013,8 @@ fn test_du_files0_from_stdin() {
     let ts = TestScenario::new(util_name!());
     let at = &ts.fixtures;
 
-    let mut file1 = at.make_file("testfile1");
-    file1.write_all(b"content1").unwrap();
-    let mut file2 = at.make_file("testfile2");
-    file2.write_all(b"content2").unwrap();
+    at.write("testfile1", "content1");
+    at.write("testfile2", "content2");
 
     let input = "testfile1\0testfile2\0";
 

From 2d260ded585ca2ab22b26df1d6adca4b9e0d78e0 Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Tue, 26 Dec 2023 15:19:45 +0100
Subject: [PATCH 277/429] du: use concat! to improve readability in tests

---
 tests/by-util/test_du.rs | 26 ++++++++++++++------------
 1 file changed, 14 insertions(+), 12 deletions(-)

diff --git a/tests/by-util/test_du.rs b/tests/by-util/test_du.rs
index db881291bde..5c2efdc9865 100644
--- a/tests/by-util/test_du.rs
+++ b/tests/by-util/test_du.rs
@@ -452,12 +452,13 @@ fn test_du_inodes_basic() {
 fn _du_inodes_basic(s: &str) {
     assert_eq!(
         s,
-        "2\t.\\subdir\\deeper\\deeper_dir
-4\t.\\subdir\\deeper
-3\t.\\subdir\\links
-8\t.\\subdir
-11\t.
-"
+        concat!(
+            "2\t.\\subdir\\deeper\\deeper_dir\n",
+            "4\t.\\subdir\\deeper\n",
+            "3\t.\\subdir\\links\n",
+            "8\t.\\subdir\n",
+            "11\t.\n",
+        )
     );
 }
 
@@ -465,12 +466,13 @@ fn _du_inodes_basic(s: &str) {
 fn _du_inodes_basic(s: &str) {
     assert_eq!(
         s,
-        "2\t./subdir/deeper/deeper_dir
-4\t./subdir/deeper
-3\t./subdir/links
-8\t./subdir
-11\t.
-"
+        concat!(
+            "2\t./subdir/deeper/deeper_dir\n",
+            "4\t./subdir/deeper\n",
+            "3\t./subdir/links\n",
+            "8\t./subdir\n",
+            "11\t.\n",
+        )
     );
 }
 

From edbb7d5b02989d385f78817b434a0e973842c9a4 Mon Sep 17 00:00:00 2001
From: Darius <dariusvalere@gmail.com>
Date: Sat, 23 Dec 2023 14:20:45 +0900
Subject: [PATCH 278/429] join: fixed parameter basenc: fixed parameter cut:
 fixed parameter mkdir: fixed parameter nohup: fixed parameter pr: fixed
 parameter printenv: fixed parameter printf: added parameters runcon: fixed
 typo shuf: fixed typo sum: fixed typo uniq: fixed parameter unlink: fixed
 parameter

---
 src/uu/basenc/basenc.md     | 2 +-
 src/uu/cut/cut.md           | 2 +-
 src/uu/join/join.md         | 2 +-
 src/uu/mkdir/mkdir.md       | 2 +-
 src/uu/nohup/nohup.md       | 2 +-
 src/uu/pr/pr.md             | 2 +-
 src/uu/printenv/printenv.md | 2 +-
 src/uu/printf/printf.md     | 2 ++
 src/uu/runcon/runcon.md     | 2 +-
 src/uu/shuf/shuf.md         | 2 +-
 src/uu/sum/sum.md           | 2 +-
 src/uu/uniq/uniq.md         | 2 +-
 src/uu/unlink/unlink.md     | 1 +
 13 files changed, 14 insertions(+), 11 deletions(-)

diff --git a/src/uu/basenc/basenc.md b/src/uu/basenc/basenc.md
index 17916bd4ab8..001babe9e6b 100644
--- a/src/uu/basenc/basenc.md
+++ b/src/uu/basenc/basenc.md
@@ -1,7 +1,7 @@
 # basenc
 
 ```
-basenc [OPTION]... [FILE]"
+basenc [OPTION]... [FILE]
 ```
 
 Encode/decode data and print to standard output
diff --git a/src/uu/cut/cut.md b/src/uu/cut/cut.md
index 972fcb6322e..5c21d23dcf9 100644
--- a/src/uu/cut/cut.md
+++ b/src/uu/cut/cut.md
@@ -3,7 +3,7 @@
 <!-- spell-checker:ignore sourcefile sourcefiles -->
 
 ```
-cut [-d|-w] [-s] [-z] [--output-delimiter] ((-f|-b|-c) {{sequence}}) {{sourcefile}}+
+cut OPTION... [FILE]...
 ```
 
 Prints specified byte or field columns from each line of stdin or the input files
diff --git a/src/uu/join/join.md b/src/uu/join/join.md
index ec91950b8bc..04275342a6e 100644
--- a/src/uu/join/join.md
+++ b/src/uu/join/join.md
@@ -1,7 +1,7 @@
 # join
 
 ```
-join [OPTIONS] <FILE1> <FILE2>
+join [OPTION]... FILE1 FILE2
 ```
 
 For each pair of input lines with identical join fields, write a line to
diff --git a/src/uu/mkdir/mkdir.md b/src/uu/mkdir/mkdir.md
index 1698842cd9c..eea3d2eb063 100644
--- a/src/uu/mkdir/mkdir.md
+++ b/src/uu/mkdir/mkdir.md
@@ -3,7 +3,7 @@
 <!-- spell-checker:ignore ugoa -->
 
 ```
-mkdir [OPTION]... [USER]
+mkdir [OPTION]... DIRECTORY...
 ```
 
 Create the given DIRECTORY(ies) if they do not exist
diff --git a/src/uu/nohup/nohup.md b/src/uu/nohup/nohup.md
index cc35ef9f46c..65ffaec873d 100644
--- a/src/uu/nohup/nohup.md
+++ b/src/uu/nohup/nohup.md
@@ -2,7 +2,7 @@
 
 ```
 nohup COMMAND [ARG]...
-nohup FLAG
+nohup OPTION
 ```
 
 Run COMMAND ignoring hangup signals.
diff --git a/src/uu/pr/pr.md b/src/uu/pr/pr.md
index 2c246b25f1c..cd2f552f3de 100644
--- a/src/uu/pr/pr.md
+++ b/src/uu/pr/pr.md
@@ -1,7 +1,7 @@
 # pr
 
 ```
-pr [OPTIONS] [files]...
+pr [OPTION]... [FILE]...
 ```
 
 Write content of given file or standard input to standard output with pagination filter
diff --git a/src/uu/printenv/printenv.md b/src/uu/printenv/printenv.md
index 929da7947b5..f67d46a23dd 100644
--- a/src/uu/printenv/printenv.md
+++ b/src/uu/printenv/printenv.md
@@ -1,7 +1,7 @@
 # printenv
 
 ```
-printenv [VARIABLE]... [OPTION]...
+printenv [OPTION]... [VARIABLE]...
 ```
 
 Display the values of the specified environment VARIABLE(s), or (with no VARIABLE) display name and value pairs for them all.
diff --git a/src/uu/printf/printf.md b/src/uu/printf/printf.md
index 9ce2957701e..fad5d01e30b 100644
--- a/src/uu/printf/printf.md
+++ b/src/uu/printf/printf.md
@@ -4,6 +4,8 @@
 
 ```
 printf FORMATSTRING [ARGUMENT]...
+printf FORMAT [ARGUMENT]...
+printf OPTION
 ```
 
 Print output based off of the format string and proceeding arguments.
diff --git a/src/uu/runcon/runcon.md b/src/uu/runcon/runcon.md
index 1911c50447c..155ea7dc0f7 100644
--- a/src/uu/runcon/runcon.md
+++ b/src/uu/runcon/runcon.md
@@ -2,7 +2,7 @@
 
 ```
 runcon [CONTEXT COMMAND [ARG...]]
-runcon [-c] [-u USER] [-r ROLE] [-t TYPE] [-l RANGE] COMMAND [ARG...]";
+runcon [-c] [-u USER] [-r ROLE] [-t TYPE] [-l RANGE] COMMAND [ARG...]
 ```
 
 Run command with specified security context under SELinux enabled systems.
diff --git a/src/uu/shuf/shuf.md b/src/uu/shuf/shuf.md
index b59799c3378..7bc1e0a6d60 100644
--- a/src/uu/shuf/shuf.md
+++ b/src/uu/shuf/shuf.md
@@ -3,7 +3,7 @@
 ```
 shuf [OPTION]... [FILE]
 shuf -e [OPTION]... [ARG]...
-shuf -i LO-HI [OPTION]...;
+shuf -i LO-HI [OPTION]...
 ```
 
 Shuffle the input by outputting a random permutation of input lines.
diff --git a/src/uu/sum/sum.md b/src/uu/sum/sum.md
index ca3adb81f36..93dbdbf62d0 100644
--- a/src/uu/sum/sum.md
+++ b/src/uu/sum/sum.md
@@ -1,7 +1,7 @@
 # sum
 
 ```
-sum [OPTION]... [FILE]..."
+sum [OPTION]... [FILE]...
 ```
 
 Checksum and count the blocks in a file.
diff --git a/src/uu/uniq/uniq.md b/src/uu/uniq/uniq.md
index dea57081b77..20de52395ba 100644
--- a/src/uu/uniq/uniq.md
+++ b/src/uu/uniq/uniq.md
@@ -1,7 +1,7 @@
 # uniq
 
 ```
-uniq [OPTION]... [INPUT [OUTPUT]]...
+uniq [OPTION]... [INPUT [OUTPUT]]
 ```
 
 Report or omit repeated lines.
diff --git a/src/uu/unlink/unlink.md b/src/uu/unlink/unlink.md
index 4468fb20450..eebcd9ef31d 100644
--- a/src/uu/unlink/unlink.md
+++ b/src/uu/unlink/unlink.md
@@ -2,6 +2,7 @@
 
 ```
 unlink [FILE]
+unlink OPTION
 ```
 
 Unlink the file at `FILE`.

From 413638c78972e2af74b585f1b85b901bc41f493b Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Wed, 27 Dec 2023 08:46:33 +0100
Subject: [PATCH 279/429] Improve the GNU ci analysis: display the root test
 changes too (#5728)

* try to compare the root results too

* Add debug info in the logs

* rename the variable for something more explicit

* Improve intermittent doc
---
 .github/workflows/GnuTests.yml | 129 ++++++++++++++++++++-------------
 1 file changed, 77 insertions(+), 52 deletions(-)

diff --git a/.github/workflows/GnuTests.yml b/.github/workflows/GnuTests.yml
index 0799b2e6c14..89fa5a7da50 100644
--- a/.github/workflows/GnuTests.yml
+++ b/.github/workflows/GnuTests.yml
@@ -204,6 +204,7 @@ jobs:
         ## Compare test failures VS reference
         have_new_failures=""
         REF_LOG_FILE='${{ steps.vars.outputs.path_reference }}/test-logs/test-suite.log'
+        ROOT_REF_LOG_FILE='${{ steps.vars.outputs.path_reference }}/test-logs/test-suite-root.log'
         REF_SUMMARY_FILE='${{ steps.vars.outputs.path_reference }}/test-summary/gnu-result.json'
         REPO_DEFAULT_BRANCH='${{ steps.vars.outputs.repo_default_branch }}'
         path_UUTILS='${{ steps.vars.outputs.path_UUTILS }}'
@@ -223,68 +224,92 @@ jobs:
         rm -f ${COMMENT_LOG}
         touch ${COMMENT_LOG}
 
-        if test -f "${REF_LOG_FILE}"; then
-          echo "Reference SHA1/ID: $(sha1sum -- "${REF_SUMMARY_FILE}")"
-          REF_ERROR=$(sed -n "s/^ERROR: \([[:print:]]\+\).*/\1/p" "${REF_LOG_FILE}" | sort)
-          NEW_ERROR=$(sed -n "s/^ERROR: \([[:print:]]\+\).*/\1/p" '${{ steps.vars.outputs.path_GNU_tests }}/test-suite.log' | sort)
-          REF_FAILING=$(sed -n "s/^FAIL: \([[:print:]]\+\).*/\1/p" "${REF_LOG_FILE}" | sort)
-          NEW_FAILING=$(sed -n "s/^FAIL: \([[:print:]]\+\).*/\1/p" '${{ steps.vars.outputs.path_GNU_tests }}/test-suite.log' | sort)
-          for LINE in ${REF_FAILING}
-          do
-            if ! grep -Fxq ${LINE}<<<"${NEW_FAILING}"; then
-              if ! grep ${LINE} ${IGNORE_INTERMITTENT}
+        compare_tests() {
+          local new_log_file=$1
+          local ref_log_file=$2
+          local test_type=$3  # "standard" or "root"
+
+          if test -f "${ref_log_file}"; then
+            echo "Reference ${test_type} test log SHA1/ID: $(sha1sum -- "${ref_log_file}") - ${test_type}"
+            REF_ERROR=$(sed -n "s/^ERROR: \([[:print:]]\+\).*/\1/p" "${ref_log_file}"| sort)
+            CURRENT_RUN_ERROR=$(sed -n "s/^ERROR: \([[:print:]]\+\).*/\1/p" "${new_log_file}" | sort)
+            REF_FAILING=$(sed -n "s/^FAIL: \([[:print:]]\+\).*/\1/p" "${ref_log_file}"| sort)
+            CURRENT_RUN_FAILING=$(sed -n "s/^FAIL: \([[:print:]]\+\).*/\1/p" "${new_log_file}" | sort)
+            echo "Detailled information:"
+            echo "REF_ERROR = ${REF_ERROR}"
+            echo "CURRENT_RUN_ERROR = ${CURRENT_RUN_ERROR}"
+            echo "REF_FAILING = ${REF_FAILING}"
+            echo "CURRENT_RUN_FAILING = ${CURRENT_RUN_FAILING}"
+
+            # Compare failing and error tests
+            for LINE in ${CURRENT_RUN_FAILING}
+            do
+              if ! grep -Fxq ${LINE}<<<"${REF_FAILING}"
               then
-                MSG="Congrats! The gnu test ${LINE} is no longer failing!"
-                echo "::warning ::$MSG"
-                echo $MSG >> ${COMMENT_LOG}
-              else
-                MSG="Skipping an intermittent issue ${LINE}"
-                echo "::warning ::$MSG"
-                echo $MSG >> ${COMMENT_LOG}
-                echo ""
+                if ! grep ${LINE} ${IGNORE_INTERMITTENT}
+                then
+                  MSG="GNU test failed: ${LINE}. ${LINE} is passing on '${REPO_DEFAULT_BRANCH}'. Maybe you have to rebase?"
+                  echo "::error ::$MSG"
+                  echo $MSG >> ${COMMENT_LOG}
+                  have_new_failures="true"
+                else
+                  MSG="Skip an intermittent issue ${LINE} (fails in this run but passes in the 'main' branch)"
+                  echo "::warning ::$MSG"
+                  echo $MSG >> ${COMMENT_LOG}
+                  echo ""
+                fi
               fi
-            fi
-          done
-          for LINE in ${NEW_FAILING}
-          do
-            if ! grep -Fxq ${LINE}<<<"${REF_FAILING}"
-            then
-              if ! grep ${LINE} ${IGNORE_INTERMITTENT}
+            done
+
+            for LINE in ${REF_FAILING}
+            do
+              if ! grep -Fxq ${LINE}<<<"${CURRENT_RUN_FAILING}"
+              then
+                if ! grep ${LINE} ${IGNORE_INTERMITTENT}
+                then
+                  MSG="Congrats! The gnu test ${LINE} is no longer failing!"
+                  echo "::warning ::$MSG"
+                  echo $MSG >> ${COMMENT_LOG}
+                else
+                  MSG="Skipping an intermittent issue ${LINE} (passes in this run but fails in the 'main' branch)"
+                  echo "::warning ::$MSG"
+                  echo $MSG >> ${COMMENT_LOG}
+                  echo ""
+                fi
+              fi
+            done
+
+            for LINE in ${CURRENT_RUN_ERROR}
+            do
+              if ! grep -Fxq ${LINE}<<<"${REF_ERROR}"
               then
-                MSG="GNU test failed: ${LINE}. ${LINE} is passing on '${{ steps.vars.outputs.repo_default_branch }}'. Maybe you have to rebase?"
+                MSG="GNU test error: ${LINE}. ${LINE} is passing on '${REPO_DEFAULT_BRANCH}'. Maybe you have to rebase?"
                 echo "::error ::$MSG"
                 echo $MSG >> ${COMMENT_LOG}
                 have_new_failures="true"
-              else
-                MSG="Skip an intermittent issue ${LINE}"
+              fi
+            done
+
+            for LINE in ${REF_ERROR}
+            do
+              if ! grep -Fxq ${LINE}<<<"${CURRENT_RUN_ERROR}"
+              then
+                MSG="Congrats! The gnu test ${LINE} is no longer ERROR!"
                 echo "::warning ::$MSG"
                 echo $MSG >> ${COMMENT_LOG}
-                echo ""
               fi
-            fi
-          done
-          for LINE in ${REF_ERROR}
-          do
-            if ! grep -Fxq ${LINE}<<<"${NEW_ERROR}"; then
-              MSG="Congrats! The gnu test ${LINE} is no longer ERROR!"
-              echo "::warning ::$MSG"
-              echo $MSG >> ${COMMENT_LOG}
-            fi
-          done
-          for LINE in ${NEW_ERROR}
-          do
-            if ! grep -Fxq ${LINE}<<<"${REF_ERROR}"
-            then
-              MSG="GNU test error: ${LINE}. ${LINE} is passing on '${{ steps.vars.outputs.repo_default_branch }}'. Maybe you have to rebase?"
-              echo "::error ::$MSG"
-              echo $MSG >> ${COMMENT_LOG}
-              have_new_failures="true"
-            fi
-          done
+            done
+          else
+            echo "::warning ::Skipping ${test_type} test failure comparison; no prior reference test logs are available."
+          fi
+        }
+
+        # Compare standard tests
+        compare_tests '${{ steps.vars.outputs.path_GNU_tests }}/test-suite.log' "${REF_LOG_FILE}" "standard"
+
+        # Compare root tests
+        compare_tests '${{ steps.vars.outputs.path_GNU_tests }}/test-suite-root.log' "${ROOT_REF_LOG_FILE}" "root"
 
-        else
-          echo "::warning ::Skipping test failure comparison; no prior reference test logs are available."
-        fi
         if test -n "${have_new_failures}" ; then exit -1 ; fi
     - name: Upload comparison log (for GnuComment workflow)
       if: success() || failure() # run regardless of prior step success/failure

From bf26eda786b6714e51fa52aa59948ad9330e8c5b Mon Sep 17 00:00:00 2001
From: Matei Mantu <66641453+mtimaN@users.noreply.github.com>
Date: Wed, 27 Dec 2023 14:37:17 +0200
Subject: [PATCH 280/429] install: remove / from end of path if it exists so as
 not to mess with .exists() (#5730)

* remove / from end of path if it exists so as not to mess with .exists()

* install: fix / removal from path

* Fix clippy warnings

* Add test for install target ends with /
---
 src/uu/install/src/install.rs |  7 +++++++
 tests/by-util/test_install.rs | 24 ++++++++++++++++++++++++
 2 files changed, 31 insertions(+)

diff --git a/src/uu/install/src/install.rs b/src/uu/install/src/install.rs
index a930be99616..fb80b2f0ec2 100644
--- a/src/uu/install/src/install.rs
+++ b/src/uu/install/src/install.rs
@@ -569,6 +569,13 @@ fn standard(mut paths: Vec<String>, b: &Behavior) -> UResult<()> {
         };
 
         if let Some(to_create) = to_create {
+            // if the path ends in /, remove it
+            let to_create = if to_create.to_string_lossy().ends_with('/') {
+                Path::new(to_create.to_str().unwrap().trim_end_matches('/'))
+            } else {
+                to_create
+            };
+
             if !to_create.exists() {
                 if b.verbose {
                     let mut result = PathBuf::new();
diff --git a/tests/by-util/test_install.rs b/tests/by-util/test_install.rs
index 85335285aae..fb360533f11 100644
--- a/tests/by-util/test_install.rs
+++ b/tests/by-util/test_install.rs
@@ -1589,3 +1589,27 @@ fn test_t_exist_dir() {
         .fails()
         .stderr_contains("failed to access 'sub4/file_exists': Not a directory");
 }
+
+#[test]
+fn test_target_file_ends_with_slash() {
+    let scene = TestScenario::new(util_name!());
+    let at = &scene.fixtures;
+
+    let source = "source_file";
+    let target_dir = "dir";
+    let target_file = "dir/target_file";
+    let target_file_slash = format!("{}/", target_file);
+
+    at.touch(source);
+    at.mkdir(target_dir);
+    at.touch(target_file);
+
+    scene
+        .ucmd()
+        .arg("-t")
+        .arg(target_file_slash)
+        .arg("-D")
+        .arg(source)
+        .fails()
+        .stderr_contains("failed to access 'dir/target_file/': Not a directory");
+}

From 0701f535ac415b4b45d8e34e220a9e0c3c7e2e21 Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Wed, 27 Dec 2023 15:39:54 +0100
Subject: [PATCH 281/429] cp: fix backup of destination symlink

---
 src/uu/cp/src/cp.rs      |  6 +++++-
 tests/by-util/test_cp.rs | 21 +++++++++++++++++++++
 2 files changed, 26 insertions(+), 1 deletion(-)

diff --git a/src/uu/cp/src/cp.rs b/src/uu/cp/src/cp.rs
index 6e88dcbb37c..97afdee1e0f 100644
--- a/src/uu/cp/src/cp.rs
+++ b/src/uu/cp/src/cp.rs
@@ -1496,7 +1496,11 @@ fn context_for(src: &Path, dest: &Path) -> String {
 /// Implements a simple backup copy for the destination file.
 /// TODO: for the backup, should this function be replaced by `copy_file(...)`?
 fn backup_dest(dest: &Path, backup_path: &Path) -> CopyResult<PathBuf> {
-    fs::copy(dest, backup_path)?;
+    if dest.is_symlink() {
+        fs::rename(dest, backup_path)?;
+    } else {
+        fs::copy(dest, backup_path)?;
+    }
     Ok(backup_path.into())
 }
 
diff --git a/tests/by-util/test_cp.rs b/tests/by-util/test_cp.rs
index 16eed035aab..2636df28a3b 100644
--- a/tests/by-util/test_cp.rs
+++ b/tests/by-util/test_cp.rs
@@ -678,6 +678,27 @@ fn test_cp_arg_backup() {
     );
 }
 
+#[test]
+fn test_cp_arg_backup_with_dest_a_symlink() {
+    let (at, mut ucmd) = at_and_ucmd!();
+    let source = "source";
+    let source_content = "content";
+    let symlink = "symlink";
+    let original = "original";
+    let backup = "symlink~";
+
+    at.write(source, source_content);
+    at.write(original, "original");
+    at.symlink_file(original, symlink);
+
+    ucmd.arg("-b").arg(source).arg(symlink).succeeds();
+
+    assert!(!at.symlink_exists(symlink));
+    assert_eq!(source_content, at.read(symlink));
+    assert!(at.symlink_exists(backup));
+    assert_eq!(original, at.resolve_link(backup));
+}
+
 #[test]
 fn test_cp_arg_backup_with_other_args() {
     let (at, mut ucmd) = at_and_ucmd!();

From c38a43210cb0ac7d58cb7732e14ac516fb7d19f1 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Wed, 27 Dec 2023 23:51:49 +0100
Subject: [PATCH 282/429] use our getegid & geteuid wrappers function instead
 of libc calls

---
 src/uu/install/src/install.rs      | 9 ++++-----
 src/uu/test/Cargo.toml             | 2 +-
 src/uu/test/src/test.rs            | 6 ++++--
 src/uu/whoami/src/platform/unix.rs | 5 ++---
 4 files changed, 11 insertions(+), 11 deletions(-)

diff --git a/src/uu/install/src/install.rs b/src/uu/install/src/install.rs
index fb80b2f0ec2..92910650da4 100644
--- a/src/uu/install/src/install.rs
+++ b/src/uu/install/src/install.rs
@@ -19,7 +19,6 @@ use uucore::mode::get_umask;
 use uucore::perms::{wrap_chown, Verbosity, VerbosityLevel};
 use uucore::{format_usage, help_about, help_usage, show, show_error, show_if_err, uio_error};
 
-use libc::{getegid, geteuid};
 use std::error::Error;
 use std::fmt::{Debug, Display};
 use std::fs;
@@ -29,6 +28,8 @@ use std::os::unix::fs::MetadataExt;
 use std::os::unix::prelude::OsStrExt;
 use std::path::{Path, PathBuf, MAIN_SEPARATOR};
 use std::process;
+#[cfg(not(target_os = "windows"))]
+use uucore::process::{getegid, geteuid};
 
 const DEFAULT_MODE: u32 = 0o755;
 const DEFAULT_STRIP_PROGRAM: &str = "strip";
@@ -959,10 +960,8 @@ fn need_copy(from: &Path, to: &Path, b: &Behavior) -> UResult<bool> {
         }
     } else {
         #[cfg(not(target_os = "windows"))]
-        unsafe {
-            if to_meta.uid() != geteuid() || to_meta.gid() != getegid() {
-                return Ok(true);
-            }
+        if to_meta.uid() != geteuid() || to_meta.gid() != getegid() {
+            return Ok(true);
         }
     }
 
diff --git a/src/uu/test/Cargo.toml b/src/uu/test/Cargo.toml
index bc27511867e..93a77b11d4a 100644
--- a/src/uu/test/Cargo.toml
+++ b/src/uu/test/Cargo.toml
@@ -17,7 +17,7 @@ path = "src/test.rs"
 [dependencies]
 clap = { workspace = true }
 libc = { workspace = true }
-uucore = { workspace = true }
+uucore = { workspace = true, features = ["process"] }
 
 [target.'cfg(target_os = "redox")'.dependencies]
 redox_syscall = { workspace = true }
diff --git a/src/uu/test/src/test.rs b/src/uu/test/src/test.rs
index 4f230a590df..a0d0f339592 100644
--- a/src/uu/test/src/test.rs
+++ b/src/uu/test/src/test.rs
@@ -17,6 +17,8 @@ use std::fs;
 use std::os::unix::fs::MetadataExt;
 use uucore::display::Quotable;
 use uucore::error::{UResult, USimpleError};
+#[cfg(not(windows))]
+use uucore::process::{getegid, geteuid};
 use uucore::{format_usage, help_about, help_section};
 
 const ABOUT: &str = help_about!("test.md");
@@ -276,7 +278,7 @@ fn path(path: &OsStr, condition: &PathCondition) -> bool {
 
     let geteuid = || {
         #[cfg(not(target_os = "redox"))]
-        let euid = unsafe { libc::geteuid() };
+        let euid = geteuid();
         #[cfg(target_os = "redox")]
         let euid = syscall::geteuid().unwrap() as u32;
 
@@ -285,7 +287,7 @@ fn path(path: &OsStr, condition: &PathCondition) -> bool {
 
     let getegid = || {
         #[cfg(not(target_os = "redox"))]
-        let egid = unsafe { libc::getegid() };
+        let egid = getegid();
         #[cfg(target_os = "redox")]
         let egid = syscall::getegid().unwrap() as u32;
 
diff --git a/src/uu/whoami/src/platform/unix.rs b/src/uu/whoami/src/platform/unix.rs
index 31ab16fba4c..9310a6de0a2 100644
--- a/src/uu/whoami/src/platform/unix.rs
+++ b/src/uu/whoami/src/platform/unix.rs
@@ -7,10 +7,9 @@ use std::ffi::OsString;
 use std::io;
 
 use uucore::entries::uid2usr;
+use uucore::process::geteuid;
 
 pub fn get_username() -> io::Result<OsString> {
-    // SAFETY: getuid() does nothing with memory and is always successful.
-    let uid = unsafe { libc::geteuid() };
     // uid2usr should arguably return an OsString but currently doesn't
-    uid2usr(uid).map(Into::into)
+    uid2usr(geteuid()).map(Into::into)
 }

From 764ea34c374fbfdc020d8a281d87bab24b650836 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Thu, 28 Dec 2023 00:42:36 +0100
Subject: [PATCH 283/429] dd/chroot: improve the skip message (not root)

---
 tests/by-util/test_chroot.rs | 2 +-
 tests/by-util/test_dd.rs     | 4 ++--
 2 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/tests/by-util/test_chroot.rs b/tests/by-util/test_chroot.rs
index 1fc2231d57a..128d0b812c1 100644
--- a/tests/by-util/test_chroot.rs
+++ b/tests/by-util/test_chroot.rs
@@ -124,7 +124,7 @@ fn test_default_shell() {
     if let Ok(result) = run_ucmd_as_root(&ts, &[dir]) {
         result.stderr_contains(expected);
     } else {
-        print!("TEST SKIPPED");
+        print!("Test skipped; requires root user");
     }
 }
 
diff --git a/tests/by-util/test_dd.rs b/tests/by-util/test_dd.rs
index bd43ad077d3..93cfee06718 100644
--- a/tests/by-util/test_dd.rs
+++ b/tests/by-util/test_dd.rs
@@ -1565,7 +1565,7 @@ fn test_skip_past_dev() {
         result.stderr_contains("0+0 records out");
         result.code_is(1);
     } else {
-        print!("TEST SKIPPED");
+        print!("Test skipped; requires root user");
     }
 }
 
@@ -1586,7 +1586,7 @@ fn test_seek_past_dev() {
         result.stderr_contains("0+0 records out");
         result.code_is(1);
     } else {
-        print!("TEST SKIPPED");
+        print!("Test skipped; requires root user");
     }
 }
 

From ad16313c59d589f42705080c8b488afa1fdc2a00 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Thu, 28 Dec 2023 07:15:01 +0100
Subject: [PATCH 284/429] head: -c allocate memory as needed (#5704)

* head: -c allocate memory as needed

Improve the execution of tests/head/head-c.sh

* simplify the code

Co-authored-by: Daniel Hofstetter <daniel.hofstetter@42dh.com>

---------

Co-authored-by: Daniel Hofstetter <daniel.hofstetter@42dh.com>
---
 src/uu/head/src/head.rs | 54 ++++++++++++++++++-----------------------
 1 file changed, 24 insertions(+), 30 deletions(-)

diff --git a/src/uu/head/src/head.rs b/src/uu/head/src/head.rs
index 83bdd37390a..0f7a08d26f4 100644
--- a/src/uu/head/src/head.rs
+++ b/src/uu/head/src/head.rs
@@ -252,43 +252,37 @@ fn read_but_last_n_bytes(input: &mut impl std::io::BufRead, n: usize) -> std::io
     let stdout = std::io::stdout();
     let mut stdout = stdout.lock();
 
-    let mut ring_buffer = vec![0u8; n];
+    let mut ring_buffer = Vec::new();
 
-    // first we fill the ring buffer
-    if let Err(e) = input.read_exact(&mut ring_buffer) {
-        if e.kind() == ErrorKind::UnexpectedEof {
-            return Ok(());
-        } else {
-            return Err(e);
-        }
-    }
     let mut buffer = [0u8; BUF_SIZE];
+    let mut total_read = 0;
+
     loop {
-        let read = loop {
-            match input.read(&mut buffer) {
-                Ok(n) => break n,
-                Err(e) => match e.kind() {
-                    ErrorKind::Interrupted => {}
-                    _ => return Err(e),
-                },
-            }
+        let read = match input.read(&mut buffer) {
+            Ok(0) => break,
+            Ok(read) => read,
+            Err(e) => match e.kind() {
+                ErrorKind::Interrupted => continue,
+                _ => return Err(e),
+            },
         };
-        if read == 0 {
-            return Ok(());
-        } else if read >= n {
-            stdout.write_all(&ring_buffer)?;
-            stdout.write_all(&buffer[..read - n])?;
-            for i in 0..n {
-                ring_buffer[i] = buffer[read - n + i];
-            }
+
+        total_read += read;
+
+        if total_read <= n {
+            // Fill the ring buffer without exceeding n bytes
+            let overflow = total_read - n;
+            ring_buffer.extend_from_slice(&buffer[..read - overflow]);
         } else {
-            stdout.write_all(&ring_buffer[..read])?;
-            for i in 0..n - read {
-                ring_buffer[i] = ring_buffer[read + i];
-            }
-            ring_buffer[n - read..].copy_from_slice(&buffer[..read]);
+            // Write the ring buffer and the part of the buffer that exceeds n
+            stdout.write_all(&ring_buffer)?;
+            stdout.write_all(&buffer[..read - n + ring_buffer.len()])?;
+            ring_buffer.clear();
+            ring_buffer.extend_from_slice(&buffer[read - n + ring_buffer.len()..read]);
         }
     }
+
+    Ok(())
 }
 
 fn read_but_last_n_lines(

From ce18f8a2a107a2a8c575dfd6831280bd522e16dc Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Wed, 27 Dec 2023 23:34:44 +0100
Subject: [PATCH 285/429] install: split the need_copy check

---
 src/uu/install/src/install.rs | 5 ++++-
 1 file changed, 4 insertions(+), 1 deletion(-)

diff --git a/src/uu/install/src/install.rs b/src/uu/install/src/install.rs
index 92910650da4..d2586307942 100644
--- a/src/uu/install/src/install.rs
+++ b/src/uu/install/src/install.rs
@@ -954,7 +954,10 @@ fn need_copy(from: &Path, to: &Path, b: &Behavior) -> UResult<bool> {
         if owner_id != to_meta.uid() {
             return Ok(true);
         }
-    } else if let Some(group_id) = b.group_id {
+    }
+
+    // Check if the group ID is specified and differs from the destination file's group.
+    if let Some(group_id) = b.group_id {
         if group_id != to_meta.gid() {
             return Ok(true);
         }

From c0206c5ea41702918d5f669bd4f5116741a54c75 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Thu, 28 Dec 2023 10:04:41 +0100
Subject: [PATCH 286/429] install: document the need_copy function

---
 src/uu/install/src/install.rs | 19 ++++++++++++++++++-
 1 file changed, 18 insertions(+), 1 deletion(-)

diff --git a/src/uu/install/src/install.rs b/src/uu/install/src/install.rs
index d2586307942..7487c90bc94 100644
--- a/src/uu/install/src/install.rs
+++ b/src/uu/install/src/install.rs
@@ -869,6 +869,7 @@ fn preserve_timestamps(from: &Path, to: &Path) -> UResult<()> {
 ///
 fn copy(from: &Path, to: &Path, b: &Behavior) -> UResult<()> {
     if b.compare && !need_copy(from, to, b)? {
+        println!("no need to copy");
         return Ok(());
     }
     // Declare the path here as we may need it for the verbose output below.
@@ -916,40 +917,53 @@ fn copy(from: &Path, to: &Path, b: &Behavior) -> UResult<()> {
 /// Crashes the program if a nonexistent owner or group is specified in _b_.
 ///
 fn need_copy(from: &Path, to: &Path, b: &Behavior) -> UResult<bool> {
+    // Attempt to retrieve metadata for the source file.
+    // If this fails, assume the file needs to be copied.
     let from_meta = match fs::metadata(from) {
         Ok(meta) => meta,
         Err(_) => return Ok(true),
     };
+
+    // Attempt to retrieve metadata for the destination file.
+    // If this fails, assume the file needs to be copied.
     let to_meta = match fs::metadata(to) {
         Ok(meta) => meta,
         Err(_) => return Ok(true),
     };
 
-    // setuid || setgid || sticky
+    // Define special file mode bits (setuid, setgid, sticky).
     let extra_mode: u32 = 0o7000;
+    // Define all file mode bits (including permissions).
     // setuid || setgid || sticky || permissions
     let all_modes: u32 = 0o7777;
 
+    // Check if any special mode bits are set in the specified mode,
+    // source file mode, or destination file mode. If so, copy is needed.
     if b.specified_mode.unwrap_or(0) & extra_mode != 0
         || from_meta.mode() & extra_mode != 0
         || to_meta.mode() & extra_mode != 0
     {
         return Ok(true);
     }
+
+    // Check if the mode of the destination file differs from the specified mode.
     if b.mode() != to_meta.mode() & all_modes {
         return Ok(true);
     }
 
+    // Check if either the source or destination is not a file.
     if !from_meta.is_file() || !to_meta.is_file() {
         return Ok(true);
     }
 
+    // Check if the file sizes differ.
     if from_meta.len() != to_meta.len() {
         return Ok(true);
     }
 
     // TODO: if -P (#1809) and from/to contexts mismatch, return true.
 
+    // Check if the owner ID is specified and differs from the destination file's owner.
     if let Some(owner_id) = b.owner_id {
         if owner_id != to_meta.uid() {
             return Ok(true);
@@ -963,11 +977,14 @@ fn need_copy(from: &Path, to: &Path, b: &Behavior) -> UResult<bool> {
         }
     } else {
         #[cfg(not(target_os = "windows"))]
+        // Check if the destination file's owner or group
+        // differs from the effective user/group ID of the process.
         if to_meta.uid() != geteuid() || to_meta.gid() != getegid() {
             return Ok(true);
         }
     }
 
+    // Check if the contents of the source and destination files differ.
     if !diff(from.to_str().unwrap(), to.to_str().unwrap()) {
         return Ok(true);
     }

From 0fb3ffb8adb5ca8fde92fbb2d4dc4598d2ca8af2 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Wed, 27 Dec 2023 23:35:29 +0100
Subject: [PATCH 287/429] install: document the need_copy function

---
 src/uu/install/src/install.rs | 3 +--
 1 file changed, 1 insertion(+), 2 deletions(-)

diff --git a/src/uu/install/src/install.rs b/src/uu/install/src/install.rs
index 7487c90bc94..87980ac5bb1 100644
--- a/src/uu/install/src/install.rs
+++ b/src/uu/install/src/install.rs
@@ -869,7 +869,6 @@ fn preserve_timestamps(from: &Path, to: &Path) -> UResult<()> {
 ///
 fn copy(from: &Path, to: &Path, b: &Behavior) -> UResult<()> {
     if b.compare && !need_copy(from, to, b)? {
-        println!("no need to copy");
         return Ok(());
     }
     // Declare the path here as we may need it for the verbose output below.
@@ -938,7 +937,7 @@ fn need_copy(from: &Path, to: &Path, b: &Behavior) -> UResult<bool> {
     let all_modes: u32 = 0o7777;
 
     // Check if any special mode bits are set in the specified mode,
-    // source file mode, or destination file mode. If so, copy is needed.
+    // source file mode, or destination file mode.
     if b.specified_mode.unwrap_or(0) & extra_mode != 0
         || from_meta.mode() & extra_mode != 0
         || to_meta.mode() & extra_mode != 0

From 2c0f15be552160e8ca8dc3dd559a768aae4a9ba5 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Thu, 28 Dec 2023 01:06:57 +0100
Subject: [PATCH 288/429] install: if run as root, revert the uid & gid to root

---
 src/uu/install/src/install.rs | 57 ++++++++++++++++++++---------------
 1 file changed, 32 insertions(+), 25 deletions(-)

diff --git a/src/uu/install/src/install.rs b/src/uu/install/src/install.rs
index 87980ac5bb1..e568149acf6 100644
--- a/src/uu/install/src/install.rs
+++ b/src/uu/install/src/install.rs
@@ -10,15 +10,6 @@ mod mode;
 use clap::{crate_version, Arg, ArgAction, ArgMatches, Command};
 use file_diff::diff;
 use filetime::{set_file_times, FileTime};
-use uucore::backup_control::{self, BackupMode};
-use uucore::display::Quotable;
-use uucore::entries::{grp2gid, usr2uid};
-use uucore::error::{FromIo, UError, UIoError, UResult, UUsageError};
-use uucore::fs::dir_strip_dot_for_creation;
-use uucore::mode::get_umask;
-use uucore::perms::{wrap_chown, Verbosity, VerbosityLevel};
-use uucore::{format_usage, help_about, help_usage, show, show_error, show_if_err, uio_error};
-
 use std::error::Error;
 use std::fmt::{Debug, Display};
 use std::fs;
@@ -28,8 +19,15 @@ use std::os::unix::fs::MetadataExt;
 use std::os::unix::prelude::OsStrExt;
 use std::path::{Path, PathBuf, MAIN_SEPARATOR};
 use std::process;
-#[cfg(not(target_os = "windows"))]
+use uucore::backup_control::{self, BackupMode};
+use uucore::display::Quotable;
+use uucore::entries::{grp2gid, usr2uid};
+use uucore::error::{FromIo, UError, UIoError, UResult, UUsageError};
+use uucore::fs::dir_strip_dot_for_creation;
+use uucore::mode::get_umask;
+use uucore::perms::{wrap_chown, Verbosity, VerbosityLevel};
 use uucore::process::{getegid, geteuid};
+use uucore::{format_usage, help_about, help_usage, show, show_error, show_if_err, uio_error};
 
 const DEFAULT_MODE: u32 = 0o755;
 const DEFAULT_STRIP_PROGRAM: &str = "strip";
@@ -665,6 +663,7 @@ fn copy_files_into_dir(files: &[PathBuf], target_dir: &Path, b: &Behavior) -> UR
 /// Handle incomplete user/group parings for chown.
 ///
 /// Returns a Result type with the Err variant containing the error message.
+/// If the user is root, revert the uid & gid
 ///
 /// # Parameters
 ///
@@ -676,23 +675,31 @@ fn copy_files_into_dir(files: &[PathBuf], target_dir: &Path, b: &Behavior) -> UR
 /// return an empty error value.
 ///
 fn chown_optional_user_group(path: &Path, b: &Behavior) -> UResult<()> {
-    if b.owner_id.is_some() || b.group_id.is_some() {
-        let meta = match fs::metadata(path) {
-            Ok(meta) => meta,
-            Err(e) => return Err(InstallError::MetadataFailed(e).into()),
-        };
+    // GNU coreutils doesn't print chown operations during install with verbose flag.
+    let verbosity = Verbosity {
+        groups_only: b.owner_id.is_none(),
+        level: VerbosityLevel::Normal,
+    };
 
-        // GNU coreutils doesn't print chown operations during install with verbose flag.
-        let verbosity = Verbosity {
-            groups_only: b.owner_id.is_none(),
-            level: VerbosityLevel::Normal,
-        };
+    // Determine the owner and group IDs to be used for chown.
+    let (owner_id, group_id) = if b.owner_id.is_some() || b.group_id.is_some() {
+        (b.owner_id, b.group_id)
+    } else if geteuid() == 0 {
+        // Special case for root user.
+        (Some(0), Some(0))
+    } else {
+        // No chown operation needed.
+        return Ok(());
+    };
 
-        match wrap_chown(path, &meta, b.owner_id, b.group_id, false, verbosity) {
-            Ok(msg) if b.verbose && !msg.is_empty() => println!("chown: {msg}"),
-            Ok(_) => {}
-            Err(e) => return Err(InstallError::ChownFailed(path.to_path_buf(), e).into()),
-        }
+    let meta = match fs::metadata(path) {
+        Ok(meta) => meta,
+        Err(e) => return Err(InstallError::MetadataFailed(e).into()),
+    };
+    match wrap_chown(path, &meta, owner_id, group_id, false, verbosity) {
+        Ok(msg) if b.verbose && !msg.is_empty() => println!("chown: {msg}"),
+        Ok(_) => {}
+        Err(e) => return Err(InstallError::ChownFailed(path.to_path_buf(), e).into()),
     }
 
     Ok(())

From efa7f8b4f7a138d5852a8c21b1c3a15037f2fbe6 Mon Sep 17 00:00:00 2001
From: "renovate[bot]" <29139614+renovate[bot]@users.noreply.github.com>
Date: Thu, 28 Dec 2023 15:03:19 +0000
Subject: [PATCH 289/429] chore(deps): update rust crate xattr to 1.2.0

---
 Cargo.lock | 4 ++--
 Cargo.toml | 2 +-
 2 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/Cargo.lock b/Cargo.lock
index d92a288755c..6c95a55a6f5 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -3574,9 +3574,9 @@ checksum = "dff9641d1cd4be8d1a070daf9e3773c5f67e78b4d9d42263020c057706765c04"
 
 [[package]]
 name = "xattr"
-version = "1.1.3"
+version = "1.2.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "a7dae5072fe1f8db8f8d29059189ac175196e410e40ba42d5d4684ae2f750995"
+checksum = "914566e6413e7fa959cc394fb30e563ba80f3541fbd40816d4c05a0fc3f2a0f1"
 dependencies = [
  "libc",
  "linux-raw-sys 0.4.12",
diff --git a/Cargo.toml b/Cargo.toml
index accfc2a0653..0a28175aded 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -331,7 +331,7 @@ utf-8 = "0.7.6"
 walkdir = "2.4"
 winapi-util = "0.1.6"
 windows-sys = { version = "0.48.0", default-features = false }
-xattr = "1.1.3"
+xattr = "1.2.0"
 zip = { version = "0.6.6", default-features = false, features = ["deflate"] }
 
 hex = "0.4.3"

From d82ee771aa82a982912a28a94bc3283267143793 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Thu, 28 Dec 2023 01:08:56 +0100
Subject: [PATCH 290/429] install: Add a test to cover recent changes

---
 tests/by-util/test_install.rs | 34 ++++++++++++++++++++++++++++++++--
 1 file changed, 32 insertions(+), 2 deletions(-)

diff --git a/tests/by-util/test_install.rs b/tests/by-util/test_install.rs
index fb360533f11..3db25c81fc2 100644
--- a/tests/by-util/test_install.rs
+++ b/tests/by-util/test_install.rs
@@ -4,9 +4,10 @@
 // file that was distributed with this source code.
 // spell-checker:ignore (words) helloworld nodir objdump n'source
 
-use crate::common::util::{is_ci, TestScenario};
+use crate::common::util::{is_ci, run_ucmd_as_root, TestScenario};
 use filetime::FileTime;
-use std::os::unix::fs::PermissionsExt;
+use std::fs;
+use std::os::unix::fs::{MetadataExt, PermissionsExt};
 #[cfg(not(any(windows, target_os = "freebsd")))]
 use std::process::Command;
 #[cfg(any(target_os = "linux", target_os = "android"))]
@@ -1613,3 +1614,32 @@ fn test_target_file_ends_with_slash() {
         .fails()
         .stderr_contains("failed to access 'dir/target_file/': Not a directory");
 }
+
+#[test]
+fn test_install_root_combined() {
+    let ts = TestScenario::new(util_name!());
+    let at = ts.fixtures.clone();
+    at.touch("a");
+    at.touch("c");
+
+    let run_and_check = |args: &[&str], target: &str, expected_uid: u32, expected_gid: u32| {
+        if let Ok(result) = run_ucmd_as_root(&ts, args) {
+            result.success();
+            assert!(at.file_exists(target));
+
+            let metadata = fs::metadata(at.plus(target)).unwrap();
+            assert_eq!(metadata.uid(), expected_uid);
+            assert_eq!(metadata.gid(), expected_gid);
+        } else {
+            print!("Test skipped; requires root user");
+        }
+    };
+
+    run_and_check(&["-Cv", "-o1", "-g1", "a", "b"], "b", 1, 1);
+    run_and_check(&["-Cv", "-o2", "-g1", "a", "b"], "b", 2, 1);
+    run_and_check(&["-Cv", "-o2", "-g2", "a", "b"], "b", 2, 2);
+
+    run_and_check(&["-Cv", "-o2", "c", "d"], "d", 2, 0);
+    run_and_check(&["-Cv", "c", "d"], "d", 0, 0);
+    run_and_check(&["-Cv", "c", "d"], "d", 0, 0);
+}

From 9bb725cefc63145c722025c2ff216fee63bc30c3 Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Thu, 28 Dec 2023 17:44:23 +0100
Subject: [PATCH 291/429] clippy: fix warnings introduced by Rust 1.75

---
 src/uu/csplit/src/patterns.rs | 6 +++---
 src/uu/factor/src/factor.rs   | 1 +
 src/uu/kill/src/kill.rs       | 2 +-
 tests/by-util/test_ls.rs      | 2 +-
 tests/by-util/test_test.rs    | 2 +-
 5 files changed, 7 insertions(+), 6 deletions(-)

diff --git a/src/uu/csplit/src/patterns.rs b/src/uu/csplit/src/patterns.rs
index 8e7b76e6bb4..6e7483b7f9f 100644
--- a/src/uu/csplit/src/patterns.rs
+++ b/src/uu/csplit/src/patterns.rs
@@ -196,7 +196,7 @@ mod tests {
             .collect();
         let patterns = get_patterns(input.as_slice()).unwrap();
         assert_eq!(patterns.len(), 3);
-        match patterns.get(0) {
+        match patterns.first() {
             Some(Pattern::UpToLine(24, ExecutePattern::Times(1))) => (),
             _ => panic!("expected UpToLine pattern"),
         };
@@ -227,7 +227,7 @@ mod tests {
         .collect();
         let patterns = get_patterns(input.as_slice()).unwrap();
         assert_eq!(patterns.len(), 5);
-        match patterns.get(0) {
+        match patterns.first() {
             Some(Pattern::UpToMatch(reg, 0, ExecutePattern::Times(1))) => {
                 let parsed_reg = format!("{reg}");
                 assert_eq!(parsed_reg, "test1.*end$");
@@ -281,7 +281,7 @@ mod tests {
         .collect();
         let patterns = get_patterns(input.as_slice()).unwrap();
         assert_eq!(patterns.len(), 5);
-        match patterns.get(0) {
+        match patterns.first() {
             Some(Pattern::SkipToMatch(reg, 0, ExecutePattern::Times(1))) => {
                 let parsed_reg = format!("{reg}");
                 assert_eq!(parsed_reg, "test1.*end$");
diff --git a/src/uu/factor/src/factor.rs b/src/uu/factor/src/factor.rs
index a7e848bb883..d7899a7e6ee 100644
--- a/src/uu/factor/src/factor.rs
+++ b/src/uu/factor/src/factor.rs
@@ -3,6 +3,7 @@
 // For the full copyright and license information, please view the LICENSE
 // file that was distributed with this source code.
 
+#![allow(clippy::items_after_test_module)]
 use smallvec::SmallVec;
 use std::cell::RefCell;
 use std::fmt;
diff --git a/src/uu/kill/src/kill.rs b/src/uu/kill/src/kill.rs
index f353fd7cab3..87de0ff54d3 100644
--- a/src/uu/kill/src/kill.rs
+++ b/src/uu/kill/src/kill.rs
@@ -71,7 +71,7 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
             table();
             Ok(())
         }
-        Mode::List => list(pids_or_signals.get(0)),
+        Mode::List => list(pids_or_signals.first()),
     }
 }
 
diff --git a/tests/by-util/test_ls.rs b/tests/by-util/test_ls.rs
index 5da8912e3f0..72a303ef3dc 100644
--- a/tests/by-util/test_ls.rs
+++ b/tests/by-util/test_ls.rs
@@ -4139,7 +4139,7 @@ fn test_ls_hyperlink_dirs() {
     assert!(result
         .stdout_str()
         .lines()
-        .nth(0)
+        .next()
         .unwrap()
         .contains(&format!("{path}{separator}{dir_a}\x07{dir_a}\x1b]8;;\x07:")));
     assert_eq!(result.stdout_str().lines().nth(1).unwrap(), "");
diff --git a/tests/by-util/test_test.rs b/tests/by-util/test_test.rs
index 277e4622a69..1999634efbc 100644
--- a/tests/by-util/test_test.rs
+++ b/tests/by-util/test_test.rs
@@ -696,7 +696,7 @@ fn test_file_owned_by_egid() {
     if user_gid != file_gid {
         let file_uid = metadata.uid();
         let path = CString::new(at.plus("regular_file").as_os_str().as_bytes()).expect("bad path");
-        let r = unsafe { libc::chown(path.as_ptr().into(), file_uid, user_gid) };
+        let r = unsafe { libc::chown(path.as_ptr(), file_uid, user_gid) };
         assert_ne!(r, -1);
     }
 

From 55de78037d9c9d9c4d83f404c831f7e41f31390f Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Thu, 28 Dec 2023 23:21:44 +0100
Subject: [PATCH 292/429] ls/gnu: ignore the libcap check

---
 util/build-gnu.sh | 1 +
 1 file changed, 1 insertion(+)

diff --git a/util/build-gnu.sh b/util/build-gnu.sh
index 18545dd4817..8a45e0a8d6e 100755
--- a/util/build-gnu.sh
+++ b/util/build-gnu.sh
@@ -179,6 +179,7 @@ sed -i 's|chmod |/usr/bin/chmod |' tests/du/inacc-dir.sh tests/tail/tail-n0f.sh
 sed -i 's|sort |/usr/bin/sort |' tests/ls/hyperlink.sh tests/test/test-N.sh
 sed -i 's|split |/usr/bin/split |' tests/factor/factor-parallel.sh
 sed -i 's|id -|/usr/bin/id -|' tests/runcon/runcon-no-reorder.sh
+sed -i "s|grep '^#define HAVE_CAP 1' \$CONFIG_HEADER > /dev/null|true|"  tests/ls/capability.sh
 # tests/ls/abmon-align.sh - https://github.com/uutils/coreutils/issues/3505
 sed -i 's|touch |/usr/bin/touch |' tests/cp/reflink-perm.sh tests/ls/block-size.sh tests/mv/update.sh tests/ls/ls-time.sh tests/stat/stat-nanoseconds.sh tests/misc/time-style.sh tests/test/test-N.sh tests/ls/abmon-align.sh
 sed -i 's|ln -|/usr/bin/ln -|' tests/cp/link-deref.sh

From 0ce73e1b02c902c24bb4f8437b0c58ae8ab7b1fb Mon Sep 17 00:00:00 2001
From: "renovate[bot]" <29139614+renovate[bot]@users.noreply.github.com>
Date: Thu, 28 Dec 2023 23:03:37 +0000
Subject: [PATCH 293/429] chore(deps): update rust crate bstr to 1.9

---
 Cargo.lock | 8 ++++----
 Cargo.toml | 2 +-
 2 files changed, 5 insertions(+), 5 deletions(-)

diff --git a/Cargo.lock b/Cargo.lock
index 6c95a55a6f5..ee403d92f92 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -188,9 +188,9 @@ dependencies = [
 
 [[package]]
 name = "bstr"
-version = "1.8.0"
+version = "1.9.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "542f33a8835a0884b006a0c3df3dadd99c0c3f296ed26c2fdc8028e01ad6230c"
+checksum = "c48f0051a4b4c5e0b6d365cd04af53aeaa209e3cc15ec2cdb69e73cc87fbd0dc"
 dependencies = [
  "memchr",
  "regex-automata",
@@ -1263,9 +1263,9 @@ dependencies = [
 
 [[package]]
 name = "memchr"
-version = "2.6.2"
+version = "2.7.1"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "5486aed0026218e61b8a01d5fbd5a0a134649abb71a0e53b7bc088529dced86e"
+checksum = "523dc4f511e55ab87b694dc30d0f820d60906ef06413f93d4d7a1385599cc149"
 
 [[package]]
 name = "memmap2"
diff --git a/Cargo.toml b/Cargo.toml
index 0a28175aded..3fc1e23cbe2 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -260,7 +260,7 @@ test = ["uu_test"]
 [workspace.dependencies]
 bigdecimal = "0.4"
 binary-heap-plus = "0.5.0"
-bstr = "1.8"
+bstr = "1.9"
 bytecount = "0.6.7"
 byteorder = "1.5.0"
 chrono = { version = "^0.4.31", default-features = false, features = [

From 702561932517267ea664e69eb8ac8527bb2d56c1 Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Fri, 29 Dec 2023 10:24:08 +0100
Subject: [PATCH 294/429] cp: adapt warning if source is used more than once

---
 src/uu/cp/src/cp.rs      | 2 +-
 tests/by-util/test_cp.rs | 4 +++-
 2 files changed, 4 insertions(+), 2 deletions(-)

diff --git a/src/uu/cp/src/cp.rs b/src/uu/cp/src/cp.rs
index 97afdee1e0f..30cb3f59ffe 100644
--- a/src/uu/cp/src/cp.rs
+++ b/src/uu/cp/src/cp.rs
@@ -1193,7 +1193,7 @@ pub fn copy(sources: &[PathBuf], target: &Path, options: &Options) -> CopyResult
     for source in sources {
         if seen_sources.contains(source) {
             // FIXME: compare sources by the actual file they point to, not their path. (e.g. dir/file == dir/../dir/file in most cases)
-            show_warning!("source {} specified more than once", source.quote());
+            show_warning!("source file {} specified more than once", source.quote());
         } else {
             let dest = construct_dest_path(source, target, target_type, options)
                 .unwrap_or_else(|_| target.to_path_buf());
diff --git a/tests/by-util/test_cp.rs b/tests/by-util/test_cp.rs
index 2636df28a3b..38d7e815dee 100644
--- a/tests/by-util/test_cp.rs
+++ b/tests/by-util/test_cp.rs
@@ -111,7 +111,9 @@ fn test_cp_duplicate_files() {
         .arg(TEST_HELLO_WORLD_SOURCE)
         .arg(TEST_COPY_TO_FOLDER)
         .succeeds()
-        .stderr_contains("specified more than once");
+        .stderr_contains(format!(
+            "source file '{TEST_HELLO_WORLD_SOURCE}' specified more than once"
+        ));
     assert_eq!(at.read(TEST_COPY_TO_FOLDER_FILE), "Hello, World!\n");
 }
 

From ce28ae5c02f1f2d30c549b92fb4a7220c761109b Mon Sep 17 00:00:00 2001
From: Alexandru-Constantin Atomei <atomeialexandru03@gmail.com>
Date: Thu, 28 Dec 2023 17:06:58 +0200
Subject: [PATCH 295/429] Fixed more and test docs

---
 src/uu/more/more.md | 2 +-
 src/uu/test/test.md | 3 ++-
 2 files changed, 3 insertions(+), 2 deletions(-)

diff --git a/src/uu/more/more.md b/src/uu/more/more.md
index cb626060ec5..e63ca1a87fb 100644
--- a/src/uu/more/more.md
+++ b/src/uu/more/more.md
@@ -1,7 +1,7 @@
 # more
 
 ```
-more [OPTIONS] <FILE>...
+more [OPTIONS] FILE...
 ```
 
 Display the contents of a text file
diff --git a/src/uu/test/test.md b/src/uu/test/test.md
index e67eb1824ab..b198c220b24 100644
--- a/src/uu/test/test.md
+++ b/src/uu/test/test.md
@@ -2,10 +2,11 @@
 
 ```
 test EXPRESSION
-test
+[
 [ EXPRESSION ]
 [ ]
 [ OPTION
+]
 ```
 
 Check file types and compare values.

From e61318413e6cdf2c4c2c94be50870fdf1adc9866 Mon Sep 17 00:00:00 2001
From: Alexandru-Constantin Atomei <atomeialexandru03@gmail.com>
Date: Fri, 29 Dec 2023 14:51:23 +0200
Subject: [PATCH 296/429] Added documentation for the vdir command.

---
 src/uu/vdir/vdir.md | 10 ++++++++++
 1 file changed, 10 insertions(+)
 create mode 100644 src/uu/vdir/vdir.md

diff --git a/src/uu/vdir/vdir.md b/src/uu/vdir/vdir.md
new file mode 100644
index 00000000000..b2295339731
--- /dev/null
+++ b/src/uu/vdir/vdir.md
@@ -0,0 +1,10 @@
+# vdir
+
+```
+vdir [OPTION]... [FILE]...
+```
+
+List directory contents.
+Ignore files and directories starting with a '.' by default
+
+Mandatory  arguments  to  long  options are mandatory for short options too.

From 1e5244765dd48ba02715b22673e0aa6c271e2919 Mon Sep 17 00:00:00 2001
From: Alexandru-Constantin Atomei <atomeialexandru03@gmail.com>
Date: Fri, 29 Dec 2023 15:07:55 +0200
Subject: [PATCH 297/429] Made one more modification to test usage string.

---
 src/uu/test/src/test.rs | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/src/uu/test/src/test.rs b/src/uu/test/src/test.rs
index a0d0f339592..9d3c2b29031 100644
--- a/src/uu/test/src/test.rs
+++ b/src/uu/test/src/test.rs
@@ -29,10 +29,11 @@ const ABOUT: &str = help_about!("test.md");
 // So, we use test or [ instead of {} so that the usage string is correct.
 const USAGE: &str = "\
 test EXPRESSION
-test
+[
 [ EXPRESSION ]
 [ ]
-[ OPTION";
+[ OPTION
+]";
 
 // We use after_help so that this comes after the usage string (it would come before if we used about)
 const AFTER_HELP: &str = help_section!("after help", "test.md");

From d15981650a1298834284ea8269c6b51d5c32d3eb Mon Sep 17 00:00:00 2001
From: Alexandru-Constantin Atomei <atomeialexandru03@gmail.com>
Date: Fri, 29 Dec 2023 15:35:23 +0200
Subject: [PATCH 298/429] Fixed one typo

---
 src/uu/vdir/vdir.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/uu/vdir/vdir.md b/src/uu/vdir/vdir.md
index b2295339731..ca3e1c5ce93 100644
--- a/src/uu/vdir/vdir.md
+++ b/src/uu/vdir/vdir.md
@@ -5,6 +5,6 @@ vdir [OPTION]... [FILE]...
 ```
 
 List directory contents.
-Ignore files and directories starting with a '.' by default
+Ignore files and directories starting with a '.' by default.
 
 Mandatory  arguments  to  long  options are mandatory for short options too.

From 21d09dd404075bbd719566eb01e1f377b999bb68 Mon Sep 17 00:00:00 2001
From: Matei Mantu <66641453+mtimaN@users.noreply.github.com>
Date: Fri, 29 Dec 2023 16:19:26 +0200
Subject: [PATCH 299/429] ls: unquoted names should be indented with a space if
 there is a quoted name (#5740)

* ls: change indentation when file names include quotes to match GNU's

* display_grid: Changed order of parameters because it made more sense

* ls -l: Add padding for unquoted filenames

* Fix checking for quoted filenames

* Simplify if
---
 src/uu/ls/src/ls.rs | 45 +++++++++++++++++++++++++++++++++++++++------
 1 file changed, 39 insertions(+), 6 deletions(-)

diff --git a/src/uu/ls/src/ls.rs b/src/uu/ls/src/ls.rs
index a6ed73da324..952083d2ab1 100644
--- a/src/uu/ls/src/ls.rs
+++ b/src/uu/ls/src/ls.rs
@@ -2414,6 +2414,11 @@ fn display_items(
     // Display the SELinux security context or '?' if none is found. When used with the `-l`
     // option, print the security context to the left of the size column.
 
+    let quoted = items.iter().any(|item| {
+        let name = escape_name(&item.display_name, &config.quoting_style);
+        name.starts_with('\'')
+    });
+
     if config.format == Format::Long {
         let padding_collection = calculate_padding_collection(items, config, out);
 
@@ -2431,7 +2436,15 @@ fn display_items(
                     display_additional_leading_info(item, &padding_collection, config, out)?;
                 write!(out, "{more_info}")?;
             }
-            display_item_long(item, &padding_collection, config, out, dired, style_manager)?;
+            display_item_long(
+                item,
+                &padding_collection,
+                config,
+                out,
+                dired,
+                style_manager,
+                quoted,
+            )?;
         }
     } else {
         let mut longest_context_len = 1;
@@ -2448,7 +2461,6 @@ fn display_items(
         let padding = calculate_padding_collection(items, config, out);
 
         let mut names_vec = Vec::new();
-
         for i in items {
             let more_info = display_additional_leading_info(i, &padding, config, out)?;
             let cell = display_item_name(i, config, prefix_context, more_info, out, style_manager);
@@ -2458,8 +2470,12 @@ fn display_items(
         let names = names_vec.into_iter();
 
         match config.format {
-            Format::Columns => display_grid(names, config.width, Direction::TopToBottom, out)?,
-            Format::Across => display_grid(names, config.width, Direction::LeftToRight, out)?,
+            Format::Columns => {
+                display_grid(names, config.width, Direction::TopToBottom, out, quoted)?;
+            }
+            Format::Across => {
+                display_grid(names, config.width, Direction::LeftToRight, out, quoted)?;
+            }
             Format::Commas => {
                 let mut current_col = 0;
                 let mut names = names;
@@ -2524,6 +2540,7 @@ fn display_grid(
     width: u16,
     direction: Direction,
     out: &mut BufWriter<Stdout>,
+    quoted: bool,
 ) -> UResult<()> {
     if width == 0 {
         // If the width is 0 we print one single line
@@ -2545,7 +2562,15 @@ fn display_grid(
         let mut grid = Grid::new(GridOptions { filling, direction });
 
         for name in names {
-            grid.add(name);
+            let formatted_name = Cell {
+                contents: if quoted && !name.contents.starts_with('\'') {
+                    format!(" {}", name.contents)
+                } else {
+                    name.contents
+                },
+                width: name.width,
+            };
+            grid.add(formatted_name);
         }
 
         match grid.fit_into_width(width as usize) {
@@ -2597,6 +2622,7 @@ fn display_item_long(
     out: &mut BufWriter<Stdout>,
     dired: &mut DiredOutput,
     style_manager: &mut StyleManager,
+    quoted: bool,
 ) -> UResult<()> {
     let mut output_display: String = String::new();
     if config.dired {
@@ -2689,8 +2715,15 @@ fn display_item_long(
 
         write!(output_display, " {} ", display_date(md, config)).unwrap();
 
-        let displayed_item =
+        let item_name =
             display_item_name(item, config, None, String::new(), out, style_manager).contents;
+
+        let displayed_item = if quoted && !item_name.starts_with('\'') {
+            format!(" {}", item_name)
+        } else {
+            item_name
+        };
+
         if config.dired {
             let (start, end) = dired::calculate_dired(
                 &dired.dired_positions,

From 231987b10956ed775749d7609c0e607858e162df Mon Sep 17 00:00:00 2001
From: Vardhan Patil <hi@vardhanpatil.com>
Date: Sat, 30 Dec 2023 12:48:19 +0530
Subject: [PATCH 300/429] cksum: create initial implementation of the --length
 option

---
 src/uu/cksum/src/cksum.rs | 56 ++++++++++++++++++++++++++++++++++++---
 1 file changed, 52 insertions(+), 4 deletions(-)

diff --git a/src/uu/cksum/src/cksum.rs b/src/uu/cksum/src/cksum.rs
index 24576040937..8e6f4f3af7c 100644
--- a/src/uu/cksum/src/cksum.rs
+++ b/src/uu/cksum/src/cksum.rs
@@ -4,7 +4,7 @@
 // file that was distributed with this source code.
 
 // spell-checker:ignore (ToDO) fname, algo
-use clap::{crate_version, Arg, ArgAction, Command};
+use clap::{crate_version, value_parser, Arg, ArgAction, Command};
 use hex::encode;
 use std::ffi::OsStr;
 use std::fs::File;
@@ -36,7 +36,12 @@ const ALGORITHM_OPTIONS_SHA512: &str = "sha512";
 const ALGORITHM_OPTIONS_BLAKE2B: &str = "blake2b";
 const ALGORITHM_OPTIONS_SM3: &str = "sm3";
 
-fn detect_algo(program: &str) -> (&'static str, Box<dyn Digest + 'static>, usize) {
+// enum CksumError
+
+fn detect_algo(
+    program: &str,
+    length: Option<usize>,
+) -> (&'static str, Box<dyn Digest + 'static>, usize) {
     match program {
         ALGORITHM_OPTIONS_SYSV => (
             ALGORITHM_OPTIONS_SYSV,
@@ -85,7 +90,11 @@ fn detect_algo(program: &str) -> (&'static str, Box<dyn Digest + 'static>, usize
         ),
         ALGORITHM_OPTIONS_BLAKE2B => (
             ALGORITHM_OPTIONS_BLAKE2B,
-            Box::new(Blake2b::new()) as Box<dyn Digest>,
+            Box::new(if let Some(length) = length {
+                Blake2b::with_output_bytes(length)
+            } else {
+                Blake2b::new()
+            }) as Box<dyn Digest>,
             512,
         ),
         ALGORITHM_OPTIONS_SM3 => (
@@ -115,6 +124,10 @@ fn cksum<'a, I>(mut options: Options, files: I) -> UResult<()>
 where
     I: Iterator<Item = &'a OsStr>,
 {
+    // if options.length != None && options.algo_name != ALGORITHM_OPTIONS_BLAKE2B {
+    //     return UError;
+    // }
+
     for filename in files {
         let filename = Path::new(filename);
         let stdin_buf;
@@ -217,6 +230,7 @@ mod options {
     pub const ALGORITHM: &str = "algorithm";
     pub const FILE: &str = "file";
     pub const UNTAGGED: &str = "untagged";
+    pub const LENGTH: &str = "length";
 }
 
 #[uucore::main]
@@ -228,7 +242,33 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
         None => ALGORITHM_OPTIONS_CRC,
     };
 
-    let (name, algo, bits) = detect_algo(algo_name);
+    let input_length = matches.get_one::<usize>(options::LENGTH);
+    let length = if let Some(length) = input_length {
+        if algo_name != ALGORITHM_OPTIONS_BLAKE2B {
+            return Err(io::Error::new(
+                io::ErrorKind::InvalidInput,
+                "--length is only supported with --algorithm=blake2b",
+            )
+            .into());
+        }
+
+        if length % 8 != 0 {
+            return Err(io::Error::new(
+                io::ErrorKind::InvalidInput,
+                // TODO: Fix formatting for this error message
+                // GNU has the executable path/name on both lines
+                format!("invalid length {length}\nlength is not a multiple of 8"),
+            )
+            .into());
+        }
+
+        Some(length / 8)
+    } else {
+        None
+    };
+
+    let (name, algo, bits) = detect_algo(algo_name, length);
+
     let opts = Options {
         algo_name: name,
         digest: algo,
@@ -282,5 +322,13 @@ pub fn uu_app() -> Command {
                 .help("create a reversed style checksum, without digest type")
                 .action(ArgAction::SetTrue),
         )
+        .arg(
+            Arg::new(options::LENGTH)
+                .long(options::LENGTH)
+                .value_parser(value_parser!(usize))
+                .short('l')
+                .help("digest length in bits; must not exceed the max for the blake2 algorithm and must be a multiple of 8")
+                .action(ArgAction::Set),
+        )
         .after_help(AFTER_HELP)
 }

From 138b11efbdc6c34144376ec3f92d6de5eddef634 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Sat, 30 Dec 2023 09:53:32 +0100
Subject: [PATCH 301/429] remove extra spaces

---
 src/uu/vdir/vdir.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/uu/vdir/vdir.md b/src/uu/vdir/vdir.md
index ca3e1c5ce93..c7a0cae3643 100644
--- a/src/uu/vdir/vdir.md
+++ b/src/uu/vdir/vdir.md
@@ -7,4 +7,4 @@ vdir [OPTION]... [FILE]...
 List directory contents.
 Ignore files and directories starting with a '.' by default.
 
-Mandatory  arguments  to  long  options are mandatory for short options too.
+Mandatory arguments to long options are mandatory for short options too.

From 037073d852c1af1100d1931418fd921fcf2073b5 Mon Sep 17 00:00:00 2001
From: Vardhan Patil <hi@vardhanpatil.com>
Date: Sat, 30 Dec 2023 15:59:29 +0530
Subject: [PATCH 302/429] cksum: make the output formatting match GNU

---
 src/uu/cksum/src/cksum.rs | 37 ++++++++++++++++++++++++-------------
 1 file changed, 24 insertions(+), 13 deletions(-)

diff --git a/src/uu/cksum/src/cksum.rs b/src/uu/cksum/src/cksum.rs
index 8e6f4f3af7c..ed9f3573f90 100644
--- a/src/uu/cksum/src/cksum.rs
+++ b/src/uu/cksum/src/cksum.rs
@@ -111,6 +111,7 @@ struct Options {
     digest: Box<dyn Digest + 'static>,
     output_bits: usize,
     untagged: bool,
+    length: Option<usize>,
 }
 
 /// Calculate checksum
@@ -174,7 +175,12 @@ where
             (ALGORITHM_OPTIONS_CRC, true) => println!("{sum} {sz}"),
             (ALGORITHM_OPTIONS_CRC, false) => println!("{sum} {sz} {}", filename.display()),
             (ALGORITHM_OPTIONS_BLAKE2B, _) if !options.untagged => {
-                println!("BLAKE2b ({}) = {sum}", filename.display());
+                if let Some(length) = options.length {
+                    // Multiply by 8 here, as we want to print the length in bits.
+                    println!("BLAKE2b-{} ({}) = {sum}", length * 8, filename.display());
+                } else {
+                    println!("BLAKE2b ({}) = {sum}", filename.display());
+                }
             }
             _ => {
                 if options.untagged {
@@ -244,24 +250,28 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
 
     let input_length = matches.get_one::<usize>(options::LENGTH);
     let length = if let Some(length) = input_length {
-        if algo_name != ALGORITHM_OPTIONS_BLAKE2B {
-            return Err(io::Error::new(
-                io::ErrorKind::InvalidInput,
-                "--length is only supported with --algorithm=blake2b",
-            )
-            .into());
-        }
-
+        
         if length % 8 != 0 {
+            // GNU's implementation seem to use these quotation marks
+            // in their error messages, so we do the same.
+            uucore::show_error!("invalid length: \u{2018}{length}\u{2019}");
             return Err(io::Error::new(
                 io::ErrorKind::InvalidInput,
-                // TODO: Fix formatting for this error message
-                // GNU has the executable path/name on both lines
-                format!("invalid length {length}\nlength is not a multiple of 8"),
+                "length is not a multiple of 8",
             )
             .into());
-        }
+    }
+
+    if algo_name != ALGORITHM_OPTIONS_BLAKE2B {
+        return Err(io::Error::new(
+            io::ErrorKind::InvalidInput,
+            "--length is only supported with --algorithm=blake2b",
+        )
+        .into());
+    }
 
+        // Divide by 8, as our blake2b implementation expects bytes
+        // instead of bits.
         Some(length / 8)
     } else {
         None
@@ -273,6 +283,7 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
         algo_name: name,
         digest: algo,
         output_bits: bits,
+        length,
         untagged: matches.get_flag(options::UNTAGGED),
     };
 

From 09ef150085f34b5e260b6a75d15e8da4a9721681 Mon Sep 17 00:00:00 2001
From: Vardhan Patil <hi@vardhanpatil.com>
Date: Sat, 30 Dec 2023 16:01:22 +0530
Subject: [PATCH 303/429] tests/cksum: add tests for the length argument

---
 tests/by-util/test_cksum.rs                   | 34 +++++++++++++++++++
 .../fixtures/cksum/supported_length.expected  |  2 ++
 .../cksum/unsupported_length.expected         |  2 ++
 3 files changed, 38 insertions(+)
 create mode 100644 tests/fixtures/cksum/supported_length.expected
 create mode 100644 tests/fixtures/cksum/unsupported_length.expected

diff --git a/tests/by-util/test_cksum.rs b/tests/by-util/test_cksum.rs
index a9d9b272b4c..dbf7264e813 100644
--- a/tests/by-util/test_cksum.rs
+++ b/tests/by-util/test_cksum.rs
@@ -228,3 +228,37 @@ fn test_untagged_algorithm_stdin() {
             .stdout_is_fixture(format!("untagged/{algo}_stdin.expected"));
     }
 }
+
+#[test]
+fn test_length_with_wrong_algorithm() {
+    new_ucmd!()
+        .arg("--length=16")
+        .arg("--algorithm=md5")
+        .arg("lorem_ipsum.txt")
+        .fails()
+        .no_stdout()
+        .stderr_contains("cksum: --length is only supported with --algorithm=blake2b")
+        .code_is(1);
+}
+
+#[test]
+fn test_length_not_supported() {
+    new_ucmd!()
+        .arg("--length=15")
+        .arg("lorem_ipsum.txt")
+        .fails()
+        .no_stdout()
+        .stderr_is_fixture("unsupported_length.expected")
+        .code_is(1);
+}
+
+#[test]
+fn test_length() {
+    new_ucmd!()
+        .arg("--length=16")
+        .arg("--algorithm=blake2b")
+        .arg("lorem_ipsum.txt")
+        .arg("alice_in_wonderland.txt")
+        .succeeds()
+        .stdout_is_fixture("supported_length.expected");
+}
diff --git a/tests/fixtures/cksum/supported_length.expected b/tests/fixtures/cksum/supported_length.expected
new file mode 100644
index 00000000000..a2edb23e9ee
--- /dev/null
+++ b/tests/fixtures/cksum/supported_length.expected
@@ -0,0 +1,2 @@
+BLAKE2b-16 (lorem_ipsum.txt) = 7e2f
+BLAKE2b-16 (alice_in_wonderland.txt) = a546
diff --git a/tests/fixtures/cksum/unsupported_length.expected b/tests/fixtures/cksum/unsupported_length.expected
new file mode 100644
index 00000000000..c2a05fec7be
--- /dev/null
+++ b/tests/fixtures/cksum/unsupported_length.expected
@@ -0,0 +1,2 @@
+cksum: invalid length: ‘15’
+cksum: length is not a multiple of 8

From 7caa0bcdea3dcee68d954c19f4a4961a61843571 Mon Sep 17 00:00:00 2001
From: Vardhan Patil <hi@vardhanpatil.com>
Date: Sat, 30 Dec 2023 16:02:10 +0530
Subject: [PATCH 304/429] cksum: fix formatting in cksum.rs

---
 src/uu/cksum/src/cksum.rs | 17 ++++++++---------
 1 file changed, 8 insertions(+), 9 deletions(-)

diff --git a/src/uu/cksum/src/cksum.rs b/src/uu/cksum/src/cksum.rs
index ed9f3573f90..2a4b539f9b8 100644
--- a/src/uu/cksum/src/cksum.rs
+++ b/src/uu/cksum/src/cksum.rs
@@ -250,7 +250,6 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
 
     let input_length = matches.get_one::<usize>(options::LENGTH);
     let length = if let Some(length) = input_length {
-        
         if length % 8 != 0 {
             // GNU's implementation seem to use these quotation marks
             // in their error messages, so we do the same.
@@ -260,15 +259,15 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
                 "length is not a multiple of 8",
             )
             .into());
-    }
+        }
 
-    if algo_name != ALGORITHM_OPTIONS_BLAKE2B {
-        return Err(io::Error::new(
-            io::ErrorKind::InvalidInput,
-            "--length is only supported with --algorithm=blake2b",
-        )
-        .into());
-    }
+        if algo_name != ALGORITHM_OPTIONS_BLAKE2B {
+            return Err(io::Error::new(
+                io::ErrorKind::InvalidInput,
+                "--length is only supported with --algorithm=blake2b",
+            )
+            .into());
+        }
 
         // Divide by 8, as our blake2b implementation expects bytes
         // instead of bits.

From aec0cfa6e3e0939c578835c5a526f81d4cea9cf6 Mon Sep 17 00:00:00 2001
From: Vardhan Patil <hi@vardhanpatil.com>
Date: Sat, 30 Dec 2023 16:05:20 +0530
Subject: [PATCH 305/429] cksum: remove commented code

---
 src/uu/cksum/src/cksum.rs | 6 ------
 1 file changed, 6 deletions(-)

diff --git a/src/uu/cksum/src/cksum.rs b/src/uu/cksum/src/cksum.rs
index 2a4b539f9b8..029aff9987e 100644
--- a/src/uu/cksum/src/cksum.rs
+++ b/src/uu/cksum/src/cksum.rs
@@ -36,8 +36,6 @@ const ALGORITHM_OPTIONS_SHA512: &str = "sha512";
 const ALGORITHM_OPTIONS_BLAKE2B: &str = "blake2b";
 const ALGORITHM_OPTIONS_SM3: &str = "sm3";
 
-// enum CksumError
-
 fn detect_algo(
     program: &str,
     length: Option<usize>,
@@ -125,10 +123,6 @@ fn cksum<'a, I>(mut options: Options, files: I) -> UResult<()>
 where
     I: Iterator<Item = &'a OsStr>,
 {
-    // if options.length != None && options.algo_name != ALGORITHM_OPTIONS_BLAKE2B {
-    //     return UError;
-    // }
-
     for filename in files {
         let filename = Path::new(filename);
         let stdin_buf;

From e1863ac64e0bb501be8dc7ef3cd0f6c565e33d35 Mon Sep 17 00:00:00 2001
From: Vardhan Patil <hi@vardhanpatil.com>
Date: Sat, 30 Dec 2023 20:14:30 +0530
Subject: [PATCH 306/429] tests/cksum: test when the --length argument is 0 or
 >512

---
 tests/by-util/test_cksum.rs                   | 24 +++++++++++++++++++
 tests/fixtures/cksum/length_is_zero.expected  |  2 ++
 .../cksum/length_larger_than_512.expected     |  2 ++
 3 files changed, 28 insertions(+)
 create mode 100644 tests/fixtures/cksum/length_is_zero.expected
 create mode 100644 tests/fixtures/cksum/length_larger_than_512.expected

diff --git a/tests/by-util/test_cksum.rs b/tests/by-util/test_cksum.rs
index dbf7264e813..0e1aec38dec 100644
--- a/tests/by-util/test_cksum.rs
+++ b/tests/by-util/test_cksum.rs
@@ -262,3 +262,27 @@ fn test_length() {
         .succeeds()
         .stdout_is_fixture("supported_length.expected");
 }
+
+#[test]
+fn test_length_greater_than_512() {
+    new_ucmd!()
+        .arg("--length=1024")
+        .arg("--algorithm=blake2b")
+        .arg("lorem_ipsum.txt")
+        .arg("alice_in_wonderland.txt")
+        .fails()
+        .no_stdout()
+        .stderr_is_fixture("length_larger_than_512.expected");
+}
+
+#[test]
+fn test_length_is_zero() {
+    new_ucmd!()
+        .arg("--length=0")
+        .arg("--algorithm=blake2b")
+        .arg("lorem_ipsum.txt")
+        .arg("alice_in_wonderland.txt")
+        .succeeds()
+        .no_stderr()
+        .stdout_is_fixture("length_is_zero.expected");
+}
\ No newline at end of file
diff --git a/tests/fixtures/cksum/length_is_zero.expected b/tests/fixtures/cksum/length_is_zero.expected
new file mode 100644
index 00000000000..97d06eb6fea
--- /dev/null
+++ b/tests/fixtures/cksum/length_is_zero.expected
@@ -0,0 +1,2 @@
+BLAKE2b (lorem_ipsum.txt) = 0e97a09189e560c3789c0bff1f020166861ef857d1fbfe4574de1842e3c06cabb9575e4af6309a166158c2b408d3c038c1b49d828b35158142cdc0396d1195c3
+BLAKE2b (alice_in_wonderland.txt) = 91b8b0f0868e905ad18b8ac35e4a1dacd289857b19258ab5d1e071761af758b0134ec152d4f011fe1825ca889c80c2e072ca70eb50548c25fc49a98937515af4
diff --git a/tests/fixtures/cksum/length_larger_than_512.expected b/tests/fixtures/cksum/length_larger_than_512.expected
new file mode 100644
index 00000000000..312b6230e9a
--- /dev/null
+++ b/tests/fixtures/cksum/length_larger_than_512.expected
@@ -0,0 +1,2 @@
+cksum: invalid length: ‘1024’
+cksum: maximum digest length for ‘BLAKE2b’ is 512 bits

From e7cb4e9ff0e685a14f10323fc5f0a0fff8f1b889 Mon Sep 17 00:00:00 2001
From: Vardhan Patil <hi@vardhanpatil.com>
Date: Sat, 30 Dec 2023 20:28:03 +0530
Subject: [PATCH 307/429] cksum: properly handle cases where --lenghth is 0 or
 >512

---
 src/uu/cksum/src/cksum.rs | 53 ++++++++++++++++++++++++---------------
 1 file changed, 33 insertions(+), 20 deletions(-)

diff --git a/src/uu/cksum/src/cksum.rs b/src/uu/cksum/src/cksum.rs
index 029aff9987e..5e21b387643 100644
--- a/src/uu/cksum/src/cksum.rs
+++ b/src/uu/cksum/src/cksum.rs
@@ -244,28 +244,41 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
 
     let input_length = matches.get_one::<usize>(options::LENGTH);
     let length = if let Some(length) = input_length {
-        if length % 8 != 0 {
-            // GNU's implementation seem to use these quotation marks
-            // in their error messages, so we do the same.
-            uucore::show_error!("invalid length: \u{2018}{length}\u{2019}");
-            return Err(io::Error::new(
-                io::ErrorKind::InvalidInput,
-                "length is not a multiple of 8",
-            )
-            .into());
-        }
+        match length.to_owned() {
+            n if n == 0 => None,
+            n if n % 8 != 0 => {
+                // GNU's implementation seem to use these quotation marks
+                // in their error messages, so we do the same.
+                uucore::show_error!("invalid length: \u{2018}{length}\u{2019}");
+                return Err(io::Error::new(
+                    io::ErrorKind::InvalidInput,
+                    "length is not a multiple of 8",
+                )
+                .into());
+            }
+            n if n > 512 => {
+                uucore::show_error!("invalid length: \u{2018}{length}\u{2019}");
 
-        if algo_name != ALGORITHM_OPTIONS_BLAKE2B {
-            return Err(io::Error::new(
-                io::ErrorKind::InvalidInput,
-                "--length is only supported with --algorithm=blake2b",
-            )
-            .into());
-        }
+                return Err(io::Error::new(
+                    io::ErrorKind::InvalidInput,
+                    "maximum digest length for \u{2018}BLAKE2b\u{2019} is 512 bits",
+                )
+                .into());
+            }
+            n => {
+                if algo_name != ALGORITHM_OPTIONS_BLAKE2B {
+                    return Err(io::Error::new(
+                        io::ErrorKind::InvalidInput,
+                        "--length is only supported with --algorithm=blake2b",
+                    )
+                    .into());
+                }
 
-        // Divide by 8, as our blake2b implementation expects bytes
-        // instead of bits.
-        Some(length / 8)
+                // Divide by 8, as our blake2b implementation expects bytes
+                // instead of bits.
+                Some(n / 8)
+            }
+        }
     } else {
         None
     };

From 1fc6a760f3e31f80c8eef080a21ae4f073a8e242 Mon Sep 17 00:00:00 2001
From: Vardhan Patil <hi@vardhanpatil.com>
Date: Sat, 30 Dec 2023 20:31:52 +0530
Subject: [PATCH 308/429] tests/cksum: fix formatting

---
 tests/by-util/test_cksum.rs | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/by-util/test_cksum.rs b/tests/by-util/test_cksum.rs
index 0e1aec38dec..00c768164d5 100644
--- a/tests/by-util/test_cksum.rs
+++ b/tests/by-util/test_cksum.rs
@@ -285,4 +285,4 @@ fn test_length_is_zero() {
         .succeeds()
         .no_stderr()
         .stdout_is_fixture("length_is_zero.expected");
-}
\ No newline at end of file
+}

From d99002157208a3514ab0df3fb4411ceeec32d5e4 Mon Sep 17 00:00:00 2001
From: Vardhan Patil <hi@vardhanpatil.com>
Date: Sat, 30 Dec 2023 20:39:09 +0530
Subject: [PATCH 309/429] cksum: remove redundant guard

---
 src/uu/cksum/src/cksum.rs | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/uu/cksum/src/cksum.rs b/src/uu/cksum/src/cksum.rs
index 5e21b387643..e8d7da60e41 100644
--- a/src/uu/cksum/src/cksum.rs
+++ b/src/uu/cksum/src/cksum.rs
@@ -245,7 +245,7 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
     let input_length = matches.get_one::<usize>(options::LENGTH);
     let length = if let Some(length) = input_length {
         match length.to_owned() {
-            n if n == 0 => None,
+            0 => None,
             n if n % 8 != 0 => {
                 // GNU's implementation seem to use these quotation marks
                 // in their error messages, so we do the same.

From 193bcf86b7c541663e4496b80b54b0ed8f3d8e23 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Sat, 30 Dec 2023 17:00:44 +0100
Subject: [PATCH 310/429] cp: Disable a test failing on freebsd

---
 tests/by-util/test_cp.rs | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/by-util/test_cp.rs b/tests/by-util/test_cp.rs
index 38d7e815dee..a1638584b8c 100644
--- a/tests/by-util/test_cp.rs
+++ b/tests/by-util/test_cp.rs
@@ -481,7 +481,7 @@ fn test_cp_arg_interactive() {
 }
 
 #[test]
-#[cfg(not(target_os = "android"))]
+#[cfg(not(any(target_os = "android", target_os = "freebsd")))]
 fn test_cp_arg_interactive_update() {
     // -u -i won't show the prompt to validate the override or not
     // Therefore, the error code will be 0

From b07ea957d326386337550bcefb10dbaabaa94696 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Sun, 31 Dec 2023 12:03:42 +0100
Subject: [PATCH 311/429] rm: improve the code a tiny bit

---
 src/uu/rm/src/rm.rs | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/uu/rm/src/rm.rs b/src/uu/rm/src/rm.rs
index 4fc37a1300f..a89ba6db67f 100644
--- a/src/uu/rm/src/rm.rs
+++ b/src/uu/rm/src/rm.rs
@@ -334,7 +334,7 @@ fn handle_dir(path: &Path, options: &Options) -> bool {
                 // remove_dir_all failed. maybe it is because of the permissions
                 // but if the directory is empty, remove_dir might work.
                 // So, let's try that before failing for real
-                if let Err(_e) = fs::remove_dir(path) {
+                if fs::remove_dir(path).is_err() {
                     had_err = true;
                     if e.kind() == std::io::ErrorKind::PermissionDenied {
                         // GNU compatibility (rm/fail-eacces.sh)

From f23902ff7a185f34d9a84218f129d1aba4bca041 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Sun, 31 Dec 2023 13:07:27 +0100
Subject: [PATCH 312/429] gnu-built: remove the useless sed

It will avoid a rebuilding when doing:
bash util/build-gnu.sh && bash util/run-gnu-test.sh   ../gnu/tests/rm/empty-inacc.sh
---
 util/build-gnu.sh | 2 --
 1 file changed, 2 deletions(-)

diff --git a/util/build-gnu.sh b/util/build-gnu.sh
index 8a45e0a8d6e..19ef4792c6b 100755
--- a/util/build-gnu.sh
+++ b/util/build-gnu.sh
@@ -102,8 +102,6 @@ for binary in $(./build-aux/gen-lists-of-programs.sh --list-progs); do
 done
 
 if test -f gnu-built; then
-    # Change the PATH in the Makefile to test the uutils coreutils instead of the GNU coreutils
-    sed -i "s/^[[:blank:]]*PATH=.*/  PATH='${UU_BUILD_DIR//\//\\/}\$(PATH_SEPARATOR)'\"\$\$PATH\" \\\/" Makefile
     echo "GNU build already found. Skip"
     echo "'rm -f $(pwd)/gnu-built' to force the build"
     echo "Note: the customization of the tests will still happen"

From 3560ec68119ebfc1f24d17bd64387b778dbd16f9 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Sun, 31 Dec 2023 13:07:47 +0100
Subject: [PATCH 313/429] gnu-built: disable some options in the GNU build

---
 util/build-gnu.sh | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/util/build-gnu.sh b/util/build-gnu.sh
index 19ef4792c6b..8ade25e8874 100755
--- a/util/build-gnu.sh
+++ b/util/build-gnu.sh
@@ -107,7 +107,7 @@ if test -f gnu-built; then
     echo "Note: the customization of the tests will still happen"
 else
     ./bootstrap --skip-po
-    ./configure --quiet --disable-gcc-warnings
+    ./configure --quiet --disable-gcc-warnings --disable-nls --disable-dependency-tracking --disable-bold-man-page-references
     #Add timeout to to protect against hangs
     sed -i 's|^"\$@|'"${SYSTEM_TIMEOUT}"' 600 "\$@|' build-aux/test-driver
     # Change the PATH in the Makefile to test the uutils coreutils instead of the GNU coreutils

From 2c42623b6e3bf4e53d3aae3034d75351d63b6712 Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Thu, 28 Dec 2023 10:59:33 +0100
Subject: [PATCH 314/429] cp: backup dest symlink linking to source

---
 src/uu/cp/src/cp.rs      |  1 +
 tests/by-util/test_cp.rs | 19 +++++++++++++++++++
 2 files changed, 20 insertions(+)

diff --git a/src/uu/cp/src/cp.rs b/src/uu/cp/src/cp.rs
index 30cb3f59ffe..a5fb66d2926 100644
--- a/src/uu/cp/src/cp.rs
+++ b/src/uu/cp/src/cp.rs
@@ -1521,6 +1521,7 @@ fn is_forbidden_copy_to_same_file(
         options.dereference(source_in_command_line) || !source.is_symlink();
     paths_refer_to_same_file(source, dest, dereference_to_compare)
         && !(options.force() && options.backup != BackupMode::NoBackup)
+        && !(dest.is_symlink() && options.backup != BackupMode::NoBackup)
 }
 
 /// Back up, remove, or leave intact the destination file, depending on the options.
diff --git a/tests/by-util/test_cp.rs b/tests/by-util/test_cp.rs
index a1638584b8c..63cfa2155fa 100644
--- a/tests/by-util/test_cp.rs
+++ b/tests/by-util/test_cp.rs
@@ -701,6 +701,25 @@ fn test_cp_arg_backup_with_dest_a_symlink() {
     assert_eq!(original, at.resolve_link(backup));
 }
 
+#[test]
+fn test_cp_arg_backup_with_dest_a_symlink_to_source() {
+    let (at, mut ucmd) = at_and_ucmd!();
+    let source = "source";
+    let source_content = "content";
+    let symlink = "symlink";
+    let backup = "symlink~";
+
+    at.write(source, source_content);
+    at.symlink_file(source, symlink);
+
+    ucmd.arg("-b").arg(source).arg(symlink).succeeds();
+
+    assert!(!at.symlink_exists(symlink));
+    assert_eq!(source_content, at.read(symlink));
+    assert!(at.symlink_exists(backup));
+    assert_eq!(source, at.resolve_link(backup));
+}
+
 #[test]
 fn test_cp_arg_backup_with_other_args() {
     let (at, mut ucmd) = at_and_ucmd!();

From 902a128ea8a3cce5b520afef3c7c357728b93a97 Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Sun, 31 Dec 2023 14:17:16 +0100
Subject: [PATCH 315/429] cp: rename function

 is_forbidden_copy_to_same_file -> is_forbidden_to_copy_to_same_file
---
 src/uu/cp/src/cp.rs | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/uu/cp/src/cp.rs b/src/uu/cp/src/cp.rs
index a5fb66d2926..91507f31958 100644
--- a/src/uu/cp/src/cp.rs
+++ b/src/uu/cp/src/cp.rs
@@ -1509,7 +1509,7 @@ fn backup_dest(dest: &Path, backup_path: &Path) -> CopyResult<PathBuf> {
 ///
 /// Copying to the same file is only allowed if both `--backup` and
 /// `--force` are specified and the file is a regular file.
-fn is_forbidden_copy_to_same_file(
+fn is_forbidden_to_copy_to_same_file(
     source: &Path,
     dest: &Path,
     options: &Options,
@@ -1533,7 +1533,7 @@ fn handle_existing_dest(
 ) -> CopyResult<()> {
     // Disallow copying a file to itself, unless `--force` and
     // `--backup` are both specified.
-    if is_forbidden_copy_to_same_file(source, dest, options, source_in_command_line) {
+    if is_forbidden_to_copy_to_same_file(source, dest, options, source_in_command_line) {
         return Err(format!("{} and {} are the same file", source.quote(), dest.quote()).into());
     }
 

From 5673f32c6305e9545ac4e1e8e0ebdf3050f300f7 Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Sun, 31 Dec 2023 16:01:34 +0100
Subject: [PATCH 316/429] cp: show error if source & dest are same file

---
 src/uu/cp/src/cp.rs      |  1 +
 tests/by-util/test_cp.rs | 14 ++++++++++++++
 2 files changed, 15 insertions(+)

diff --git a/src/uu/cp/src/cp.rs b/src/uu/cp/src/cp.rs
index 30cb3f59ffe..332bb578512 100644
--- a/src/uu/cp/src/cp.rs
+++ b/src/uu/cp/src/cp.rs
@@ -1713,6 +1713,7 @@ fn copy_file(
         if are_hardlinks_to_same_file(source, dest)
             && !options.force()
             && options.backup == BackupMode::NoBackup
+            && source != dest
         {
             return Ok(());
         }
diff --git a/tests/by-util/test_cp.rs b/tests/by-util/test_cp.rs
index a1638584b8c..d166243ed6e 100644
--- a/tests/by-util/test_cp.rs
+++ b/tests/by-util/test_cp.rs
@@ -117,6 +117,20 @@ fn test_cp_duplicate_files() {
     assert_eq!(at.read(TEST_COPY_TO_FOLDER_FILE), "Hello, World!\n");
 }
 
+#[test]
+fn test_cp_same_file() {
+    let (at, mut ucmd) = at_and_ucmd!();
+    let file = "a";
+
+    at.touch(file);
+
+    ucmd.arg(file)
+        .arg(file)
+        .fails()
+        .code_is(1)
+        .stderr_contains(format!("'{file}' and '{file}' are the same file"));
+}
+
 #[test]
 fn test_cp_multiple_files_target_is_file() {
     new_ucmd!()

From cdd3492532a108b4e2ca518c44ea755ee49529e4 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Sun, 31 Dec 2023 16:28:21 +0100
Subject: [PATCH 317/429] fuzz: use thread to bypass the limitation of output

Closes: #5724

many thanks to @samueltardieu
---
 fuzz/fuzz_targets/fuzz_common.rs | 46 ++++++++++++++++----------------
 1 file changed, 23 insertions(+), 23 deletions(-)

diff --git a/fuzz/fuzz_targets/fuzz_common.rs b/fuzz/fuzz_targets/fuzz_common.rs
index 11b75a2fa09..2a6cbdfded8 100644
--- a/fuzz/fuzz_targets/fuzz_common.rs
+++ b/fuzz/fuzz_targets/fuzz_common.rs
@@ -8,12 +8,12 @@ use libc::{close, dup, dup2, pipe, STDERR_FILENO, STDOUT_FILENO};
 use rand::prelude::SliceRandom;
 use rand::Rng;
 use std::ffi::OsString;
-use std::io;
 use std::io::{Seek, SeekFrom, Write};
 use std::os::fd::{AsRawFd, RawFd};
 use std::process::{Command, Stdio};
 use std::sync::atomic::Ordering;
 use std::sync::{atomic::AtomicBool, Once};
+use std::{io, thread};
 
 /// Represents the result of running a command, including its standard output,
 /// standard error, and exit code.
@@ -56,7 +56,7 @@ pub fn generate_and_run_uumain<F>(
     pipe_input: Option<&str>,
 ) -> CommandResult
 where
-    F: FnOnce(std::vec::IntoIter<OsString>) -> i32,
+    F: FnOnce(std::vec::IntoIter<OsString>) -> i32 + Send + 'static,
 {
     // Duplicate the stdout and stderr file descriptors
     let original_stdout_fd = unsafe { dup(STDOUT_FILENO) };
@@ -68,6 +68,7 @@ where
             exit_code: -1,
         };
     }
+
     println!("Running test {:?}", &args[0..]);
     let mut pipe_stdout_fds = [-1; 2];
     let mut pipe_stderr_fds = [-1; 2];
@@ -120,10 +121,20 @@ where
         None
     };
 
-    let uumain_exit_status = uumain_function(args.to_owned().into_iter());
-
-    io::stdout().flush().unwrap();
-    io::stderr().flush().unwrap();
+    let (uumain_exit_status, captured_stdout, captured_stderr) = thread::scope(|s| {
+        let out = s.spawn(|| read_from_fd(pipe_stdout_fds[0]));
+        let err = s.spawn(|| read_from_fd(pipe_stderr_fds[0]));
+        let status = uumain_function(args.to_owned().into_iter());
+        io::stdout().flush().unwrap();
+        io::stderr().flush().unwrap();
+        unsafe {
+            close(pipe_stdout_fds[1]);
+            close(pipe_stderr_fds[1]);
+            close(STDOUT_FILENO);
+            close(STDERR_FILENO);
+        }
+        (status, out.join().unwrap(), err.join().unwrap())
+    });
 
     // Restore the original stdout and stderr
     if unsafe { dup2(original_stdout_fd, STDOUT_FILENO) } == -1
@@ -135,13 +146,6 @@ where
             exit_code: -1,
         };
     }
-    unsafe {
-        close(original_stdout_fd);
-        close(original_stderr_fd);
-
-        close(pipe_stdout_fds[1]);
-        close(pipe_stderr_fds[1]);
-    }
 
     // Restore the original stdin if it was modified
     if let Some(fd) = original_stdin_fd {
@@ -155,18 +159,14 @@ where
         unsafe { close(fd) };
     }
 
-    let captured_stdout = read_from_fd(pipe_stdout_fds[0]).trim().to_string();
-    let captured_stderr = read_from_fd(pipe_stderr_fds[0]).to_string();
-    let captured_stderr = captured_stderr
-        .split_once(':')
-        .map(|x| x.1)
-        .unwrap_or("")
-        .trim()
-        .to_string();
-
     CommandResult {
         stdout: captured_stdout,
-        stderr: captured_stderr,
+        stderr: captured_stderr
+            .split_once(':')
+            .map(|x| x.1)
+            .unwrap_or("")
+            .trim()
+            .to_string(),
         exit_code: uumain_exit_status,
     }
 }

From 08f51558bfa82455837fcbdfadc8c263b561eb77 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Sun, 31 Dec 2023 16:29:50 +0100
Subject: [PATCH 318/429] fuzz: enable seq as the stalled issue is fixed

---
 .github/workflows/fuzzing.yml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/.github/workflows/fuzzing.yml b/.github/workflows/fuzzing.yml
index 1945088442a..c29294d4d6c 100644
--- a/.github/workflows/fuzzing.yml
+++ b/.github/workflows/fuzzing.yml
@@ -48,7 +48,7 @@ jobs:
           - { name: fuzz_expr, should_pass: true }
           - { name: fuzz_printf, should_pass: false }
           - { name: fuzz_echo, should_pass: true }
-          # - { name: fuzz_seq, should_pass: false }
+          - { name: fuzz_seq, should_pass: false }
           - { name: fuzz_parse_glob, should_pass: true }
           - { name: fuzz_parse_size, should_pass: true }
           - { name: fuzz_parse_time, should_pass: true }

From 7ddeba4b98615dea328d2d3ab8dd2be8ad02bfe4 Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Mon, 1 Jan 2024 14:30:27 +0100
Subject: [PATCH 319/429] cp: show no "same file" error for --link a a

---
 src/uu/cp/src/cp.rs      |  2 ++
 tests/by-util/test_cp.rs | 16 ++++++++++++++++
 2 files changed, 18 insertions(+)

diff --git a/src/uu/cp/src/cp.rs b/src/uu/cp/src/cp.rs
index 332bb578512..d58eec13d2d 100644
--- a/src/uu/cp/src/cp.rs
+++ b/src/uu/cp/src/cp.rs
@@ -150,6 +150,7 @@ pub enum TargetType {
 }
 
 /// Copy action to perform
+#[derive(PartialEq)]
 pub enum CopyMode {
     Link,
     SymLink,
@@ -1714,6 +1715,7 @@ fn copy_file(
             && !options.force()
             && options.backup == BackupMode::NoBackup
             && source != dest
+            || (source == dest && options.copy_mode == CopyMode::Link)
         {
             return Ok(());
         }
diff --git a/tests/by-util/test_cp.rs b/tests/by-util/test_cp.rs
index d166243ed6e..884e71a3c6a 100644
--- a/tests/by-util/test_cp.rs
+++ b/tests/by-util/test_cp.rs
@@ -566,6 +566,22 @@ fn test_cp_arg_link_with_dest_hardlink_to_source() {
     assert!(at.file_exists(hardlink));
 }
 
+#[test]
+#[cfg(target_os = "linux")]
+fn test_cp_arg_link_with_same_file() {
+    use std::os::linux::fs::MetadataExt;
+
+    let (at, mut ucmd) = at_and_ucmd!();
+    let file = "file";
+
+    at.touch(file);
+
+    ucmd.args(&["--link", file, file]).succeeds();
+
+    assert_eq!(at.metadata(file).st_nlink(), 1);
+    assert!(at.file_exists(file));
+}
+
 #[test]
 fn test_cp_arg_symlink() {
     let (at, mut ucmd) = at_and_ucmd!();

From 62b101a6c5f4deeeb30a4539c96470c0d3004e15 Mon Sep 17 00:00:00 2001
From: Laurent Cheylus <foxy@free.fr>
Date: Mon, 1 Jan 2024 15:56:15 +0100
Subject: [PATCH 320/429] docs: fix URL for FreeBSD port

  - FreeBSD port name is rust-coreutils, fix URL for repology.org

Signed-off-by: Laurent Cheylus <foxy@free.fr>
---
 docs/src/installation.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/src/installation.md b/docs/src/installation.md
index 238a4db9b61..dc631d240ca 100644
--- a/docs/src/installation.md
+++ b/docs/src/installation.md
@@ -119,7 +119,7 @@ port install coreutils-uutils
 
 ## FreeBSD
 
-[![FreeBSD port](https://repology.org/badge/version-for-repo/freebsd/uutils-coreutils.svg)](https://repology.org/project/uutils-coreutils/versions)
+[![FreeBSD port](https://repology.org/badge/version-for-repo/freebsd/rust-coreutils.svg)](https://repology.org/project/rust-coreutils/versions)
 
 ```sh
 pkg install rust-coreutils

From 01e12120c13807b49316f081ba6ad0e2607f46bc Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Mon, 1 Jan 2024 16:48:06 +0100
Subject: [PATCH 321/429] mv: simplify condition

---
 src/uu/mv/src/mv.rs | 20 +++++++-------------
 1 file changed, 7 insertions(+), 13 deletions(-)

diff --git a/src/uu/mv/src/mv.rs b/src/uu/mv/src/mv.rs
index 72730778bf1..855afcc1fdf 100644
--- a/src/uu/mv/src/mv.rs
+++ b/src/uu/mv/src/mv.rs
@@ -128,13 +128,13 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
     let mut app = uu_app();
     let matches = app.try_get_matches_from_mut(args)?;
 
-    if !matches.contains_id(OPT_TARGET_DIRECTORY)
-        && matches
-            .get_many::<OsString>(ARG_FILES)
-            .map(|f| f.len())
-            .unwrap_or(0)
-            == 1
-    {
+    let files: Vec<OsString> = matches
+        .get_many::<OsString>(ARG_FILES)
+        .unwrap_or_default()
+        .cloned()
+        .collect();
+
+    if files.len() == 1 && !matches.contains_id(OPT_TARGET_DIRECTORY) {
         app.error(
             ErrorKind::TooFewValues,
             format!(
@@ -144,12 +144,6 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
         .exit();
     }
 
-    let files: Vec<OsString> = matches
-        .get_many::<OsString>(ARG_FILES)
-        .unwrap_or_default()
-        .cloned()
-        .collect();
-
     let overwrite_mode = determine_overwrite_mode(&matches);
     let backup_mode = backup_control::determine_backup_mode(&matches)?;
     let update_mode = update_control::determine_update_mode(&matches);

From f53f9b64966645d7d740436a476271d1540dba1a Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Mon, 1 Jan 2024 16:57:47 +0100
Subject: [PATCH 322/429] handle the error when stdout is full Avoid panic when
 using seq 1 >/dev/full

Should move tests/csplit/csplit-io-err.sh from ERROR to SKIP
---
 src/uucore/src/lib/lib.rs | 12 +++++++++---
 1 file changed, 9 insertions(+), 3 deletions(-)

diff --git a/src/uucore/src/lib/lib.rs b/src/uucore/src/lib/lib.rs
index dcef26443ea..2fc0ae301b3 100644
--- a/src/uucore/src/lib/lib.rs
+++ b/src/uucore/src/lib/lib.rs
@@ -105,9 +105,15 @@ macro_rules! bin {
     ($util:ident) => {
         pub fn main() {
             use std::io::Write;
-            uucore::panic::mute_sigpipe_panic(); // suppress extraneous error output for SIGPIPE failures/panics
-            let code = $util::uumain(uucore::args_os()); // execute utility code
-            std::io::stdout().flush().expect("could not flush stdout"); // (defensively) flush stdout for utility prior to exit; see <https://github.com/rust-lang/rust/issues/23818>
+            // suppress extraneous error output for SIGPIPE failures/panics
+            uucore::panic::mute_sigpipe_panic();
+            // execute utility code
+            let code = $util::uumain(uucore::args_os());
+            // (defensively) flush stdout for utility prior to exit; see <https://github.com/rust-lang/rust/issues/23818>
+            if let Err(e) = std::io::stdout().flush() {
+                eprintln!("Error flushing stdout: {}", e);
+            }
+
             std::process::exit(code);
         }
     };

From 05d85618e3e6ac1606fc4c0ff0164d5db99049f1 Mon Sep 17 00:00:00 2001
From: Samuel Tardieu <sam@rfc1149.net>
Date: Mon, 1 Jan 2024 17:45:20 +0100
Subject: [PATCH 323/429] test: use clearer expression for CI testing

`bool::is_ok_and()` is available in Rust 1.70.0 and above, which is compatible
with the current MSRV.
---
 tests/common/util.rs | 4 +---
 1 file changed, 1 insertion(+), 3 deletions(-)

diff --git a/tests/common/util.rs b/tests/common/util.rs
index 6f4e76d4228..5dac61f7eac 100644
--- a/tests/common/util.rs
+++ b/tests/common/util.rs
@@ -55,9 +55,7 @@ const DEFAULT_ENV: [(&str, &str); 2] = [("LC_ALL", "C"), ("TZ", "UTC")];
 
 /// Test if the program is running under CI
 pub fn is_ci() -> bool {
-    std::env::var("CI")
-        .unwrap_or_else(|_| String::from("false"))
-        .eq_ignore_ascii_case("true")
+    std::env::var("CI").is_ok_and(|s| s.eq_ignore_ascii_case("true"))
 }
 
 /// Read a test scenario fixture, returning its bytes

From d640e690f43daf030c635ef8b8624d2b6792e367 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Tue, 2 Jan 2024 00:13:20 +0100
Subject: [PATCH 324/429] Workaround
 https://github.com/uutils/coreutils/issues/5766 to transform an ERROR into
 FAIL

---
 util/build-gnu.sh | 5 +++++
 1 file changed, 5 insertions(+)

diff --git a/util/build-gnu.sh b/util/build-gnu.sh
index 8ade25e8874..7e530ba5c82 100755
--- a/util/build-gnu.sh
+++ b/util/build-gnu.sh
@@ -181,6 +181,11 @@ sed -i "s|grep '^#define HAVE_CAP 1' \$CONFIG_HEADER > /dev/null|true|"  tests/l
 # tests/ls/abmon-align.sh - https://github.com/uutils/coreutils/issues/3505
 sed -i 's|touch |/usr/bin/touch |' tests/cp/reflink-perm.sh tests/ls/block-size.sh tests/mv/update.sh tests/ls/ls-time.sh tests/stat/stat-nanoseconds.sh tests/misc/time-style.sh tests/test/test-N.sh tests/ls/abmon-align.sh
 sed -i 's|ln -|/usr/bin/ln -|' tests/cp/link-deref.sh
+
+# Workaround https://github.com/uutils/coreutils/issues/5766
+# to transform an ERROR into FAIL
+sed -i 's|xargs mkdir )|xargs mkdir -p )|' tests/cp/link-heap.sh
+
 sed -i 's|cp |/usr/bin/cp |' tests/mv/hard-2.sh
 sed -i 's|paste |/usr/bin/paste |' tests/od/od-endian.sh
 sed -i 's|timeout |'"${SYSTEM_TIMEOUT}"' |' tests/tail/follow-stdin.sh

From 203600bb9ce9df8b369b9dc6f23318aa62e3cd5b Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Tue, 2 Jan 2024 00:42:52 +0100
Subject: [PATCH 325/429] tail: transform FAIL into ERROR for
 tests/tail/inotify-rotate-resources.sh

---
 util/build-gnu.sh | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/util/build-gnu.sh b/util/build-gnu.sh
index 8ade25e8874..33f8b8aaae5 100755
--- a/util/build-gnu.sh
+++ b/util/build-gnu.sh
@@ -216,6 +216,9 @@ sed -i -e "s|rm: cannot remove 'rel': Permission denied|rm: cannot remove 'rel':
 # however there's a bug because `---dis` is an alias for: `---disable-inotify`
 sed -i -e "s|---dis ||g" tests/tail/overlay-headers.sh
 
+# Do not FAIL, just do a regular ERROR
+sed -i -e "s|framework_failure_ 'no inotify_add_watch';|fail=1;|" tests/tail/inotify-rotate-resources.sh
+
 test -f "${UU_BUILD_DIR}/getlimits" || cp src/getlimits "${UU_BUILD_DIR}"
 
 # pr produces very long log and this command isn't super interesting

From 239e5426e6275aeba271884a2047758b62dc10d1 Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Tue, 2 Jan 2024 16:06:41 +0100
Subject: [PATCH 326/429] du: show error for nul names with --files0-from

---
 src/uu/du/src/du.rs      | 13 +++++++++----
 tests/by-util/test_du.rs | 29 +++++++++++++++++++++++++++++
 2 files changed, 38 insertions(+), 4 deletions(-)

diff --git a/src/uu/du/src/du.rs b/src/uu/du/src/du.rs
index e3f5a718654..3d590e1bf79 100644
--- a/src/uu/du/src/du.rs
+++ b/src/uu/du/src/du.rs
@@ -26,11 +26,11 @@ use std::sync::mpsc;
 use std::thread;
 use std::time::{Duration, UNIX_EPOCH};
 use uucore::display::{print_verbatim, Quotable};
-use uucore::error::{FromIo, UError, UResult, USimpleError};
+use uucore::error::{set_exit_code, FromIo, UError, UResult, USimpleError};
 use uucore::line_ending::LineEnding;
 use uucore::parse_glob;
 use uucore::parse_size::{parse_size_u64, ParseSizeError};
-use uucore::{format_usage, help_about, help_section, help_usage, show, show_warning};
+use uucore::{format_usage, help_about, help_section, help_usage, show, show_error, show_warning};
 #[cfg(windows)]
 use windows_sys::Win32::Foundation::HANDLE;
 #[cfg(windows)]
@@ -621,9 +621,14 @@ fn read_files_from(file_name: &str) -> Result<Vec<PathBuf>, std::io::Error> {
 
     let mut paths = Vec::new();
 
-    for line in reader.split(b'\0') {
+    for (i, line) in reader.split(b'\0').enumerate() {
         let path = line?;
-        if !path.is_empty() {
+
+        if path.is_empty() {
+            let line_number = i + 1;
+            show_error!("{file_name}:{line_number}: invalid zero-length file name");
+            set_exit_code(1);
+        } else {
             paths.push(PathBuf::from(String::from_utf8_lossy(&path).to_string()));
         }
     }
diff --git a/tests/by-util/test_du.rs b/tests/by-util/test_du.rs
index 5c2efdc9865..955759cb889 100644
--- a/tests/by-util/test_du.rs
+++ b/tests/by-util/test_du.rs
@@ -1010,6 +1010,24 @@ fn test_du_files0_from() {
         .stdout_contains("testdir");
 }
 
+#[test]
+fn test_du_files0_from_with_invalid_zero_length_file_names() {
+    let ts = TestScenario::new(util_name!());
+    let at = &ts.fixtures;
+
+    at.touch("testfile");
+
+    at.write("filelist", "\0testfile\0\0");
+
+    ts.ucmd()
+        .arg("--files0-from=filelist")
+        .fails()
+        .code_is(1)
+        .stdout_contains("testfile")
+        .stderr_contains("filelist:1: invalid zero-length file name")
+        .stderr_contains("filelist:3: invalid zero-length file name");
+}
+
 #[test]
 fn test_du_files0_from_stdin() {
     let ts = TestScenario::new(util_name!());
@@ -1028,6 +1046,17 @@ fn test_du_files0_from_stdin() {
         .stdout_contains("testfile2");
 }
 
+#[test]
+fn test_du_files0_from_stdin_with_invalid_zero_length_file_names() {
+    new_ucmd!()
+        .arg("--files0-from=-")
+        .pipe_in("\0\0")
+        .fails()
+        .code_is(1)
+        .stderr_contains("-:1: invalid zero-length file name")
+        .stderr_contains("-:2: invalid zero-length file name");
+}
+
 #[test]
 fn test_du_files0_from_dir() {
     let ts = TestScenario::new(util_name!());

From 4a28b1674ab0b2ac73c0d028a37342517d847e28 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Tue, 2 Jan 2024 20:33:05 +0100
Subject: [PATCH 327/429] remaining-gnu-error.py: shows when a test requires
 root

---
 util/remaining-gnu-error.py | 13 ++++++++++++-
 1 file changed, 12 insertions(+), 1 deletion(-)

diff --git a/util/remaining-gnu-error.py b/util/remaining-gnu-error.py
index 5fd47300ab2..7bd9b141adb 100755
--- a/util/remaining-gnu-error.py
+++ b/util/remaining-gnu-error.py
@@ -33,11 +33,22 @@ def show_list(l):
     tests = list(filter(lambda k: "factor" not in k, l))
 
     for f in reversed(tests):
-        print("%s: %s" % (f, os.stat(f).st_size))
+        if contains_require_root(f):
+            print("%s: %s / require_root" % (f, os.stat(f).st_size))
+        else:
+            print("%s: %s" % (f, os.stat(f).st_size))
     print("")
     print("%s tests remaining" % len(tests))
 
 
+def contains_require_root(file_path):
+    try:
+        with open(file_path, "r") as file:
+            return "require_root_" in file.read()
+    except IOError:
+        return False
+
+
 with open("result.json", "r") as json_file:
     data = json.load(json_file)
 

From 6d3345cfec4496afd75b8e8f9ed46c6ba4375c16 Mon Sep 17 00:00:00 2001
From: Laurent Cheylus <foxy@free.fr>
Date: Mon, 1 Jan 2024 15:11:58 +0100
Subject: [PATCH 328/429] util: use env to call bash in shell scripts

  - For shell scripts using bash, use #!/usr/bin/env bash instead of #!/bin/bash.
    On some OS, bash is not the default shell and is not installed as /bin/bash

Signed-off-by: Laurent Cheylus <foxy@free.fr>
---
 util/analyze-gnu-results.sh | 2 +-
 util/android-commands.sh    | 2 +-
 util/build-gnu.sh           | 2 +-
 3 files changed, 3 insertions(+), 3 deletions(-)
 mode change 100644 => 100755 util/analyze-gnu-results.sh

diff --git a/util/analyze-gnu-results.sh b/util/analyze-gnu-results.sh
old mode 100644
new mode 100755
index 045e3b93dfb..76ade340f6b
--- a/util/analyze-gnu-results.sh
+++ b/util/analyze-gnu-results.sh
@@ -1,4 +1,4 @@
-#!/bin/bash
+#!/usr/bin/env bash
 # spell-checker:ignore xpass XPASS testsuite
 set -e
 
diff --git a/util/android-commands.sh b/util/android-commands.sh
index 4b504de5649..652e3d992bf 100755
--- a/util/android-commands.sh
+++ b/util/android-commands.sh
@@ -1,4 +1,4 @@
-#!/bin/bash
+#!/usr/bin/env bash
 # spell-checker:ignore termux keyevent sdcard binutils unmatch adb's dumpsys logcat pkill nextest logfile
 
 # There are three shells: the host's, adb, and termux. Only adb lets us run
diff --git a/util/build-gnu.sh b/util/build-gnu.sh
index 2d79bd71039..c8bd908b035 100755
--- a/util/build-gnu.sh
+++ b/util/build-gnu.sh
@@ -1,4 +1,4 @@
-#!/bin/bash
+#!/usr/bin/env bash
 # `build-gnu.bash` ~ builds GNU coreutils (from supplied sources)
 #
 

From 7aca1f932ab72ddea6ae2b0ea0288f6ebfcdb578 Mon Sep 17 00:00:00 2001
From: Laurent Cheylus <foxy@free.fr>
Date: Mon, 1 Jan 2024 20:31:47 +0100
Subject: [PATCH 329/429] build-gnu.sh: modify script to be compatible with BSD
 OS

  - Define variables for GNU version of make, nproc, readlink and sed and use them on BSD.
  - In specific cases (option -z not available on BSD and with command /c), use GNU sed instead of
    BSD sed.
  - For xargs, --no-run-if-empty option is a GNU extension. Replace it by -r to be compatible with
    FreeBSD and OpenBSD xargs command.

Signed-off-by: Laurent Cheylus <foxy@free.fr>
---
 util/build-gnu.sh | 41 ++++++++++++++++++++++++++++++-----------
 1 file changed, 30 insertions(+), 11 deletions(-)

diff --git a/util/build-gnu.sh b/util/build-gnu.sh
index c8bd908b035..5f851a9e231 100755
--- a/util/build-gnu.sh
+++ b/util/build-gnu.sh
@@ -2,12 +2,28 @@
 # `build-gnu.bash` ~ builds GNU coreutils (from supplied sources)
 #
 
-# spell-checker:ignore (paths) abmon deref discrim eacces getlimits getopt ginstall inacc infloop inotify reflink ; (misc) INT_OFLOW OFLOW baddecode submodules ; (vars/env) SRCDIR vdir rcexp xpart dired
+# spell-checker:ignore (paths) abmon deref discrim eacces getlimits getopt ginstall inacc infloop inotify reflink ; (misc) INT_OFLOW OFLOW baddecode submodules ; (vars/env) SRCDIR vdir rcexp xpart dired OSTYPE ; (utils) gnproc greadlink gsed
 
 set -e
 
+# Use GNU version for make, nproc, readlink and sed on *BSD
+case "$OSTYPE" in
+    *bsd*)
+        MAKE="gmake"
+        NPROC="gnproc"
+        READLINK="greadlink"
+        SED="gsed"
+        ;;
+    *)
+        MAKE="make"
+        NPROC="nproc"
+        READLINK="readlink"
+        SED="sed"
+        ;;
+esac
+
 ME="${0}"
-ME_dir="$(dirname -- "$(readlink -fm -- "${ME}")")"
+ME_dir="$(dirname -- "$("${READLINK}" -fm -- "${ME}")")"
 REPO_main_dir="$(dirname -- "${ME_dir}")"
 
 # Default profile is 'debug'
@@ -26,7 +42,7 @@ echo "UU_MAKE_PROFILE='${UU_MAKE_PROFILE}'"
 ### * config (from environment with fallback defaults); note: GNU is expected to be a sibling repo directory
 
 path_UUTILS=${path_UUTILS:-${REPO_main_dir}}
-path_GNU="$(readlink -fm -- "${path_GNU:-${path_UUTILS}/../gnu}")"
+path_GNU="$("${READLINK}" -fm -- "${path_GNU:-${path_UUTILS}/../gnu}")"
 
 ###
 
@@ -78,7 +94,7 @@ if [ "$(uname)" == "Linux" ]; then
     export SELINUX_ENABLED=1
 fi
 
-make PROFILE="${UU_MAKE_PROFILE}"
+"${MAKE}" PROFILE="${UU_MAKE_PROFILE}"
 
 cp "${UU_BUILD_DIR}/install" "${UU_BUILD_DIR}/ginstall" # The GNU tests rename this script before running, to avoid confusion with the make target
 # Create *sum binaries
@@ -115,7 +131,7 @@ else
     sed -i 's| tr | /usr/bin/tr |' tests/init.sh
     # Use a better diff
     sed -i 's|diff -c|diff -u|g' tests/Coreutils.pm
-    make -j "$(nproc)"
+    "${MAKE}" -j "$("${NPROC}")"
     touch gnu-built
 fi
 
@@ -135,7 +151,7 @@ t_max=36
 #         done
 #     )
 #     for i in ${seq}; do
-#         make "tests/factor/t${i}.sh"
+#         "${MAKE}" "tests/factor/t${i}.sh"
 #     done
 #     cat
 #     sed -i -e 's|^seq |/usr/bin/seq |' -e 's|sha1sum |/usr/bin/sha1sum |' tests/factor/t*.sh
@@ -194,8 +210,8 @@ sed -i 's|timeout |'"${SYSTEM_TIMEOUT}"' |' tests/tail/follow-stdin.sh
 sed -i 's|\(^\s*\)seq \$|\1'"${SYSTEM_TIMEOUT}"' 0.1 seq \$|' tests/seq/seq-precision.sh tests/seq/seq-long-double.sh
 
 # Remove dup of /usr/bin/ and /usr/local/bin/ when executed several times
-grep -rlE '/usr/bin/\s?/usr/bin' init.cfg tests/* | xargs --no-run-if-empty sed -Ei 's|/usr/bin/\s?/usr/bin/|/usr/bin/|g'
-grep -rlE '/usr/local/bin/\s?/usr/local/bin' init.cfg tests/* | xargs --no-run-if-empty sed -Ei 's|/usr/local/bin/\s?/usr/local/bin/|/usr/local/bin/|g'
+grep -rlE '/usr/bin/\s?/usr/bin' init.cfg tests/* | xargs -r sed -Ei 's|/usr/bin/\s?/usr/bin/|/usr/bin/|g'
+grep -rlE '/usr/local/bin/\s?/usr/local/bin' init.cfg tests/* | xargs -r sed -Ei 's|/usr/local/bin/\s?/usr/local/bin/|/usr/local/bin/|g'
 
 #### Adjust tests to make them work with Rust/coreutils
 # in some cases, what we are doing in rust/coreutils is good (or better)
@@ -275,7 +291,8 @@ sed -i -e "s/ginstall: creating directory/install: creating directory/g" tests/i
 
 # GNU doesn't support padding < -LONG_MAX
 # disable this test case
-sed -i -Ez "s/\n([^\n#]*pad-3\.2[^\n]*)\n([^\n]*)\n([^\n]*)/\n# uutils\/numfmt supports padding = LONG_MIN\n#\1\n#\2\n#\3/" tests/misc/numfmt.pl
+# Use GNU sed because option -z is not available on BSD sed
+"${SED}" -i -Ez "s/\n([^\n#]*pad-3\.2[^\n]*)\n([^\n]*)\n([^\n]*)/\n# uutils\/numfmt supports padding = LONG_MIN\n#\1\n#\2\n#\3/" tests/misc/numfmt.pl
 
 # Update the GNU error message to match the one generated by clap
 sed -i -e "s/\$prog: multiple field specifications/error: The argument '--field <FIELDS>' was provided more than once, but cannot be used multiple times\n\nUsage: numfmt [OPTION]... [NUMBER]...\n\n\nFor more information try '--help'/g" tests/misc/numfmt.pl
@@ -300,7 +317,8 @@ awk 'BEGIN {count=0} /compare exp out2/ && count < 6 {sub(/compare exp out2/, "g
 sed -i -e "s|44 45|48 49|" tests/ls/stat-failed.sh
 
 # small difference in the error message
-sed -i -e "/ls: invalid argument 'XX' for 'time style'/,/Try 'ls --help' for more information\./c\
+# Use GNU sed for /c command
+"${SED}" -i -e "/ls: invalid argument 'XX' for 'time style'/,/Try 'ls --help' for more information\./c\
 ls: invalid --time-style argument 'XX'\nPossible values are: [\"full-iso\", \"long-iso\", \"iso\", \"locale\", \"+FORMAT (e.g., +%H:%M) for a 'date'-style format\"]\n\nFor more information try --help" tests/ls/time-style-diag.sh
 
 # disable two kind of tests:
@@ -309,7 +327,8 @@ ls: invalid --time-style argument 'XX'\nPossible values are: [\"full-iso\", \"lo
 sed -i -e "s/env \$prog \$BEFORE \$opt > out2/env \$prog \$BEFORE \$opt > out2 #/" -e "s/env \$prog \$BEFORE \$opt AFTER > out3/env \$prog \$BEFORE \$opt AFTER > out3 #/" -e "s/compare exp out2/compare exp out2 #/" -e "s/compare exp out3/compare exp out3 #/" tests/help/help-version-getopt.sh
 
 # Add debug info + we have less syscall then GNU's. Adjust our check.
-sed -i -e '/test \$n_stat1 = \$n_stat2 \\/c\
+# Use GNU sed for /c command
+"${SED}" -i -e '/test \$n_stat1 = \$n_stat2 \\/c\
 echo "n_stat1 = \$n_stat1"\n\
 echo "n_stat2 = \$n_stat2"\n\
 test \$n_stat1 -ge \$n_stat2 \\' tests/ls/stat-free-color.sh

From d450d5a46342b3c50bccb1b61ff655f509db4538 Mon Sep 17 00:00:00 2001
From: Laurent Cheylus <foxy@free.fr>
Date: Mon, 1 Jan 2024 22:21:10 +0100
Subject: [PATCH 330/429] show-utils.sh: modify script to be compatible with
 BSD OS

  - Use /usr/bin/env bash instead of /bin/sh to define OSTYPE
  - Use GNU realpath on BSD OS (FreeBSD and OpenBSD)

Signed-off-by: Laurent Cheylus <foxy@free.fr>
---
 util/show-utils.sh | 18 ++++++++++++++----
 1 file changed, 14 insertions(+), 4 deletions(-)

diff --git a/util/show-utils.sh b/util/show-utils.sh
index dda01abe2d2..f53a92cc817 100755
--- a/util/show-utils.sh
+++ b/util/show-utils.sh
@@ -1,13 +1,23 @@
-#!/bin/sh
+#!/usr/bin/env bash
 
-# spell-checker:ignore (utils) cksum coreutils dircolors hashsum mkdir mktemp printenv printf readlink realpath  rmdir shuf tsort unexpand
+# spell-checker:ignore (shell) OSTYPE
+# spell-checker:ignore (utils) cksum coreutils dircolors hashsum mkdir mktemp printenv printf readlink realpath grealpath rmdir shuf tsort unexpand
 # spell-checker:ignore (jq) deps startswith
 
+# Use GNU version for realpath on *BSD
+case "$OSTYPE" in
+    *bsd*)
+        REALPATH="grealpath"
+        ;;
+    *)
+        REALPATH="realpath"
+        ;;
+esac
+
 ME="${0}"
 ME_dir="$(dirname -- "${ME}")"
 ME_parent_dir="$(dirname -- "${ME_dir}")"
-# NOTE: On FreeBSD, `-mP` arguments are not available.
-ME_parent_dir_abs="$(realpath -mP -- "${ME_parent_dir}" || realpath -- "${ME_parent_dir}")"
+ME_parent_dir_abs="$("${REALPATH}" -mP -- "${ME_parent_dir}" || "${REALPATH}" -- "${ME_parent_dir}")"
 
 # refs: <https://forge.rust-lang.org/release/platform-support.html> , <https://docs.rs/platforms/0.2.1/platforms/platform/tier1/index.html>
 

From aef204461c93ae3de8a33d278d0e508643d9e1da Mon Sep 17 00:00:00 2001
From: Laurent Cheylus <foxy@free.fr>
Date: Mon, 1 Jan 2024 23:44:10 +0100
Subject: [PATCH 331/429] util: modify scripts for code coverage to be
 compatible with BSD OS

  - Use /usr/bin/env bash instead of /bin/sh to use OSTYPE
  - Use readlink from GNU coreutils on BSD OS in util/build-code_coverage.sh and
    util/show-code_coverage.sh scripts

Signed-off-by: Laurent Cheylus <foxy@free.fr>
---
 util/build-code_coverage.sh | 18 ++++++++++++++----
 util/show-code_coverage.sh  | 16 +++++++++++++---
 2 files changed, 27 insertions(+), 7 deletions(-)

diff --git a/util/build-code_coverage.sh b/util/build-code_coverage.sh
index 4082bc13dcf..bbe4abaab3f 100755
--- a/util/build-code_coverage.sh
+++ b/util/build-code_coverage.sh
@@ -1,15 +1,25 @@
-#!/bin/sh
+#!/usr/bin/env bash
 
 # spell-checker:ignore (abbrevs/acronyms) HTML gcno llvm
 # spell-checker:ignore (jargon) toolchain
 # spell-checker:ignore (rust) Ccodegen Cinline Coverflow Cpanic RUSTC RUSTDOCFLAGS RUSTFLAGS RUSTUP Zpanic
-# spell-checker:ignore (shell) OSID esac
-# spell-checker:ignore (utils) genhtml grcov lcov readlink sccache shellcheck uutils
+# spell-checker:ignore (shell) OSID OSTYPE esac
+# spell-checker:ignore (utils) genhtml grcov lcov greadlink readlink sccache shellcheck uutils
 
 FEATURES_OPTION="--features feat_os_unix"
 
+# Use GNU coreutils for readlink on *BSD
+case "$OSTYPE" in
+    *bsd*)
+        READLINK="greadlink"
+        ;;
+    *)
+        READLINK="readlink"
+        ;;
+esac
+
 ME="${0}"
-ME_dir="$(dirname -- "$(readlink -fm -- "${ME}")")"
+ME_dir="$(dirname -- "$("${READLINK}" -fm -- "${ME}")")"
 REPO_main_dir="$(dirname -- "${ME_dir}")"
 
 cd "${REPO_main_dir}" &&
diff --git a/util/show-code_coverage.sh b/util/show-code_coverage.sh
index 3f51462c904..8c6f5e20a67 100755
--- a/util/show-code_coverage.sh
+++ b/util/show-code_coverage.sh
@@ -1,9 +1,19 @@
-#!/bin/sh
+#!/usr/bin/env bash
 
-# spell-checker:ignore (vars) OSID binfmt
+# spell-checker:ignore (vars) OSID OSTYPE binfmt greadlink
+
+# Use GNU coreutils for readlink on *BSD
+case "$OSTYPE" in
+    *bsd*)
+        READLINK="greadlink"
+        ;;
+    *)
+        READLINK="readlink"
+        ;;
+esac
 
 ME="${0}"
-ME_dir="$(dirname -- "$(readlink -fm -- "${ME}")")"
+ME_dir="$(dirname -- "$("${READLINK}" -fm -- "${ME}")")"
 REPO_main_dir="$(dirname -- "${ME_dir}")"
 
 export COVERAGE_REPORT_DIR="${REPO_main_dir}/target/debug/coverage-nix"

From 13665da85ed1cbe06a76ae2673d8eac3f5891af8 Mon Sep 17 00:00:00 2001
From: Laurent Cheylus <foxy@free.fr>
Date: Tue, 2 Jan 2024 19:11:34 +0100
Subject: [PATCH 332/429] run-gnu-test.sh: modify script to be compatible with
 BSD OS

  - Use /usr/bin/env bash instead of /bin/sh to use OSTYPE
  - Define variables for GNU version of make, nproc, readlink and use them on BSD.

Signed-off-by: Laurent Cheylus <foxy@free.fr>
---
 util/run-gnu-test.sh | 30 ++++++++++++++++++++++--------
 1 file changed, 22 insertions(+), 8 deletions(-)

diff --git a/util/run-gnu-test.sh b/util/run-gnu-test.sh
index 1abb476b72b..4148c3f96db 100755
--- a/util/run-gnu-test.sh
+++ b/util/run-gnu-test.sh
@@ -1,13 +1,27 @@
-#!/bin/sh
+#!/usr/bin/env bash
 # `run-gnu-test.bash [TEST]`
 # run GNU test (or all tests if TEST is missing/null)
 
-# spell-checker:ignore (env/vars) GNULIB SRCDIR SUBDIRS ; (utils) shellcheck
+# spell-checker:ignore (env/vars) GNULIB SRCDIR SUBDIRS OSTYPE ; (utils) shellcheck gnproc greadlink
 
 # ref: [How the GNU coreutils are tested](https://www.pixelbeat.org/docs/coreutils-testing.html) @@ <https://archive.is/p2ITW>
 # * note: to run a single test => `make check TESTS=PATH/TO/TEST/SCRIPT SUBDIRS=. VERBOSE=yes`
 
-ME_dir="$(dirname -- "$(readlink -fm -- "$0")")"
+# Use GNU version for make, nproc, readlink on *BSD
+case "$OSTYPE" in
+    *bsd*)
+        MAKE="gmake"
+        NPROC="gnproc"
+        READLINK="greadlink"
+        ;;
+    *)
+        MAKE="make"
+        NPROC="nproc"
+        READLINK="readlink"
+        ;;
+esac
+
+ME_dir="$(dirname -- "$("${READLINK}" -fm -- "$0")")"
 REPO_main_dir="$(dirname -- "${ME_dir}")"
 
 echo "ME_dir='${ME_dir}'"
@@ -18,7 +32,7 @@ set -e
 ### * config (from environment with fallback defaults); note: GNU and GNULIB are expected to be sibling repo directories
 
 path_UUTILS=${path_UUTILS:-${REPO_main_dir}}
-path_GNU="$(readlink -fm -- "${path_GNU:-${path_UUTILS}/../gnu}")"
+path_GNU="$("${READLINK}" -fm -- "${path_GNU:-${path_UUTILS}/../gnu}")"
 
 echo "path_UUTILS='${path_UUTILS}'"
 echo "path_GNU='${path_GNU}'"
@@ -47,7 +61,7 @@ if test "$1" != "run-root"; then
             fi
         done
         # trim it
-        SPECIFIC_TESTS=$(echo $SPECIFIC_TESTS | xargs)
+        SPECIFIC_TESTS=$(echo "$SPECIFIC_TESTS" | xargs)
         echo "Running specific tests: $SPECIFIC_TESTS"
     fi
 fi
@@ -60,16 +74,16 @@ fi
 if test "$1" != "run-root"; then
     # run the regular tests
     if test $# -ge 1; then
-        timeout -sKILL 4h make -j "$(nproc)" check TESTS="$SPECIFIC_TESTS" SUBDIRS=. RUN_EXPENSIVE_TESTS=yes RUN_VERY_EXPENSIVE_TESTS=yes VERBOSE=no gl_public_submodule_commit="" srcdir="${path_GNU}" || : # Kill after 4 hours in case something gets stuck in make
+        timeout -sKILL 4h "${MAKE}" -j "$("${NPROC}")" check TESTS="$SPECIFIC_TESTS" SUBDIRS=. RUN_EXPENSIVE_TESTS=yes RUN_VERY_EXPENSIVE_TESTS=yes VERBOSE=no gl_public_submodule_commit="" srcdir="${path_GNU}" || : # Kill after 4 hours in case something gets stuck in make
     else
-        timeout -sKILL 4h make -j "$(nproc)" check SUBDIRS=. RUN_EXPENSIVE_TESTS=yes RUN_VERY_EXPENSIVE_TESTS=yes VERBOSE=no gl_public_submodule_commit="" srcdir="${path_GNU}" || : # Kill after 4 hours in case something gets stuck in make
+        timeout -sKILL 4h "${MAKE}" -j "$("${NPROC}")" check SUBDIRS=. RUN_EXPENSIVE_TESTS=yes RUN_VERY_EXPENSIVE_TESTS=yes VERBOSE=no gl_public_submodule_commit="" srcdir="${path_GNU}" || : # Kill after 4 hours in case something gets stuck in make
     fi
 else
     # in case we would like to run tests requiring root
     if test -z "$1" -o "$1" == "run-root"; then
         if test -n "$CI"; then
             echo "Running check-root to run only root tests"
-            sudo make -j "$(nproc)" check-root SUBDIRS=. RUN_EXPENSIVE_TESTS=yes RUN_VERY_EXPENSIVE_TESTS=yes VERBOSE=no gl_public_submodule_commit="" srcdir="${path_GNU}" TEST_SUITE_LOG="tests/test-suite-root.log" || :
+            sudo "${MAKE}" -j "$("${NPROC}")" check-root SUBDIRS=. RUN_EXPENSIVE_TESTS=yes RUN_VERY_EXPENSIVE_TESTS=yes VERBOSE=no gl_public_submodule_commit="" srcdir="${path_GNU}" TEST_SUITE_LOG="tests/test-suite-root.log" || :
         fi
     fi
 fi

From 0bc70e3ba1535206ac1194d7a683f34c7ffd23bd Mon Sep 17 00:00:00 2001
From: Laurent Cheylus <foxy@free.fr>
Date: Tue, 2 Jan 2024 19:28:28 +0100
Subject: [PATCH 333/429] CI: install GNU coreutils package for FreeBSD
 workflow

  - util/show-utils.sh script is used by FreeBSD workflow => use realpath
    command from GNU coreutils instead of FreeBSD realpath.
  - install GNU coreutils (FreeBSD package coreutils) in style job

Signed-off-by: Laurent Cheylus <foxy@free.fr>
---
 .github/workflows/freebsd.yml | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/.github/workflows/freebsd.yml b/.github/workflows/freebsd.yml
index c4d441a5572..25655f0917f 100644
--- a/.github/workflows/freebsd.yml
+++ b/.github/workflows/freebsd.yml
@@ -44,8 +44,8 @@ jobs:
         usesh: true
         sync: rsync
         copyback: false
-        # We need jq to run show-utils.sh and bash to use inline shell string replacement
-        prepare: pkg install -y curl sudo jq bash
+        # We need jq and GNU coreutils to run show-utils.sh and bash to use inline shell string replacement
+        prepare: pkg install -y curl sudo jq coreutils bash
         run: |
           ## Prepare, build, and test
           # implementation modelled after ref: <https://github.com/rust-lang/rustup/pull/2783>

From be587980780cbed0a7ece95a61ed8f52d7a159e4 Mon Sep 17 00:00:00 2001
From: Laurent Cheylus <foxy@free.fr>
Date: Tue, 2 Jan 2024 20:31:41 +0100
Subject: [PATCH 334/429] DEVELOPMENT.md: on FreeBSD, install GNU coreutils
 package to build/run tests

Signed-off-by: Laurent Cheylus <foxy@free.fr>
---
 DEVELOPMENT.md | 8 +++++++-
 1 file changed, 7 insertions(+), 1 deletion(-)

diff --git a/DEVELOPMENT.md b/DEVELOPMENT.md
index 29cfe2b2a3c..6f1de3b5476 100644
--- a/DEVELOPMENT.md
+++ b/DEVELOPMENT.md
@@ -1,4 +1,4 @@
-<!-- spell-checker:ignore (flags) Ccodegen Coverflow Cpanic Zinstrument Zpanic reimplementing toybox RUNTEST CARGOFLAGS nextest prereq autopoint gettext texinfo automake findutils shellenv libexec gnubin toolchains -->
+<!-- spell-checker:ignore (flags) Ccodegen Coverflow Cpanic Zinstrument Zpanic reimplementing toybox RUNTEST CARGOFLAGS nextest prereq autopoint gettext texinfo automake findutils shellenv libexec gnubin toolchains gsed -->
 
 # Setting up your local development environment
 
@@ -241,6 +241,12 @@ DEBUG=1 bash util/run-gnu-test.sh tests/misc/sm3sum.pl
 
 Note that GNU test suite relies on individual utilities (not the multicall binary).
 
+On FreeBSD, you need to install packages for GNU coreutils and sed (used in shell scripts instead of system commands):
+
+```shell
+pkg install coreutils gsed
+```
+
 ## Code coverage report
 
 Code coverage report can be generated using [grcov](https://github.com/mozilla/grcov).

From e4fbc317141caaf4e4361bb0985f1878d794869d Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Wed, 3 Jan 2024 09:39:16 +0100
Subject: [PATCH 335/429] du: ignore duplicate names with --files0-from

---
 src/uu/du/src/du.rs      |  5 ++++-
 tests/by-util/test_du.rs | 32 ++++++++++++++++++++++++++++++++
 2 files changed, 36 insertions(+), 1 deletion(-)

diff --git a/src/uu/du/src/du.rs b/src/uu/du/src/du.rs
index 3d590e1bf79..62fcfceda01 100644
--- a/src/uu/du/src/du.rs
+++ b/src/uu/du/src/du.rs
@@ -629,7 +629,10 @@ fn read_files_from(file_name: &str) -> Result<Vec<PathBuf>, std::io::Error> {
             show_error!("{file_name}:{line_number}: invalid zero-length file name");
             set_exit_code(1);
         } else {
-            paths.push(PathBuf::from(String::from_utf8_lossy(&path).to_string()));
+            let p = PathBuf::from(String::from_utf8_lossy(&path).to_string());
+            if !paths.contains(&p) {
+                paths.push(p);
+            }
         }
     }
 
diff --git a/tests/by-util/test_du.rs b/tests/by-util/test_du.rs
index 955759cb889..9e4622c31a8 100644
--- a/tests/by-util/test_du.rs
+++ b/tests/by-util/test_du.rs
@@ -1010,6 +1010,21 @@ fn test_du_files0_from() {
         .stdout_contains("testdir");
 }
 
+#[test]
+fn test_du_files0_from_ignore_duplicate_file_names() {
+    let ts = TestScenario::new(util_name!());
+    let at = &ts.fixtures;
+    let file = "testfile";
+
+    at.touch(file);
+    at.write("filelist", &format!("{file}\0{file}\0"));
+
+    ts.ucmd()
+        .arg("--files0-from=filelist")
+        .succeeds()
+        .stdout_is(format!("0\t{file}\n"));
+}
+
 #[test]
 fn test_du_files0_from_with_invalid_zero_length_file_names() {
     let ts = TestScenario::new(util_name!());
@@ -1046,6 +1061,23 @@ fn test_du_files0_from_stdin() {
         .stdout_contains("testfile2");
 }
 
+#[test]
+fn test_du_files0_from_stdin_ignore_duplicate_file_names() {
+    let ts = TestScenario::new(util_name!());
+    let at = &ts.fixtures;
+    let file = "testfile";
+
+    at.touch(file);
+
+    let input = format!("{file}\0{file}");
+
+    ts.ucmd()
+        .arg("--files0-from=-")
+        .pipe_in(input)
+        .succeeds()
+        .stdout_is(format!("0\t{file}\n"));
+}
+
 #[test]
 fn test_du_files0_from_stdin_with_invalid_zero_length_file_names() {
     new_ucmd!()

From c9f796b69488a589f7e941cc54050af0cc9b19ed Mon Sep 17 00:00:00 2001
From: Tom <1955774+tdelmas@users.noreply.github.com>
Date: Wed, 3 Jan 2024 11:24:01 +0100
Subject: [PATCH 336/429] META bug: moved to project mgmt

https://github.com/uutils/coreutils/issues/3336#issuecomment-1206292911
---
 README.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/README.md b/README.md
index 4f341638b3f..c8ca0d8a316 100644
--- a/README.md
+++ b/README.md
@@ -305,7 +305,7 @@ Below is the evolution of how many GNU tests uutils passes. A more detailed
 breakdown of the GNU test results of the main branch can be found
 [in the user manual](https://uutils.github.io/coreutils/book/test_coverage.html).
 
-See <https://github.com/uutils/coreutils/issues/3336> for the main meta bugs
+See <https://github.com/orgs/uutils/projects/1> for the main meta bugs
 (many are missing).
 
 ![Evolution over time](https://github.com/uutils/coreutils-tracking/blob/main/gnu-results.png?raw=true)

From e30f191579c4fe1b5c64614cf9712feb9888dc66 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Dorian=20P=C3=A9ron?= <dorianperon.i@gmail.com>
Date: Wed, 3 Jan 2024 18:37:51 +0100
Subject: [PATCH 337/429] ls: Handle the use of QUOTING_STYLE variable

---
 src/uu/ls/src/ls.rs | 111 +++++++++++++++++++++++++++++---------------
 1 file changed, 73 insertions(+), 38 deletions(-)

diff --git a/src/uu/ls/src/ls.rs b/src/uu/ls/src/ls.rs
index 952083d2ab1..d56929be802 100644
--- a/src/uu/ls/src/ls.rs
+++ b/src/uu/ls/src/ls.rs
@@ -621,7 +621,52 @@ fn extract_hyperlink(options: &clap::ArgMatches) -> bool {
     }
 }
 
+/// Match the argument given to --quoting-style or the QUOTING_STYLE env variable.
+///
+/// # Arguments
+///
+/// * `style`: the actual argument string
+/// * `show_control` - A boolean value representing whether or not to show control characters.
+///
+/// # Returns
+///
+/// * An option with None if the style string is invalid, or a `QuotingStyle` wrapped in `Some`.
+fn match_quoting_style_name(style: &str, show_control: bool) -> Option<QuotingStyle> {
+    match style {
+        "literal" => Some(QuotingStyle::Literal { show_control }),
+        "shell" => Some(QuotingStyle::Shell {
+            escape: false,
+            always_quote: false,
+            show_control,
+        }),
+        "shell-always" => Some(QuotingStyle::Shell {
+            escape: false,
+            always_quote: true,
+            show_control,
+        }),
+        "shell-escape" => Some(QuotingStyle::Shell {
+            escape: true,
+            always_quote: false,
+            show_control,
+        }),
+        "shell-escape-always" => Some(QuotingStyle::Shell {
+            escape: true,
+            always_quote: true,
+            show_control,
+        }),
+        "c" => Some(QuotingStyle::C {
+            quotes: quoting_style::Quotes::Double,
+        }),
+        "escape" => Some(QuotingStyle::C {
+            quotes: quoting_style::Quotes::None,
+        }),
+        _ => None,
+    }
+}
+
 /// Extracts the quoting style to use based on the options provided.
+/// If no options are given, it looks if a default quoting style is provided
+/// through the QUOTING_STYLE environment variable.
 ///
 /// # Arguments
 ///
@@ -632,38 +677,12 @@ fn extract_hyperlink(options: &clap::ArgMatches) -> bool {
 ///
 /// A QuotingStyle variant representing the quoting style to use.
 fn extract_quoting_style(options: &clap::ArgMatches, show_control: bool) -> QuotingStyle {
-    let opt_quoting_style = options.get_one::<String>(options::QUOTING_STYLE).cloned();
+    let opt_quoting_style = options.get_one::<String>(options::QUOTING_STYLE);
 
     if let Some(style) = opt_quoting_style {
-        match style.as_str() {
-            "literal" => QuotingStyle::Literal { show_control },
-            "shell" => QuotingStyle::Shell {
-                escape: false,
-                always_quote: false,
-                show_control,
-            },
-            "shell-always" => QuotingStyle::Shell {
-                escape: false,
-                always_quote: true,
-                show_control,
-            },
-            "shell-escape" => QuotingStyle::Shell {
-                escape: true,
-                always_quote: false,
-                show_control,
-            },
-            "shell-escape-always" => QuotingStyle::Shell {
-                escape: true,
-                always_quote: true,
-                show_control,
-            },
-            "c" => QuotingStyle::C {
-                quotes: quoting_style::Quotes::Double,
-            },
-            "escape" => QuotingStyle::C {
-                quotes: quoting_style::Quotes::None,
-            },
-            _ => unreachable!("Should have been caught by Clap"),
+        match match_quoting_style_name(style, show_control) {
+            Some(qs) => qs,
+            None => unreachable!("Should have been caught by Clap"),
         }
     } else if options.get_flag(options::quoting::LITERAL) {
         QuotingStyle::Literal { show_control }
@@ -675,16 +694,32 @@ fn extract_quoting_style(options: &clap::ArgMatches, show_control: bool) -> Quot
         QuotingStyle::C {
             quotes: quoting_style::Quotes::Double,
         }
-    } else if options.get_flag(options::DIRED) || !std::io::stdout().is_terminal() {
-        // By default, `ls` uses Literal quoting when
-        // writing to a non-terminal file descriptor
+    } else if options.get_flag(options::DIRED) {
         QuotingStyle::Literal { show_control }
     } else {
-        // TODO: use environment variable if available
-        QuotingStyle::Shell {
-            escape: true,
-            always_quote: false,
-            show_control,
+        // If set, the QUOTING_STYLE environment variable specifies a default style.
+        if let Ok(style) = std::env::var("QUOTING_STYLE") {
+            match match_quoting_style_name(style.as_str(), show_control) {
+                Some(qs) => return qs,
+                None => eprintln!(
+                    "{}: Ignoring invalid value of environment variable QUOTING_STYLE: '{}'",
+                    std::env::args().next().unwrap_or("ls".to_string()),
+                    style
+                ),
+            }
+        }
+
+        // By default, `ls` uses Literal quoting when
+        // writing to a non-terminal file descriptor
+        if !std::io::stdout().is_terminal() {
+            QuotingStyle::Literal { show_control }
+        } else {
+            // TODO: use environment variable if available
+            QuotingStyle::Shell {
+                escape: true,
+                always_quote: false,
+                show_control,
+            }
         }
     }
 }

From 217aa3bd9d573043d3c8b6a5969618364f7f5ff4 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Wed, 3 Jan 2024 20:41:44 +0100
Subject: [PATCH 338/429] gnu compare: try to use a local copy if the download
 failed

---
 util/remaining-gnu-error.py | 19 +++++++++++++++----
 1 file changed, 15 insertions(+), 4 deletions(-)

diff --git a/util/remaining-gnu-error.py b/util/remaining-gnu-error.py
index 7bd9b141adb..20b3faee7fa 100755
--- a/util/remaining-gnu-error.py
+++ b/util/remaining-gnu-error.py
@@ -11,10 +11,21 @@
 import sys
 
 base = "../gnu/tests/"
-urllib.request.urlretrieve(
-    "https://raw.githubusercontent.com/uutils/coreutils-tracking/main/gnu-full-result.json",
-    "result.json",
-)
+
+# Try to download the file, use local copy if download fails
+result_json = "result.json"
+try:
+    urllib.request.urlretrieve(
+        "https://raw.githubusercontent.com/uutils/coreutils-tracking/main/gnu-full-result.json",
+        result_json
+    )
+except Exception as e:
+    print(f"Failed to download the file: {e}")
+    if not os.path.exists(result_json):
+        print(f"Local file '{result_json}' not found. Exiting.")
+        sys.exit(1)
+    else:
+        print(f"Using local file '{result_json}'.")
 
 types = ("/*/*.sh", "/*/*.pl", "/*/*.xpl")
 

From d07a2f0d86c963ba8d42e8171b3e92ffec055b97 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Thu, 4 Jan 2024 13:40:47 +0100
Subject: [PATCH 339/429] Add new fuzzers: cut, sort, split and wc  (#5760)

* fuzz: use thread to bypass the limitation of output

Closes: #5724

many thanks to @samueltardieu

* fuzz: enable seq as the stalled issue is fixed

* fuzz: add 4 more fuzzers

* fuzz: enable the 4 new fuzzers in the CI

* remove old import

Co-authored-by: Daniel Hofstetter <daniel.hofstetter@42dh.com>

* remove comment

Co-authored-by: Daniel Hofstetter <daniel.hofstetter@42dh.com>

* remove comment

Co-authored-by: Daniel Hofstetter <daniel.hofstetter@42dh.com>

* add more flags

Co-authored-by: Daniel Hofstetter <daniel.hofstetter@42dh.com>

* add space

Co-authored-by: Daniel Hofstetter <daniel.hofstetter@42dh.com>

* add a comment about sort local

Co-authored-by: Daniel Hofstetter <daniel.hofstetter@42dh.com>

* wrong copy/paste

Co-authored-by: Daniel Hofstetter <daniel.hofstetter@42dh.com>

* fuzz: import "std::env"

---------

Co-authored-by: Daniel Hofstetter <daniel.hofstetter@42dh.com>
---
 .github/workflows/fuzzing.yml   |   4 ++
 fuzz/Cargo.toml                 |  28 +++++++++
 fuzz/fuzz_targets/fuzz_cut.rs   |  87 ++++++++++++++++++++++++++
 fuzz/fuzz_targets/fuzz_sort.rs  |  86 ++++++++++++++++++++++++++
 fuzz/fuzz_targets/fuzz_split.rs | 105 ++++++++++++++++++++++++++++++++
 fuzz/fuzz_targets/fuzz_wc.rs    |  99 ++++++++++++++++++++++++++++++
 6 files changed, 409 insertions(+)
 create mode 100644 fuzz/fuzz_targets/fuzz_cut.rs
 create mode 100644 fuzz/fuzz_targets/fuzz_sort.rs
 create mode 100644 fuzz/fuzz_targets/fuzz_split.rs
 create mode 100644 fuzz/fuzz_targets/fuzz_wc.rs

diff --git a/.github/workflows/fuzzing.yml b/.github/workflows/fuzzing.yml
index c29294d4d6c..b96f7e4ef22 100644
--- a/.github/workflows/fuzzing.yml
+++ b/.github/workflows/fuzzing.yml
@@ -49,6 +49,10 @@ jobs:
           - { name: fuzz_printf, should_pass: false }
           - { name: fuzz_echo, should_pass: true }
           - { name: fuzz_seq, should_pass: false }
+          - { name: fuzz_sort, should_pass: false }
+          - { name: fuzz_wc, should_pass: false }
+          - { name: fuzz_cut, should_pass: false }
+          - { name: fuzz_split, should_pass: false }
           - { name: fuzz_parse_glob, should_pass: true }
           - { name: fuzz_parse_size, should_pass: true }
           - { name: fuzz_parse_time, should_pass: true }
diff --git a/fuzz/Cargo.toml b/fuzz/Cargo.toml
index 3d5862c6970..076e274ec8a 100644
--- a/fuzz/Cargo.toml
+++ b/fuzz/Cargo.toml
@@ -20,6 +20,10 @@ uu_expr = { path = "../src/uu/expr/" }
 uu_printf = { path = "../src/uu/printf/" }
 uu_echo = { path = "../src/uu/echo/" }
 uu_seq = { path = "../src/uu/seq/" }
+uu_sort = { path = "../src/uu/sort/" }
+uu_wc = { path = "../src/uu/wc/" }
+uu_cut = { path = "../src/uu/cut/" }
+uu_split = { path = "../src/uu/split/" }
 
 # Prevent this from interfering with workspaces
 [workspace]
@@ -49,6 +53,30 @@ path = "fuzz_targets/fuzz_seq.rs"
 test = false
 doc = false
 
+[[bin]]
+name = "fuzz_sort"
+path = "fuzz_targets/fuzz_sort.rs"
+test = false
+doc = false
+
+[[bin]]
+name = "fuzz_split"
+path = "fuzz_targets/fuzz_split.rs"
+test = false
+doc = false
+
+[[bin]]
+name = "fuzz_cut"
+path = "fuzz_targets/fuzz_cut.rs"
+test = false
+doc = false
+
+[[bin]]
+name = "fuzz_wc"
+path = "fuzz_targets/fuzz_wc.rs"
+test = false
+doc = false
+
 [[bin]]
 name = "fuzz_expr"
 path = "fuzz_targets/fuzz_expr.rs"
diff --git a/fuzz/fuzz_targets/fuzz_cut.rs b/fuzz/fuzz_targets/fuzz_cut.rs
new file mode 100644
index 00000000000..fa5f8fcc472
--- /dev/null
+++ b/fuzz/fuzz_targets/fuzz_cut.rs
@@ -0,0 +1,87 @@
+// This file is part of the uutils coreutils package.
+//
+// For the full copyright and license information, please view the LICENSE
+// file that was distributed with this source code.
+// spell-checker:ignore parens
+
+#![no_main]
+use libfuzzer_sys::fuzz_target;
+use uu_cut::uumain;
+
+use rand::Rng;
+use std::ffi::OsString;
+
+mod fuzz_common;
+use crate::fuzz_common::{
+    compare_result, generate_and_run_uumain, generate_random_string, run_gnu_cmd, CommandResult,
+};
+static CMD_PATH: &str = "cut";
+
+fn generate_cut_args() -> String {
+    let mut rng = rand::thread_rng();
+    let arg_count = rng.gen_range(1..=6);
+    let mut args = Vec::new();
+
+    for _ in 0..arg_count {
+        if rng.gen_bool(0.1) {
+            args.push(generate_random_string(rng.gen_range(1..=20)));
+        } else {
+            match rng.gen_range(0..=4) {
+                0 => args.push(String::from("-b") + &rng.gen_range(1..=10).to_string()),
+                1 => args.push(String::from("-c") + &rng.gen_range(1..=10).to_string()),
+                2 => args.push(String::from("-d,") + &generate_random_string(1)), // Using a comma as a default delimiter
+                3 => args.push(String::from("-f") + &rng.gen_range(1..=5).to_string()),
+                _ => (),
+            }
+        }
+    }
+
+    args.join(" ")
+}
+
+fn generate_delimited_data(count: usize) -> String {
+    let mut rng = rand::thread_rng();
+    let mut lines = Vec::new();
+
+    for _ in 0..count {
+        let fields = (0..rng.gen_range(1..=5))
+            .map(|_| generate_random_string(rng.gen_range(1..=10)))
+            .collect::<Vec<_>>()
+            .join(",");
+        lines.push(fields);
+    }
+
+    lines.join("\n")
+}
+
+fuzz_target!(|_data: &[u8]| {
+    let cut_args = generate_cut_args();
+    let mut args = vec![OsString::from("cut")];
+    args.extend(cut_args.split_whitespace().map(OsString::from));
+
+    let input_lines = generate_delimited_data(10);
+
+    let rust_result = generate_and_run_uumain(&args, uumain, Some(&input_lines));
+    let gnu_result = match run_gnu_cmd(CMD_PATH, &args[1..], false, Some(&input_lines)) {
+        Ok(result) => result,
+        Err(error_result) => {
+            eprintln!("Failed to run GNU command:");
+            eprintln!("Stderr: {}", error_result.stderr);
+            eprintln!("Exit Code: {}", error_result.exit_code);
+            CommandResult {
+                stdout: String::new(),
+                stderr: error_result.stderr,
+                exit_code: error_result.exit_code,
+            }
+        }
+    };
+
+    compare_result(
+        "cut",
+        &format!("{:?}", &args[1..]),
+        Some(&input_lines),
+        &rust_result,
+        &gnu_result,
+        false, // Set to true if you want to fail on stderr diff
+    );
+});
diff --git a/fuzz/fuzz_targets/fuzz_sort.rs b/fuzz/fuzz_targets/fuzz_sort.rs
new file mode 100644
index 00000000000..3520bbaefed
--- /dev/null
+++ b/fuzz/fuzz_targets/fuzz_sort.rs
@@ -0,0 +1,86 @@
+// This file is part of the uutils coreutils package.
+//
+// For the full copyright and license information, please view the LICENSE
+// file that was distributed with this source code.
+// spell-checker:ignore parens
+
+#![no_main]
+use libfuzzer_sys::fuzz_target;
+use uu_sort::uumain;
+
+use rand::Rng;
+use std::env;
+use std::ffi::OsString;
+
+mod fuzz_common;
+use crate::fuzz_common::CommandResult;
+use crate::fuzz_common::{
+    compare_result, generate_and_run_uumain, generate_random_string, run_gnu_cmd,
+};
+static CMD_PATH: &str = "sort";
+
+fn generate_sort_args() -> String {
+    let mut rng = rand::thread_rng();
+
+    let arg_count = rng.gen_range(1..=5);
+    let mut args = Vec::new();
+
+    for _ in 0..arg_count {
+        match rng.gen_range(0..=4) {
+            0 => args.push(String::from("-r")), // Reverse the result of comparisons
+            1 => args.push(String::from("-n")), // Compare according to string numerical value
+            2 => args.push(String::from("-f")), // Fold lower case to upper case characters
+            3 => args.push(generate_random_string(rng.gen_range(1..=10))), // Random string (to simulate file names)
+            _ => args.push(String::from("-k") + &rng.gen_range(1..=5).to_string()), // Sort via a specified field
+        }
+    }
+
+    args.join(" ")
+}
+
+fn generate_random_lines(count: usize) -> String {
+    let mut rng = rand::thread_rng();
+    let mut lines = Vec::new();
+
+    for _ in 0..count {
+        lines.push(generate_random_string(rng.gen_range(1..=20)));
+    }
+
+    lines.join("\n")
+}
+
+fuzz_target!(|_data: &[u8]| {
+    let sort_args = generate_sort_args();
+    let mut args = vec![OsString::from("sort")];
+    args.extend(sort_args.split_whitespace().map(OsString::from));
+
+    // Generate random lines to sort
+    let input_lines = generate_random_lines(10);
+
+    let rust_result = generate_and_run_uumain(&args, uumain, Some(&input_lines));
+
+    // TODO remove once uutils sort supports localization
+    env::set_var("LC_COLLATE", "C");
+    let gnu_result = match run_gnu_cmd(CMD_PATH, &args[1..], false, Some(&input_lines)) {
+        Ok(result) => result,
+        Err(error_result) => {
+            eprintln!("Failed to run GNU command:");
+            eprintln!("Stderr: {}", error_result.stderr);
+            eprintln!("Exit Code: {}", error_result.exit_code);
+            CommandResult {
+                stdout: String::new(),
+                stderr: error_result.stderr,
+                exit_code: error_result.exit_code,
+            }
+        }
+    };
+
+    compare_result(
+        "sort",
+        &format!("{:?}", &args[1..]),
+        None,
+        &rust_result,
+        &gnu_result,
+        false, // Set to true if you want to fail on stderr diff
+    );
+});
diff --git a/fuzz/fuzz_targets/fuzz_split.rs b/fuzz/fuzz_targets/fuzz_split.rs
new file mode 100644
index 00000000000..876c8dd21d4
--- /dev/null
+++ b/fuzz/fuzz_targets/fuzz_split.rs
@@ -0,0 +1,105 @@
+// This file is part of the uutils coreutils package.
+//
+// For the full copyright and license information, please view the LICENSE
+// file that was distributed with this source code.
+// spell-checker:ignore parens
+
+#![no_main]
+use libfuzzer_sys::fuzz_target;
+use uu_split::uumain;
+
+use rand::Rng;
+use std::ffi::OsString;
+
+mod fuzz_common;
+use crate::fuzz_common::{
+    compare_result, generate_and_run_uumain, generate_random_string, run_gnu_cmd, CommandResult,
+};
+static CMD_PATH: &str = "split";
+
+fn generate_split_args() -> String {
+    let mut rng = rand::thread_rng();
+    let mut args = Vec::new();
+
+    match rng.gen_range(0..=9) {
+        0 => {
+            args.push(String::from("-a")); // Suffix length
+            args.push(rng.gen_range(1..=8).to_string());
+        }
+        1 => {
+            args.push(String::from("--additional-suffix"));
+            args.push(generate_random_string(5)); // Random suffix
+        }
+        2 => {
+            args.push(String::from("-b")); // Bytes per output file
+            args.push(rng.gen_range(1..=1024).to_string() + "K");
+        }
+        3 => {
+            args.push(String::from("-C")); // Line bytes
+            args.push(rng.gen_range(1..=1024).to_string());
+        }
+        4 => args.push(String::from("-d")), // Use numeric suffixes
+        5 => args.push(String::from("-x")), // Use hex suffixes
+        6 => {
+            args.push(String::from("-l")); // Number of lines per output file
+            args.push(rng.gen_range(1..=1000).to_string());
+        }
+        7 => {
+            args.push(String::from("--filter"));
+            args.push(String::from("cat > /dev/null")); // Example filter command
+        }
+        8 => {
+            args.push(String::from("-t")); // Separator
+            args.push(String::from("\n")); // Newline as separator
+        }
+        9 => args.push(String::from("--verbose")), // Verbose
+        _ => (),
+    }
+
+    args.join(" ")
+}
+
+// Function to generate a random string of lines
+fn generate_random_lines(count: usize) -> String {
+    let mut rng = rand::thread_rng();
+    let mut lines = Vec::new();
+
+    for _ in 0..count {
+        lines.push(generate_random_string(rng.gen_range(1..=20)));
+    }
+
+    lines.join("\n")
+}
+
+fuzz_target!(|_data: &[u8]| {
+    let split_args = generate_split_args();
+    let mut args = vec![OsString::from("split")];
+    args.extend(split_args.split_whitespace().map(OsString::from));
+
+    let input_lines = generate_random_lines(10);
+
+    let rust_result = generate_and_run_uumain(&args, uumain, Some(&input_lines));
+
+    let gnu_result = match run_gnu_cmd(CMD_PATH, &args[1..], false, Some(&input_lines)) {
+        Ok(result) => result,
+        Err(error_result) => {
+            eprintln!("Failed to run GNU command:");
+            eprintln!("Stderr: {}", error_result.stderr);
+            eprintln!("Exit Code: {}", error_result.exit_code);
+            CommandResult {
+                stdout: String::new(),
+                stderr: error_result.stderr,
+                exit_code: error_result.exit_code,
+            }
+        }
+    };
+
+    compare_result(
+        "split",
+        &format!("{:?}", &args[1..]),
+        None,
+        &rust_result,
+        &gnu_result,
+        false, // Set to true if you want to fail on stderr diff
+    );
+});
diff --git a/fuzz/fuzz_targets/fuzz_wc.rs b/fuzz/fuzz_targets/fuzz_wc.rs
new file mode 100644
index 00000000000..dc85bbc3541
--- /dev/null
+++ b/fuzz/fuzz_targets/fuzz_wc.rs
@@ -0,0 +1,99 @@
+// This file is part of the uutils coreutils package.
+//
+// For the full copyright and license information, please view the LICENSE
+// file that was distributed with this source code.
+// spell-checker:ignore parens
+
+#![no_main]
+use libfuzzer_sys::fuzz_target;
+use uu_wc::uumain;
+
+use rand::Rng;
+use std::ffi::OsString;
+
+mod fuzz_common;
+use crate::fuzz_common::{
+    compare_result, generate_and_run_uumain, generate_random_string, run_gnu_cmd, CommandResult,
+};
+static CMD_PATH: &str = "wc";
+
+fn generate_wc_args() -> String {
+    let mut rng = rand::thread_rng();
+    let arg_count = rng.gen_range(1..=6);
+    let mut args = Vec::new();
+
+    for _ in 0..arg_count {
+        // Introduce a chance to add invalid arguments
+        if rng.gen_bool(0.1) {
+            args.push(generate_random_string(rng.gen_range(1..=20)));
+        } else {
+            match rng.gen_range(0..=5) {
+                0 => args.push(String::from("-c")),
+                1 => args.push(String::from("-m")),
+                2 => args.push(String::from("-l")),
+                3 => args.push(String::from("-L")),
+                4 => args.push(String::from("-w")),
+                // TODO
+                5 => {
+                    args.push(String::from("--files0-from"));
+                    if rng.gen_bool(0.5) {
+                        args.push(generate_random_string(50)); // Longer invalid file name
+                    } else {
+                        args.push(generate_random_string(5));
+                    }
+                }
+                _ => (),
+            }
+        }
+    }
+
+    args.join(" ")
+}
+
+// Function to generate a random string of lines, including invalid ones
+fn generate_random_lines(count: usize) -> String {
+    let mut rng = rand::thread_rng();
+    let mut lines = Vec::new();
+
+    for _ in 0..count {
+        if rng.gen_bool(0.1) {
+            lines.push(generate_random_string(rng.gen_range(1000..=5000))); // Very long invalid line
+        } else {
+            lines.push(generate_random_string(rng.gen_range(1..=20)));
+        }
+    }
+
+    lines.join("\n")
+}
+
+fuzz_target!(|_data: &[u8]| {
+    let wc_args = generate_wc_args();
+    let mut args = vec![OsString::from("wc")];
+    args.extend(wc_args.split_whitespace().map(OsString::from));
+
+    let input_lines = generate_random_lines(10);
+
+    let rust_result = generate_and_run_uumain(&args, uumain, Some(&input_lines));
+    let gnu_result = match run_gnu_cmd(CMD_PATH, &args[1..], false, Some(&input_lines)) {
+        Ok(result) => result,
+        Err(error_result) => {
+            eprintln!("Failed to run GNU command:");
+            eprintln!("Stderr: {}", error_result.stderr);
+            eprintln!("Exit Code: {}", error_result.exit_code);
+            CommandResult {
+                stdout: String::new(),
+                stderr: error_result.stderr,
+                exit_code: error_result.exit_code,
+            }
+        }
+    };
+
+    compare_result(
+        "wc",
+        &format!("{:?}", &args[1..]),
+        Some(&input_lines),
+        &rust_result,
+        &gnu_result,
+        false, // Set to true if you want to fail on stderr diff
+    );
+});

From 6760d63539cd2bb8ac1e5ec345baea84a1c902a3 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Dorian=20P=C3=A9ron?= <dorianperon.i@gmail.com>
Date: Thu, 4 Jan 2024 16:51:30 +0100
Subject: [PATCH 340/429] ls: Fix clippy warning

---
 src/uu/ls/src/ls.rs | 11 +++++------
 1 file changed, 5 insertions(+), 6 deletions(-)

diff --git a/src/uu/ls/src/ls.rs b/src/uu/ls/src/ls.rs
index d56929be802..0e9b2572289 100644
--- a/src/uu/ls/src/ls.rs
+++ b/src/uu/ls/src/ls.rs
@@ -709,17 +709,16 @@ fn extract_quoting_style(options: &clap::ArgMatches, show_control: bool) -> Quot
             }
         }
 
-        // By default, `ls` uses Literal quoting when
-        // writing to a non-terminal file descriptor
-        if !std::io::stdout().is_terminal() {
-            QuotingStyle::Literal { show_control }
-        } else {
-            // TODO: use environment variable if available
+        // By default, `ls` uses Shell escape quoting style when writing to a terminal file
+        // descriptor and Literal otherwise.
+        if std::io::stdout().is_terminal() {
             QuotingStyle::Shell {
                 escape: true,
                 always_quote: false,
                 show_control,
             }
+        } else {
+            QuotingStyle::Literal { show_control }
         }
     }
 }

From c23dbd3166a7839162bc833491ae0b13ce8e1829 Mon Sep 17 00:00:00 2001
From: Samuel Tardieu <sam@rfc1149.net>
Date: Thu, 4 Jan 2024 19:03:30 +0100
Subject: [PATCH 341/429] fuzz: reset the exit code global variable after every
 test

---
 fuzz/fuzz_targets/fuzz_common.rs | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/fuzz/fuzz_targets/fuzz_common.rs b/fuzz/fuzz_targets/fuzz_common.rs
index 2a6cbdfded8..0201ffd89c2 100644
--- a/fuzz/fuzz_targets/fuzz_common.rs
+++ b/fuzz/fuzz_targets/fuzz_common.rs
@@ -125,6 +125,9 @@ where
         let out = s.spawn(|| read_from_fd(pipe_stdout_fds[0]));
         let err = s.spawn(|| read_from_fd(pipe_stderr_fds[0]));
         let status = uumain_function(args.to_owned().into_iter());
+        // Reset the exit code global variable in case we run another test after this one
+        // See https://github.com/uutils/coreutils/issues/5777
+        uucore::error::set_exit_code(0);
         io::stdout().flush().unwrap();
         io::stderr().flush().unwrap();
         unsafe {

From 932ea96cb6a942fc5d56a18d4f62f262951b8c07 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Fri, 5 Jan 2024 00:03:12 +0100
Subject: [PATCH 342/429] Update a GNU test error check - 
 tests/cp/fail-perm.sh

---
 util/build-gnu.sh | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/util/build-gnu.sh b/util/build-gnu.sh
index 5f851a9e231..4209b771015 100755
--- a/util/build-gnu.sh
+++ b/util/build-gnu.sh
@@ -198,6 +198,10 @@ sed -i "s|grep '^#define HAVE_CAP 1' \$CONFIG_HEADER > /dev/null|true|"  tests/l
 sed -i 's|touch |/usr/bin/touch |' tests/cp/reflink-perm.sh tests/ls/block-size.sh tests/mv/update.sh tests/ls/ls-time.sh tests/stat/stat-nanoseconds.sh tests/misc/time-style.sh tests/test/test-N.sh tests/ls/abmon-align.sh
 sed -i 's|ln -|/usr/bin/ln -|' tests/cp/link-deref.sh
 
+# our messages are better
+sed -i "s|cannot stat 'symlink': Permission denied|not writing through dangling symlink 'symlink'|" tests/cp/fail-perm.sh
+sed -i "s|cp: target directory 'symlink': Permission denied|cp: 'symlink' is not a directory|" tests/cp/fail-perm.sh
+
 # Workaround https://github.com/uutils/coreutils/issues/5766
 # to transform an ERROR into FAIL
 sed -i 's|xargs mkdir )|xargs mkdir -p )|' tests/cp/link-heap.sh

From 9b3cc5437c3de57c1f1f28a130d92fb1671ef45a Mon Sep 17 00:00:00 2001
From: cre4ture <creature05@arcor.de>
Date: Fri, 5 Jan 2024 00:25:59 +0100
Subject: [PATCH 343/429] head: head_backwards for non-seekable files like
 /proc/* or fifos (named pipes) (#5732)

* implement head_backwards for non-seekable files like /proc/* or pipes

Signed-off-by: Ulrich Hornung <hornunguli@gmx.de>
---
 src/uu/head/src/head.rs    | 165 +++++++++++++++++++++++++------------
 tests/by-util/test_head.rs |  60 +++++++++++++-
 2 files changed, 170 insertions(+), 55 deletions(-)

diff --git a/src/uu/head/src/head.rs b/src/uu/head/src/head.rs
index 0f7a08d26f4..3f6fd218507 100644
--- a/src/uu/head/src/head.rs
+++ b/src/uu/head/src/head.rs
@@ -7,7 +7,10 @@
 
 use clap::{crate_version, Arg, ArgAction, ArgMatches, Command};
 use std::ffi::OsString;
+use std::fs::Metadata;
 use std::io::{self, BufWriter, ErrorKind, Read, Seek, SeekFrom, Write};
+#[cfg(not(target_os = "windows"))]
+use std::os::unix::fs::MetadataExt;
 use uucore::display::Quotable;
 use uucore::error::{FromIo, UResult, USimpleError};
 use uucore::line_ending::LineEnding;
@@ -243,42 +246,57 @@ fn read_n_lines(input: &mut impl std::io::BufRead, n: u64, separator: u8) -> std
     Ok(())
 }
 
-fn read_but_last_n_bytes(input: &mut impl std::io::BufRead, n: usize) -> std::io::Result<()> {
+fn catch_too_large_numbers_in_backwards_bytes_or_lines(n: u64) -> Option<usize> {
+    match usize::try_from(n) {
+        Ok(value) => Some(value),
+        Err(e) => {
+            show!(USimpleError::new(
+                1,
+                format!("{e}: number of -bytes or -lines is too large")
+            ));
+            None
+        }
+    }
+}
+
+fn read_but_last_n_bytes(input: &mut impl std::io::BufRead, n: u64) -> std::io::Result<()> {
     if n == 0 {
         //prints everything
         return read_n_bytes(input, std::u64::MAX);
     }
 
-    let stdout = std::io::stdout();
-    let mut stdout = stdout.lock();
+    if let Some(n) = catch_too_large_numbers_in_backwards_bytes_or_lines(n) {
+        let stdout = std::io::stdout();
+        let mut stdout = stdout.lock();
 
-    let mut ring_buffer = Vec::new();
+        let mut ring_buffer = Vec::new();
 
-    let mut buffer = [0u8; BUF_SIZE];
-    let mut total_read = 0;
+        let mut buffer = [0u8; BUF_SIZE];
+        let mut total_read = 0;
 
-    loop {
-        let read = match input.read(&mut buffer) {
-            Ok(0) => break,
-            Ok(read) => read,
-            Err(e) => match e.kind() {
-                ErrorKind::Interrupted => continue,
-                _ => return Err(e),
-            },
-        };
+        loop {
+            let read = match input.read(&mut buffer) {
+                Ok(0) => break,
+                Ok(read) => read,
+                Err(e) => match e.kind() {
+                    ErrorKind::Interrupted => continue,
+                    _ => return Err(e),
+                },
+            };
 
-        total_read += read;
+            total_read += read;
 
-        if total_read <= n {
-            // Fill the ring buffer without exceeding n bytes
-            let overflow = total_read - n;
-            ring_buffer.extend_from_slice(&buffer[..read - overflow]);
-        } else {
-            // Write the ring buffer and the part of the buffer that exceeds n
-            stdout.write_all(&ring_buffer)?;
-            stdout.write_all(&buffer[..read - n + ring_buffer.len()])?;
-            ring_buffer.clear();
-            ring_buffer.extend_from_slice(&buffer[read - n + ring_buffer.len()..read]);
+            if total_read <= n {
+                // Fill the ring buffer without exceeding n bytes
+                let overflow = total_read - n;
+                ring_buffer.extend_from_slice(&buffer[..read - overflow]);
+            } else {
+                // Write the ring buffer and the part of the buffer that exceeds n
+                stdout.write_all(&ring_buffer)?;
+                stdout.write_all(&buffer[..read - n + ring_buffer.len()])?;
+                ring_buffer.clear();
+                ring_buffer.extend_from_slice(&buffer[read - n + ring_buffer.len()..read]);
+            }
         }
     }
 
@@ -287,13 +305,15 @@ fn read_but_last_n_bytes(input: &mut impl std::io::BufRead, n: usize) -> std::io
 
 fn read_but_last_n_lines(
     input: impl std::io::BufRead,
-    n: usize,
+    n: u64,
     separator: u8,
 ) -> std::io::Result<()> {
-    let stdout = std::io::stdout();
-    let mut stdout = stdout.lock();
-    for bytes in take_all_but(lines(input, separator), n) {
-        stdout.write_all(&bytes?)?;
+    if let Some(n) = catch_too_large_numbers_in_backwards_bytes_or_lines(n) {
+        let stdout = std::io::stdout();
+        let mut stdout = stdout.lock();
+        for bytes in take_all_but(lines(input, separator), n) {
+            stdout.write_all(&bytes?)?;
+        }
     }
     Ok(())
 }
@@ -374,7 +394,63 @@ where
     }
 }
 
+fn is_seekable(input: &mut std::fs::File) -> bool {
+    let current_pos = input.stream_position();
+    current_pos.is_ok()
+        && input.seek(SeekFrom::End(0)).is_ok()
+        && input.seek(SeekFrom::Start(current_pos.unwrap())).is_ok()
+}
+
+fn sanity_limited_blksize(_st: &Metadata) -> u64 {
+    #[cfg(not(target_os = "windows"))]
+    {
+        const DEFAULT: u64 = 512;
+        const MAX: u64 = usize::MAX as u64 / 8 + 1;
+
+        let st_blksize: u64 = _st.blksize();
+        match st_blksize {
+            0 => DEFAULT,
+            1..=MAX => st_blksize,
+            _ => DEFAULT,
+        }
+    }
+
+    #[cfg(target_os = "windows")]
+    {
+        512
+    }
+}
+
 fn head_backwards_file(input: &mut std::fs::File, options: &HeadOptions) -> std::io::Result<()> {
+    let st = input.metadata()?;
+    let seekable = is_seekable(input);
+    let blksize_limit = sanity_limited_blksize(&st);
+    if !seekable || st.len() <= blksize_limit {
+        return head_backwards_without_seek_file(input, options);
+    }
+
+    head_backwards_on_seekable_file(input, options)
+}
+
+fn head_backwards_without_seek_file(
+    input: &mut std::fs::File,
+    options: &HeadOptions,
+) -> std::io::Result<()> {
+    let reader = &mut std::io::BufReader::with_capacity(BUF_SIZE, &*input);
+
+    match options.mode {
+        Mode::AllButLastBytes(n) => read_but_last_n_bytes(reader, n)?,
+        Mode::AllButLastLines(n) => read_but_last_n_lines(reader, n, options.line_ending.into())?,
+        _ => unreachable!(),
+    }
+
+    Ok(())
+}
+
+fn head_backwards_on_seekable_file(
+    input: &mut std::fs::File,
+    options: &HeadOptions,
+) -> std::io::Result<()> {
     match options.mode {
         Mode::AllButLastBytes(n) => {
             let size = input.metadata()?.len();
@@ -428,32 +504,13 @@ fn uu_head(options: &HeadOptions) -> UResult<()> {
                 let stdin = std::io::stdin();
                 let mut stdin = stdin.lock();
 
-                // Outputting "all-but-last" requires us to use a ring buffer with size n, so n
-                // must be converted from u64 to usize to fit in memory. If such conversion fails,
-                // it means the platform doesn't have enough memory to hold the buffer, so we fail.
-                if let Mode::AllButLastLines(n) | Mode::AllButLastBytes(n) = options.mode {
-                    if let Err(e) = usize::try_from(n) {
-                        show!(USimpleError::new(
-                            1,
-                            format!("{e}: number of bytes is too large")
-                        ));
-                        continue;
-                    };
-                };
-
                 match options.mode {
                     Mode::FirstBytes(n) => read_n_bytes(&mut stdin, n),
-                    // unwrap is guaranteed to succeed because we checked the value of n above
-                    Mode::AllButLastBytes(n) => {
-                        read_but_last_n_bytes(&mut stdin, n.try_into().unwrap())
-                    }
+                    Mode::AllButLastBytes(n) => read_but_last_n_bytes(&mut stdin, n),
                     Mode::FirstLines(n) => read_n_lines(&mut stdin, n, options.line_ending.into()),
-                    // unwrap is guaranteed to succeed because we checked the value of n above
-                    Mode::AllButLastLines(n) => read_but_last_n_lines(
-                        &mut stdin,
-                        n.try_into().unwrap(),
-                        options.line_ending.into(),
-                    ),
+                    Mode::AllButLastLines(n) => {
+                        read_but_last_n_lines(&mut stdin, n, options.line_ending.into())
+                    }
                 }
             }
             (name, false) => {
diff --git a/tests/by-util/test_head.rs b/tests/by-util/test_head.rs
index f536b26ae08..9cc4c1770ec 100644
--- a/tests/by-util/test_head.rs
+++ b/tests/by-util/test_head.rs
@@ -330,7 +330,7 @@ fn test_head_invalid_num() {
             new_ucmd!()
                 .args(&["-c", size])
                 .fails()
-                .stderr_is("head: out of range integral type conversion attempted: number of bytes is too large\n");
+                .stderr_is("head: out of range integral type conversion attempted: number of -bytes or -lines is too large\n");
         }
     }
     new_ucmd!()
@@ -378,3 +378,61 @@ fn test_presume_input_pipe_5_chars() {
         .run()
         .stdout_is_fixture("lorem_ipsum_5_chars.expected");
 }
+
+#[cfg(all(
+    not(target_os = "windows"),
+    not(target_os = "macos"),
+    not(target_os = "freebsd")
+))]
+#[test]
+fn test_read_backwards_bytes_proc_fs_version() {
+    let ts = TestScenario::new(util_name!());
+
+    let args = ["-c", "-1", "/proc/version"];
+    let result = ts.ucmd().args(&args).succeeds();
+    assert!(result.stdout().len() > 0);
+}
+
+#[cfg(all(
+    not(target_os = "windows"),
+    not(target_os = "macos"),
+    not(target_os = "freebsd")
+))]
+#[test]
+fn test_read_backwards_bytes_proc_fs_modules() {
+    let ts = TestScenario::new(util_name!());
+
+    let args = ["-c", "-1", "/proc/modules"];
+    let result = ts.ucmd().args(&args).succeeds();
+    assert!(result.stdout().len() > 0);
+}
+
+#[cfg(all(
+    not(target_os = "windows"),
+    not(target_os = "macos"),
+    not(target_os = "freebsd")
+))]
+#[test]
+fn test_read_backwards_lines_proc_fs_modules() {
+    let ts = TestScenario::new(util_name!());
+
+    let args = ["--lines", "-1", "/proc/modules"];
+    let result = ts.ucmd().args(&args).succeeds();
+    assert!(result.stdout().len() > 0);
+}
+
+#[cfg(all(
+    not(target_os = "windows"),
+    not(target_os = "macos"),
+    not(target_os = "freebsd")
+))]
+#[test]
+fn test_read_backwards_bytes_sys_kernel_profiling() {
+    let ts = TestScenario::new(util_name!());
+
+    let args = ["-c", "-1", "/sys/kernel/profiling"];
+    let result = ts.ucmd().args(&args).succeeds();
+    let stdout_str = result.stdout_str();
+    assert_eq!(stdout_str.len(), 1);
+    assert!(stdout_str == "0" || stdout_str == "1");
+}

From c58575edaaa208622077f4c30cf80645e06e1c90 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Dorian=20P=C3=A9ron?= <dorianperon.i@gmail.com>
Date: Fri, 5 Jan 2024 02:07:09 +0100
Subject: [PATCH 344/429] tests/ls: Add tests to ensure env var is used as a
 last resort

---
 tests/by-util/test_ls.rs | 65 ++++++++++++++++++++++++++++++++++++++++
 1 file changed, 65 insertions(+)

diff --git a/tests/by-util/test_ls.rs b/tests/by-util/test_ls.rs
index 72a303ef3dc..476704660d4 100644
--- a/tests/by-util/test_ls.rs
+++ b/tests/by-util/test_ls.rs
@@ -2622,6 +2622,71 @@ fn test_ls_quoting_style() {
     }
 }
 
+#[test]
+fn test_ls_quoting_style_env_var_default() {
+    let scene = TestScenario::new(util_name!());
+    let at = &scene.fixtures;
+    at.touch(at.plus_as_string("foo-1"));
+    at.touch(at.plus_as_string("bar-2"));
+
+    // If no quoting style argument is provided, the QUOTING_STYLE environment variable
+    // shall be used.
+
+    let correct_c = "\"bar-2\"\n\"foo-1\"";
+    scene
+        .ucmd()
+        .env("QUOTING_STYLE", "c")
+        .succeeds()
+        .stdout_only(format!("{correct_c}\n"));
+}
+
+#[test]
+fn test_ls_quoting_style_arg_overrides_env_var() {
+    let scene = TestScenario::new(util_name!());
+    let at = &scene.fixtures;
+    at.touch(at.plus_as_string("foo-1"));
+    at.touch(at.plus_as_string("bar-2"));
+
+    // The quoting style given by the env variable should be
+    // overriden by any escape style provided by argument.
+    for (arg, correct) in [
+        ("--quoting-style=literal", "foo-1"),
+        ("-N", "foo-1"),
+        ("--quoting-style=escape", "foo-1"),
+        ("-b", "foo-1"),
+        ("--quoting-style=shell-escape", "foo-1"),
+        ("--quoting-style=shell-escape-always", "'foo-1'"),
+        ("--quoting-style=shell", "foo-1"),
+        ("--quoting-style=shell-always", "'foo-1'"),
+    ] {
+        scene
+            .ucmd()
+            .env("QUOTING_STYLE", "c")
+            .arg("--hide-control-chars")
+            .arg(arg)
+            .arg("foo-1")
+            .succeeds()
+            .stdout_only(format!("{correct}\n"));
+    }
+
+    // Another loop to check for the C quoting style that is used as a default above.
+    for (arg, correct) in [
+        ("--quoting-style=c", "\"foo-1\""),
+        ("-Q", "\"foo-1\""),
+        ("--quote-name", "\"foo-1\""),
+    ] {
+        scene
+            .ucmd()
+            .env("QUOTING_STYLE", "literal")
+            .arg("--hide-control-chars")
+            .arg(arg)
+            .arg("foo-1")
+            .succeeds()
+            .stdout_only(format!("{correct}\n"));
+    }
+
+}
+
 #[test]
 fn test_ls_quoting_and_color() {
     let scene = TestScenario::new(util_name!());

From 9dca071b69a95b1c445ddd9243c5f1428da30edc Mon Sep 17 00:00:00 2001
From: Ikko Eltociear Ashimine <eltociear@gmail.com>
Date: Fri, 5 Jan 2024 15:30:23 +0900
Subject: [PATCH 345/429] Fix typo in signals.rs (#5781)

* Fix typo in signals.rs

occured -> occurred

* Remove "occurred" from spell-checker:ignore

---------

Co-authored-by: Daniel Hofstetter <daniel.hofstetter@42dh.com>
---
 src/uucore/src/lib/features/signals.rs | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/uucore/src/lib/features/signals.rs b/src/uucore/src/lib/features/signals.rs
index a4c85647ba4..0c3f968d975 100644
--- a/src/uucore/src/lib/features/signals.rs
+++ b/src/uucore/src/lib/features/signals.rs
@@ -3,7 +3,7 @@
 // For the full copyright and license information, please view the LICENSE
 // file that was distributed with this source code.
 
-// spell-checker:ignore (vars/api) fcntl setrlimit setitimer rubout pollable occured sysconf
+// spell-checker:ignore (vars/api) fcntl setrlimit setitimer rubout pollable sysconf
 // spell-checker:ignore (vars/signals) ABRT ALRM CHLD SEGV SIGABRT SIGALRM SIGBUS SIGCHLD SIGCONT SIGEMT SIGFPE SIGHUP SIGILL SIGINFO SIGINT SIGIO SIGIOT SIGKILL SIGPIPE SIGPROF SIGPWR SIGQUIT SIGSEGV SIGSTOP SIGSYS SIGTERM SIGTRAP SIGTSTP SIGTHR SIGTTIN SIGTTOU SIGURG SIGUSR SIGVTALRM SIGWINCH SIGXCPU SIGXFSZ STKFLT PWR THR TSTP TTIN TTOU VTALRM XCPU XFSZ SIGCLD SIGPOLL SIGWAITING SIGAIOCANCEL SIGLWP SIGFREEZE SIGTHAW SIGCANCEL SIGLOST SIGXRES SIGJVM SIGRTMIN SIGRT SIGRTMAX AIOCANCEL XRES RTMIN RTMAX
 #[cfg(unix)]
 use nix::errno::Errno;
@@ -207,7 +207,7 @@ pub static ALL_SIGNALS: [&str; 33] = [
      SIGPWR       19      power-fail restart
      SIGWINCH     20      window size change
      SIGURG       21      urgent socket condition
-     SIGPOLL      22      pollable event occured
+     SIGPOLL      22      pollable event occurred
      SIGIO        SIGPOLL socket I/O possible (SIGPOLL alias)
      SIGSTOP      23      stop (cannot be caught or ignored)
      SIGTSTP      24      user stop requested from tty

From e56682893f99878e73b230c3bf8b1283d9fe8e8f Mon Sep 17 00:00:00 2001
From: Samuel Tardieu <sam@rfc1149.net>
Date: Fri, 5 Jan 2024 10:09:04 +0100
Subject: [PATCH 346/429] uucore: fix style in tests

- `Path::new()` returns a `&Path` and does not need to be dereferenced
- Some types can be deduced from the context and are well visible
  already (`parse_size_u128()` or `from_bytes()`)
---
 src/uucore/src/lib/features/backup_control.rs    |  6 +++---
 src/uucore/src/lib/features/fs.rs                |  8 ++++----
 src/uucore/src/lib/parser/parse_size.rs          | 16 ++++++++--------
 .../src/lib/parser/shortcut_value_parser.rs      |  2 +-
 4 files changed, 16 insertions(+), 16 deletions(-)

diff --git a/src/uucore/src/lib/features/backup_control.rs b/src/uucore/src/lib/features/backup_control.rs
index 86c7cd72b1d..fedbb375cb7 100644
--- a/src/uucore/src/lib/features/backup_control.rs
+++ b/src/uucore/src/lib/features/backup_control.rs
@@ -662,7 +662,7 @@ mod tests {
         let target = Path::new("data.txt");
         let suffix = String::from(".bak");
 
-        assert!(source_is_target_backup(&source, &target, &suffix));
+        assert!(source_is_target_backup(source, target, &suffix));
     }
 
     #[test]
@@ -671,7 +671,7 @@ mod tests {
         let target = Path::new("backup.txt");
         let suffix = String::from(".bak");
 
-        assert!(!source_is_target_backup(&source, &target, &suffix));
+        assert!(!source_is_target_backup(source, target, &suffix));
     }
 
     #[test]
@@ -680,6 +680,6 @@ mod tests {
         let target = Path::new("example");
         let suffix = String::from("~");
 
-        assert!(source_is_target_backup(&source, &target, &suffix));
+        assert!(source_is_target_backup(source, target, &suffix));
     }
 }
diff --git a/src/uucore/src/lib/features/fs.rs b/src/uucore/src/lib/features/fs.rs
index 41437c55468..6eb809e6d32 100644
--- a/src/uucore/src/lib/features/fs.rs
+++ b/src/uucore/src/lib/features/fs.rs
@@ -878,7 +878,7 @@ mod tests {
         let path1 = temp_file.path();
         let path2 = temp_file.path();
 
-        assert!(are_hardlinks_to_same_file(&path1, &path2));
+        assert!(are_hardlinks_to_same_file(path1, path2));
     }
 
     #[cfg(unix)]
@@ -893,7 +893,7 @@ mod tests {
         let path1 = temp_file1.path();
         let path2 = temp_file2.path();
 
-        assert!(!are_hardlinks_to_same_file(&path1, &path2));
+        assert!(!are_hardlinks_to_same_file(path1, path2));
     }
 
     #[cfg(unix)]
@@ -904,9 +904,9 @@ mod tests {
         let path1 = temp_file.path();
 
         let path2 = temp_file.path().with_extension("hardlink");
-        fs::hard_link(&path1, &path2).unwrap();
+        fs::hard_link(path1, &path2).unwrap();
 
-        assert!(are_hardlinks_to_same_file(&path1, &path2));
+        assert!(are_hardlinks_to_same_file(path1, &path2));
     }
 
     #[cfg(unix)]
diff --git a/src/uucore/src/lib/parser/parse_size.rs b/src/uucore/src/lib/parser/parse_size.rs
index 0a46ce3271b..163c8942fb2 100644
--- a/src/uucore/src/lib/parser/parse_size.rs
+++ b/src/uucore/src/lib/parser/parse_size.rs
@@ -424,23 +424,23 @@ mod tests {
 
         for &(c, exp) in &suffixes {
             let s = format!("2{c}B"); // KB
-            assert_eq!(Ok((2 * (1000_u128).pow(exp)) as u128), parse_size_u128(&s));
+            assert_eq!(Ok(2 * (1000_u128).pow(exp)), parse_size_u128(&s));
             let s = format!("2{c}"); // K
-            assert_eq!(Ok((2 * (1024_u128).pow(exp)) as u128), parse_size_u128(&s));
+            assert_eq!(Ok(2 * (1024_u128).pow(exp)), parse_size_u128(&s));
             let s = format!("2{c}iB"); // KiB
-            assert_eq!(Ok((2 * (1024_u128).pow(exp)) as u128), parse_size_u128(&s));
+            assert_eq!(Ok(2 * (1024_u128).pow(exp)), parse_size_u128(&s));
             let s = format!("2{}iB", c.to_lowercase()); // kiB
-            assert_eq!(Ok((2 * (1024_u128).pow(exp)) as u128), parse_size_u128(&s));
+            assert_eq!(Ok(2 * (1024_u128).pow(exp)), parse_size_u128(&s));
 
             // suffix only
             let s = format!("{c}B"); // KB
-            assert_eq!(Ok(((1000_u128).pow(exp)) as u128), parse_size_u128(&s));
+            assert_eq!(Ok((1000_u128).pow(exp)), parse_size_u128(&s));
             let s = format!("{c}"); // K
-            assert_eq!(Ok(((1024_u128).pow(exp)) as u128), parse_size_u128(&s));
+            assert_eq!(Ok((1024_u128).pow(exp)), parse_size_u128(&s));
             let s = format!("{c}iB"); // KiB
-            assert_eq!(Ok(((1024_u128).pow(exp)) as u128), parse_size_u128(&s));
+            assert_eq!(Ok((1024_u128).pow(exp)), parse_size_u128(&s));
             let s = format!("{}iB", c.to_lowercase()); // kiB
-            assert_eq!(Ok(((1024_u128).pow(exp)) as u128), parse_size_u128(&s));
+            assert_eq!(Ok((1024_u128).pow(exp)), parse_size_u128(&s));
         }
     }
 
diff --git a/src/uucore/src/lib/parser/shortcut_value_parser.rs b/src/uucore/src/lib/parser/shortcut_value_parser.rs
index 49bb2b62b71..2b94f9b75bc 100644
--- a/src/uucore/src/lib/parser/shortcut_value_parser.rs
+++ b/src/uucore/src/lib/parser/shortcut_value_parser.rs
@@ -163,7 +163,7 @@ mod tests {
         let parser = ShortcutValueParser::new(["abcd"]);
         let cmd = Command::new("cmd");
 
-        let result = parser.parse_ref(&cmd, None, OsStr::from_bytes(&[0xc3 as u8, 0x28 as u8]));
+        let result = parser.parse_ref(&cmd, None, OsStr::from_bytes(&[0xc3, 0x28]));
         assert_eq!(ErrorKind::InvalidUtf8, result.unwrap_err().kind());
     }
 }

From 4343ba6695d9de47a055ae411983029d61b6ea3e Mon Sep 17 00:00:00 2001
From: Samuel Tardieu <sam@rfc1149.net>
Date: Fri, 5 Jan 2024 11:04:16 +0100
Subject: [PATCH 347/429] fuzz: fix file descriptor leak

---
 fuzz/fuzz_targets/fuzz_common.rs | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/fuzz/fuzz_targets/fuzz_common.rs b/fuzz/fuzz_targets/fuzz_common.rs
index 0201ffd89c2..f0de0b6052f 100644
--- a/fuzz/fuzz_targets/fuzz_common.rs
+++ b/fuzz/fuzz_targets/fuzz_common.rs
@@ -149,6 +149,10 @@ where
             exit_code: -1,
         };
     }
+    unsafe {
+        close(original_stdout_fd);
+        close(original_stderr_fd);
+    }
 
     // Restore the original stdin if it was modified
     if let Some(fd) = original_stdin_fd {

From 4c698d58e09dc7d46dc47f5b88e1726374939e8c Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Wed, 3 Jan 2024 23:43:02 +0100
Subject: [PATCH 348/429] mv: support the case mkdir a && mv a e/

---
 src/uu/mv/src/mv.rs      |  5 +++--
 tests/by-util/test_mv.rs | 13 +++++++++++++
 2 files changed, 16 insertions(+), 2 deletions(-)

diff --git a/src/uu/mv/src/mv.rs b/src/uu/mv/src/mv.rs
index 855afcc1fdf..19a7c274fbe 100644
--- a/src/uu/mv/src/mv.rs
+++ b/src/uu/mv/src/mv.rs
@@ -334,10 +334,11 @@ fn handle_two_paths(source: &Path, target: &Path, opts: &Options) -> UResult<()>
         }
     }
 
-    let target_is_dir = target.is_dir();
+    let target_is_dir: bool = target.is_dir();
+    let source_is_dir: bool = source.is_dir();
 
     if path_ends_with_terminator(target)
-        && !target_is_dir
+        && (!target_is_dir && !source_is_dir)
         && !opts.no_target_dir
         && opts.update != UpdateMode::ReplaceIfOlder
     {
diff --git a/tests/by-util/test_mv.rs b/tests/by-util/test_mv.rs
index 4b923767b84..175b91e7dab 100644
--- a/tests/by-util/test_mv.rs
+++ b/tests/by-util/test_mv.rs
@@ -1556,6 +1556,19 @@ fn test_mv_dir_into_file_where_both_are_files() {
         .stderr_contains("mv: cannot stat 'a/': Not a directory");
 }
 
+#[test]
+fn test_mv_dir_into_path_slash() {
+    let scene = TestScenario::new(util_name!());
+    let at = &scene.fixtures;
+    at.mkdir("a");
+    scene.ucmd().arg("a").arg("e/").succeeds();
+    assert!(at.dir_exists("e"));
+    at.mkdir("b");
+    at.mkdir("f");
+    scene.ucmd().arg("b").arg("f/").succeeds();
+    assert!(at.dir_exists("f/b"));
+}
+
 // Todo:
 
 // $ at.touch a b

From 108dc4a0cddcabae16e009d7d9c71fdc05a40aac Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Thu, 4 Jan 2024 00:24:08 +0100
Subject: [PATCH 349/429] Move path_ends_with_terminator from mv into uucore

---
 src/uu/mv/src/mv.rs               | 24 ++++--------------------
 src/uucore/src/lib/features/fs.rs | 19 +++++++++++++++++++
 2 files changed, 23 insertions(+), 20 deletions(-)

diff --git a/src/uu/mv/src/mv.rs b/src/uu/mv/src/mv.rs
index 19a7c274fbe..c95e54028da 100644
--- a/src/uu/mv/src/mv.rs
+++ b/src/uu/mv/src/mv.rs
@@ -23,7 +23,10 @@ use std::path::{Path, PathBuf};
 use uucore::backup_control::{self, source_is_target_backup};
 use uucore::display::Quotable;
 use uucore::error::{set_exit_code, FromIo, UResult, USimpleError, UUsageError};
-use uucore::fs::{are_hardlinks_or_one_way_symlink_to_same_file, are_hardlinks_to_same_file};
+use uucore::fs::{
+    are_hardlinks_or_one_way_symlink_to_same_file, are_hardlinks_to_same_file,
+    path_ends_with_terminator,
+};
 use uucore::update_control;
 // These are exposed for projects (e.g. nushell) that want to create an `Options` value, which
 // requires these enums
@@ -104,25 +107,6 @@ static OPT_VERBOSE: &str = "verbose";
 static OPT_PROGRESS: &str = "progress";
 static ARG_FILES: &str = "files";
 
-/// Returns true if the passed `path` ends with a path terminator.
-#[cfg(unix)]
-fn path_ends_with_terminator(path: &Path) -> bool {
-    use std::os::unix::prelude::OsStrExt;
-    path.as_os_str()
-        .as_bytes()
-        .last()
-        .map_or(false, |&byte| byte == b'/' || byte == b'\\')
-}
-
-#[cfg(windows)]
-fn path_ends_with_terminator(path: &Path) -> bool {
-    use std::os::windows::prelude::OsStrExt;
-    path.as_os_str()
-        .encode_wide()
-        .last()
-        .map_or(false, |wide| wide == b'/'.into() || wide == b'\\'.into())
-}
-
 #[uucore::main]
 pub fn uumain(args: impl uucore::Args) -> UResult<()> {
     let mut app = uu_app();
diff --git a/src/uucore/src/lib/features/fs.rs b/src/uucore/src/lib/features/fs.rs
index 6eb809e6d32..7033646b63b 100644
--- a/src/uucore/src/lib/features/fs.rs
+++ b/src/uucore/src/lib/features/fs.rs
@@ -714,6 +714,25 @@ pub fn are_hardlinks_or_one_way_symlink_to_same_file(source: &Path, target: &Pat
     source_metadata.ino() == target_metadata.ino() && source_metadata.dev() == target_metadata.dev()
 }
 
+/// Returns true if the passed `path` ends with a path terminator.
+#[cfg(unix)]
+pub fn path_ends_with_terminator(path: &Path) -> bool {
+    use std::os::unix::prelude::OsStrExt;
+    path.as_os_str()
+        .as_bytes()
+        .last()
+        .map_or(false, |&byte| byte == b'/' || byte == b'\\')
+}
+
+#[cfg(windows)]
+pub fn path_ends_with_terminator(path: &Path) -> bool {
+    use std::os::windows::prelude::OsStrExt;
+    path.as_os_str()
+        .encode_wide()
+        .last()
+        .map_or(false, |wide| wide == b'/'.into() || wide == b'\\'.into())
+}
+
 #[cfg(test)]
 mod tests {
     // Note this useful idiom: importing names from outer (for mod tests) scope.

From cb27b9c9c35c133f2aae11dd71123c99ba32ccb8 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Thu, 4 Jan 2024 00:27:44 +0100
Subject: [PATCH 350/429] path_ends_with_terminator: rustdoc + unittest

---
 src/uucore/src/lib/features/fs.rs | 29 +++++++++++++++++++++++++++++
 1 file changed, 29 insertions(+)

diff --git a/src/uucore/src/lib/features/fs.rs b/src/uucore/src/lib/features/fs.rs
index 7033646b63b..c9eaa1e016b 100644
--- a/src/uucore/src/lib/features/fs.rs
+++ b/src/uucore/src/lib/features/fs.rs
@@ -715,7 +715,16 @@ pub fn are_hardlinks_or_one_way_symlink_to_same_file(source: &Path, target: &Pat
 }
 
 /// Returns true if the passed `path` ends with a path terminator.
+///
+/// This function examines the last character of the path to determine
+/// if it is a directory separator. It supports both Unix-style (`/`)
+/// and Windows-style (`\`) separators.
+///
+/// # Arguments
+///
+/// * `path` - A reference to the path to be checked.
 #[cfg(unix)]
+
 pub fn path_ends_with_terminator(path: &Path) -> bool {
     use std::os::unix::prelude::OsStrExt;
     path.as_os_str()
@@ -940,4 +949,24 @@ mod tests {
         assert_eq!(get_file_display(S_IFSOCK | 0o600), 's');
         assert_eq!(get_file_display(0o777), '?');
     }
+
+    #[test]
+    fn test_path_ends_with_terminator() {
+        // Path ends with a forward slash
+        assert!(path_ends_with_terminator(Path::new("/some/path/")));
+
+        // Path ends with a backslash
+        assert!(path_ends_with_terminator(Path::new("C:\\some\\path\\")));
+
+        // Path does not end with a terminator
+        assert!(!path_ends_with_terminator(Path::new("/some/path")));
+        assert!(!path_ends_with_terminator(Path::new("C:\\some\\path")));
+
+        // Empty path
+        assert!(!path_ends_with_terminator(Path::new("")));
+
+        // Root path
+        assert!(path_ends_with_terminator(Path::new("/")));
+        assert!(path_ends_with_terminator(Path::new("C:\\")));
+    }
 }

From aabf5fa577fc6cdc9b08a5cc92c0083ee53367c6 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Thu, 4 Jan 2024 00:41:54 +0100
Subject: [PATCH 351/429] cp: manages target with trailing '/'

---
 src/uu/cp/src/copydir.rs | 13 +++++++++++--
 src/uu/cp/src/cp.rs      |  8 ++++++--
 tests/by-util/test_cp.rs | 20 ++++++++++++++++++++
 util/build-gnu.sh        |  3 +++
 4 files changed, 40 insertions(+), 4 deletions(-)

diff --git a/src/uu/cp/src/copydir.rs b/src/uu/cp/src/copydir.rs
index a903ed2aaff..dd3fced53de 100644
--- a/src/uu/cp/src/copydir.rs
+++ b/src/uu/cp/src/copydir.rs
@@ -17,7 +17,9 @@ use std::path::{Path, PathBuf, StripPrefixError};
 use indicatif::ProgressBar;
 use uucore::display::Quotable;
 use uucore::error::UIoError;
-use uucore::fs::{canonicalize, FileInformation, MissingHandling, ResolveMode};
+use uucore::fs::{
+    canonicalize, path_ends_with_terminator, FileInformation, MissingHandling, ResolveMode,
+};
 use uucore::show;
 use uucore::show_error;
 use uucore::uio_error;
@@ -170,7 +172,14 @@ impl Entry {
         let mut descendant =
             get_local_to_root_parent(&source_absolute, context.root_parent.as_deref())?;
         if no_target_dir {
-            descendant = descendant.strip_prefix(context.root)?.to_path_buf();
+            let source_is_dir: bool = direntry.path().is_dir();
+            if path_ends_with_terminator(context.target) && source_is_dir {
+                if let Err(e) = std::fs::create_dir_all(context.target) {
+                    eprintln!("Failed to create directory: {}", e);
+                }
+            } else {
+                descendant = descendant.strip_prefix(context.root)?.to_path_buf();
+            }
         }
 
         let local_to_target = context.target.join(descendant);
diff --git a/src/uu/cp/src/cp.rs b/src/uu/cp/src/cp.rs
index 332bb578512..8a4c5623ade 100644
--- a/src/uu/cp/src/cp.rs
+++ b/src/uu/cp/src/cp.rs
@@ -32,8 +32,8 @@ use platform::copy_on_write;
 use uucore::display::Quotable;
 use uucore::error::{set_exit_code, UClapError, UError, UResult, UUsageError};
 use uucore::fs::{
-    are_hardlinks_to_same_file, canonicalize, is_symlink_loop, paths_refer_to_same_file,
-    FileInformation, MissingHandling, ResolveMode,
+    are_hardlinks_to_same_file, canonicalize, is_symlink_loop, path_ends_with_terminator,
+    paths_refer_to_same_file, FileInformation, MissingHandling, ResolveMode,
 };
 use uucore::{backup_control, update_control};
 // These are exposed for projects (e.g. nushell) that want to create an `Options` value, which
@@ -1994,6 +1994,10 @@ fn copy_helper(
         fs::create_dir_all(parent)?;
     }
 
+    if path_ends_with_terminator(dest) && !dest.is_dir() {
+        return Err(Error::NotADirectory(dest.to_path_buf()));
+    }
+
     if source.as_os_str() == "/dev/null" {
         /* workaround a limitation of fs::copy
          * https://github.com/rust-lang/rust/issues/79390
diff --git a/tests/by-util/test_cp.rs b/tests/by-util/test_cp.rs
index d166243ed6e..cb6b7a8dce7 100644
--- a/tests/by-util/test_cp.rs
+++ b/tests/by-util/test_cp.rs
@@ -3681,3 +3681,23 @@ fn test_cp_seen_file() {
     assert!(at.plus("c").join("f").exists());
     assert!(at.plus("c").join("f.~1~").exists());
 }
+
+#[test]
+fn test_cp_path_ends_with_terminator() {
+    let ts = TestScenario::new(util_name!());
+    let at = &ts.fixtures;
+    at.mkdir("a");
+    ts.ucmd().arg("-r").arg("-T").arg("a").arg("e/").succeeds();
+}
+
+#[test]
+fn test_cp_no_such() {
+    let ts = TestScenario::new(util_name!());
+    let at = &ts.fixtures;
+    at.touch("b");
+    ts.ucmd()
+        .arg("b")
+        .arg("no-such/")
+        .fails()
+        .stderr_is("cp: 'no-such/' is not a directory\n");
+}
diff --git a/util/build-gnu.sh b/util/build-gnu.sh
index 4209b771015..915577c5584 100755
--- a/util/build-gnu.sh
+++ b/util/build-gnu.sh
@@ -206,6 +206,9 @@ sed -i "s|cp: target directory 'symlink': Permission denied|cp: 'symlink' is not
 # to transform an ERROR into FAIL
 sed -i 's|xargs mkdir )|xargs mkdir -p )|' tests/cp/link-heap.sh
 
+# Our message is a bit better
+sed -i "s|cannot create regular file 'no-such/': Not a directory|'no-such/' is not a directory|" tests/mv/trailing-slash.sh
+
 sed -i 's|cp |/usr/bin/cp |' tests/mv/hard-2.sh
 sed -i 's|paste |/usr/bin/paste |' tests/od/od-endian.sh
 sed -i 's|timeout |'"${SYSTEM_TIMEOUT}"' |' tests/tail/follow-stdin.sh

From e64a0b4a2637a5b84165acf729f41da98b6bb8cf Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Fri, 5 Jan 2024 10:11:35 +0100
Subject: [PATCH 352/429] Various fixes

Co-authored-by: Daniel Hofstetter <daniel.hofstetter@42dh.com>
---
 src/uu/cp/src/copydir.rs          | 2 +-
 src/uu/mv/src/mv.rs               | 4 ++--
 src/uucore/src/lib/features/fs.rs | 1 -
 3 files changed, 3 insertions(+), 4 deletions(-)

diff --git a/src/uu/cp/src/copydir.rs b/src/uu/cp/src/copydir.rs
index dd3fced53de..7a9d797e81c 100644
--- a/src/uu/cp/src/copydir.rs
+++ b/src/uu/cp/src/copydir.rs
@@ -172,7 +172,7 @@ impl Entry {
         let mut descendant =
             get_local_to_root_parent(&source_absolute, context.root_parent.as_deref())?;
         if no_target_dir {
-            let source_is_dir: bool = direntry.path().is_dir();
+            let source_is_dir = direntry.path().is_dir();
             if path_ends_with_terminator(context.target) && source_is_dir {
                 if let Err(e) = std::fs::create_dir_all(context.target) {
                     eprintln!("Failed to create directory: {}", e);
diff --git a/src/uu/mv/src/mv.rs b/src/uu/mv/src/mv.rs
index c95e54028da..223ac9119b6 100644
--- a/src/uu/mv/src/mv.rs
+++ b/src/uu/mv/src/mv.rs
@@ -318,8 +318,8 @@ fn handle_two_paths(source: &Path, target: &Path, opts: &Options) -> UResult<()>
         }
     }
 
-    let target_is_dir: bool = target.is_dir();
-    let source_is_dir: bool = source.is_dir();
+    let target_is_dir = target.is_dir();
+    let source_is_dir = source.is_dir();
 
     if path_ends_with_terminator(target)
         && (!target_is_dir && !source_is_dir)
diff --git a/src/uucore/src/lib/features/fs.rs b/src/uucore/src/lib/features/fs.rs
index c9eaa1e016b..20cc9e13de3 100644
--- a/src/uucore/src/lib/features/fs.rs
+++ b/src/uucore/src/lib/features/fs.rs
@@ -724,7 +724,6 @@ pub fn are_hardlinks_or_one_way_symlink_to_same_file(source: &Path, target: &Pat
 ///
 /// * `path` - A reference to the path to be checked.
 #[cfg(unix)]
-
 pub fn path_ends_with_terminator(path: &Path) -> bool {
     use std::os::unix::prelude::OsStrExt;
     path.as_os_str()

From 4372908e8487416b93836ba5d926b5cc441cd11a Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Dorian=20P=C3=A9ron?= <dorianperon.i@gmail.com>
Date: Fri, 5 Jan 2024 13:51:28 +0100
Subject: [PATCH 353/429] fix: cargo fmt + fix spelling mistake

---
 tests/by-util/test_ls.rs | 3 +--
 1 file changed, 1 insertion(+), 2 deletions(-)

diff --git a/tests/by-util/test_ls.rs b/tests/by-util/test_ls.rs
index 476704660d4..0162b017078 100644
--- a/tests/by-util/test_ls.rs
+++ b/tests/by-util/test_ls.rs
@@ -2648,7 +2648,7 @@ fn test_ls_quoting_style_arg_overrides_env_var() {
     at.touch(at.plus_as_string("bar-2"));
 
     // The quoting style given by the env variable should be
-    // overriden by any escape style provided by argument.
+    // overridden by any escape style provided by argument.
     for (arg, correct) in [
         ("--quoting-style=literal", "foo-1"),
         ("-N", "foo-1"),
@@ -2684,7 +2684,6 @@ fn test_ls_quoting_style_arg_overrides_env_var() {
             .succeeds()
             .stdout_only(format!("{correct}\n"));
     }
-
 }
 
 #[test]

From 4c5326ffa34b2026d5437b8b5b118f5f67467f0a Mon Sep 17 00:00:00 2001
From: Samuel Tardieu <sam@rfc1149.net>
Date: Fri, 5 Jan 2024 14:40:45 +0100
Subject: [PATCH 354/429] uucore/num_format: the default precision for %g is 6

---
 src/uucore/src/lib/features/format/num_format.rs | 8 +++++++-
 1 file changed, 7 insertions(+), 1 deletion(-)

diff --git a/src/uucore/src/lib/features/format/num_format.rs b/src/uucore/src/lib/features/format/num_format.rs
index 51f3336cf61..4e60015f64a 100644
--- a/src/uucore/src/lib/features/format/num_format.rs
+++ b/src/uucore/src/lib/features/format/num_format.rs
@@ -286,7 +286,13 @@ impl Formatter for Float {
 
         let precision = match precision {
             Some(CanAsterisk::Fixed(x)) => x,
-            None => 0,
+            None => {
+                if matches!(variant, FloatVariant::Shortest) {
+                    6
+                } else {
+                    0
+                }
+            }
             Some(CanAsterisk::Asterisk) => return Err(FormatError::WrongSpecType),
         };
 

From f5179290a6d571229c977b6b7eede92b1492f1aa Mon Sep 17 00:00:00 2001
From: Samuel Tardieu <sam@rfc1149.net>
Date: Fri, 5 Jan 2024 14:44:09 +0100
Subject: [PATCH 355/429] uucore/num_format: replace saturating_sub by regular
 subtraction

Using `saturating_sub()` before converting to `usize` gives a wrong
feeling of security as it looks like it ensures that the value will
never go negative. However, since it is applied to `i32`, it can, and
converting it to `usize` would go horribly wrong anyway.

By following the code flow, `exponent` cannot be greater than
`precision`, or the `else` block would not have been taken.  A plain
subtraction will give the same result and will at least panic in debug
mode.
---
 src/uucore/src/lib/features/format/num_format.rs | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/uucore/src/lib/features/format/num_format.rs b/src/uucore/src/lib/features/format/num_format.rs
index 4e60015f64a..dce39641d8c 100644
--- a/src/uucore/src/lib/features/format/num_format.rs
+++ b/src/uucore/src/lib/features/format/num_format.rs
@@ -425,7 +425,7 @@ fn format_float_shortest(
         //  - The precision works differently and specifies the total number
         //    of digits instead of the digits in the fractional part.
         //  - If we don't force the decimal, '0' and `.` are trimmed.
-        let decimal_places = (precision as i32).saturating_sub(exponent) as usize;
+        let decimal_places = (precision as i32 - exponent) as usize;
         let mut formatted = if decimal_places == 0 && force_decimal == ForceDecimal::Yes {
             format!("{f:.0}.")
         } else {

From 32f0256d7d974ba8b845d0dae3bc82e3437767a9 Mon Sep 17 00:00:00 2001
From: Samuel Tardieu <sam@rfc1149.net>
Date: Fri, 5 Jan 2024 14:49:09 +0100
Subject: [PATCH 356/429] =?UTF-8?q?uucore/num=5Fformat:=20properly=20displ?=
 =?UTF-8?q?ay=2010=E1=B5=96=20where=20p=20is=20the=20precision?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

`seq --format %.2g 10 10` would display `1` because the precision would
not allow room for the decimal point, and the `0` in `10` would be
trimmed as an insignificant trailing `0`.

This has been fixed by only trimming trailing `0` in the presence of a
decimal point.
---
 .../src/lib/features/format/num_format.rs     | 37 ++++++++++++++-----
 tests/by-util/test_seq.rs                     | 20 ++++++++++
 2 files changed, 48 insertions(+), 9 deletions(-)

diff --git a/src/uucore/src/lib/features/format/num_format.rs b/src/uucore/src/lib/features/format/num_format.rs
index dce39641d8c..60a3a404a8e 100644
--- a/src/uucore/src/lib/features/format/num_format.rs
+++ b/src/uucore/src/lib/features/format/num_format.rs
@@ -411,7 +411,7 @@ fn format_float_shortest(
         let mut normalized = format!("{normalized:.*}", precision);
 
         if force_decimal == ForceDecimal::No {
-            strip_zeros_and_dot(&mut normalized);
+            strip_fractional_zeroes_and_dot(&mut normalized);
         }
 
         let exp_char = match case {
@@ -424,7 +424,8 @@ fn format_float_shortest(
         // Decimal-ish notation with a few differences:
         //  - The precision works differently and specifies the total number
         //    of digits instead of the digits in the fractional part.
-        //  - If we don't force the decimal, '0' and `.` are trimmed.
+        //  - If we don't force the decimal, `.` and trailing `0` in the fractional part
+        //    are trimmed.
         let decimal_places = (precision as i32 - exponent) as usize;
         let mut formatted = if decimal_places == 0 && force_decimal == ForceDecimal::Yes {
             format!("{f:.0}.")
@@ -433,7 +434,7 @@ fn format_float_shortest(
         };
 
         if force_decimal == ForceDecimal::No {
-            strip_zeros_and_dot(&mut formatted);
+            strip_fractional_zeroes_and_dot(&mut formatted);
         }
 
         formatted
@@ -469,12 +470,16 @@ fn format_float_hexadecimal(
     s
 }
 
-fn strip_zeros_and_dot(s: &mut String) {
-    while s.ends_with('0') {
-        s.pop();
-    }
-    if s.ends_with('.') {
-        s.pop();
+fn strip_fractional_zeroes_and_dot(s: &mut String) {
+    let mut trim_to = s.len();
+    for (pos, c) in s.char_indices().rev() {
+        if pos + c.len_utf8() == trim_to && (c == '0' || c == '.') {
+            trim_to = pos;
+        }
+        if c == '.' {
+            s.truncate(trim_to);
+            break;
+        }
     }
 }
 
@@ -580,4 +585,18 @@ mod test {
         assert_eq!(f(1000000.0), "1.e+06");
         assert_eq!(f(99999999.0), "1.e+08");
     }
+
+    #[test]
+    fn strip_insignificant_end() {
+        use super::strip_fractional_zeroes_and_dot;
+        let f = |s| {
+            let mut s = String::from(s);
+            strip_fractional_zeroes_and_dot(&mut s);
+            s
+        };
+        assert_eq!(&f("1000"), "1000");
+        assert_eq!(&f("1000."), "1000");
+        assert_eq!(&f("1000.02030"), "1000.0203");
+        assert_eq!(&f("1000.00000"), "1000");
+    }
 }
diff --git a/tests/by-util/test_seq.rs b/tests/by-util/test_seq.rs
index da28181eb61..4a3286960b9 100644
--- a/tests/by-util/test_seq.rs
+++ b/tests/by-util/test_seq.rs
@@ -766,3 +766,23 @@ fn test_invalid_zero_increment_value() {
         .no_stdout()
         .usage_error("invalid Zero increment value: '0'");
 }
+
+#[test]
+fn test_power_of_ten_display() {
+    new_ucmd!()
+        .args(&["-f", "%.2g", "10", "10"])
+        .succeeds()
+        .stdout_only("10\n");
+}
+
+#[test]
+fn test_default_g_precision() {
+    new_ucmd!()
+        .args(&["-f", "%010g", "1e5", "1e5"])
+        .succeeds()
+        .stdout_only("0000100000\n");
+    new_ucmd!()
+        .args(&["-f", "%010g", "1e6", "1e6"])
+        .succeeds()
+        .stdout_only("000001e+06\n");
+}

From 5de030f119791a873b5a6bfb990c8e1c049aa4d7 Mon Sep 17 00:00:00 2001
From: Michel Lind <salimma@fedoraproject.org>
Date: Fri, 5 Jan 2024 22:20:59 -0600
Subject: [PATCH 357/429] uuhelp_parser: add links to homepage and repo

When viewing the crate right now, apart from via looking at the dependencies
it's hard to find the associated project and repository.

Add the missing info.

Signed-off-by: Michel Lind <salimma@fedoraproject.org>
---
 src/uuhelp_parser/Cargo.toml | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/src/uuhelp_parser/Cargo.toml b/src/uuhelp_parser/Cargo.toml
index c07bce63160..cbf049f9dba 100644
--- a/src/uuhelp_parser/Cargo.toml
+++ b/src/uuhelp_parser/Cargo.toml
@@ -5,3 +5,6 @@ version = "0.0.23"
 edition = "2021"
 license = "MIT"
 description = "A collection of functions to parse the markdown code of help files"
+
+homepage = "https://github.com/uutils/coreutils"
+repository = "https://github.com/uutils/coreutils/tree/main/src/uuhelp_parser"

From 9f4330f94cc471d880df7d9089ee1105b27fd321 Mon Sep 17 00:00:00 2001
From: Fabrice Fontaine <fontaine.fabrice@gmail.com>
Date: Sat, 6 Jan 2024 10:26:54 +0100
Subject: [PATCH 358/429] uucore: add support for sparc64

Add support for sparc64 in uucore to avoid the following build failure
with nushell:

error[E0308]: mismatched types
   --> /home/autobuild/autobuild/instance-7/output-1/build/nushell-0.85.0/VENDOR/uucore/src/lib/features/fs.rs:121:16
    |
111 |     pub fn number_of_links(&self) -> u64 {
    |                                      --- expected `u64` because of return type
...
121 |         return self.0.st_nlink;
    |                ^^^^^^^^^^^^^^^ expected `u64`, found `u32`
    |
help: you can convert a `u32` to a `u64`
    |
121 |         return self.0.st_nlink.into();
    |                               +++++++

For more information about this error, try `rustc --explain E0308`.
error: could not compile `uucore` (lib) due to previous error

Fixes:
 - http://autobuild.buildroot.org/results/f9f0287a8e39c65895014ca513ed25071f020add

Signed-off-by: Fabrice Fontaine <fontaine.fabrice@gmail.com>
---
 src/uucore/src/lib/features/fs.rs | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/src/uucore/src/lib/features/fs.rs b/src/uucore/src/lib/features/fs.rs
index 20cc9e13de3..3b9170bc309 100644
--- a/src/uucore/src/lib/features/fs.rs
+++ b/src/uucore/src/lib/features/fs.rs
@@ -121,6 +121,7 @@ impl FileInformation {
             not(target_arch = "aarch64"),
             not(target_arch = "riscv64"),
             not(target_arch = "loongarch64"),
+            not(target_arch = "sparc64"),
             target_pointer_width = "64"
         ))]
         return self.0.st_nlink;
@@ -137,6 +138,7 @@ impl FileInformation {
                 target_arch = "aarch64",
                 target_arch = "riscv64",
                 target_arch = "loongarch64",
+                target_arch = "sparc64",
                 not(target_pointer_width = "64")
             )
         ))]

From 247f2e55bdd5a6da3d34604eb7033fbd7df69b66 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Sat, 6 Jan 2024 16:54:29 +0100
Subject: [PATCH 359/429] seq: adjust some error messages. GNU's are better
 (#5798)

* seq: adjust some error messages. GNU's are better
tested by tests/seq/seq.pl

* uucore: remove todo

---------

Co-authored-by: Daniel Hofstetter <daniel.hofstetter@42dh.com>
---
 src/uucore/src/lib/features/format/mod.rs | 23 ++++++++++++++++-------
 tests/by-util/test_seq.rs                 | 14 ++++++++++++++
 2 files changed, 30 insertions(+), 7 deletions(-)

diff --git a/src/uucore/src/lib/features/format/mod.rs b/src/uucore/src/lib/features/format/mod.rs
index d213d0359cf..4d30753d610 100644
--- a/src/uucore/src/lib/features/format/mod.rs
+++ b/src/uucore/src/lib/features/format/mod.rs
@@ -57,8 +57,8 @@ pub enum FormatError {
     IoError(std::io::Error),
     NoMoreArguments,
     InvalidArgument(FormatArgument),
-    TooManySpecs,
-    NeedAtLeastOneSpec,
+    TooManySpecs(Vec<u8>),
+    NeedAtLeastOneSpec(Vec<u8>),
     WrongSpecType,
 }
 
@@ -79,9 +79,16 @@ impl Display for FormatError {
                 "%{}: invalid conversion specification",
                 String::from_utf8_lossy(s)
             ),
-            // TODO: The next two should print the spec as well
-            Self::TooManySpecs => write!(f, "format has too many % directives"),
-            Self::NeedAtLeastOneSpec => write!(f, "format has no % directive"),
+            Self::TooManySpecs(s) => write!(
+                f,
+                "format '{}' has too many % directives",
+                String::from_utf8_lossy(s)
+            ),
+            Self::NeedAtLeastOneSpec(s) => write!(
+                f,
+                "format '{}' has no % directive",
+                String::from_utf8_lossy(s)
+            ),
             // TODO: Error message below needs some work
             Self::WrongSpecType => write!(f, "wrong % directive type was given"),
             Self::IoError(_) => write!(f, "io error"),
@@ -303,7 +310,9 @@ impl<F: Formatter> Format<F> {
         }
 
         let Some(spec) = spec else {
-            return Err(FormatError::NeedAtLeastOneSpec);
+            return Err(FormatError::NeedAtLeastOneSpec(
+                format_string.as_ref().to_vec(),
+            ));
         };
 
         let formatter = F::try_from_spec(spec)?;
@@ -312,7 +321,7 @@ impl<F: Formatter> Format<F> {
         for item in &mut iter {
             match item? {
                 FormatItem::Spec(_) => {
-                    return Err(FormatError::TooManySpecs);
+                    return Err(FormatError::TooManySpecs(format_string.as_ref().to_vec()));
                 }
                 FormatItem::Char(c) => suffix.push(c),
             }
diff --git a/tests/by-util/test_seq.rs b/tests/by-util/test_seq.rs
index da28181eb61..9b0f9acea6d 100644
--- a/tests/by-util/test_seq.rs
+++ b/tests/by-util/test_seq.rs
@@ -766,3 +766,17 @@ fn test_invalid_zero_increment_value() {
         .no_stdout()
         .usage_error("invalid Zero increment value: '0'");
 }
+
+#[test]
+fn test_invalid_format() {
+    new_ucmd!()
+        .args(&["-f", "%%g", "1"])
+        .fails()
+        .no_stdout()
+        .stderr_contains("format '%%g' has no % directive");
+    new_ucmd!()
+        .args(&["-f", "%g%g", "1"])
+        .fails()
+        .no_stdout()
+        .stderr_contains("format '%g%g' has too many % directives");
+}

From c867d6bfb1695721f1093ce967ebc21fbd847b74 Mon Sep 17 00:00:00 2001
From: Kostiantyn Hryshchuk <statheres@gmail.com>
Date: Sat, 6 Jan 2024 22:50:21 +0100
Subject: [PATCH 360/429] shred: implemented "--remove" arg (#5790)

---
 src/uu/shred/src/shred.rs   | 105 +++++++++++++++++++++++++++---------
 tests/by-util/test_shred.rs |  77 ++++++++++++++++++++++++++
 2 files changed, 158 insertions(+), 24 deletions(-)

diff --git a/src/uu/shred/src/shred.rs b/src/uu/shred/src/shred.rs
index a77bfe5e134..b142e2e94e0 100644
--- a/src/uu/shred/src/shred.rs
+++ b/src/uu/shred/src/shred.rs
@@ -28,10 +28,17 @@ pub mod options {
     pub const FILE: &str = "file";
     pub const ITERATIONS: &str = "iterations";
     pub const SIZE: &str = "size";
+    pub const WIPESYNC: &str = "u";
     pub const REMOVE: &str = "remove";
     pub const VERBOSE: &str = "verbose";
     pub const EXACT: &str = "exact";
     pub const ZERO: &str = "zero";
+
+    pub mod remove {
+        pub const UNLINK: &str = "unlink";
+        pub const WIPE: &str = "wipe";
+        pub const WIPESYNC: &str = "wipesync";
+    }
 }
 
 // This block size seems to match GNU (2^16 = 65536)
@@ -81,6 +88,14 @@ enum PassType {
     Random,
 }
 
+#[derive(PartialEq, Clone, Copy)]
+enum RemoveMethod {
+    None,     // Default method. Only obfuscate the file data
+    Unlink,   // The same as 'None' + unlink the file
+    Wipe,     // The same as 'Unlink' + obfuscate the file name before unlink
+    WipeSync, // The same as 'Wipe' sync the file name changes
+}
+
 /// Iterates over all possible filenames of a certain length using NAME_CHARSET as an alphabet
 struct FilenameIter {
     // Store the indices of the letters of our filename in NAME_CHARSET
@@ -219,17 +234,25 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
         None => unreachable!(),
     };
 
-    // TODO: implement --remove HOW
-    //       The optional HOW parameter indicates how to remove a directory entry:
-    //         - 'unlink' => use a standard unlink call.
-    //         - 'wipe' => also first obfuscate bytes in the name.
-    //         - 'wipesync' => also sync each obfuscated byte to disk.
-    //       The default mode is 'wipesync', but note it can be expensive.
-
     // TODO: implement --random-source
 
+    let remove_method = if matches.get_flag(options::WIPESYNC) {
+        RemoveMethod::WipeSync
+    } else if matches.contains_id(options::REMOVE) {
+        match matches
+            .get_one::<String>(options::REMOVE)
+            .map(AsRef::as_ref)
+        {
+            Some(options::remove::UNLINK) => RemoveMethod::Unlink,
+            Some(options::remove::WIPE) => RemoveMethod::Wipe,
+            Some(options::remove::WIPESYNC) => RemoveMethod::WipeSync,
+            _ => unreachable!("should be caught by clap"),
+        }
+    } else {
+        RemoveMethod::None
+    };
+
     let force = matches.get_flag(options::FORCE);
-    let remove = matches.get_flag(options::REMOVE);
     let size_arg = matches
         .get_one::<String>(options::SIZE)
         .map(|s| s.to_string());
@@ -240,7 +263,14 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
 
     for path_str in matches.get_many::<String>(options::FILE).unwrap() {
         show_if_err!(wipe_file(
-            path_str, iterations, remove, size, exact, zero, verbose, force,
+            path_str,
+            iterations,
+            remove_method,
+            size,
+            exact,
+            zero,
+            verbose,
+            force,
         ));
     }
     Ok(())
@@ -276,12 +306,26 @@ pub fn uu_app() -> Command {
                 .help("shred this many bytes (suffixes like K, M, G accepted)"),
         )
         .arg(
-            Arg::new(options::REMOVE)
+            Arg::new(options::WIPESYNC)
                 .short('u')
-                .long(options::REMOVE)
-                .help("truncate and remove file after overwriting;  See below")
+                .help("deallocate and remove file after overwriting")
                 .action(ArgAction::SetTrue),
         )
+        .arg(
+            Arg::new(options::REMOVE)
+                .long(options::REMOVE)
+                .value_name("HOW")
+                .value_parser([
+                    options::remove::UNLINK,
+                    options::remove::WIPE,
+                    options::remove::WIPESYNC,
+                ])
+                .num_args(0..=1)
+                .require_equals(true)
+                .default_missing_value(options::remove::WIPESYNC)
+                .help("like -u but give control on HOW to delete;  See below")
+                .action(ArgAction::Set),
+        )
         .arg(
             Arg::new(options::VERBOSE)
                 .long(options::VERBOSE)
@@ -340,7 +384,7 @@ fn pass_name(pass_type: &PassType) -> String {
 fn wipe_file(
     path_str: &str,
     n_passes: usize,
-    remove: bool,
+    remove_method: RemoveMethod,
     size: Option<u64>,
     exact: bool,
     zero: bool,
@@ -457,8 +501,8 @@ fn wipe_file(
             .map_err_context(|| format!("{}: File write pass failed", path.maybe_quote())));
     }
 
-    if remove {
-        do_remove(path, path_str, verbose)
+    if remove_method != RemoveMethod::None {
+        do_remove(path, path_str, verbose, remove_method)
             .map_err_context(|| format!("{}: failed to remove file", path.maybe_quote()))?;
     }
     Ok(())
@@ -501,7 +545,7 @@ fn get_file_size(path: &Path) -> Result<u64, io::Error> {
 
 // Repeatedly renames the file with strings of decreasing length (most likely all 0s)
 // Return the path of the file after its last renaming or None if error
-fn wipe_name(orig_path: &Path, verbose: bool) -> Option<PathBuf> {
+fn wipe_name(orig_path: &Path, verbose: bool, remove_method: RemoveMethod) -> Option<PathBuf> {
     let file_name_len = orig_path.file_name().unwrap().to_str().unwrap().len();
 
     let mut last_path = PathBuf::from(orig_path);
@@ -526,12 +570,14 @@ fn wipe_name(orig_path: &Path, verbose: bool) -> Option<PathBuf> {
                         );
                     }
 
-                    // Sync every file rename
-                    let new_file = OpenOptions::new()
-                        .write(true)
-                        .open(new_path.clone())
-                        .expect("Failed to open renamed file for syncing");
-                    new_file.sync_all().expect("Failed to sync renamed file");
+                    if remove_method == RemoveMethod::WipeSync {
+                        // Sync every file rename
+                        let new_file = OpenOptions::new()
+                            .write(true)
+                            .open(new_path.clone())
+                            .expect("Failed to open renamed file for syncing");
+                        new_file.sync_all().expect("Failed to sync renamed file");
+                    }
 
                     last_path = new_path;
                     break;
@@ -552,12 +598,23 @@ fn wipe_name(orig_path: &Path, verbose: bool) -> Option<PathBuf> {
     Some(last_path)
 }
 
-fn do_remove(path: &Path, orig_filename: &str, verbose: bool) -> Result<(), io::Error> {
+fn do_remove(
+    path: &Path,
+    orig_filename: &str,
+    verbose: bool,
+    remove_method: RemoveMethod,
+) -> Result<(), io::Error> {
     if verbose {
         show_error!("{}: removing", orig_filename.maybe_quote());
     }
 
-    if let Some(rp) = wipe_name(path, verbose) {
+    let remove_path = if remove_method == RemoveMethod::Unlink {
+        Some(path.with_file_name(orig_filename))
+    } else {
+        wipe_name(path, verbose, remove_method)
+    };
+
+    if let Some(rp) = remove_path {
         fs::remove_file(rp)?;
     }
 
diff --git a/tests/by-util/test_shred.rs b/tests/by-util/test_shred.rs
index 83d2890ed0b..d5de7882f57 100644
--- a/tests/by-util/test_shred.rs
+++ b/tests/by-util/test_shred.rs
@@ -2,6 +2,9 @@
 //
 // For the full copyright and license information, please view the LICENSE
 // file that was distributed with this source code.
+
+// spell-checker:ignore wipesync
+
 use crate::common::util::TestScenario;
 
 #[test]
@@ -9,8 +12,82 @@ fn test_invalid_arg() {
     new_ucmd!().arg("--definitely-invalid").fails().code_is(1);
 }
 
+#[test]
+fn test_invalid_remove_arg() {
+    new_ucmd!().arg("--remove=unknown").fails().code_is(1);
+}
+
+#[test]
+fn test_shred() {
+    let (at, mut ucmd) = at_and_ucmd!();
+
+    let file = "test_shred";
+    let file_original_content = "test_shred file content";
+
+    at.write(file, file_original_content);
+
+    ucmd.arg(file).succeeds();
+
+    // File exists
+    assert!(at.file_exists(file));
+    // File is obfuscated
+    assert!(at.read_bytes(file) != file_original_content.as_bytes());
+}
+
 #[test]
 fn test_shred_remove() {
+    let (at, mut ucmd) = at_and_ucmd!();
+
+    let file = "test_shred_remove";
+    at.touch(file);
+
+    ucmd.arg("--remove").arg(file).succeeds();
+
+    // File was deleted
+    assert!(!at.file_exists(file));
+}
+
+#[test]
+fn test_shred_remove_unlink() {
+    let (at, mut ucmd) = at_and_ucmd!();
+
+    let file = "test_shred_remove_unlink";
+    at.touch(file);
+
+    ucmd.arg("--remove=unlink").arg(file).succeeds();
+
+    // File was deleted
+    assert!(!at.file_exists(file));
+}
+
+#[test]
+fn test_shred_remove_wipe() {
+    let (at, mut ucmd) = at_and_ucmd!();
+
+    let file = "test_shred_remove_wipe";
+    at.touch(file);
+
+    ucmd.arg("--remove=wipe").arg(file).succeeds();
+
+    // File was deleted
+    assert!(!at.file_exists(file));
+}
+
+#[test]
+fn test_shred_remove_wipesync() {
+    let (at, mut ucmd) = at_and_ucmd!();
+
+    let file = "test_shred_remove_wipesync";
+    at.touch(file);
+
+    ucmd.arg("--remove=wipesync").arg(file).succeeds();
+
+    // File was deleted
+    assert!(!at.file_exists(file));
+}
+
+#[test]
+fn test_shred_u() {
     let scene = TestScenario::new(util_name!());
     let at = &scene.fixtures;
 

From 724305e64f56b2ef7f469eb99f7282d19fbd3c41 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Sat, 6 Jan 2024 22:57:48 +0100
Subject: [PATCH 361/429] Remove the tests/cp/link-heap.sh workaround

No longer needed since github.com/uutils/coreutils/pull/5789 landed
---
 util/build-gnu.sh | 4 ----
 1 file changed, 4 deletions(-)

diff --git a/util/build-gnu.sh b/util/build-gnu.sh
index 915577c5584..9fdb3079d9d 100755
--- a/util/build-gnu.sh
+++ b/util/build-gnu.sh
@@ -202,10 +202,6 @@ sed -i 's|ln -|/usr/bin/ln -|' tests/cp/link-deref.sh
 sed -i "s|cannot stat 'symlink': Permission denied|not writing through dangling symlink 'symlink'|" tests/cp/fail-perm.sh
 sed -i "s|cp: target directory 'symlink': Permission denied|cp: 'symlink' is not a directory|" tests/cp/fail-perm.sh
 
-# Workaround https://github.com/uutils/coreutils/issues/5766
-# to transform an ERROR into FAIL
-sed -i 's|xargs mkdir )|xargs mkdir -p )|' tests/cp/link-heap.sh
-
 # Our message is a bit better
 sed -i "s|cannot create regular file 'no-such/': Not a directory|'no-such/' is not a directory|" tests/mv/trailing-slash.sh
 

From f612546ff711784b551b4a2a43069cb14830035b Mon Sep 17 00:00:00 2001
From: "renovate[bot]" <29139614+renovate[bot]@users.noreply.github.com>
Date: Sun, 7 Jan 2024 15:21:27 +0000
Subject: [PATCH 362/429] chore(deps): update rust crate libc to 0.2.152

---
 Cargo.lock | 4 ++--
 Cargo.toml | 2 +-
 2 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/Cargo.lock b/Cargo.lock
index ee403d92f92..9190d1be352 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -1185,9 +1185,9 @@ checksum = "830d08ce1d1d941e6b30645f1a0eb5643013d835ce3779a5fc208261dbe10f55"
 
 [[package]]
 name = "libc"
-version = "0.2.151"
+version = "0.2.152"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "302d7ab3130588088d277783b1e2d2e10c9e9e4a16dd9050e6ec93fb3e7048f4"
+checksum = "13e3bf6590cbc649f4d1a3eefc9d5d6eb746f5200ffb04e5e142700b8faa56e7"
 
 [[package]]
 name = "libloading"
diff --git a/Cargo.toml b/Cargo.toml
index 3fc1e23cbe2..f45d0b2f4e9 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -288,7 +288,7 @@ half = "2.3"
 hostname = "0.3"
 indicatif = "0.17"
 itertools = "0.12.0"
-libc = "0.2.151"
+libc = "0.2.152"
 lscolors = { version = "0.16.0", default-features = false, features = [
   "gnu_legacy",
 ] }

From 8c1fc8b28743090f06aff52b132dfeacf1f2339d Mon Sep 17 00:00:00 2001
From: D9nni <lungudaniel31@gmail.com>
Date: Sun, 7 Jan 2024 21:43:31 +0200
Subject: [PATCH 363/429] Added --raw argument, with error for multiple files

---
 src/uu/cksum/src/cksum.rs | 55 ++++++++++++++++++++++++++++++++++++---
 1 file changed, 51 insertions(+), 4 deletions(-)

diff --git a/src/uu/cksum/src/cksum.rs b/src/uu/cksum/src/cksum.rs
index e8d7da60e41..df8fdb5ea09 100644
--- a/src/uu/cksum/src/cksum.rs
+++ b/src/uu/cksum/src/cksum.rs
@@ -8,11 +8,13 @@ use clap::{crate_version, value_parser, Arg, ArgAction, Command};
 use hex::encode;
 use std::ffi::OsStr;
 use std::fs::File;
-use std::io::{self, stdin, BufReader, Read};
+use std::io::{self, stdin, stdout, BufReader, Read, Write};
 use std::iter;
 use std::path::Path;
+use std::error::Error;
+use std::fmt::Display;
 use uucore::{
-    error::{FromIo, UResult},
+    error::{FromIo, UResult, UError},
     format_usage, help_about, help_section, help_usage,
     sum::{
         div_ceil, Blake2b, Digest, DigestWriter, Md5, Sha1, Sha224, Sha256, Sha384, Sha512, Sm3,
@@ -36,6 +38,32 @@ const ALGORITHM_OPTIONS_SHA512: &str = "sha512";
 const ALGORITHM_OPTIONS_BLAKE2B: &str = "blake2b";
 const ALGORITHM_OPTIONS_SM3: &str = "sm3";
 
+#[derive(Debug)]
+enum CkSumError {
+    RawMultipleFiles,
+}
+
+impl UError for CkSumError {
+    fn code(&self) -> i32 {
+        match self {
+            Self::RawMultipleFiles => 1,
+        }
+    }
+}
+
+impl Error for CkSumError {
+}
+
+impl Display for CkSumError {
+    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
+        match self {
+            Self::RawMultipleFiles => {
+                write!(f, "the --raw option is not supported with multiple files")
+            }
+        }
+    }
+}
+
 fn detect_algo(
     program: &str,
     length: Option<usize>,
@@ -110,6 +138,7 @@ struct Options {
     output_bits: usize,
     untagged: bool,
     length: Option<usize>,
+    raw: bool,
 }
 
 /// Calculate checksum
@@ -123,7 +152,12 @@ fn cksum<'a, I>(mut options: Options, files: I) -> UResult<()>
 where
     I: Iterator<Item = &'a OsStr>,
 {
-    for filename in files {
+    let files_vec:Vec<_> = files.collect();
+    if options.raw && files_vec.len() > 1 {
+        return Err(Box::new(CkSumError::RawMultipleFiles));
+    }
+
+    for filename in files_vec {
         let filename = Path::new(filename);
         let stdin_buf;
         let file_buf;
@@ -140,7 +174,12 @@ where
         });
         let (sum, sz) = digest_read(&mut options.digest, &mut file, options.output_bits)
             .map_err_context(|| "failed to read input".to_string())?;
-
+        
+        if options.raw {
+            let bytes_str = sum.parse::<u32>().unwrap().to_be_bytes();
+            stdout().write_all(&bytes_str)?;
+            return Ok(());
+        }
         // The BSD checksum output is 5 digit integer
         let bsd_width = 5;
         match (options.algo_name, not_file) {
@@ -231,6 +270,7 @@ mod options {
     pub const FILE: &str = "file";
     pub const UNTAGGED: &str = "untagged";
     pub const LENGTH: &str = "length";
+    pub const RAW: &str = "raw";
 }
 
 #[uucore::main]
@@ -291,6 +331,7 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
         output_bits: bits,
         length,
         untagged: matches.get_flag(options::UNTAGGED),
+        raw: matches.get_flag(options::RAW), 
     };
 
     match matches.get_many::<String>(options::FILE) {
@@ -346,6 +387,12 @@ pub fn uu_app() -> Command {
                 .short('l')
                 .help("digest length in bits; must not exceed the max for the blake2 algorithm and must be a multiple of 8")
                 .action(ArgAction::Set),
+        )       
+        .arg(
+            Arg::new(options::RAW)
+            .long(options::RAW)
+            .help("emit a raw binary digest, not hexadecimal")
+            .action(ArgAction::SetTrue),
         )
         .after_help(AFTER_HELP)
 }

From 288ad97878af53c220e65c0a0434a35a7be7c6dc Mon Sep 17 00:00:00 2001
From: Atomei Alexandru Constantin <atomeialexandru03@gmail.com>
Date: Sun, 7 Jan 2024 23:39:33 +0200
Subject: [PATCH 364/429] Made cksum to return an error if the algorithm
 blake2b is used on a directory

---
 src/uu/cksum/src/cksum.rs | 7 +++++++
 1 file changed, 7 insertions(+)

diff --git a/src/uu/cksum/src/cksum.rs b/src/uu/cksum/src/cksum.rs
index e8d7da60e41..77f2749443c 100644
--- a/src/uu/cksum/src/cksum.rs
+++ b/src/uu/cksum/src/cksum.rs
@@ -169,6 +169,13 @@ where
             (ALGORITHM_OPTIONS_CRC, true) => println!("{sum} {sz}"),
             (ALGORITHM_OPTIONS_CRC, false) => println!("{sum} {sz} {}", filename.display()),
             (ALGORITHM_OPTIONS_BLAKE2B, _) if !options.untagged => {
+                if filename.is_dir() {
+                    return Err(io::Error::new(
+                        io::ErrorKind::InvalidInput,
+                        format!("{}: Is a directory", filename.display()),
+                    )
+                    .into());
+                }
                 if let Some(length) = options.length {
                     // Multiply by 8 here, as we want to print the length in bits.
                     println!("BLAKE2b-{} ({}) = {sum}", length * 8, filename.display());

From 0bfd4bbdf752f3a1cd28fb763d93652ab4395265 Mon Sep 17 00:00:00 2001
From: Atomei Alexandru Constantin <atomeialexandru03@gmail.com>
Date: Mon, 8 Jan 2024 00:08:24 +0200
Subject: [PATCH 365/429] Added test to validate that it now generates the
 error for an arbitrary directory

---
 tests/by-util/test_cksum.rs | 14 ++++++++++++++
 1 file changed, 14 insertions(+)

diff --git a/tests/by-util/test_cksum.rs b/tests/by-util/test_cksum.rs
index 00c768164d5..fd55a69e487 100644
--- a/tests/by-util/test_cksum.rs
+++ b/tests/by-util/test_cksum.rs
@@ -286,3 +286,17 @@ fn test_length_is_zero() {
         .no_stderr()
         .stdout_is_fixture("length_is_zero.expected");
 }
+
+#[test]
+fn test_blake2b_fail_on_directory() {
+    let (at, mut ucmd) = at_and_ucmd!();
+
+    let folder_name = "a_folder";
+    at.mkdir(folder_name);
+
+    ucmd.arg("--algorithm=blake2b")
+        .arg(folder_name)
+        .fails()
+        .no_stdout()
+        .stderr_contains(format!("cksum: {folder_name}: Is a directory"));
+}

From f03ef79bc86ee58f688e5d0d36a684993d5a769a Mon Sep 17 00:00:00 2001
From: D9nni <lungudaniel31@gmail.com>
Date: Mon, 8 Jan 2024 08:51:06 +0200
Subject: [PATCH 366/429] cksum: added tests for --raw and fixed fmt whitespace
 error

---
 src/uu/cksum/src/cksum.rs   | 17 ++++++++---------
 tests/by-util/test_cksum.rs | 22 ++++++++++++++++++++++
 2 files changed, 30 insertions(+), 9 deletions(-)

diff --git a/src/uu/cksum/src/cksum.rs b/src/uu/cksum/src/cksum.rs
index df8fdb5ea09..e3fb78ec460 100644
--- a/src/uu/cksum/src/cksum.rs
+++ b/src/uu/cksum/src/cksum.rs
@@ -6,15 +6,15 @@
 // spell-checker:ignore (ToDO) fname, algo
 use clap::{crate_version, value_parser, Arg, ArgAction, Command};
 use hex::encode;
+use std::error::Error;
 use std::ffi::OsStr;
+use std::fmt::Display;
 use std::fs::File;
 use std::io::{self, stdin, stdout, BufReader, Read, Write};
 use std::iter;
 use std::path::Path;
-use std::error::Error;
-use std::fmt::Display;
 use uucore::{
-    error::{FromIo, UResult, UError},
+    error::{FromIo, UError, UResult},
     format_usage, help_about, help_section, help_usage,
     sum::{
         div_ceil, Blake2b, Digest, DigestWriter, Md5, Sha1, Sha224, Sha256, Sha384, Sha512, Sm3,
@@ -51,8 +51,7 @@ impl UError for CkSumError {
     }
 }
 
-impl Error for CkSumError {
-}
+impl Error for CkSumError {}
 
 impl Display for CkSumError {
     fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
@@ -152,7 +151,7 @@ fn cksum<'a, I>(mut options: Options, files: I) -> UResult<()>
 where
     I: Iterator<Item = &'a OsStr>,
 {
-    let files_vec:Vec<_> = files.collect();
+    let files_vec: Vec<_> = files.collect();
     if options.raw && files_vec.len() > 1 {
         return Err(Box::new(CkSumError::RawMultipleFiles));
     }
@@ -174,7 +173,7 @@ where
         });
         let (sum, sz) = digest_read(&mut options.digest, &mut file, options.output_bits)
             .map_err_context(|| "failed to read input".to_string())?;
-        
+
         if options.raw {
             let bytes_str = sum.parse::<u32>().unwrap().to_be_bytes();
             stdout().write_all(&bytes_str)?;
@@ -331,7 +330,7 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
         output_bits: bits,
         length,
         untagged: matches.get_flag(options::UNTAGGED),
-        raw: matches.get_flag(options::RAW), 
+        raw: matches.get_flag(options::RAW),
     };
 
     match matches.get_many::<String>(options::FILE) {
@@ -387,7 +386,7 @@ pub fn uu_app() -> Command {
                 .short('l')
                 .help("digest length in bits; must not exceed the max for the blake2 algorithm and must be a multiple of 8")
                 .action(ArgAction::Set),
-        )       
+        )
         .arg(
             Arg::new(options::RAW)
             .long(options::RAW)
diff --git a/tests/by-util/test_cksum.rs b/tests/by-util/test_cksum.rs
index 00c768164d5..a4e877b1c6a 100644
--- a/tests/by-util/test_cksum.rs
+++ b/tests/by-util/test_cksum.rs
@@ -286,3 +286,25 @@ fn test_length_is_zero() {
         .no_stderr()
         .stdout_is_fixture("length_is_zero.expected");
 }
+
+#[test]
+fn test_raw_single_file() {
+    new_ucmd!()
+        .arg("--raw")
+        .arg("lorem_ipsum.txt")
+        .succeeds()
+        .no_stderr()
+        .stdout_is_fixture("raw_single_file.expected");
+}
+
+#[test]
+fn test_raw_multiple_files() {
+    new_ucmd!()
+        .arg("--raw")
+        .arg("lorem_ipsum.txt")
+        .arg("alice_in_wonderland.txt")
+        .fails()
+        .no_stdout()
+        .stderr_contains("cksum: the --raw option is not supported with multiple files")
+        .code_is(1);
+}

From 1c6bf6991c012e3fd391199e98a6feec27bbcba4 Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Mon, 8 Jan 2024 10:49:16 +0100
Subject: [PATCH 367/429] nl: don't exit if input is directory

---
 src/uu/nl/src/nl.rs      | 16 +++++++++++-----
 tests/by-util/test_nl.rs | 17 +++++++++++++++++
 2 files changed, 28 insertions(+), 5 deletions(-)

diff --git a/src/uu/nl/src/nl.rs b/src/uu/nl/src/nl.rs
index 7d7688650aa..c7e72f6e2e2 100644
--- a/src/uu/nl/src/nl.rs
+++ b/src/uu/nl/src/nl.rs
@@ -7,8 +7,8 @@ use clap::{crate_version, Arg, ArgAction, Command};
 use std::fs::File;
 use std::io::{stdin, BufRead, BufReader, Read};
 use std::path::Path;
-use uucore::error::{FromIo, UResult, USimpleError};
-use uucore::{format_usage, help_about, help_section, help_usage};
+use uucore::error::{set_exit_code, FromIo, UResult, USimpleError};
+use uucore::{format_usage, help_about, help_section, help_usage, show_error};
 
 mod helper;
 
@@ -205,9 +205,15 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
             nl(&mut buffer, &mut stats, &settings)?;
         } else {
             let path = Path::new(file);
-            let reader = File::open(path).map_err_context(|| file.to_string())?;
-            let mut buffer = BufReader::new(reader);
-            nl(&mut buffer, &mut stats, &settings)?;
+
+            if path.is_dir() {
+                show_error!("{}: Is a directory", path.display());
+                set_exit_code(1);
+            } else {
+                let reader = File::open(path).map_err_context(|| file.to_string())?;
+                let mut buffer = BufReader::new(reader);
+                nl(&mut buffer, &mut stats, &settings)?;
+            }
         }
     }
 
diff --git a/tests/by-util/test_nl.rs b/tests/by-util/test_nl.rs
index 78c8975a849..a00e37a4767 100644
--- a/tests/by-util/test_nl.rs
+++ b/tests/by-util/test_nl.rs
@@ -634,3 +634,20 @@ fn test_empty_section_delimiter() {
             .stdout_is("     1\ta\n       \n     2\tb\n");
     }
 }
+
+#[test]
+fn test_directory_as_input() {
+    let (at, mut ucmd) = at_and_ucmd!();
+    let dir = "dir";
+    let file = "file";
+    let content = "aaa";
+
+    at.mkdir(dir);
+    at.write(file, content);
+
+    ucmd.arg(dir)
+        .arg(file)
+        .fails()
+        .stderr_is(format!("nl: {dir}: Is a directory\n"))
+        .stdout_contains(content);
+}

From 28b5224725fe93f445c49a02d975ccdb4abf4812 Mon Sep 17 00:00:00 2001
From: D9nni <lungudaniel31@gmail.com>
Date: Mon, 8 Jan 2024 15:50:25 +0200
Subject: [PATCH 368/429] cksum: fixed test for --raw on single file

---
 tests/by-util/test_cksum.rs                   | 2 +-
 tests/fixtures/cksum/raw_single_file.expected | 1 +
 2 files changed, 2 insertions(+), 1 deletion(-)
 create mode 100644 tests/fixtures/cksum/raw_single_file.expected

diff --git a/tests/by-util/test_cksum.rs b/tests/by-util/test_cksum.rs
index 2d4fad923ed..52ac099111d 100644
--- a/tests/by-util/test_cksum.rs
+++ b/tests/by-util/test_cksum.rs
@@ -294,7 +294,7 @@ fn test_raw_single_file() {
         .arg("lorem_ipsum.txt")
         .succeeds()
         .no_stderr()
-        .stdout_is_fixture("raw_single_file.expected");
+        .stdout_is_fixture_bytes("raw_single_file.expected");
 }
 
 #[test]
diff --git a/tests/fixtures/cksum/raw_single_file.expected b/tests/fixtures/cksum/raw_single_file.expected
new file mode 100644
index 00000000000..de175b04582
--- /dev/null
+++ b/tests/fixtures/cksum/raw_single_file.expected
@@ -0,0 +1 @@
+�Ph
\ No newline at end of file

From 833c1a0d3fa3dfe4132de792ca11cabf0d5eedd5 Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Mon, 8 Jan 2024 16:19:43 +0100
Subject: [PATCH 369/429] ci: set -no-window in Android workflow

---
 .github/workflows/android.yml | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/.github/workflows/android.yml b/.github/workflows/android.yml
index 69ca970c0fa..34dcf910d18 100644
--- a/.github/workflows/android.yml
+++ b/.github/workflows/android.yml
@@ -52,7 +52,7 @@ jobs:
         ram-size: 2048M
         disk-size: 7GB
         force-avd-creation: true
-        emulator-options: -no-snapshot-load -noaudio -no-boot-anim -camera-back none
+        emulator-options: -no-window -no-snapshot-load -noaudio -no-boot-anim -camera-back none
         script: |
           util/android-commands.sh init "${{ matrix.arch }}" "${{ matrix.api-level }}" "${{ env.TERMUX }}"
     - name: Save AVD cache
@@ -88,7 +88,7 @@ jobs:
         ram-size: 2048M
         disk-size: 7GB
         force-avd-creation: false
-        emulator-options: -no-snapshot-save -gpu swiftshader_indirect -noaudio -no-boot-anim -camera-back none -snapshot ${{ matrix.api-level }}-${{ matrix.arch }}+termux-${{ env.TERMUX }}
+        emulator-options: -no-window -no-snapshot-save -gpu swiftshader_indirect -noaudio -no-boot-anim -camera-back none -snapshot ${{ matrix.api-level }}-${{ matrix.arch }}+termux-${{ env.TERMUX }}
         # This is not a usual script. Every line is executed in a separate shell with `sh -c`. If
         # one of the lines returns with error the whole script is failed (like running a script with
         # set -e) and in consequences the other lines (shells) are not executed.

From 62dffc3250ce1c12077586146ddb6106679b30ab Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Mon, 8 Jan 2024 17:14:33 +0100
Subject: [PATCH 370/429] ln: fix "unused import" warning on Android

---
 tests/by-util/test_ln.rs | 3 +--
 1 file changed, 1 insertion(+), 2 deletions(-)

diff --git a/tests/by-util/test_ln.rs b/tests/by-util/test_ln.rs
index 2501e9d362a..b315630ce4e 100644
--- a/tests/by-util/test_ln.rs
+++ b/tests/by-util/test_ln.rs
@@ -3,8 +3,6 @@
 // For the full copyright and license information, please view the LICENSE
 // file that was distributed with this source code.
 use crate::common::util::TestScenario;
-#[cfg(unix)]
-use std::os::unix::fs::MetadataExt;
 use std::path::PathBuf;
 
 #[test]
@@ -752,6 +750,7 @@ fn test_ln_seen_file() {
     assert!(at.plus("a").join("f").exists());
     #[cfg(unix)]
     {
+        use std::os::unix::fs::MetadataExt;
         // Check inode numbers
         let inode_a_f = at.plus("a").join("f").metadata().unwrap().ino();
         let inode_b_f = at.plus("b").join("f").metadata().unwrap().ino();

From e29afdc0df89ec35a655d1ebdcaf71eaf5375880 Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Mon, 8 Jan 2024 17:29:34 +0100
Subject: [PATCH 371/429] head: disable some tests on Android

---
 tests/by-util/test_head.rs | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/tests/by-util/test_head.rs b/tests/by-util/test_head.rs
index 9cc4c1770ec..cc17cdf950a 100644
--- a/tests/by-util/test_head.rs
+++ b/tests/by-util/test_head.rs
@@ -382,6 +382,7 @@ fn test_presume_input_pipe_5_chars() {
 #[cfg(all(
     not(target_os = "windows"),
     not(target_os = "macos"),
+    not(target_os = "android"),
     not(target_os = "freebsd")
 ))]
 #[test]
@@ -396,6 +397,7 @@ fn test_read_backwards_bytes_proc_fs_version() {
 #[cfg(all(
     not(target_os = "windows"),
     not(target_os = "macos"),
+    not(target_os = "android"),
     not(target_os = "freebsd")
 ))]
 #[test]
@@ -410,6 +412,7 @@ fn test_read_backwards_bytes_proc_fs_modules() {
 #[cfg(all(
     not(target_os = "windows"),
     not(target_os = "macos"),
+    not(target_os = "android"),
     not(target_os = "freebsd")
 ))]
 #[test]
@@ -424,6 +427,7 @@ fn test_read_backwards_lines_proc_fs_modules() {
 #[cfg(all(
     not(target_os = "windows"),
     not(target_os = "macos"),
+    not(target_os = "android"),
     not(target_os = "freebsd")
 ))]
 #[test]

From 5dfeca9ff232d050e3669d675a6b9f290a5111ef Mon Sep 17 00:00:00 2001
From: Samuel Tardieu <sam@rfc1149.net>
Date: Thu, 4 Jan 2024 19:33:47 +0100
Subject: [PATCH 372/429] format: %c prints the first character of a string

---
 src/uucore/src/lib/features/format/argument.rs | 9 +--------
 tests/by-util/test_printf.rs                   | 8 ++++++++
 2 files changed, 9 insertions(+), 8 deletions(-)

diff --git a/src/uucore/src/lib/features/format/argument.rs b/src/uucore/src/lib/features/format/argument.rs
index db18cf51890..6f66230cbe0 100644
--- a/src/uucore/src/lib/features/format/argument.rs
+++ b/src/uucore/src/lib/features/format/argument.rs
@@ -41,14 +41,7 @@ impl<'a, T: Iterator<Item = &'a FormatArgument>> ArgumentIter<'a> for T {
         match next {
             FormatArgument::Char(c) => *c,
             FormatArgument::Unparsed(s) => {
-                let mut chars = s.chars();
-                let Some(c) = chars.next() else {
-                    return '\0';
-                };
-                let None = chars.next() else {
-                    return '\0';
-                };
-                c
+                s.chars().next().unwrap_or('\0')
             }
             _ => '\0',
         }
diff --git a/tests/by-util/test_printf.rs b/tests/by-util/test_printf.rs
index dfd13159043..c106e55129b 100644
--- a/tests/by-util/test_printf.rs
+++ b/tests/by-util/test_printf.rs
@@ -162,6 +162,14 @@ fn sub_char() {
         .stdout_only("the letter A");
 }
 
+#[test]
+fn sub_char_from_string() {
+    new_ucmd!()
+        .args(&["%c%c%c", "five", "%", "oval"])
+        .succeeds()
+        .stdout_only("f%o");
+}
+
 #[test]
 fn sub_num_int() {
     new_ucmd!()

From 9858fef20ec1e3d4acd16ed74b63452dfd7d9b18 Mon Sep 17 00:00:00 2001
From: Terts Diepraam <terts.diepraam@gmail.com>
Date: Mon, 8 Jan 2024 13:28:24 +0100
Subject: [PATCH 373/429] printf: use 0 instead of 0o as octal prefix

---
 .../src/lib/features/format/num_format.rs     | 33 ++++++++++++++++++-
 1 file changed, 32 insertions(+), 1 deletion(-)

diff --git a/src/uucore/src/lib/features/format/num_format.rs b/src/uucore/src/lib/features/format/num_format.rs
index 60a3a404a8e..325da3ce6e3 100644
--- a/src/uucore/src/lib/features/format/num_format.rs
+++ b/src/uucore/src/lib/features/format/num_format.rs
@@ -141,7 +141,17 @@ impl Formatter for UnsignedInt {
         let mut s = match self.variant {
             UnsignedIntVariant::Decimal => format!("{x}"),
             UnsignedIntVariant::Octal(Prefix::No) => format!("{x:o}"),
-            UnsignedIntVariant::Octal(Prefix::Yes) => format!("{x:#o}"),
+            UnsignedIntVariant::Octal(Prefix::Yes) => {
+                // The prefix that rust uses is `0o`, but GNU uses `0`.
+                // We also need to take into account that 0 should not be 00
+                // Since this is an unsigned int, we do not need to take the minus
+                // sign into account.
+                if x != 0 {
+                    format!("0{x:o}")
+                } else {
+                    format!("{x:o}")
+                }
+            }
             UnsignedIntVariant::Hexadecimal(Case::Lowercase, Prefix::No) => {
                 format!("{x:x}")
             }
@@ -487,6 +497,27 @@ fn strip_fractional_zeroes_and_dot(s: &mut String) {
 mod test {
     use crate::format::num_format::{Case, ForceDecimal};
 
+    #[test]
+    fn unsigned_octal() {
+        use super::{Formatter, NumberAlignment, Prefix, UnsignedInt, UnsignedIntVariant};
+        let f = |x| {
+            let mut s = Vec::new();
+            UnsignedInt {
+                variant: UnsignedIntVariant::Octal(Prefix::Yes),
+                width: 0,
+                precision: 0,
+                alignment: NumberAlignment::Left,
+            }
+            .fmt(&mut s, x)
+            .unwrap();
+            String::from_utf8(s).unwrap()
+        };
+
+        assert_eq!(f(0), "0");
+        assert_eq!(f(5), "05");
+        assert_eq!(f(8), "010");
+    }
+
     #[test]
     fn decimal_float() {
         use super::format_float_decimal;

From 49154669a620df00c267fd0c520af6001bf73f79 Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Tue, 9 Jan 2024 15:17:15 +0100
Subject: [PATCH 374/429] pathchk: simplify and rename test

---
 tests/by-util/test_pathchk.rs | 15 ++++++++-------
 1 file changed, 8 insertions(+), 7 deletions(-)

diff --git a/tests/by-util/test_pathchk.rs b/tests/by-util/test_pathchk.rs
index d66ecb9efb4..f5d84b5762a 100644
--- a/tests/by-util/test_pathchk.rs
+++ b/tests/by-util/test_pathchk.rs
@@ -4,6 +4,14 @@
 // file that was distributed with this source code.
 use crate::common::util::TestScenario;
 
+#[test]
+fn test_no_args() {
+    new_ucmd!()
+        .fails()
+        .no_stdout()
+        .stderr_contains("pathchk: missing operand");
+}
+
 #[test]
 fn test_invalid_arg() {
     new_ucmd!().arg("--definitely-invalid").fails().code_is(1);
@@ -164,10 +172,3 @@ fn test_posix_all() {
     // fail on empty path
     new_ucmd!().args(&["-p", "-P", ""]).fails().no_stdout();
 }
-
-#[test]
-fn test_args_parsing() {
-    // fail on no args
-    let empty_args: [String; 0] = [];
-    new_ucmd!().args(&empty_args).fails().no_stdout();
-}

From f400a07dc6e6fed71efb38a5b84d0d981e355cd9 Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Tue, 9 Jan 2024 15:19:22 +0100
Subject: [PATCH 375/429] pathchk: remove useless comments

---
 tests/by-util/test_pathchk.rs | 8 --------
 1 file changed, 8 deletions(-)

diff --git a/tests/by-util/test_pathchk.rs b/tests/by-util/test_pathchk.rs
index f5d84b5762a..d09c8a2e1e4 100644
--- a/tests/by-util/test_pathchk.rs
+++ b/tests/by-util/test_pathchk.rs
@@ -19,8 +19,6 @@ fn test_invalid_arg() {
 
 #[test]
 fn test_default_mode() {
-    // test the default mode
-
     // accept some reasonable default
     new_ucmd!().args(&["dir/file"]).succeeds().no_stdout();
 
@@ -56,8 +54,6 @@ fn test_default_mode() {
 
 #[test]
 fn test_posix_mode() {
-    // test the posix mode
-
     // accept some reasonable default
     new_ucmd!().args(&["-p", "dir/file"]).succeeds().no_stdout();
 
@@ -82,8 +78,6 @@ fn test_posix_mode() {
 
 #[test]
 fn test_posix_special() {
-    // test the posix special mode
-
     // accept some reasonable default
     new_ucmd!().args(&["-P", "dir/file"]).succeeds().no_stdout();
 
@@ -123,8 +117,6 @@ fn test_posix_special() {
 
 #[test]
 fn test_posix_all() {
-    // test the posix special mode
-
     // accept some reasonable default
     new_ucmd!()
         .args(&["-p", "-P", "dir/file"])

From 96271ffa3cb9588c97dddddc186a28ef4bbcb43a Mon Sep 17 00:00:00 2001
From: D9nni <lungudaniel31@gmail.com>
Date: Tue, 9 Jan 2024 23:12:40 +0200
Subject: [PATCH 376/429] cksum: added tests for --raw with each algorithm, not
 working for crc, sysv, bsd

---
 src/uu/cksum/src/cksum.rs                     |  19 +++++++++++++-----
 tests/by-util/test_cksum.rs                   |  16 ++++++++-------
 .../cksum/raw/blake2b_single_file.expected    |   1 +
 .../cksum/raw/bsd_single_file.expected        |   1 +
 .../crc_single_file.expected}                 |   0
 .../cksum/raw/md5_single_file.expected        | Bin 0 -> 16 bytes
 .../cksum/raw/sha1_single_file.expected       |   1 +
 .../cksum/raw/sha224_single_file.expected     | Bin 0 -> 28 bytes
 .../cksum/raw/sha256_single_file.expected     |   1 +
 .../cksum/raw/sha384_single_file.expected     |   3 +++
 .../cksum/raw/sha512_single_file.expected     |   1 +
 .../cksum/raw/sm3_single_file.expected        |   1 +
 .../cksum/raw/sysv_single_file.expected       |   1 +
 13 files changed, 33 insertions(+), 12 deletions(-)
 create mode 100644 tests/fixtures/cksum/raw/blake2b_single_file.expected
 create mode 100644 tests/fixtures/cksum/raw/bsd_single_file.expected
 rename tests/fixtures/cksum/{raw_single_file.expected => raw/crc_single_file.expected} (100%)
 create mode 100644 tests/fixtures/cksum/raw/md5_single_file.expected
 create mode 100644 tests/fixtures/cksum/raw/sha1_single_file.expected
 create mode 100644 tests/fixtures/cksum/raw/sha224_single_file.expected
 create mode 100644 tests/fixtures/cksum/raw/sha256_single_file.expected
 create mode 100644 tests/fixtures/cksum/raw/sha384_single_file.expected
 create mode 100644 tests/fixtures/cksum/raw/sha512_single_file.expected
 create mode 100644 tests/fixtures/cksum/raw/sm3_single_file.expected
 create mode 100644 tests/fixtures/cksum/raw/sysv_single_file.expected

diff --git a/src/uu/cksum/src/cksum.rs b/src/uu/cksum/src/cksum.rs
index 40c06a38612..6f3de690de8 100644
--- a/src/uu/cksum/src/cksum.rs
+++ b/src/uu/cksum/src/cksum.rs
@@ -5,6 +5,7 @@
 
 // spell-checker:ignore (ToDO) fname, algo
 use clap::{crate_version, value_parser, Arg, ArgAction, Command};
+use hex::decode;
 use hex::encode;
 use std::error::Error;
 use std::ffi::OsStr;
@@ -151,12 +152,12 @@ fn cksum<'a, I>(mut options: Options, files: I) -> UResult<()>
 where
     I: Iterator<Item = &'a OsStr>,
 {
-    let files_vec: Vec<_> = files.collect();
-    if options.raw && files_vec.len() > 1 {
+    let files: Vec<_> = files.collect();
+    if options.raw && files.len() > 1 {
         return Err(Box::new(CkSumError::RawMultipleFiles));
     }
 
-    for filename in files_vec {
+    for filename in files {
         let filename = Path::new(filename);
         let stdin_buf;
         let file_buf;
@@ -175,8 +176,16 @@ where
             .map_err_context(|| "failed to read input".to_string())?;
 
         if options.raw {
-            let bytes_str = sum.parse::<u32>().unwrap().to_be_bytes();
-            stdout().write_all(&bytes_str)?;
+            match decode(sum.clone()) {
+                Ok(bytes) => {
+                    stdout().write_all(&bytes)?;
+                }
+                Err(_) => {
+                    //bsd, sysv and crc have output generated without encode()
+                    let bytes = sum.parse::<u32>().unwrap().to_be_bytes();
+                    stdout().write_all(&bytes)?;
+                }
+            }
             return Ok(());
         }
         // The BSD checksum output is 5 digit integer
diff --git a/tests/by-util/test_cksum.rs b/tests/by-util/test_cksum.rs
index 52ac099111d..b3db0bf0a02 100644
--- a/tests/by-util/test_cksum.rs
+++ b/tests/by-util/test_cksum.rs
@@ -289,14 +289,16 @@ fn test_length_is_zero() {
 
 #[test]
 fn test_raw_single_file() {
-    new_ucmd!()
-        .arg("--raw")
-        .arg("lorem_ipsum.txt")
-        .succeeds()
-        .no_stderr()
-        .stdout_is_fixture_bytes("raw_single_file.expected");
+    for algo in ALGOS {
+        new_ucmd!()
+            .arg("--raw")
+            .arg("lorem_ipsum.txt")
+            .arg(format!("--algorithm={algo}"))
+            .succeeds()
+            .no_stderr()
+            .stdout_is_fixture_bytes(format!("raw/{algo}_single_file.expected"));
+    }
 }
-
 #[test]
 fn test_raw_multiple_files() {
     new_ucmd!()
diff --git a/tests/fixtures/cksum/raw/blake2b_single_file.expected b/tests/fixtures/cksum/raw/blake2b_single_file.expected
new file mode 100644
index 00000000000..4955b2f990e
--- /dev/null
+++ b/tests/fixtures/cksum/raw/blake2b_single_file.expected
@@ -0,0 +1 @@
+�����`�x��f��W���Et�B��l��W^J�0�aX´��8�����5�B��9m��
\ No newline at end of file
diff --git a/tests/fixtures/cksum/raw/bsd_single_file.expected b/tests/fixtures/cksum/raw/bsd_single_file.expected
new file mode 100644
index 00000000000..538ab19f728
--- /dev/null
+++ b/tests/fixtures/cksum/raw/bsd_single_file.expected
@@ -0,0 +1 @@
+�
\ No newline at end of file
diff --git a/tests/fixtures/cksum/raw_single_file.expected b/tests/fixtures/cksum/raw/crc_single_file.expected
similarity index 100%
rename from tests/fixtures/cksum/raw_single_file.expected
rename to tests/fixtures/cksum/raw/crc_single_file.expected
diff --git a/tests/fixtures/cksum/raw/md5_single_file.expected b/tests/fixtures/cksum/raw/md5_single_file.expected
new file mode 100644
index 0000000000000000000000000000000000000000..e7b47aebbcba99b6dbaa03e825f0be3b5bfdb012
GIT binary patch
literal 16
YcmX?G<Tl~^oy79kUq=|0%j>KH08Ru5cmMzZ

literal 0
HcmV?d00001

diff --git a/tests/fixtures/cksum/raw/sha1_single_file.expected b/tests/fixtures/cksum/raw/sha1_single_file.expected
new file mode 100644
index 00000000000..0f634be4749
--- /dev/null
+++ b/tests/fixtures/cksum/raw/sha1_single_file.expected
@@ -0,0 +1 @@
+�к�؈:=�m毽(%,��
\ No newline at end of file
diff --git a/tests/fixtures/cksum/raw/sha224_single_file.expected b/tests/fixtures/cksum/raw/sha224_single_file.expected
new file mode 100644
index 0000000000000000000000000000000000000000..bc3fa6bf18f53f72894471200626992087ef971d
GIT binary patch
literal 28
kcmcD0mcM7MK%TV2YD?*-If0iL>Nfs77JA{!quGBL0mH`*$p8QV

literal 0
HcmV?d00001

diff --git a/tests/fixtures/cksum/raw/sha256_single_file.expected b/tests/fixtures/cksum/raw/sha256_single_file.expected
new file mode 100644
index 00000000000..b9ce06f39d9
--- /dev/null
+++ b/tests/fixtures/cksum/raw/sha256_single_file.expected
@@ -0,0 +1 @@
+�� PP�0�Pg�^�	�SkE���C[�+?
\ No newline at end of file
diff --git a/tests/fixtures/cksum/raw/sha384_single_file.expected b/tests/fixtures/cksum/raw/sha384_single_file.expected
new file mode 100644
index 00000000000..4b337f859ed
--- /dev/null
+++ b/tests/fixtures/cksum/raw/sha384_single_file.expected
@@ -0,0 +1,3 @@
+K�
+2�i���J��Mϸ��/g������LZ{WZ3S�
+��H�
\ No newline at end of file
diff --git a/tests/fixtures/cksum/raw/sha512_single_file.expected b/tests/fixtures/cksum/raw/sha512_single_file.expected
new file mode 100644
index 00000000000..79f78cf00cb
--- /dev/null
+++ b/tests/fixtures/cksum/raw/sha512_single_file.expected
@@ -0,0 +1 @@
+�Td�%V�Վ�sؚ�!�Yyu)���f���������|T,�Bn^Oऊ�Vg�D	k!=���
\ No newline at end of file
diff --git a/tests/fixtures/cksum/raw/sm3_single_file.expected b/tests/fixtures/cksum/raw/sm3_single_file.expected
new file mode 100644
index 00000000000..3506406dc42
--- /dev/null
+++ b/tests/fixtures/cksum/raw/sm3_single_file.expected
@@ -0,0 +1 @@
+m)k�]��(�0���CyM��g@�p��i��
\ No newline at end of file
diff --git a/tests/fixtures/cksum/raw/sysv_single_file.expected b/tests/fixtures/cksum/raw/sysv_single_file.expected
new file mode 100644
index 00000000000..b975da49c01
--- /dev/null
+++ b/tests/fixtures/cksum/raw/sysv_single_file.expected
@@ -0,0 +1 @@
+I
\ No newline at end of file

From 0fe5f39b74f338177853b2ba960e85eb10ce944c Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Wed, 10 Jan 2024 10:46:03 +0100
Subject: [PATCH 377/429] Bump console from 0.15.7 to 0.15.8

---
 Cargo.lock | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/Cargo.lock b/Cargo.lock
index 9190d1be352..6f83430b68d 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -320,15 +320,15 @@ checksum = "120133d4db2ec47efe2e26502ee984747630c67f51974fca0b6c1340cf2368d3"
 
 [[package]]
 name = "console"
-version = "0.15.7"
+version = "0.15.8"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "c926e00cc70edefdc64d3a5ff31cc65bb97a3460097762bd23afb4d8145fccf8"
+checksum = "0e1f83fc076bd6dd27517eacdf25fef6c4dfe5f1d7448bafaaf3a26f13b5e4eb"
 dependencies = [
  "encode_unicode",
  "lazy_static",
  "libc",
  "unicode-width",
- "windows-sys 0.45.0",
+ "windows-sys 0.52.0",
 ]
 
 [[package]]

From d29adfcb095b6dc28d0b21574ff4df69f6e39d97 Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Wed, 10 Jan 2024 10:47:20 +0100
Subject: [PATCH 378/429] Bump mio from 0.8.6 to 0.8.10

---
 Cargo.lock | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/Cargo.lock b/Cargo.lock
index 6f83430b68d..0e4a271dfe0 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -1293,14 +1293,14 @@ dependencies = [
 
 [[package]]
 name = "mio"
-version = "0.8.6"
+version = "0.8.10"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "5b9d9a46eff5b4ff64b45a9e316a6d1e0bc719ef429cbec4dc630684212bfdf9"
+checksum = "8f3d0b296e374a4e6f3c7b0a1f5a51d748a0d34c85e7dc48fc3fa9a87657fe09"
 dependencies = [
  "libc",
  "log",
  "wasi",
- "windows-sys 0.45.0",
+ "windows-sys 0.48.0",
 ]
 
 [[package]]

From 4754e071d40c27d91d42855753f86f507abb294d Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Wed, 10 Jan 2024 10:48:50 +0100
Subject: [PATCH 379/429] deny.toml: update comment for windows-sys

---
 deny.toml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/deny.toml b/deny.toml
index df970c2c6e8..986c2b26970 100644
--- a/deny.toml
+++ b/deny.toml
@@ -62,7 +62,7 @@ skip = [
   { name = "linux-raw-sys", version = "0.3.8" },
   # terminal_size
   { name = "rustix", version = "0.37.26" },
-  # various crates
+  # notify
   { name = "windows-sys", version = "0.45.0" },
   # various crates
   { name = "windows-sys", version = "0.48.0" },

From aafdf10dc82e6744ee7bd7fafcc19ec619b9c40d Mon Sep 17 00:00:00 2001
From: Terts Diepraam <terts.diepraam@gmail.com>
Date: Wed, 10 Jan 2024 14:03:53 +0100
Subject: [PATCH 380/429] CI: test uucore with coreutils to run it with the
 proper features

---
 .github/workflows/CICD.yml | 10 +---------
 1 file changed, 1 insertion(+), 9 deletions(-)

diff --git a/.github/workflows/CICD.yml b/.github/workflows/CICD.yml
index ea369e4ef6f..df1a5fa5005 100644
--- a/.github/workflows/CICD.yml
+++ b/.github/workflows/CICD.yml
@@ -994,16 +994,8 @@ jobs:
         UTILITY_LIST="$(./util/show-utils.sh ${{ steps.vars.outputs.CARGO_FEATURES_OPTION }})"
         CARGO_UTILITY_LIST_OPTIONS="$(for u in ${UTILITY_LIST}; do echo -n "-puu_${u} "; done;)"
         outputs CARGO_UTILITY_LIST_OPTIONS
-    - name: Test uucore
-      run: cargo nextest run --profile ci --hide-progress-bar -p uucore
-      env:
-        RUSTC_WRAPPER: ""
-        RUSTFLAGS: "-Zprofile -Ccodegen-units=1 -Copt-level=0 -Clink-dead-code -Coverflow-checks=off -Zpanic_abort_tests -Cpanic=abort"
-        RUSTDOCFLAGS: "-Cpanic=abort"
-        RUST_BACKTRACE: "1"
-        # RUSTUP_TOOLCHAIN: ${{ steps.vars.outputs.TOOLCHAIN }}
     - name: Test
-      run: cargo nextest run --profile ci --hide-progress-bar ${{ steps.vars.outputs.CARGO_FEATURES_OPTION }}
+      run: cargo nextest run --profile ci --hide-progress-bar ${{ steps.vars.outputs.CARGO_FEATURES_OPTION }} -p uucore -p coreutils
       env:
         RUSTC_WRAPPER: ""
         RUSTFLAGS: "-Zprofile -Ccodegen-units=1 -Copt-level=0 -Clink-dead-code -Coverflow-checks=off -Zpanic_abort_tests -Cpanic=abort"

From c7b15ddce9d2af52267511ce06b84bb32b843d82 Mon Sep 17 00:00:00 2001
From: D9nni <lungudaniel31@gmail.com>
Date: Wed, 10 Jan 2024 15:04:19 +0200
Subject: [PATCH 381/429] cksum: fixed cksum --raw --algorithm

---
 src/uu/cksum/src/cksum.rs                     | 23 ++++++++++++++-----
 .../cksum/raw/blake2b_single_file.expected    |  2 +-
 2 files changed, 18 insertions(+), 7 deletions(-)

diff --git a/src/uu/cksum/src/cksum.rs b/src/uu/cksum/src/cksum.rs
index 6f3de690de8..eeda3c08343 100644
--- a/src/uu/cksum/src/cksum.rs
+++ b/src/uu/cksum/src/cksum.rs
@@ -176,16 +176,27 @@ where
             .map_err_context(|| "failed to read input".to_string())?;
 
         if options.raw {
-            match decode(sum.clone()) {
-                Ok(bytes) => {
-                    stdout().write_all(&bytes)?;
-                }
-                Err(_) => {
-                    //bsd, sysv and crc have output generated without encode()
+            match options.algo_name  {
+                ALGORITHM_OPTIONS_CRC 
+                | ALGORITHM_OPTIONS_SYSV
+                | ALGORITHM_OPTIONS_BSD => {
                     let bytes = sum.parse::<u32>().unwrap().to_be_bytes();
+                    let mut first_nonzero = 0;
+                    for byte in bytes {
+                        if byte != 0 {
+                            break;
+                        }
+                        first_nonzero += 1;
+                    }
+                    stdout().write_all(&bytes[first_nonzero..])?;
+                }
+                _ =>{
+                    let bytes = decode(sum).unwrap();
                     stdout().write_all(&bytes)?;
                 }
+
             }
+
             return Ok(());
         }
         // The BSD checksum output is 5 digit integer
diff --git a/tests/fixtures/cksum/raw/blake2b_single_file.expected b/tests/fixtures/cksum/raw/blake2b_single_file.expected
index 4955b2f990e..19b3112206d 100644
--- a/tests/fixtures/cksum/raw/blake2b_single_file.expected
+++ b/tests/fixtures/cksum/raw/blake2b_single_file.expected
@@ -1 +1 @@
-�����`�x��f��W���Et�B��l��W^J�0�aX´��8�����5�B��9m��
\ No newline at end of file
+�����`�x��f��W���Et�B��l��W^J�0�aX´��8�����5�B��9m��
\ No newline at end of file

From 911df1d76cdc1d61f01b282b169dad246089b9f1 Mon Sep 17 00:00:00 2001
From: D9nni <lungudaniel31@gmail.com>
Date: Wed, 10 Jan 2024 15:15:23 +0200
Subject: [PATCH 382/429] cksum: code improvements for cksum --raw --algorithm

---
 src/uu/cksum/src/cksum.rs | 28 +++++++++++-----------------
 1 file changed, 11 insertions(+), 17 deletions(-)

diff --git a/src/uu/cksum/src/cksum.rs b/src/uu/cksum/src/cksum.rs
index eeda3c08343..40694fac661 100644
--- a/src/uu/cksum/src/cksum.rs
+++ b/src/uu/cksum/src/cksum.rs
@@ -176,27 +176,21 @@ where
             .map_err_context(|| "failed to read input".to_string())?;
 
         if options.raw {
-            match options.algo_name  {
-                ALGORITHM_OPTIONS_CRC 
-                | ALGORITHM_OPTIONS_SYSV
-                | ALGORITHM_OPTIONS_BSD => {
+            let bytes = match options.algo_name {
+                ALGORITHM_OPTIONS_CRC => {
                     let bytes = sum.parse::<u32>().unwrap().to_be_bytes();
-                    let mut first_nonzero = 0;
-                    for byte in bytes {
-                        if byte != 0 {
-                            break;
-                        }
-                        first_nonzero += 1;
-                    }
-                    stdout().write_all(&bytes[first_nonzero..])?;
+                    bytes.to_vec()
                 }
-                _ =>{
+                ALGORITHM_OPTIONS_SYSV | ALGORITHM_OPTIONS_BSD => {
+                    let bytes = sum.parse::<u16>().unwrap().to_be_bytes();
+                    bytes.to_vec()
+                }
+                _ => {
                     let bytes = decode(sum).unwrap();
-                    stdout().write_all(&bytes)?;
+                    bytes
                 }
-
-            }
-
+            };
+            stdout().write_all(&bytes)?;
             return Ok(());
         }
         // The BSD checksum output is 5 digit integer

From 00cd6fa347a1bf147d0cfdc9e01f99c4cb7c2f6f Mon Sep 17 00:00:00 2001
From: Samuel Tardieu <sam@rfc1149.net>
Date: Mon, 8 Jan 2024 15:02:12 +0100
Subject: [PATCH 383/429] format: new dedicated number parser

The parser can parse integral and floating point numbers as expected by
the coreutils `printf` command.
---
 src/uucore/src/lib/features/format/mod.rs     |   1 +
 .../src/lib/features/format/num_parser.rs     | 378 ++++++++++++++++++
 2 files changed, 379 insertions(+)
 create mode 100644 src/uucore/src/lib/features/format/num_parser.rs

diff --git a/src/uucore/src/lib/features/format/mod.rs b/src/uucore/src/lib/features/format/mod.rs
index 4d30753d610..8f662080dcb 100644
--- a/src/uucore/src/lib/features/format/mod.rs
+++ b/src/uucore/src/lib/features/format/mod.rs
@@ -33,6 +33,7 @@
 mod argument;
 mod escape;
 pub mod num_format;
+pub mod num_parser;
 mod spec;
 
 pub use argument::*;
diff --git a/src/uucore/src/lib/features/format/num_parser.rs b/src/uucore/src/lib/features/format/num_parser.rs
new file mode 100644
index 00000000000..0d65651d7e9
--- /dev/null
+++ b/src/uucore/src/lib/features/format/num_parser.rs
@@ -0,0 +1,378 @@
+// This file is part of the uutils coreutils package.
+//
+// For the full copyright and license information, please view the LICENSE
+// file that was distributed with this source code.
+
+//! Utilities for parsing numbers in various formats
+
+// spell-checker:ignore powf copysign prec inity
+
+#[derive(Clone, Copy, PartialEq)]
+pub enum Base {
+    Binary = 2,
+    Octal = 8,
+    Decimal = 10,
+    Hexadecimal = 16,
+}
+
+impl Base {
+    pub fn digit(&self, c: char) -> Option<u64> {
+        fn from_decimal(c: char) -> u64 {
+            u64::from(c) - u64::from('0')
+        }
+        match self {
+            Self::Binary => ('0'..='1').contains(&c).then(|| from_decimal(c)),
+            Self::Octal => ('0'..='7').contains(&c).then(|| from_decimal(c)),
+            Self::Decimal => c.is_ascii_digit().then(|| from_decimal(c)),
+            Self::Hexadecimal => match c.to_ascii_lowercase() {
+                '0'..='9' => Some(from_decimal(c)),
+                c @ 'a'..='f' => Some(u64::from(c) - u64::from('a') + 10),
+                _ => None,
+            },
+        }
+    }
+}
+
+/// Type returned if a number could not be parsed in its entirety
+#[derive(Debug, PartialEq)]
+pub enum ParseError<'a, T> {
+    /// The input as a whole makes no sense
+    NotNumeric,
+    /// The beginning of the input made sense and has been parsed,
+    /// while the remaining doesn't.
+    PartialMatch(T, &'a str),
+    /// The integral part has overflowed the requested type, or
+    /// has overflowed the `u64` internal storage when parsing the
+    /// integral part of a floating point number.
+    Overflow,
+}
+
+impl<'a, T> ParseError<'a, T> {
+    fn map<U>(self, f: impl FnOnce(T, &'a str) -> ParseError<'a, U>) -> ParseError<'a, U> {
+        match self {
+            Self::NotNumeric => ParseError::NotNumeric,
+            Self::Overflow => ParseError::Overflow,
+            Self::PartialMatch(v, s) => f(v, s),
+        }
+    }
+}
+
+/// A number parser for binary, octal, decimal, hexadecimal and single characters.
+///
+/// Internally, in order to get the maximum possible precision and cover the full
+/// range of u64 and i64 without losing precision for f64, the returned number is
+/// decomposed into:
+///   - A `base` value
+///   - A `neg` sign bit
+///   - A `integral` positive part
+///   - A `fractional` positive part
+///   - A `precision` representing the number of digits in the fractional part
+///
+/// If the fractional part cannot be represented on a `u64`, parsing continues
+/// silently by ignoring non-significant digits.
+pub struct ParsedNumber {
+    base: Base,
+    negative: bool,
+    integral: u64,
+    fractional: u64,
+    precision: usize,
+}
+
+impl ParsedNumber {
+    fn into_i64(self) -> Option<i64> {
+        if self.negative {
+            i64::try_from(-i128::from(self.integral)).ok()
+        } else {
+            i64::try_from(self.integral).ok()
+        }
+    }
+
+    /// Parse a number as i64. No fractional part is allowed.
+    pub fn parse_i64(input: &str) -> Result<i64, ParseError<'_, i64>> {
+        match Self::parse(input, true) {
+            Ok(v) => v.into_i64().ok_or(ParseError::Overflow),
+            Err(e) => Err(e.map(|v, rest| {
+                v.into_i64()
+                    .map(|v| ParseError::PartialMatch(v, rest))
+                    .unwrap_or(ParseError::Overflow)
+            })),
+        }
+    }
+
+    /// Parse a number as u64. No fractional part is allowed.
+    pub fn parse_u64(input: &str) -> Result<u64, ParseError<'_, u64>> {
+        match Self::parse(input, true) {
+            Ok(v) | Err(ParseError::PartialMatch(v, _)) if v.negative => {
+                Err(ParseError::NotNumeric)
+            }
+            Ok(v) => Ok(v.integral),
+            Err(e) => Err(e.map(|v, rest| ParseError::PartialMatch(v.integral, rest))),
+        }
+    }
+
+    fn into_f64(self) -> f64 {
+        let n = self.integral as f64
+            + (self.fractional as f64) / (self.base as u8 as f64).powf(self.precision as f64);
+        if self.negative {
+            -n
+        } else {
+            n
+        }
+    }
+
+    /// Parse a number as f64
+    pub fn parse_f64(input: &str) -> Result<f64, ParseError<'_, f64>> {
+        match Self::parse(input, false) {
+            Ok(v) => Ok(v.into_f64()),
+            Err(ParseError::NotNumeric) => Self::parse_f64_special_values(input),
+            Err(e) => Err(e.map(|v, rest| ParseError::PartialMatch(v.into_f64(), rest))),
+        }
+    }
+
+    fn parse_f64_special_values(input: &str) -> Result<f64, ParseError<'_, f64>> {
+        let (sign, rest) = if let Some(input) = input.strip_prefix('-') {
+            (-1.0, input)
+        } else {
+            (1.0, input)
+        };
+        let prefix = rest
+            .chars()
+            .take(3)
+            .map(|c| c.to_ascii_lowercase())
+            .collect::<String>();
+        let special = match prefix.as_str() {
+            "inf" => f64::INFINITY,
+            "nan" => f64::NAN,
+            _ => return Err(ParseError::NotNumeric),
+        }
+        .copysign(sign);
+        if rest.len() == 3 {
+            Ok(special)
+        } else {
+            Err(ParseError::PartialMatch(special, &rest[3..]))
+        }
+    }
+
+    #[allow(clippy::cognitive_complexity)]
+    fn parse(input: &str, integral_only: bool) -> Result<Self, ParseError<'_, Self>> {
+        // Parse the "'" prefix separately
+        if let Some(rest) = input.strip_prefix('\'') {
+            let mut chars = rest.char_indices().fuse();
+            let v = chars.next().map(|(_, c)| Self {
+                base: Base::Decimal,
+                negative: false,
+                integral: u64::from(c),
+                fractional: 0,
+                precision: 0,
+            });
+            return match (v, chars.next()) {
+                (Some(v), None) => Ok(v),
+                (Some(v), Some((i, _))) => Err(ParseError::PartialMatch(v, &rest[i..])),
+                (None, _) => Err(ParseError::NotNumeric),
+            };
+        }
+
+        // Initial minus sign
+        let (negative, unsigned) = if let Some(input) = input.strip_prefix('-') {
+            (true, input)
+        } else {
+            (false, input)
+        };
+
+        // Parse an optional base prefix ("0b" / "0B" / "0" / "0x" / "0X"). "0" is octal unless a
+        // fractional part is allowed in which case it is an insignificant leading 0. A "0" prefix
+        // will not be consumed in case the parsable string contains only "0": the leading extra "0"
+        // will have no influence on the result.
+        let (base, rest) = if let Some(rest) = unsigned.strip_prefix('0') {
+            if let Some(rest) = rest.strip_prefix(['b', 'B']) {
+                (Base::Binary, rest)
+            } else if let Some(rest) = rest.strip_prefix(['x', 'X']) {
+                (Base::Hexadecimal, rest)
+            } else if integral_only {
+                (Base::Octal, unsigned)
+            } else {
+                (Base::Decimal, unsigned)
+            }
+        } else {
+            (Base::Decimal, unsigned)
+        };
+        if rest.is_empty() {
+            return Err(ParseError::NotNumeric);
+        }
+
+        // Parse the integral part of the number
+        let mut chars = rest.chars().enumerate().fuse().peekable();
+        let mut integral = 0u64;
+        while let Some(d) = chars.peek().and_then(|&(_, c)| base.digit(c)) {
+            chars.next();
+            integral = integral
+                .checked_mul(base as u64)
+                .and_then(|n| n.checked_add(d))
+                .ok_or(ParseError::Overflow)?;
+        }
+
+        // Parse the fractional part of the number if there can be one and the input contains
+        // a '.' decimal separator.
+        let (mut fractional, mut precision) = (0u64, 0);
+        if matches!(chars.peek(), Some(&(_, '.')))
+            && matches!(base, Base::Decimal | Base::Hexadecimal)
+            && !integral_only
+        {
+            chars.next();
+            let mut ended = false;
+            while let Some(d) = chars.peek().and_then(|&(_, c)| base.digit(c)) {
+                chars.next();
+                if !ended {
+                    if let Some(f) = fractional
+                        .checked_mul(base as u64)
+                        .and_then(|n| n.checked_add(d))
+                    {
+                        (fractional, precision) = (f, precision + 1);
+                    } else {
+                        ended = true;
+                    }
+                }
+            }
+        }
+
+        // If nothing has been parsed, declare the parsing unsuccessful
+        if let Some((0, _)) = chars.peek() {
+            return Err(ParseError::NotNumeric);
+        }
+
+        // Return what has been parsed so far. It there are extra characters, mark the
+        // parsing as a partial match.
+        let parsed = Self {
+            base,
+            negative,
+            integral,
+            fractional,
+            precision,
+        };
+        if let Some((first_unparsed, _)) = chars.next() {
+            Err(ParseError::PartialMatch(parsed, &rest[first_unparsed..]))
+        } else {
+            Ok(parsed)
+        }
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::{ParseError, ParsedNumber};
+
+    #[test]
+    fn test_decimal_u64() {
+        assert_eq!(Ok(123), ParsedNumber::parse_u64("123"));
+        assert_eq!(
+            Ok(u64::MAX),
+            ParsedNumber::parse_u64(&format!("{}", u64::MAX))
+        );
+        assert!(matches!(
+            ParsedNumber::parse_u64("-123"),
+            Err(ParseError::NotNumeric)
+        ));
+        assert!(matches!(
+            ParsedNumber::parse_u64(""),
+            Err(ParseError::NotNumeric)
+        ));
+        assert!(matches!(
+            ParsedNumber::parse_u64("123.15"),
+            Err(ParseError::PartialMatch(123, ".15"))
+        ));
+    }
+
+    #[test]
+    fn test_decimal_i64() {
+        assert_eq!(Ok(123), ParsedNumber::parse_i64("123"));
+        assert_eq!(Ok(-123), ParsedNumber::parse_i64("-123"));
+        assert!(matches!(
+            ParsedNumber::parse_i64("--123"),
+            Err(ParseError::NotNumeric)
+        ));
+        assert_eq!(
+            Ok(i64::MAX),
+            ParsedNumber::parse_i64(&format!("{}", i64::MAX))
+        );
+        assert_eq!(
+            Ok(i64::MIN),
+            ParsedNumber::parse_i64(&format!("{}", i64::MIN))
+        );
+        assert!(matches!(
+            ParsedNumber::parse_i64(&format!("{}", u64::MAX)),
+            Err(ParseError::Overflow)
+        ));
+        assert!(matches!(
+            ParsedNumber::parse_i64(&format!("{}", i64::MAX as u64 + 1)),
+            Err(ParseError::Overflow)
+        ));
+    }
+
+    #[test]
+    fn test_decimal_f64() {
+        assert_eq!(Ok(123.0), ParsedNumber::parse_f64("123"));
+        assert_eq!(Ok(-123.0), ParsedNumber::parse_f64("-123"));
+        assert_eq!(Ok(123.0), ParsedNumber::parse_f64("123."));
+        assert_eq!(Ok(-123.0), ParsedNumber::parse_f64("-123."));
+        assert_eq!(Ok(123.0), ParsedNumber::parse_f64("123.0"));
+        assert_eq!(Ok(-123.0), ParsedNumber::parse_f64("-123.0"));
+        assert_eq!(Ok(123.15), ParsedNumber::parse_f64("123.15"));
+        assert_eq!(Ok(-123.15), ParsedNumber::parse_f64("-123.15"));
+        assert_eq!(Ok(0.15), ParsedNumber::parse_f64(".15"));
+        assert_eq!(Ok(-0.15), ParsedNumber::parse_f64("-.15"));
+        assert_eq!(
+            Ok(0.15),
+            ParsedNumber::parse_f64(".150000000000000000000000000231313")
+        );
+        assert!(matches!(ParsedNumber::parse_f64("1.2.3"),
+                         Err(ParseError::PartialMatch(f, ".3")) if f == 1.2));
+        assert_eq!(Ok(f64::INFINITY), ParsedNumber::parse_f64("inf"));
+        assert_eq!(Ok(f64::NEG_INFINITY), ParsedNumber::parse_f64("-inf"));
+        assert!(ParsedNumber::parse_f64("NaN").unwrap().is_nan());
+        assert!(ParsedNumber::parse_f64("NaN").unwrap().is_sign_positive());
+        assert!(ParsedNumber::parse_f64("-NaN").unwrap().is_nan());
+        assert!(ParsedNumber::parse_f64("-NaN").unwrap().is_sign_negative());
+        assert!(matches!(ParsedNumber::parse_f64("-infinity"),
+                         Err(ParseError::PartialMatch(f, "inity")) if f == f64::NEG_INFINITY));
+        assert!(ParsedNumber::parse_f64(&format!("{}", u64::MAX)).is_ok());
+        assert!(ParsedNumber::parse_f64(&format!("{}", i64::MIN)).is_ok());
+    }
+
+    #[test]
+    fn test_hexadecimal() {
+        assert_eq!(Ok(0x123), ParsedNumber::parse_u64("0x123"));
+        assert_eq!(Ok(0x123), ParsedNumber::parse_u64("0X123"));
+        assert_eq!(Ok(0xfe), ParsedNumber::parse_u64("0xfE"));
+        assert_eq!(Ok(-0x123), ParsedNumber::parse_i64("-0x123"));
+
+        assert_eq!(Ok(0.5), ParsedNumber::parse_f64("0x.8"));
+        assert_eq!(Ok(0.0625), ParsedNumber::parse_f64("0x.1"));
+        assert_eq!(Ok(15.0078125), ParsedNumber::parse_f64("0xf.02"));
+    }
+
+    #[test]
+    fn test_octal() {
+        assert_eq!(Ok(0), ParsedNumber::parse_u64("0"));
+        assert_eq!(Ok(0o123), ParsedNumber::parse_u64("0123"));
+        assert_eq!(Ok(0o123), ParsedNumber::parse_u64("00123"));
+        assert_eq!(Ok(0), ParsedNumber::parse_u64("00"));
+        assert!(matches!(
+            ParsedNumber::parse_u64("008"),
+            Err(ParseError::PartialMatch(0, "8"))
+        ));
+        assert!(matches!(
+            ParsedNumber::parse_u64("08"),
+            Err(ParseError::PartialMatch(0, "8"))
+        ));
+        assert!(matches!(
+            ParsedNumber::parse_u64("0."),
+            Err(ParseError::PartialMatch(0, "."))
+        ));
+    }
+
+    #[test]
+    fn test_binary() {
+        assert_eq!(Ok(0b1011), ParsedNumber::parse_u64("0b1011"));
+        assert_eq!(Ok(0b1011), ParsedNumber::parse_u64("0B1011"));
+    }
+}

From a85a792c886310688373a091374bd33ebaff82f4 Mon Sep 17 00:00:00 2001
From: Samuel Tardieu <sam@rfc1149.net>
Date: Mon, 8 Jan 2024 15:04:34 +0100
Subject: [PATCH 384/429] format: use the new number parser and fix the error
 messages

The error messages are more compliant with GNU coreutils.
Also, floating hexadecimal numbers are now supported in
`printf`.
---
 .../src/lib/features/format/argument.rs       | 111 ++++++++----------
 tests/by-util/test_printf.rs                  |  42 ++++++-
 2 files changed, 88 insertions(+), 65 deletions(-)

diff --git a/src/uucore/src/lib/features/format/argument.rs b/src/uucore/src/lib/features/format/argument.rs
index 6f66230cbe0..92d6c1603fb 100644
--- a/src/uucore/src/lib/features/format/argument.rs
+++ b/src/uucore/src/lib/features/format/argument.rs
@@ -3,9 +3,14 @@
 // For the full copyright and license information, please view the LICENSE
 // file that was distributed with this source code.
 
+use crate::{
+    error::set_exit_code,
+    features::format::num_parser::{ParseError, ParsedNumber},
+    quoting_style::{escape_name, Quotes, QuotingStyle},
+    show_error, show_warning,
+};
 use os_display::Quotable;
-
-use crate::{error::set_exit_code, show_warning};
+use std::ffi::OsStr;
 
 /// An argument for formatting
 ///
@@ -40,9 +45,7 @@ impl<'a, T: Iterator<Item = &'a FormatArgument>> ArgumentIter<'a> for T {
         };
         match next {
             FormatArgument::Char(c) => *c,
-            FormatArgument::Unparsed(s) => {
-                s.chars().next().unwrap_or('\0')
-            }
+            FormatArgument::Unparsed(s) => s.chars().next().unwrap_or('\0'),
             _ => '\0',
         }
     }
@@ -53,25 +56,7 @@ impl<'a, T: Iterator<Item = &'a FormatArgument>> ArgumentIter<'a> for T {
         };
         match next {
             FormatArgument::UnsignedInt(n) => *n,
-            FormatArgument::Unparsed(s) => {
-                let opt = if let Some(s) = s.strip_prefix("0x") {
-                    u64::from_str_radix(s, 16).ok()
-                } else if let Some(s) = s.strip_prefix('0') {
-                    u64::from_str_radix(s, 8).ok()
-                } else if let Some(s) = s.strip_prefix('\'') {
-                    s.chars().next().map(|c| c as u64)
-                } else {
-                    s.parse().ok()
-                };
-                match opt {
-                    Some(n) => n,
-                    None => {
-                        show_warning!("{}: expected a numeric value", s.quote());
-                        set_exit_code(1);
-                        0
-                    }
-                }
-            }
+            FormatArgument::Unparsed(s) => extract_value(ParsedNumber::parse_u64(s), s),
             _ => 0,
         }
     }
@@ -82,29 +67,7 @@ impl<'a, T: Iterator<Item = &'a FormatArgument>> ArgumentIter<'a> for T {
         };
         match next {
             FormatArgument::SignedInt(n) => *n,
-            FormatArgument::Unparsed(s) => {
-                // For hex, we parse `u64` because we do not allow another
-                // minus sign. We might need to do more precise parsing here.
-                let opt = if let Some(s) = s.strip_prefix("-0x") {
-                    u64::from_str_radix(s, 16).ok().map(|x| -(x as i64))
-                } else if let Some(s) = s.strip_prefix("0x") {
-                    u64::from_str_radix(s, 16).ok().map(|x| x as i64)
-                } else if s.starts_with("-0") || s.starts_with('0') {
-                    i64::from_str_radix(s, 8).ok()
-                } else if let Some(s) = s.strip_prefix('\'') {
-                    s.chars().next().map(|x| x as i64)
-                } else {
-                    s.parse().ok()
-                };
-                match opt {
-                    Some(n) => n,
-                    None => {
-                        show_warning!("{}: expected a numeric value", s.quote());
-                        set_exit_code(1);
-                        0
-                    }
-                }
-            }
+            FormatArgument::Unparsed(s) => extract_value(ParsedNumber::parse_i64(s), s),
             _ => 0,
         }
     }
@@ -115,23 +78,7 @@ impl<'a, T: Iterator<Item = &'a FormatArgument>> ArgumentIter<'a> for T {
         };
         match next {
             FormatArgument::Float(n) => *n,
-            FormatArgument::Unparsed(s) => {
-                let opt = if s.starts_with("0x") || s.starts_with("-0x") {
-                    unimplemented!("Hexadecimal floats are unimplemented!")
-                } else if let Some(s) = s.strip_prefix('\'') {
-                    s.chars().next().map(|x| x as u64 as f64)
-                } else {
-                    s.parse().ok()
-                };
-                match opt {
-                    Some(n) => n,
-                    None => {
-                        show_warning!("{}: expected a numeric value", s.quote());
-                        set_exit_code(1);
-                        0.0
-                    }
-                }
-            }
+            FormatArgument::Unparsed(s) => extract_value(ParsedNumber::parse_f64(s), s),
             _ => 0.0,
         }
     }
@@ -143,3 +90,39 @@ impl<'a, T: Iterator<Item = &'a FormatArgument>> ArgumentIter<'a> for T {
         }
     }
 }
+
+fn extract_value<T: Default>(p: Result<T, ParseError<'_, T>>, input: &str) -> T {
+    match p {
+        Ok(v) => v,
+        Err(e) => {
+            set_exit_code(1);
+            let input = escape_name(
+                OsStr::new(input),
+                &QuotingStyle::C {
+                    quotes: Quotes::None,
+                },
+            );
+            match e {
+                ParseError::Overflow => {
+                    show_error!("{}: Numerical result out of range", input.quote());
+                    Default::default()
+                }
+                ParseError::NotNumeric => {
+                    show_error!("{}: expected a numeric value", input.quote());
+                    Default::default()
+                }
+                ParseError::PartialMatch(v, rest) => {
+                    if input.starts_with('\'') {
+                        show_warning!(
+                            "{}: character(s) following character constant have been ignored",
+                            &rest,
+                        );
+                    } else {
+                        show_error!("{}: value not completely converted", input.quote());
+                    }
+                    v
+                }
+            }
+        }
+    }
+}
diff --git a/tests/by-util/test_printf.rs b/tests/by-util/test_printf.rs
index c106e55129b..48fc1e6ace2 100644
--- a/tests/by-util/test_printf.rs
+++ b/tests/by-util/test_printf.rs
@@ -435,7 +435,6 @@ fn sub_float_dec_places() {
 }
 
 #[test]
-#[ignore = "hexadecimal floats are unimplemented"]
 fn sub_float_hex_in() {
     new_ucmd!()
         .args(&["%f", "0xF1.1F"])
@@ -599,3 +598,44 @@ fn sub_general_round_float_leading_zeroes() {
         .succeeds()
         .stdout_only("1.00001");
 }
+
+#[test]
+fn partial_float() {
+    new_ucmd!()
+        .args(&["%.2f is %s", "42.03x", "a lot"])
+        .fails()
+        .code_is(1)
+        .stdout_is("42.03 is a lot")
+        .stderr_is("printf: '42.03x': value not completely converted\n");
+}
+
+#[test]
+fn partial_integer() {
+    new_ucmd!()
+        .args(&["%d is %s", "42x23", "a lot"])
+        .fails()
+        .code_is(1)
+        .stdout_is("42 is a lot")
+        .stderr_is("printf: '42x23': value not completely converted\n");
+}
+
+#[test]
+fn test_overflow() {
+    new_ucmd!()
+        .args(&["%d", "36893488147419103232"])
+        .fails()
+        .code_is(1)
+        .stderr_is("printf: '36893488147419103232': Numerical result out of range\n");
+}
+
+#[test]
+fn partial_char() {
+    new_ucmd!()
+        .args(&["%d", "'abc"])
+        .fails()
+        .code_is(1)
+        .stdout_is("97")
+        .stderr_is(
+            "printf: warning: bc: character(s) following character constant have been ignored\n",
+        );
+}

From 9a76997b0a9d6d8b92b7c1d476f00d5cc45a74cc Mon Sep 17 00:00:00 2001
From: D9nni <lungudaniel31@gmail.com>
Date: Wed, 10 Jan 2024 16:49:52 +0200
Subject: [PATCH 385/429] cksum: fixed clippy and fmt errors

---
 src/uu/cksum/src/cksum.rs | 13 +++----------
 1 file changed, 3 insertions(+), 10 deletions(-)

diff --git a/src/uu/cksum/src/cksum.rs b/src/uu/cksum/src/cksum.rs
index 40694fac661..a3e6dfd9e1a 100644
--- a/src/uu/cksum/src/cksum.rs
+++ b/src/uu/cksum/src/cksum.rs
@@ -177,18 +177,11 @@ where
 
         if options.raw {
             let bytes = match options.algo_name {
-                ALGORITHM_OPTIONS_CRC => {
-                    let bytes = sum.parse::<u32>().unwrap().to_be_bytes();
-                    bytes.to_vec()
-                }
+                ALGORITHM_OPTIONS_CRC => sum.parse::<u32>().unwrap().to_be_bytes().to_vec(),
                 ALGORITHM_OPTIONS_SYSV | ALGORITHM_OPTIONS_BSD => {
-                    let bytes = sum.parse::<u16>().unwrap().to_be_bytes();
-                    bytes.to_vec()
-                }
-                _ => {
-                    let bytes = decode(sum).unwrap();
-                    bytes
+                    sum.parse::<u16>().unwrap().to_be_bytes().to_vec()
                 }
+                _ => decode(sum).unwrap(),
             };
             stdout().write_all(&bytes)?;
             return Ok(());

From 3b884966ac207107feb12a831e63083d746b06cb Mon Sep 17 00:00:00 2001
From: Marras Antoine <antoine.marras@student-cs.fr>
Date: Mon, 8 Jan 2024 14:30:56 +0100
Subject: [PATCH 386/429] printf: added failing tests on alternative hex form

---
 tests/by-util/test_printf.rs | 26 ++++++++++++++++++++++++++
 1 file changed, 26 insertions(+)

diff --git a/tests/by-util/test_printf.rs b/tests/by-util/test_printf.rs
index 48fc1e6ace2..f162df49024 100644
--- a/tests/by-util/test_printf.rs
+++ b/tests/by-util/test_printf.rs
@@ -639,3 +639,29 @@ fn partial_char() {
             "printf: warning: bc: character(s) following character constant have been ignored\n",
         );
 }
+
+#[test]
+fn sub_alternative_lower_hex_0() {
+    new_ucmd!().args(&["%#x", "0"]).succeeds().stdout_only("0");
+}
+
+#[test]
+fn sub_alternative_lower_hex() {
+    new_ucmd!()
+        .args(&["%#x", "42"])
+        .succeeds()
+        .stdout_only("0x2a");
+}
+
+#[test]
+fn sub_alternative_upper_hex_0() {
+    new_ucmd!().args(&["%#X", "0"]).succeeds().stdout_only("0");
+}
+
+#[test]
+fn sub_alternative_upper_hex() {
+    new_ucmd!()
+        .args(&["%#X", "42"])
+        .succeeds()
+        .stdout_only("0x2A");
+}

From 0648321d9796fd709adb7a78b169be3859d93dfb Mon Sep 17 00:00:00 2001
From: Marras Antoine <antoine.marras@student-cs.fr>
Date: Mon, 8 Jan 2024 15:08:18 +0100
Subject: [PATCH 387/429] printf: 0x not shown anymore in front of 0 while in
 alternative mode

---
 src/uucore/src/lib/features/format/num_format.rs | 12 ++++++++++--
 1 file changed, 10 insertions(+), 2 deletions(-)

diff --git a/src/uucore/src/lib/features/format/num_format.rs b/src/uucore/src/lib/features/format/num_format.rs
index 325da3ce6e3..9b7e805f0d3 100644
--- a/src/uucore/src/lib/features/format/num_format.rs
+++ b/src/uucore/src/lib/features/format/num_format.rs
@@ -156,13 +156,21 @@ impl Formatter for UnsignedInt {
                 format!("{x:x}")
             }
             UnsignedIntVariant::Hexadecimal(Case::Lowercase, Prefix::Yes) => {
-                format!("{x:#x}")
+                if x == 0 {
+                    "0".to_string()
+                } else {
+                    format!("{x:#x}")
+                }
             }
             UnsignedIntVariant::Hexadecimal(Case::Uppercase, Prefix::No) => {
                 format!("{x:X}")
             }
             UnsignedIntVariant::Hexadecimal(Case::Uppercase, Prefix::Yes) => {
-                format!("{x:#X}")
+                if x == 0 {
+                    "0".to_string()
+                } else {
+                    format!("{x:#X}")
+                }
             }
         };
 

From e948d2e8e5e5403dc8afcb505ad86f98a7b159f3 Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Wed, 10 Jan 2024 15:14:12 +0100
Subject: [PATCH 388/429] ci: install mingw-w64-x86_64-gcc for windows-gnu

---
 .github/workflows/CICD.yml | 6 ++++++
 1 file changed, 6 insertions(+)

diff --git a/.github/workflows/CICD.yml b/.github/workflows/CICD.yml
index ea369e4ef6f..89022bbef35 100644
--- a/.github/workflows/CICD.yml
+++ b/.github/workflows/CICD.yml
@@ -615,6 +615,8 @@ jobs:
           arm-unknown-linux-gnueabihf) sudo apt-get -y update ; sudo apt-get -y install gcc-arm-linux-gnueabihf ;;
           aarch64-unknown-linux-*) sudo apt-get -y update ; sudo apt-get -y install gcc-aarch64-linux-gnu ;;
           *-redox*) sudo apt-get -y update ; sudo apt-get -y install fuse3 libfuse-dev ;;
+          # Update binutils if MinGW due to https://github.com/rust-lang/rust/issues/112368
+          x86_64-pc-windows-gnu) C:/msys64/usr/bin/pacman.exe -Syu --needed mingw-w64-x86_64-gcc --noconfirm ; echo "C:\msys64\mingw64\bin" >> $GITHUB_PATH ;;
         esac
         case '${{ matrix.job.os }}' in
           macos-latest) brew install coreutils ;; # needed for testing
@@ -984,6 +986,10 @@ jobs:
             echo "foo" > /home/runner/.plan
             ;;
         esac
+        case '${{ matrix.job.os }}' in
+          # Update binutils if MinGW due to https://github.com/rust-lang/rust/issues/112368
+          windows-latest) C:/msys64/usr/bin/pacman.exe -Syu --needed mingw-w64-x86_64-gcc --noconfirm ; echo "C:\msys64\mingw64\bin" >> $GITHUB_PATH ;;
+        esac
     - name: Initialize toolchain-dependent workflow variables
       id: dep_vars
       shell: bash

From 7d32e49fb907f3fd9e9a1bbb1e152a4083d1b9a5 Mon Sep 17 00:00:00 2001
From: Samuel Tardieu <sam@rfc1149.net>
Date: Wed, 10 Jan 2024 18:19:56 +0100
Subject: [PATCH 389/429] printf: %c prints the first byte of its argument

---
 src/uucore/src/lib/features/format/argument.rs | 2 +-
 tests/by-util/test_printf.rs                   | 5 +++++
 2 files changed, 6 insertions(+), 1 deletion(-)

diff --git a/src/uucore/src/lib/features/format/argument.rs b/src/uucore/src/lib/features/format/argument.rs
index 92d6c1603fb..ef81fc3533b 100644
--- a/src/uucore/src/lib/features/format/argument.rs
+++ b/src/uucore/src/lib/features/format/argument.rs
@@ -45,7 +45,7 @@ impl<'a, T: Iterator<Item = &'a FormatArgument>> ArgumentIter<'a> for T {
         };
         match next {
             FormatArgument::Char(c) => *c,
-            FormatArgument::Unparsed(s) => s.chars().next().unwrap_or('\0'),
+            FormatArgument::Unparsed(s) => s.bytes().next().map_or('\0', char::from),
             _ => '\0',
         }
     }
diff --git a/tests/by-util/test_printf.rs b/tests/by-util/test_printf.rs
index 48fc1e6ace2..c3527710669 100644
--- a/tests/by-util/test_printf.rs
+++ b/tests/by-util/test_printf.rs
@@ -639,3 +639,8 @@ fn partial_char() {
             "printf: warning: bc: character(s) following character constant have been ignored\n",
         );
 }
+
+#[test]
+fn char_as_byte() {
+    new_ucmd!().args(&["%c", "🙃"]).succeeds().stdout_only("ð");
+}

From 47e908bc6cbd40c9a937ed8f78dc384c83ff2b42 Mon Sep 17 00:00:00 2001
From: Samuel Tardieu <sam@rfc1149.net>
Date: Wed, 10 Jan 2024 18:59:33 +0100
Subject: [PATCH 390/429] printf: output of double-quote should not be escaped

This is obtained by escaping the sequence `\"` as `"`.
---
 src/uucore/src/lib/features/format/escape.rs | 1 +
 tests/by-util/test_printf.rs                 | 5 +++++
 2 files changed, 6 insertions(+)

diff --git a/src/uucore/src/lib/features/format/escape.rs b/src/uucore/src/lib/features/format/escape.rs
index d20da3e7e38..9420507f3e3 100644
--- a/src/uucore/src/lib/features/format/escape.rs
+++ b/src/uucore/src/lib/features/format/escape.rs
@@ -108,6 +108,7 @@ pub fn parse_escape_code(rest: &mut &[u8]) -> EscapedChar {
         *rest = new_rest;
         match c {
             b'\\' => EscapedChar::Byte(b'\\'),
+            b'"' => EscapedChar::Byte(b'"'),
             b'a' => EscapedChar::Byte(b'\x07'),
             b'b' => EscapedChar::Byte(b'\x08'),
             b'c' => EscapedChar::End,
diff --git a/tests/by-util/test_printf.rs b/tests/by-util/test_printf.rs
index 48fc1e6ace2..a288d7c0842 100644
--- a/tests/by-util/test_printf.rs
+++ b/tests/by-util/test_printf.rs
@@ -36,6 +36,11 @@ fn escaped_slash() {
         .stdout_only("hello\\ world");
 }
 
+#[test]
+fn unescaped_double_quote() {
+    new_ucmd!().args(&["\\\""]).succeeds().stdout_only("\"");
+}
+
 #[test]
 fn escaped_hex() {
     new_ucmd!().args(&["\\x41"]).succeeds().stdout_only("A");

From 2aa8a3502fd049a3ce13164aa8b289daf2940e04 Mon Sep 17 00:00:00 2001
From: Sudhakar Verma <sudhakar.verma@canonical.com>
Date: Fri, 12 Jan 2024 16:08:47 +0530
Subject: [PATCH 391/429] printf : no infinite loop

---
 src/uu/printf/src/printf.rs  | 10 +++++++++-
 tests/by-util/test_printf.rs |  5 +++++
 2 files changed, 14 insertions(+), 1 deletion(-)

diff --git a/src/uu/printf/src/printf.rs b/src/uu/printf/src/printf.rs
index ad42e38941f..64a3a35a7af 100644
--- a/src/uu/printf/src/printf.rs
+++ b/src/uu/printf/src/printf.rs
@@ -11,7 +11,7 @@ use std::ops::ControlFlow;
 
 use clap::{crate_version, Arg, ArgAction, Command};
 use uucore::error::{UResult, UUsageError};
-use uucore::format::{parse_spec_and_escape, FormatArgument};
+use uucore::format::{parse_spec_and_escape, FormatArgument, FormatItem};
 use uucore::{format_usage, help_about, help_section, help_usage};
 
 const VERSION: &str = "version";
@@ -46,6 +46,14 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
         };
     }
 
+    // See #5815 - We don't need to iter on args if no format string seen
+    let format_seen = parse_spec_and_escape(format_string.as_ref())
+        .into_iter()
+        .any(|r| matches!(r, Ok(FormatItem::Spec(_))));
+    if !format_seen {
+        return Ok(());
+    }
+
     while args.peek().is_some() {
         for item in parse_spec_and_escape(format_string.as_ref()) {
             match item?.write(stdout(), &mut args)? {
diff --git a/tests/by-util/test_printf.rs b/tests/by-util/test_printf.rs
index 4f2e1dc10e6..411285a0cd2 100644
--- a/tests/by-util/test_printf.rs
+++ b/tests/by-util/test_printf.rs
@@ -649,3 +649,8 @@ fn partial_char() {
 fn char_as_byte() {
     new_ucmd!().args(&["%c", "🙃"]).succeeds().stdout_only("ð");
 }
+
+#[test]
+fn no_infinite_loop() {
+    new_ucmd!().args(&["a", "b"]).succeeds().stdout_only("a");
+}

From 4e5a65ee41372ca9bd35501e251b1b7bf799665e Mon Sep 17 00:00:00 2001
From: Sudhakar Verma <sudhakar.verma@canonical.com>
Date: Fri, 12 Jan 2024 16:23:38 +0530
Subject: [PATCH 392/429] printf: fix clippy warnings

---
 src/uu/printf/src/printf.rs | 5 ++---
 1 file changed, 2 insertions(+), 3 deletions(-)

diff --git a/src/uu/printf/src/printf.rs b/src/uu/printf/src/printf.rs
index 64a3a35a7af..b0988f7b45f 100644
--- a/src/uu/printf/src/printf.rs
+++ b/src/uu/printf/src/printf.rs
@@ -47,9 +47,8 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
     }
 
     // See #5815 - We don't need to iter on args if no format string seen
-    let format_seen = parse_spec_and_escape(format_string.as_ref())
-        .into_iter()
-        .any(|r| matches!(r, Ok(FormatItem::Spec(_))));
+    let format_seen =
+        parse_spec_and_escape(format_string.as_ref()).any(|r| matches!(r, Ok(FormatItem::Spec(_))));
     if !format_seen {
         return Ok(());
     }

From cd4568f5d9862ab28dda351c7692c0bd95dcdda7 Mon Sep 17 00:00:00 2001
From: Sudhakar Verma <sudhakar.verma@canonical.com>
Date: Fri, 12 Jan 2024 17:12:30 +0530
Subject: [PATCH 393/429] printf: simplify loop

---
 src/uu/printf/src/printf.rs | 9 ++++++---
 1 file changed, 6 insertions(+), 3 deletions(-)

diff --git a/src/uu/printf/src/printf.rs b/src/uu/printf/src/printf.rs
index b0988f7b45f..c98bb59a1e4 100644
--- a/src/uu/printf/src/printf.rs
+++ b/src/uu/printf/src/printf.rs
@@ -38,17 +38,20 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
         None => vec![],
     };
 
+    let mut format_seen = false;
     let mut args = values.iter().peekable();
     for item in parse_spec_and_escape(format_string.as_ref()) {
+        if let Ok(FormatItem::Spec(_)) = item {
+            format_seen = true;
+        }
         match item?.write(stdout(), &mut args)? {
             ControlFlow::Continue(()) => {}
             ControlFlow::Break(()) => return Ok(()),
         };
     }
 
-    // See #5815 - We don't need to iter on args if no format string seen
-    let format_seen =
-        parse_spec_and_escape(format_string.as_ref()).any(|r| matches!(r, Ok(FormatItem::Spec(_))));
+    // Without format specs in the string, the iter would not consume any args,
+    // leading to an infinite loop. Thus, we exit early.
     if !format_seen {
         return Ok(());
     }

From 19e1f26e3d9aa7a4749ed4c21293d111afc41846 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Sat, 13 Jan 2024 14:01:38 +0100
Subject: [PATCH 394/429] fuzz: with pipe, also capture stderr

---
 fuzz/fuzz_targets/fuzz_common.rs | 5 ++++-
 1 file changed, 4 insertions(+), 1 deletion(-)

diff --git a/fuzz/fuzz_targets/fuzz_common.rs b/fuzz/fuzz_targets/fuzz_common.rs
index f0de0b6052f..e8cac8d4048 100644
--- a/fuzz/fuzz_targets/fuzz_common.rs
+++ b/fuzz/fuzz_targets/fuzz_common.rs
@@ -232,7 +232,10 @@ pub fn run_gnu_cmd(
 
     let output = if let Some(input_str) = pipe_input {
         // We have an pipe input
-        command.stdin(Stdio::piped()).stdout(Stdio::piped());
+        command
+            .stdin(Stdio::piped())
+            .stdout(Stdio::piped())
+            .stderr(Stdio::piped());
 
         let mut child = command.spawn().expect("Failed to execute command");
         let child_stdin = child.stdin.as_mut().unwrap();

From 563df4b79d972c27551055e5bf1eb4af02f6955f Mon Sep 17 00:00:00 2001
From: Atomei Alexandru <118962363+Ato2207@users.noreply.github.com>
Date: Sat, 13 Jan 2024 15:43:36 +0200
Subject: [PATCH 395/429] Made cksum return an error if used on a directory.
 (#5822)

* Made cksum to return an error if it is used on a directory regardless of the algorithm

* Added one more test for cksum on folders and deleted an old one that expected it to succeed instead of fail

* Made cksum work on more than one item if it fails and added a test for this case
---
 src/uu/cksum/src/cksum.rs   | 19 ++++++-------
 tests/by-util/test_cksum.rs | 55 +++++++++++++++++++++++++++----------
 2 files changed, 49 insertions(+), 25 deletions(-)

diff --git a/src/uu/cksum/src/cksum.rs b/src/uu/cksum/src/cksum.rs
index a3e6dfd9e1a..458177e8a7c 100644
--- a/src/uu/cksum/src/cksum.rs
+++ b/src/uu/cksum/src/cksum.rs
@@ -15,8 +15,8 @@ use std::io::{self, stdin, stdout, BufReader, Read, Write};
 use std::iter;
 use std::path::Path;
 use uucore::{
-    error::{FromIo, UError, UResult},
-    format_usage, help_about, help_section, help_usage,
+    error::{FromIo, UError, UResult, USimpleError},
+    format_usage, help_about, help_section, help_usage, show,
     sum::{
         div_ceil, Blake2b, Digest, DigestWriter, Md5, Sha1, Sha224, Sha256, Sha384, Sha512, Sm3,
         BSD, CRC, SYSV,
@@ -174,7 +174,13 @@ where
         });
         let (sum, sz) = digest_read(&mut options.digest, &mut file, options.output_bits)
             .map_err_context(|| "failed to read input".to_string())?;
-
+        if filename.is_dir() {
+            show!(USimpleError::new(
+                1,
+                format!("{}: Is a directory", filename.display())
+            ));
+            continue;
+        }
         if options.raw {
             let bytes = match options.algo_name {
                 ALGORITHM_OPTIONS_CRC => sum.parse::<u32>().unwrap().to_be_bytes().to_vec(),
@@ -214,13 +220,6 @@ where
             (ALGORITHM_OPTIONS_CRC, true) => println!("{sum} {sz}"),
             (ALGORITHM_OPTIONS_CRC, false) => println!("{sum} {sz} {}", filename.display()),
             (ALGORITHM_OPTIONS_BLAKE2B, _) if !options.untagged => {
-                if filename.is_dir() {
-                    return Err(io::Error::new(
-                        io::ErrorKind::InvalidInput,
-                        format!("{}: Is a directory", filename.display()),
-                    )
-                    .into());
-                }
                 if let Some(length) = options.length {
                     // Multiply by 8 here, as we want to print the length in bits.
                     println!("BLAKE2b-{} ({}) = {sum}", length * 8, filename.display());
diff --git a/tests/by-util/test_cksum.rs b/tests/by-util/test_cksum.rs
index b3db0bf0a02..80cfc749931 100644
--- a/tests/by-util/test_cksum.rs
+++ b/tests/by-util/test_cksum.rs
@@ -80,18 +80,6 @@ fn test_nonexisting_file() {
         .stderr_contains(format!("cksum: {file_name}: No such file or directory"));
 }
 
-#[test]
-fn test_folder() {
-    let (at, mut ucmd) = at_and_ucmd!();
-
-    let folder_name = "a_folder";
-    at.mkdir(folder_name);
-
-    ucmd.arg(folder_name)
-        .succeeds()
-        .stdout_only(format!("4294967295 0 {folder_name}\n"));
-}
-
 // Make sure crc is correct for files larger than 32 bytes
 // but <128 bytes (1 fold pclmul) // spell-checker:disable-line
 #[test]
@@ -312,15 +300,52 @@ fn test_raw_multiple_files() {
 }
 
 #[test]
-fn test_blake2b_fail_on_directory() {
+fn test_fail_on_folder() {
     let (at, mut ucmd) = at_and_ucmd!();
 
     let folder_name = "a_folder";
     at.mkdir(folder_name);
 
-    ucmd.arg("--algorithm=blake2b")
-        .arg(folder_name)
+    ucmd.arg(folder_name)
         .fails()
         .no_stdout()
         .stderr_contains(format!("cksum: {folder_name}: Is a directory"));
 }
+
+#[test]
+fn test_all_algorithms_fail_on_folder() {
+    let scene = TestScenario::new(util_name!());
+
+    let at = &scene.fixtures;
+
+    let folder_name = "a_folder";
+    at.mkdir(folder_name);
+
+    for algo in ALGOS {
+        scene
+            .ucmd()
+            .arg(format!("--algorithm={algo}"))
+            .arg(folder_name)
+            .fails()
+            .no_stdout()
+            .stderr_contains(format!("cksum: {folder_name}: Is a directory"));
+    }
+}
+
+#[test]
+fn test_folder_and_file() {
+    let scene = TestScenario::new(util_name!());
+
+    let at = &scene.fixtures;
+
+    let folder_name = "a_folder";
+    at.mkdir(folder_name);
+
+    scene
+        .ucmd()
+        .arg(folder_name)
+        .arg("lorem_ipsum.txt")
+        .fails()
+        .stderr_contains(format!("cksum: {folder_name}: Is a directory"))
+        .stdout_is_fixture("crc_single_file.expected");
+}

From c63b5b2a5d919ffd5b98741035c64c9ab83cf508 Mon Sep 17 00:00:00 2001
From: "renovate[bot]" <29139614+renovate[bot]@users.noreply.github.com>
Date: Sat, 13 Jan 2024 13:57:26 +0000
Subject: [PATCH 396/429] chore(deps): update rust crate tempfile to 3.9.0

---
 Cargo.lock | 6 +++---
 Cargo.toml | 2 +-
 2 files changed, 4 insertions(+), 4 deletions(-)

diff --git a/Cargo.lock b/Cargo.lock
index 0e4a271dfe0..bf83d9accd8 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -2045,15 +2045,15 @@ dependencies = [
 
 [[package]]
 name = "tempfile"
-version = "3.8.1"
+version = "3.9.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "7ef1adac450ad7f4b3c28589471ade84f25f731a7a0fe30d71dfa9f60fd808e5"
+checksum = "01ce4141aa927a6d1bd34a041795abd0db1cccba5d5f24b009f694bdf3a1f3fa"
 dependencies = [
  "cfg-if",
  "fastrand",
  "redox_syscall 0.4.0",
  "rustix 0.38.28",
- "windows-sys 0.48.0",
+ "windows-sys 0.52.0",
 ]
 
 [[package]]
diff --git a/Cargo.toml b/Cargo.toml
index f45d0b2f4e9..a01fcdd2d39 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -319,7 +319,7 @@ self_cell = "1.0.3"
 selinux = "0.4"
 signal-hook = "0.3.17"
 smallvec = { version = "1.11", features = ["union"] }
-tempfile = "3.8.1"
+tempfile = "3.9.0"
 uutils_term_grid = "0.3"
 terminal_size = "0.3.0"
 textwrap = { version = "0.16.0", features = ["terminal_size"] }

From e0abb76c0f5be632b60460ccdce69547baa06c60 Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Sat, 16 Dec 2023 14:56:13 +0100
Subject: [PATCH 397/429] Bump redox_syscall to 0.4.1

redox_syscall from 0.3.5 & 0.4.0 -> 0.4.1
filetime from 0.2.22 -> 0.2.23
parking_lot_core from 0.9.8 -> 0.9.9
---
 Cargo.lock | 31 +++++++++++--------------------
 deny.toml  |  2 --
 2 files changed, 11 insertions(+), 22 deletions(-)

diff --git a/Cargo.lock b/Cargo.lock
index 0e4a271dfe0..936d2c1f245 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -813,14 +813,14 @@ checksum = "31a7a908b8f32538a2143e59a6e4e2508988832d5d4d6f7c156b3cbc762643a5"
 
 [[package]]
 name = "filetime"
-version = "0.2.22"
+version = "0.2.23"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "d4029edd3e734da6fe05b6cd7bd2960760a616bd2ddd0d59a0124746d6272af0"
+checksum = "1ee447700ac8aa0b2f2bd7bc4462ad686ba06baa6727ac149a2d6277f0d240fd"
 dependencies = [
  "cfg-if",
  "libc",
- "redox_syscall 0.3.5",
- "windows-sys 0.48.0",
+ "redox_syscall",
+ "windows-sys 0.52.0",
 ]
 
 [[package]]
@@ -1455,13 +1455,13 @@ dependencies = [
 
 [[package]]
 name = "parking_lot_core"
-version = "0.9.8"
+version = "0.9.9"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "93f00c865fe7cabf650081affecd3871070f26767e7b2070a3ffae14c654b447"
+checksum = "4c42a9226546d68acdd9c0a280d17ce19bfe27a46bf68784e4066115788d008e"
 dependencies = [
  "cfg-if",
  "libc",
- "redox_syscall 0.3.5",
+ "redox_syscall",
  "smallvec",
  "windows-targets 0.48.0",
 ]
@@ -1689,18 +1689,9 @@ dependencies = [
 
 [[package]]
 name = "redox_syscall"
-version = "0.3.5"
-source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "567664f262709473930a4bf9e51bf2ebf3348f2e748ccc50dea20646858f8f29"
-dependencies = [
- "bitflags 1.3.2",
-]
-
-[[package]]
-name = "redox_syscall"
-version = "0.4.0"
+version = "0.4.1"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "ded0bce2d41cc3c57aefa284708ced249a64acb01745dbbe72bd78610bfd644c"
+checksum = "4722d768eff46b75989dd134e5c353f0d6296e5aaa3132e776cbdb56be7731aa"
 dependencies = [
  "bitflags 1.3.2",
 ]
@@ -2051,7 +2042,7 @@ checksum = "7ef1adac450ad7f4b3c28589471ade84f25f731a7a0fe30d71dfa9f60fd808e5"
 dependencies = [
  "cfg-if",
  "fastrand",
- "redox_syscall 0.4.0",
+ "redox_syscall",
  "rustix 0.38.28",
  "windows-sys 0.48.0",
 ]
@@ -3014,7 +3005,7 @@ version = "0.0.23"
 dependencies = [
  "clap",
  "libc",
- "redox_syscall 0.4.0",
+ "redox_syscall",
  "uucore",
 ]
 
diff --git a/deny.toml b/deny.toml
index 986c2b26970..d7c04ad2d5b 100644
--- a/deny.toml
+++ b/deny.toml
@@ -102,8 +102,6 @@ skip = [
   { name = "syn", version = "1.0.109" },
   # various crates
   { name = "bitflags", version = "1.3.2" },
-  # various crates
-  { name = "redox_syscall", version = "0.3.5" },
   # clap_builder, textwrap
   { name = "terminal_size", version = "0.2.6" },
 ]

From bc51b8d2169896ab5c513edb441a6d041a0449f6 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Sat, 13 Jan 2024 15:09:08 +0100
Subject: [PATCH 398/429] cut: allow the same option to be passed multiple
 times

---
 src/uu/cut/src/cut.rs     |  1 +
 tests/by-util/test_cut.rs | 10 ++++++++++
 2 files changed, 11 insertions(+)

diff --git a/src/uu/cut/src/cut.rs b/src/uu/cut/src/cut.rs
index 0d5f79b35c1..2a3196d002e 100644
--- a/src/uu/cut/src/cut.rs
+++ b/src/uu/cut/src/cut.rs
@@ -510,6 +510,7 @@ pub fn uu_app() -> Command {
         .about(ABOUT)
         .after_help(AFTER_HELP)
         .infer_long_args(true)
+        .args_override_self(true)
         .arg(
             Arg::new(options::BYTES)
                 .short('b')
diff --git a/tests/by-util/test_cut.rs b/tests/by-util/test_cut.rs
index 112dc0fd3e5..57e6666d304 100644
--- a/tests/by-util/test_cut.rs
+++ b/tests/by-util/test_cut.rs
@@ -255,3 +255,13 @@ fn test_equal_as_delimiter3() {
         .succeeds()
         .stdout_only_bytes("abZcd\n");
 }
+
+#[test]
+fn test_multiple() {
+    let result = new_ucmd!()
+        .args(&["-f2", "-d:", "-d="])
+        .pipe_in("a=b\n")
+        .succeeds();
+    assert_eq!(result.stdout_str(), "b\n");
+    assert_eq!(result.stderr_str(), "");
+}

From e860b32a82acb1ca9840d1b7197d5407e922ef99 Mon Sep 17 00:00:00 2001
From: "renovate[bot]" <29139614+renovate[bot]@users.noreply.github.com>
Date: Sun, 14 Jan 2024 00:28:34 +0000
Subject: [PATCH 399/429] chore(deps): update rust crate smallvec to 1.12

---
 Cargo.lock | 4 ++--
 Cargo.toml | 2 +-
 2 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/Cargo.lock b/Cargo.lock
index bf83d9accd8..b6a25913477 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -1995,9 +1995,9 @@ dependencies = [
 
 [[package]]
 name = "smallvec"
-version = "1.11.0"
+version = "1.12.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "62bb4feee49fdd9f707ef802e22365a35de4b7b299de4763d44bfea899442ff9"
+checksum = "2593d31f82ead8df961d8bd23a64c2ccf2eb5dd34b0a34bfb4dd54011c72009e"
 
 [[package]]
 name = "smawk"
diff --git a/Cargo.toml b/Cargo.toml
index a01fcdd2d39..c6912251560 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -318,7 +318,7 @@ same-file = "1.0.6"
 self_cell = "1.0.3"
 selinux = "0.4"
 signal-hook = "0.3.17"
-smallvec = { version = "1.11", features = ["union"] }
+smallvec = { version = "1.12", features = ["union"] }
 tempfile = "3.9.0"
 uutils_term_grid = "0.3"
 terminal_size = "0.3.0"

From aeee56b3c3bd7ed0f93d875d322b0f9eba4ae95d Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Sun, 14 Jan 2024 15:23:24 +0100
Subject: [PATCH 400/429] head: fix clippy warnings in tests

---
 tests/by-util/test_head.rs | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/tests/by-util/test_head.rs b/tests/by-util/test_head.rs
index cc17cdf950a..0b0e98aa122 100644
--- a/tests/by-util/test_head.rs
+++ b/tests/by-util/test_head.rs
@@ -391,7 +391,7 @@ fn test_read_backwards_bytes_proc_fs_version() {
 
     let args = ["-c", "-1", "/proc/version"];
     let result = ts.ucmd().args(&args).succeeds();
-    assert!(result.stdout().len() > 0);
+    assert!(!result.stdout().is_empty());
 }
 
 #[cfg(all(
@@ -406,7 +406,7 @@ fn test_read_backwards_bytes_proc_fs_modules() {
 
     let args = ["-c", "-1", "/proc/modules"];
     let result = ts.ucmd().args(&args).succeeds();
-    assert!(result.stdout().len() > 0);
+    assert!(!result.stdout().is_empty());
 }
 
 #[cfg(all(
@@ -421,7 +421,7 @@ fn test_read_backwards_lines_proc_fs_modules() {
 
     let args = ["--lines", "-1", "/proc/modules"];
     let result = ts.ucmd().args(&args).succeeds();
-    assert!(result.stdout().len() > 0);
+    assert!(!result.stdout().is_empty());
 }
 
 #[cfg(all(

From e01d5f75f786b5f6953f5d714de92a588e0d5bc1 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Sun, 14 Jan 2024 15:57:22 +0100
Subject: [PATCH 401/429] ls: if acl are used, show the + in the perms (#5816)

* ls: if acl are used, show the + in the perms

Tested by tests/mkdir/p-acl.sh

* CICD.yml: fix small formatting issue

---------

Co-authored-by: Daniel Hofstetter <daniel.hofstetter@42dh.com>
---
 .github/workflows/CICD.yml | 20 ++++++++++++++++----
 Cargo.lock                 |  1 +
 src/uu/ls/Cargo.toml       |  3 +++
 src/uu/ls/src/ls.rs        | 28 ++++++++++++++++++++++++++--
 tests/by-util/test_ls.rs   | 36 ++++++++++++++++++++++++++++++++++++
 5 files changed, 82 insertions(+), 6 deletions(-)

diff --git a/.github/workflows/CICD.yml b/.github/workflows/CICD.yml
index 89022bbef35..20945609230 100644
--- a/.github/workflows/CICD.yml
+++ b/.github/workflows/CICD.yml
@@ -612,11 +612,23 @@ jobs:
       run: |
         ## Install/setup prerequisites
         case '${{ matrix.job.target }}' in
-          arm-unknown-linux-gnueabihf) sudo apt-get -y update ; sudo apt-get -y install gcc-arm-linux-gnueabihf ;;
-          aarch64-unknown-linux-*) sudo apt-get -y update ; sudo apt-get -y install gcc-aarch64-linux-gnu ;;
-          *-redox*) sudo apt-get -y update ; sudo apt-get -y install fuse3 libfuse-dev ;;
+          arm-unknown-linux-gnueabihf) 
+            sudo apt-get -y update
+            sudo apt-get -y install gcc-arm-linux-gnueabihf
+          ;;
+          aarch64-unknown-linux-*) 
+            sudo apt-get -y update
+            sudo apt-get -y install gcc-aarch64-linux-gnu
+          ;;
+          *-redox*) 
+            sudo apt-get -y update
+            sudo apt-get -y install fuse3 libfuse-dev
+          ;;
           # Update binutils if MinGW due to https://github.com/rust-lang/rust/issues/112368
-          x86_64-pc-windows-gnu) C:/msys64/usr/bin/pacman.exe -Syu --needed mingw-w64-x86_64-gcc --noconfirm ; echo "C:\msys64\mingw64\bin" >> $GITHUB_PATH ;;
+          x86_64-pc-windows-gnu)
+            C:/msys64/usr/bin/pacman.exe -Syu --needed mingw-w64-x86_64-gcc --noconfirm
+            echo "C:\msys64\mingw64\bin" >> $GITHUB_PATH
+          ;;
         esac
         case '${{ matrix.job.os }}' in
           macos-latest) brew install coreutils ;; # needed for testing
diff --git a/Cargo.lock b/Cargo.lock
index b6a25913477..56e448fa794 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -2616,6 +2616,7 @@ dependencies = [
  "unicode-width",
  "uucore",
  "uutils_term_grid",
+ "xattr",
 ]
 
 [[package]]
diff --git a/src/uu/ls/Cargo.toml b/src/uu/ls/Cargo.toml
index d11eeb27ce3..38312eefc5e 100644
--- a/src/uu/ls/Cargo.toml
+++ b/src/uu/ls/Cargo.toml
@@ -34,6 +34,9 @@ once_cell = { workspace = true }
 selinux = { workspace = true, optional = true }
 hostname = { workspace = true }
 
+[target.'cfg(unix)'.dependencies]
+xattr = { workspace = true }
+
 [[bin]]
 name = "ls"
 path = "src/main.rs"
diff --git a/src/uu/ls/src/ls.rs b/src/uu/ls/src/ls.rs
index 0e9b2572289..1c89cd3536d 100644
--- a/src/uu/ls/src/ls.rs
+++ b/src/uu/ls/src/ls.rs
@@ -3,7 +3,7 @@
 // For the full copyright and license information, please view the LICENSE
 // file that was distributed with this source code.
 
-// spell-checker:ignore (ToDO) somegroup nlink tabsize dired subdired dtype colorterm
+// spell-checker:ignore (ToDO) somegroup nlink tabsize dired subdired dtype colorterm getxattr
 
 use clap::{
     builder::{NonEmptyStringValueParser, ValueParser},
@@ -36,6 +36,7 @@ use std::{
 };
 use term_grid::{Cell, Direction, Filling, Grid, GridOptions};
 use unicode_width::UnicodeWidthStr;
+
 #[cfg(any(
     target_os = "linux",
     target_os = "macos",
@@ -2620,6 +2621,18 @@ fn display_grid(
     Ok(())
 }
 
+#[cfg(all(unix, not(any(target_os = "android", target_os = "macos"))))]
+fn file_has_acl<P: AsRef<Path>>(file: P) -> bool {
+    // don't use exacl here, it is doing more getxattr call then needed
+    match xattr::list(file) {
+        Ok(acl) => {
+            // if we have extra attributes, we have an acl
+            acl.count() > 0
+        }
+        Err(_) => false,
+    }
+}
+
 /// This writes to the BufWriter out a single string of the output of `ls -l`.
 ///
 /// It writes the following keys, in order:
@@ -2663,9 +2676,14 @@ fn display_item_long(
         output_display += "  ";
     }
     if let Some(md) = item.get_metadata(out) {
+        #[cfg(any(not(unix), target_os = "android", target_os = "macos"))]
+        // TODO: See how Mac should work here
+        let is_acl_set = false;
+        #[cfg(all(unix, not(any(target_os = "android", target_os = "macos"))))]
+        let is_acl_set = file_has_acl(item.display_name.as_os_str());
         write!(
             output_display,
-            "{}{} {}",
+            "{}{}{} {}",
             display_permissions(md, true),
             if item.security_context.len() > 1 {
                 // GNU `ls` uses a "." character to indicate a file with a security context,
@@ -2674,6 +2692,12 @@ fn display_item_long(
             } else {
                 ""
             },
+            if is_acl_set {
+                // if acl has been set, we display a "+" at the end of the file permissions
+                "+"
+            } else {
+                ""
+            },
             pad_left(&display_symlink_count(md), padding.link_count)
         )
         .unwrap();
diff --git a/tests/by-util/test_ls.rs b/tests/by-util/test_ls.rs
index 0162b017078..1262c2ab9ec 100644
--- a/tests/by-util/test_ls.rs
+++ b/tests/by-util/test_ls.rs
@@ -4293,3 +4293,39 @@ fn test_term_colorterm() {
         "exe"
     );
 }
+
+#[cfg(all(unix, not(target_os = "macos")))]
+#[test]
+fn test_acl_display() {
+    use std::process::Command;
+
+    let scene = TestScenario::new(util_name!());
+    let at = &scene.fixtures;
+    let path = "a42";
+    at.mkdir(path);
+
+    let path = at.plus_as_string(path);
+    // calling the command directly. xattr requires some dev packages to be installed
+    // and it adds a complex dependency just for a test
+    match Command::new("setfacl")
+        .args(["-d", "-m", "group::rwx", &path])
+        .status()
+        .map(|status| status.code())
+    {
+        Ok(Some(0)) => {}
+        Ok(_) => {
+            println!("test skipped: setfacl failed");
+            return;
+        }
+        Err(e) => {
+            println!("test skipped: setfacl failed with {}", e);
+            return;
+        }
+    }
+
+    scene
+        .ucmd()
+        .args(&["-lda", &path])
+        .succeeds()
+        .stdout_contains("+");
+}

From 4f33a375cda8c515db6eb81cd54007fe850dd2cb Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Fri, 5 Jan 2024 20:55:54 +0100
Subject: [PATCH 402/429] factor: handle the '< .' arg

---
 src/uu/factor/src/cli.rs     | 15 ++++++++++++---
 tests/by-util/test_factor.rs |  5 +++++
 2 files changed, 17 insertions(+), 3 deletions(-)

diff --git a/src/uu/factor/src/cli.rs b/src/uu/factor/src/cli.rs
index 63a0632a3b7..d01ca625c7b 100644
--- a/src/uu/factor/src/cli.rs
+++ b/src/uu/factor/src/cli.rs
@@ -73,9 +73,18 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
         let stdin = stdin();
         let lines = stdin.lock().lines();
         for line in lines {
-            for number in line.unwrap().split_whitespace() {
-                print_factors_str(number, &mut w, print_exponents)
-                    .map_err_context(|| "write error".into())?;
+            match line {
+                Ok(line) => {
+                    for number in line.split_whitespace() {
+                        print_factors_str(number, &mut w, print_exponents)
+                            .map_err_context(|| "write error".into())?;
+                    }
+                }
+                Err(e) => {
+                    set_exit_code(1);
+                    show_error!("error reading input: {}", e);
+                    return Ok(());
+                }
             }
         }
     }
diff --git a/tests/by-util/test_factor.rs b/tests/by-util/test_factor.rs
index 3326a1ace71..57a2dae0998 100644
--- a/tests/by-util/test_factor.rs
+++ b/tests/by-util/test_factor.rs
@@ -1258,3 +1258,8 @@ const PRIMES50: &[u64] = &[
     1125899906841623,
     1125899906841613,
 ];
+
+#[test]
+fn fails_on_directory() {
+    new_ucmd!().pipe_in(".").fails();
+}

From 8d24036f5cf769f6a10672e6060c615599269f2a Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Fri, 5 Jan 2024 21:15:26 +0100
Subject: [PATCH 403/429] basenc: handle '--base32 .' arg

---
 src/uu/base32/src/base_common.rs        |  3 ++-
 src/uucore/src/lib/features/encoding.rs |  7 +++++--
 tests/by-util/test_basenc.rs            | 13 +++++++++++++
 3 files changed, 20 insertions(+), 3 deletions(-)

diff --git a/src/uu/base32/src/base_common.rs b/src/uu/base32/src/base_common.rs
index 2112a40ead7..68c40287db7 100644
--- a/src/uu/base32/src/base_common.rs
+++ b/src/uu/base32/src/base_common.rs
@@ -6,7 +6,7 @@
 use std::io::{stdout, Read, Write};
 
 use uucore::display::Quotable;
-use uucore::encoding::{wrap_print, Data, Format};
+use uucore::encoding::{wrap_print, Data, EncodeError, Format};
 use uucore::error::{FromIo, UResult, USimpleError, UUsageError};
 use uucore::format_usage;
 
@@ -174,6 +174,7 @@ pub fn handle_input<R: Read>(
                 wrap_print(&data, &s);
                 Ok(())
             }
+            Err(EncodeError::InvalidInput) => Err(USimpleError::new(1, "error: invalid input")),
             Err(_) => Err(USimpleError::new(
                 1,
                 "error: invalid input (length must be multiple of 4 characters)",
diff --git a/src/uucore/src/lib/features/encoding.rs b/src/uucore/src/lib/features/encoding.rs
index 14fdbb38ee7..db218d5f061 100644
--- a/src/uucore/src/lib/features/encoding.rs
+++ b/src/uucore/src/lib/features/encoding.rs
@@ -27,6 +27,7 @@ pub enum DecodeError {
 
 pub enum EncodeError {
     Z85InputLenNotMultipleOf4,
+    InvalidInput,
 }
 
 pub type DecodeResult = Result<Vec<u8>, DecodeError>;
@@ -148,8 +149,10 @@ impl<R: Read> Data<R> {
 
     pub fn encode(&mut self) -> Result<String, EncodeError> {
         let mut buf: Vec<u8> = vec![];
-        self.input.read_to_end(&mut buf).unwrap();
-        encode(self.format, buf.as_slice())
+        match self.input.read_to_end(&mut buf) {
+            Ok(_) => encode(self.format, buf.as_slice()),
+            Err(_) => Err(EncodeError::InvalidInput),
+        }
     }
 }
 
diff --git a/tests/by-util/test_basenc.rs b/tests/by-util/test_basenc.rs
index 6c71b63f79c..13a8967031b 100644
--- a/tests/by-util/test_basenc.rs
+++ b/tests/by-util/test_basenc.rs
@@ -18,3 +18,16 @@ fn test_z85_not_padded() {
         .fails()
         .stderr_only("basenc: error: invalid input (length must be multiple of 4 characters)\n");
 }
+
+#[test]
+fn test_invalid_input() {
+    let error_message = if cfg!(windows) {
+        "basenc: .: Permission denied"
+    } else {
+        "basenc: error: invalid input\n"
+    };
+    new_ucmd!()
+        .args(&["--base32", "."])
+        .fails()
+        .stderr_only(error_message);
+}

From 3d356d47b3f6ada89b4946983d904f578f5263e2 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Fri, 5 Jan 2024 21:44:58 +0100
Subject: [PATCH 404/429] expand: avoid an infinite loop

---
 src/uu/expand/src/expand.rs  | 11 +++++++++--
 tests/by-util/test_expand.rs |  8 ++++++++
 2 files changed, 17 insertions(+), 2 deletions(-)

diff --git a/src/uu/expand/src/expand.rs b/src/uu/expand/src/expand.rs
index eb9766eb4f6..1efb36c654c 100644
--- a/src/uu/expand/src/expand.rs
+++ b/src/uu/expand/src/expand.rs
@@ -11,11 +11,12 @@ use std::fmt;
 use std::fs::File;
 use std::io::{stdin, stdout, BufRead, BufReader, BufWriter, Read, Write};
 use std::num::IntErrorKind;
+use std::path::Path;
 use std::str::from_utf8;
 use unicode_width::UnicodeWidthChar;
 use uucore::display::Quotable;
-use uucore::error::{FromIo, UError, UResult};
-use uucore::{format_usage, help_about, help_usage};
+use uucore::error::{set_exit_code, FromIo, UError, UResult};
+use uucore::{format_usage, help_about, help_usage, show_error};
 
 const ABOUT: &str = help_about!("expand.md");
 const USAGE: &str = help_usage!("expand.md");
@@ -465,6 +466,12 @@ fn expand(options: &Options) -> UResult<()> {
     let mut buf = Vec::new();
 
     for file in &options.files {
+        if Path::new(file).is_dir() {
+            show_error!("{}: Is a directory", file);
+            set_exit_code(1);
+            continue;
+        }
+
         let mut fh = open(file)?;
 
         while match fh.read_until(b'\n', &mut buf) {
diff --git a/tests/by-util/test_expand.rs b/tests/by-util/test_expand.rs
index 1e26b32732c..c420f5ad5b9 100644
--- a/tests/by-util/test_expand.rs
+++ b/tests/by-util/test_expand.rs
@@ -409,3 +409,11 @@ int main() {
 ",
         );
 }
+
+#[test]
+fn test_expand_directory() {
+    new_ucmd!()
+        .args(&["."])
+        .fails()
+        .stderr_contains("expand: .: Is a directory");
+}

From 7914f22cfe13167d14f38b01d4a3b8aa6f5b309e Mon Sep 17 00:00:00 2001
From: "renovate[bot]" <29139614+renovate[bot]@users.noreply.github.com>
Date: Mon, 15 Jan 2024 03:14:26 +0000
Subject: [PATCH 405/429] chore(deps): update rust crate xattr to 1.3.1

---
 Cargo.lock | 16 ++++++++--------
 Cargo.toml |  2 +-
 2 files changed, 9 insertions(+), 9 deletions(-)

diff --git a/Cargo.lock b/Cargo.lock
index e0d6ffbf5da..55ec59e2d0a 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -1589,7 +1589,7 @@ dependencies = [
  "hex",
  "lazy_static",
  "procfs-core",
- "rustix 0.38.28",
+ "rustix 0.38.30",
 ]
 
 [[package]]
@@ -1822,9 +1822,9 @@ dependencies = [
 
 [[package]]
 name = "rustix"
-version = "0.38.28"
+version = "0.38.30"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "72e572a5e8ca657d7366229cdde4bd14c4eb5499a9573d4d366fe1b599daa316"
+checksum = "322394588aaf33c24007e8bb3238ee3e4c5c09c084ab32bc73890b99ff326bca"
 dependencies = [
  "bitflags 2.4.0",
  "errno",
@@ -2043,7 +2043,7 @@ dependencies = [
  "cfg-if",
  "fastrand",
  "redox_syscall",
- "rustix 0.38.28",
+ "rustix 0.38.30",
  "windows-sys 0.52.0",
 ]
 
@@ -2063,7 +2063,7 @@ version = "0.3.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "21bebf2b7c9e0a515f6e0f8c51dc0f8e4696391e6f1ff30379559f8365fb0df7"
 dependencies = [
- "rustix 0.38.28",
+ "rustix 0.38.30",
  "windows-sys 0.48.0",
 ]
 
@@ -3566,13 +3566,13 @@ checksum = "dff9641d1cd4be8d1a070daf9e3773c5f67e78b4d9d42263020c057706765c04"
 
 [[package]]
 name = "xattr"
-version = "1.2.0"
+version = "1.3.1"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "914566e6413e7fa959cc394fb30e563ba80f3541fbd40816d4c05a0fc3f2a0f1"
+checksum = "8da84f1a25939b27f6820d92aed108f83ff920fdf11a7b19366c27c4cda81d4f"
 dependencies = [
  "libc",
  "linux-raw-sys 0.4.12",
- "rustix 0.38.28",
+ "rustix 0.38.30",
 ]
 
 [[package]]
diff --git a/Cargo.toml b/Cargo.toml
index c6912251560..17efcb6a747 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -331,7 +331,7 @@ utf-8 = "0.7.6"
 walkdir = "2.4"
 winapi-util = "0.1.6"
 windows-sys = { version = "0.48.0", default-features = false }
-xattr = "1.2.0"
+xattr = "1.3.1"
 zip = { version = "0.6.6", default-features = false, features = ["deflate"] }
 
 hex = "0.4.3"

From 076b905513b1ed27cae640ba6cb5d0db42ef5935 Mon Sep 17 00:00:00 2001
From: Biplab Mochan Gartia <45629823+biplab5464@users.noreply.github.com>
Date: Mon, 15 Jan 2024 14:07:56 +0530
Subject: [PATCH 406/429]  cksum: stops when one of given files doesn't exist
 #5809  (#5820)

* cksum: stops when one of given files doesn't exist #5809

* removed printld  cksum: stops when one of given files doesn't exist #5809

* formatting the code cksum: stops when one of given files doesn't exist #5809

* formatting the code cksum: stops when one of given files doesn't exist #5809

* set exist status cksum: stops when one of given files doesn't exist #5809

* code quality formatting issue cksum: stops when one of given files doesn't exist #5809

* tertsdiepraam idea cksum: stops when one of given files doesn't exist #5809

* one new test case and deleted duplicate show cksum: stops when one of given files doesn't exist #5809

* formatting the test cases cksum: stops when one of given files doesn't exist #5809

* Revert "formatting the test cases cksum: stops when one of given files doesn't exist #5809"

This reverts commit 8c382f1e8fa4e9ba3fc0f4fc05ee2fb58ef9dbfd.

* reverting the changes and committing again due to a mistake cksum: stops when one of given files doesn't exist #5809

---------

Co-authored-by: biplab5464 <biplab5464@outlook.com>
---
 src/uu/cksum/src/cksum.rs   |  9 +++++++--
 tests/by-util/test_cksum.rs | 16 ++++++++++++++++
 2 files changed, 23 insertions(+), 2 deletions(-)

diff --git a/src/uu/cksum/src/cksum.rs b/src/uu/cksum/src/cksum.rs
index 458177e8a7c..36dfbbe1e3d 100644
--- a/src/uu/cksum/src/cksum.rs
+++ b/src/uu/cksum/src/cksum.rs
@@ -168,8 +168,13 @@ where
         } else if filename.is_dir() {
             Box::new(BufReader::new(io::empty())) as Box<dyn Read>
         } else {
-            file_buf =
-                File::open(filename).map_err_context(|| filename.to_str().unwrap().to_string())?;
+            file_buf = match File::open(filename) {
+                Ok(file) => file,
+                Err(err) => {
+                    show!(err.map_err_context(|| filename.to_string_lossy().to_string()));
+                    continue;
+                }
+            };
             Box::new(file_buf) as Box<dyn Read>
         });
         let (sum, sz) = digest_read(&mut options.digest, &mut file, options.output_bits)
diff --git a/tests/by-util/test_cksum.rs b/tests/by-util/test_cksum.rs
index 80cfc749931..464de947479 100644
--- a/tests/by-util/test_cksum.rs
+++ b/tests/by-util/test_cksum.rs
@@ -80,6 +80,22 @@ fn test_nonexisting_file() {
         .stderr_contains(format!("cksum: {file_name}: No such file or directory"));
 }
 
+#[test]
+fn test_one_nonexisting_file() {
+    let (at, mut ucmd) = at_and_ucmd!();
+
+    at.touch("abc.txt");
+    at.touch("xyz.txt");
+
+    ucmd.arg("abc.txt")
+        .arg("asdf.txt")
+        .arg("xyz.txt")
+        .fails()
+        .stdout_contains_line("4294967295 0 xyz.txt")
+        .stderr_contains("asdf.txt: No such file or directory")
+        .stdout_contains_line("4294967295 0 abc.txt");
+}
+
 // Make sure crc is correct for files larger than 32 bytes
 // but <128 bytes (1 fold pclmul) // spell-checker:disable-line
 #[test]

From e91540fc0792ab563fe2a35a52299024902b88cf Mon Sep 17 00:00:00 2001
From: Daniel Hofstetter <daniel.hofstetter@42dh.com>
Date: Mon, 15 Jan 2024 10:27:59 +0100
Subject: [PATCH 407/429] uucore: fix clippy warning from if_not_else lint

---
 src/uucore/src/lib/features/format/num_format.rs | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/src/uucore/src/lib/features/format/num_format.rs b/src/uucore/src/lib/features/format/num_format.rs
index 325da3ce6e3..ea5d6a75316 100644
--- a/src/uucore/src/lib/features/format/num_format.rs
+++ b/src/uucore/src/lib/features/format/num_format.rs
@@ -146,10 +146,10 @@ impl Formatter for UnsignedInt {
                 // We also need to take into account that 0 should not be 00
                 // Since this is an unsigned int, we do not need to take the minus
                 // sign into account.
-                if x != 0 {
-                    format!("0{x:o}")
-                } else {
+                if x == 0 {
                     format!("{x:o}")
+                } else {
+                    format!("0{x:o}")
                 }
             }
             UnsignedIntVariant::Hexadecimal(Case::Lowercase, Prefix::No) => {

From b116a97fdcd8533f296f0c2e0f1a94e3b287d0e5 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Mon, 15 Jan 2024 10:43:20 +0100
Subject: [PATCH 408/429] add missing \n

---
 tests/by-util/test_basenc.rs | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/by-util/test_basenc.rs b/tests/by-util/test_basenc.rs
index 13a8967031b..c9e15ef1f61 100644
--- a/tests/by-util/test_basenc.rs
+++ b/tests/by-util/test_basenc.rs
@@ -22,7 +22,7 @@ fn test_z85_not_padded() {
 #[test]
 fn test_invalid_input() {
     let error_message = if cfg!(windows) {
-        "basenc: .: Permission denied"
+        "basenc: .: Permission denied\n"
     } else {
         "basenc: error: invalid input\n"
     };

From fff83995fb2c10fe1b477f4e3879fa0dbd5e247d Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Mon, 15 Jan 2024 10:59:04 +0100
Subject: [PATCH 409/429] cp: --preserve should keep xattr (#5834)

* cp: --preserve should keep xattr

Should help with tests/cp/acl.sh

* Update tests/by-util/test_cp.rs

Co-authored-by: Daniel Hofstetter <daniel.hofstetter@42dh.com>

* Update tests/by-util/test_cp.rs

Co-authored-by: Daniel Hofstetter <daniel.hofstetter@42dh.com>

* Update tests/by-util/test_cp.rs

Co-authored-by: Daniel Hofstetter <daniel.hofstetter@42dh.com>

---------

Co-authored-by: Daniel Hofstetter <daniel.hofstetter@42dh.com>
---
 Cargo.lock               |  1 +
 Cargo.toml               |  1 +
 src/uu/cp/src/cp.rs      |  5 ++--
 tests/by-util/test_cp.rs | 58 +++++++++++++++++++++++++++++++++++++++-
 4 files changed, 62 insertions(+), 3 deletions(-)

diff --git a/Cargo.lock b/Cargo.lock
index 55ec59e2d0a..978c7fc3fae 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -507,6 +507,7 @@ dependencies = [
  "uucore",
  "uuhelp_parser",
  "walkdir",
+ "xattr",
  "zip",
 ]
 
diff --git a/Cargo.toml b/Cargo.toml
index 17efcb6a747..a8e9c399b5c 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -500,6 +500,7 @@ rlimit = "0.10.1"
 [target.'cfg(unix)'.dev-dependencies]
 nix = { workspace = true, features = ["process", "signal", "user"] }
 rand_pcg = "0.3"
+xattr = { workspace = true }
 
 [build-dependencies]
 phf_codegen = { workspace = true }
diff --git a/src/uu/cp/src/cp.rs b/src/uu/cp/src/cp.rs
index 52d59ff6198..28e9b678471 100644
--- a/src/uu/cp/src/cp.rs
+++ b/src/uu/cp/src/cp.rs
@@ -826,6 +826,7 @@ impl Attributes {
         ownership: Preserve::Yes { required: true },
         mode: Preserve::Yes { required: true },
         timestamps: Preserve::Yes { required: true },
+        xattr: Preserve::Yes { required: true },
         ..Self::NONE
     };
 
@@ -1441,7 +1442,7 @@ pub(crate) fn copy_attributes(
     })?;
 
     handle_preserve(&attributes.xattr, || -> CopyResult<()> {
-        #[cfg(unix)]
+        #[cfg(all(unix, not(target_os = "android")))]
         {
             let xattrs = xattr::list(source)?;
             for attr in xattrs {
@@ -1450,7 +1451,7 @@ pub(crate) fn copy_attributes(
                 }
             }
         }
-        #[cfg(not(unix))]
+        #[cfg(not(all(unix, not(target_os = "android"))))]
         {
             // The documentation for GNU cp states:
             //
diff --git a/tests/by-util/test_cp.rs b/tests/by-util/test_cp.rs
index 5d78c5996c0..1271909ecb9 100644
--- a/tests/by-util/test_cp.rs
+++ b/tests/by-util/test_cp.rs
@@ -2,7 +2,7 @@
 //
 // For the full copyright and license information, please view the LICENSE
 // file that was distributed with this source code.
-// spell-checker:ignore (flags) reflink (fs) tmpfs (linux) rlimit Rlim NOFILE clob btrfs ROOTDIR USERDIR procfs outfile uufs
+// spell-checker:ignore (flags) reflink (fs) tmpfs (linux) rlimit Rlim NOFILE clob btrfs ROOTDIR USERDIR procfs outfile uufs xattrs
 
 use crate::common::util::TestScenario;
 #[cfg(not(windows))]
@@ -56,6 +56,8 @@ static TEST_MOUNT_MOUNTPOINT: &str = "mount";
 static TEST_MOUNT_OTHER_FILESYSTEM_FILE: &str = "mount/DO_NOT_copy_me.txt";
 #[cfg(unix)]
 static TEST_NONEXISTENT_FILE: &str = "nonexistent_file.txt";
+#[cfg(all(unix, not(any(target_os = "android", target_os = "macos"))))]
+use xattr;
 
 /// Assert that mode, ownership, and permissions of two metadata objects match.
 #[cfg(all(not(windows), not(target_os = "freebsd")))]
@@ -3736,3 +3738,57 @@ fn test_cp_no_such() {
         .fails()
         .stderr_is("cp: 'no-such/' is not a directory\n");
 }
+
+#[cfg(all(unix, not(any(target_os = "android", target_os = "macos"))))]
+fn compare_xattrs<P: AsRef<Path>>(path1: P, path2: P) -> bool {
+    let get_sorted_xattrs = |path: P| {
+        xattr::list(path)
+            .map(|attrs| {
+                let mut attrs = attrs.collect::<Vec<_>>();
+                attrs.sort();
+                attrs
+            })
+            .unwrap_or_else(|_| Vec::new())
+    };
+
+    get_sorted_xattrs(path1) == get_sorted_xattrs(path2)
+}
+
+#[cfg(all(unix, not(any(target_os = "android", target_os = "macos"))))]
+#[test]
+fn test_acl_preserve() {
+    use std::process::Command;
+
+    let scene = TestScenario::new(util_name!());
+    let at = &scene.fixtures;
+    let path1 = "a";
+    let path2 = "b";
+    let file = "a/file";
+    let file_target = "b/file";
+    at.mkdir(path1);
+    at.mkdir(path2);
+    at.touch(file);
+
+    let path = at.plus_as_string(file);
+    // calling the command directly. xattr requires some dev packages to be installed
+    // and it adds a complex dependency just for a test
+    match Command::new("setfacl")
+        .args(["-m", "group::rwx", &path1])
+        .status()
+        .map(|status| status.code())
+    {
+        Ok(Some(0)) => {}
+        Ok(_) => {
+            println!("test skipped: setfacl failed");
+            return;
+        }
+        Err(e) => {
+            println!("test skipped: setfacl failed with {}", e);
+            return;
+        }
+    }
+
+    scene.ucmd().args(&["-p", &path, path2]).succeeds();
+
+    assert!(compare_xattrs(&file, &file_target));
+}

From fe3f8293ef278e21649e6b891f36c8f0d8a5d696 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Sun, 14 Jan 2024 00:01:45 +0100
Subject: [PATCH 410/429] uucore: add a new feature called fsxattr

---
 Cargo.lock                             |   1 +
 src/uucore/Cargo.toml                  |   2 +
 src/uucore/src/lib/features.rs         |   2 +
 src/uucore/src/lib/features/fsxattr.rs | 116 +++++++++++++++++++++++++
 src/uucore/src/lib/lib.rs              |   8 +-
 5 files changed, 127 insertions(+), 2 deletions(-)
 create mode 100644 src/uucore/src/lib/features/fsxattr.rs

diff --git a/Cargo.lock b/Cargo.lock
index 978c7fc3fae..0ef909d732a 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -3209,6 +3209,7 @@ dependencies = [
  "wild",
  "winapi-util",
  "windows-sys 0.48.0",
+ "xattr",
  "z85",
 ]
 
diff --git a/src/uucore/Cargo.toml b/src/uucore/Cargo.toml
index 44f8bb2d13f..557cdc4dde2 100644
--- a/src/uucore/Cargo.toml
+++ b/src/uucore/Cargo.toml
@@ -54,6 +54,7 @@ sm3 = { workspace = true, optional = true }
 [target.'cfg(unix)'.dependencies]
 walkdir = { workspace = true, optional = true }
 nix = { workspace = true, features = ["fs", "uio", "zerocopy", "signal"] }
+xattr = { workspace = true, optional = true }
 
 [dev-dependencies]
 clap = { workspace = true }
@@ -77,6 +78,7 @@ encoding = ["data-encoding", "data-encoding-macro", "z85", "thiserror"]
 entries = ["libc"]
 fs = ["dunce", "libc", "winapi-util", "windows-sys"]
 fsext = ["libc", "time", "windows-sys"]
+fsxattr = [ "xattr" ]
 lines = []
 format = ["itertools"]
 mode = ["libc"]
diff --git a/src/uucore/src/lib/features.rs b/src/uucore/src/lib/features.rs
index e26de487b57..423ff34bad9 100644
--- a/src/uucore/src/lib/features.rs
+++ b/src/uucore/src/lib/features.rs
@@ -46,6 +46,8 @@ pub mod pipes;
 #[cfg(all(unix, feature = "process"))]
 pub mod process;
 
+#[cfg(all(unix, not(target_os = "macos"), feature = "fsxattr"))]
+pub mod fsxattr;
 #[cfg(all(unix, not(target_os = "fuchsia"), feature = "signals"))]
 pub mod signals;
 #[cfg(all(
diff --git a/src/uucore/src/lib/features/fsxattr.rs b/src/uucore/src/lib/features/fsxattr.rs
new file mode 100644
index 00000000000..7bda023f9a7
--- /dev/null
+++ b/src/uucore/src/lib/features/fsxattr.rs
@@ -0,0 +1,116 @@
+// This file is part of the uutils coreutils package.
+//
+// For the full copyright and license information, please view the LICENSE
+// file that was distributed with this source code.
+
+//! Set of functions to manage xattr on files and dirs
+use std::collections::HashMap;
+use std::ffi::OsString;
+use std::path::Path;
+
+/// Copies extended attributes (xattrs) from one file or directory to another.
+///
+/// # Arguments
+///
+/// * `source` - A reference to the source path.
+/// * `dest` - A reference to the destination path.
+///
+/// # Returns
+///
+/// A result indicating success or failure.
+pub fn copy_xattrs<P: AsRef<Path>>(source: P, dest: P) -> std::io::Result<()> {
+    for attr_name in xattr::list(&source)? {
+        if let Some(value) = xattr::get(&source, &attr_name)? {
+            xattr::set(&dest, &attr_name, &value)?;
+        }
+    }
+    Ok(())
+}
+
+/// Retrieves the extended attributes (xattrs) of a given file or directory.
+///
+/// # Arguments
+///
+/// * `source` - A reference to the path of the file or directory.
+///
+/// # Returns
+///
+/// A result containing a HashMap of attributes names and values, or an error.
+pub fn retrieve_xattrs<P: AsRef<Path>>(source: P) -> std::io::Result<HashMap<OsString, Vec<u8>>> {
+    let mut attrs = HashMap::new();
+    for attr_name in xattr::list(&source)? {
+        if let Some(value) = xattr::get(&source, &attr_name)? {
+            attrs.insert(attr_name, value);
+        }
+    }
+    Ok(attrs)
+}
+
+/// Applies extended attributes (xattrs) to a given file or directory.
+///
+/// # Arguments
+///
+/// * `dest` - A reference to the path of the file or directory.
+/// * `xattrs` - A HashMap containing attribute names and their corresponding values.
+///
+/// # Returns
+///
+/// A result indicating success or failure.
+pub fn apply_xattrs<P: AsRef<Path>>(
+    dest: P,
+    xattrs: HashMap<OsString, Vec<u8>>,
+) -> std::io::Result<()> {
+    for (attr, value) in xattrs {
+        xattr::set(&dest, &attr, &value)?;
+    }
+    Ok(())
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use std::fs::File;
+    use tempfile::tempdir;
+
+    #[test]
+    fn test_copy_xattrs() {
+        let temp_dir = tempdir().unwrap();
+        let source_path = temp_dir.path().join("source.txt");
+        let dest_path = temp_dir.path().join("dest.txt");
+
+        File::create(&source_path).unwrap();
+        File::create(&dest_path).unwrap();
+
+        let test_attr = "user.test";
+        let test_value = b"test value";
+        xattr::set(&source_path, test_attr, test_value).unwrap();
+
+        copy_xattrs(&source_path, &dest_path).unwrap();
+
+        let copied_value = xattr::get(&dest_path, test_attr).unwrap().unwrap();
+        assert_eq!(copied_value, test_value);
+    }
+
+    #[test]
+    fn test_apply_and_retrieve_xattrs() {
+        let temp_dir = tempdir().unwrap();
+        let file_path = temp_dir.path().join("test_file.txt");
+
+        File::create(&file_path).unwrap();
+
+        let mut test_xattrs = HashMap::new();
+        let test_attr = "user.test_attr";
+        let test_value = b"test value";
+        test_xattrs.insert(OsString::from(test_attr), test_value.to_vec());
+        apply_xattrs(&file_path, test_xattrs).unwrap();
+
+        let retrieved_xattrs = retrieve_xattrs(&file_path).unwrap();
+        assert!(retrieved_xattrs.contains_key(OsString::from(test_attr).as_os_str()));
+        assert_eq!(
+            retrieved_xattrs
+                .get(OsString::from(test_attr).as_os_str())
+                .unwrap(),
+            test_value
+        );
+    }
+}
diff --git a/src/uucore/src/lib/lib.rs b/src/uucore/src/lib/lib.rs
index 2fc0ae301b3..6f8400589ef 100644
--- a/src/uucore/src/lib/lib.rs
+++ b/src/uucore/src/lib/lib.rs
@@ -43,8 +43,6 @@ pub use crate::features::encoding;
 pub use crate::features::format;
 #[cfg(feature = "fs")]
 pub use crate::features::fs;
-#[cfg(feature = "fsext")]
-pub use crate::features::fsext;
 #[cfg(feature = "lines")]
 pub use crate::features::lines;
 #[cfg(feature = "quoting-style")]
@@ -89,6 +87,12 @@ pub use crate::features::utmpx;
 #[cfg(all(windows, feature = "wide"))]
 pub use crate::features::wide;
 
+#[cfg(feature = "fsext")]
+pub use crate::features::fsext;
+
+#[cfg(all(unix, not(target_os = "macos"), feature = "fsxattr"))]
+pub use crate::features::fsxattr;
+
 //## core functions
 
 use std::ffi::OsString;

From 238fb776ad01146976212ce3e331dd3bbe8a45f4 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Sun, 14 Jan 2024 00:38:17 +0100
Subject: [PATCH 411/429] test: add a function to compare the xattr between two
 files. used by cp & mv (at least)

---
 tests/common/util.rs | 42 ++++++++++++++++++++++++++++++++++++++++++
 1 file changed, 42 insertions(+)

diff --git a/tests/common/util.rs b/tests/common/util.rs
index 5dac61f7eac..9055c238e08 100644
--- a/tests/common/util.rs
+++ b/tests/common/util.rs
@@ -756,6 +756,26 @@ pub fn get_root_path() -> &'static str {
     }
 }
 
+/// Compares the extended attributes (xattrs) of two files or directories.
+///
+/// # Returns
+///
+/// `true` if both paths have the same set of extended attributes, `false` otherwise.
+#[cfg(all(unix, not(target_os = "macos")))]
+pub fn compare_xattrs<P: AsRef<std::path::Path>>(path1: P, path2: P) -> bool {
+    let get_sorted_xattrs = |path: P| {
+        xattr::list(path)
+            .map(|attrs| {
+                let mut attrs = attrs.collect::<Vec<_>>();
+                attrs.sort();
+                attrs
+            })
+            .unwrap_or_else(|_| Vec::new())
+    };
+
+    get_sorted_xattrs(path1) == get_sorted_xattrs(path2)
+}
+
 /// Object-oriented path struct that represents and operates on
 /// paths relative to the directory it was constructed for.
 #[derive(Clone)]
@@ -3375,4 +3395,26 @@ mod tests {
         );
         assert!(command.tmpd.is_some());
     }
+
+    #[cfg(all(unix, not(target_os = "macos")))]
+    #[test]
+    fn test_compare_xattrs() {
+        use tempfile::tempdir;
+
+        let temp_dir = tempdir().unwrap();
+        let file_path1 = temp_dir.path().join("test_file1.txt");
+        let file_path2 = temp_dir.path().join("test_file2.txt");
+
+        File::create(&file_path1).unwrap();
+        File::create(&file_path2).unwrap();
+
+        let test_attr = "user.test_attr";
+        let test_value = b"test value";
+        xattr::set(&file_path1, test_attr, test_value).unwrap();
+
+        assert!(!compare_xattrs(&file_path1, &file_path2));
+
+        xattr::set(&file_path2, test_attr, test_value).unwrap();
+        assert!(compare_xattrs(&file_path1, &file_path2));
+    }
 }

From 2ec4e9f78490f5cd8d4ccff4ac87a442da5461b2 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Sun, 14 Jan 2024 00:39:00 +0100
Subject: [PATCH 412/429] mv: preserve the xattr

Should make tests/mv/acl pass
---
 .../cspell.dictionaries/jargon.wordlist.txt   |  2 +
 src/uu/mv/Cargo.toml                          |  1 +
 src/uu/mv/src/mv.rs                           | 15 +++++++
 src/uucore/Cargo.toml                         |  2 +-
 tests/by-util/test_mv.rs                      | 41 +++++++++++++++++++
 5 files changed, 60 insertions(+), 1 deletion(-)

diff --git a/.vscode/cspell.dictionaries/jargon.wordlist.txt b/.vscode/cspell.dictionaries/jargon.wordlist.txt
index dca883dc804..20e26990f3b 100644
--- a/.vscode/cspell.dictionaries/jargon.wordlist.txt
+++ b/.vscode/cspell.dictionaries/jargon.wordlist.txt
@@ -42,6 +42,7 @@ fileio
 filesystem
 filesystems
 flamegraph
+fsxattr
 fullblock
 getfacl
 gibi
@@ -133,6 +134,7 @@ urand
 whitespace
 wordlist
 wordlists
+xattrs
 
 # * abbreviations
 consts
diff --git a/src/uu/mv/Cargo.toml b/src/uu/mv/Cargo.toml
index 83a10ef6b7a..83d68bc3d82 100644
--- a/src/uu/mv/Cargo.toml
+++ b/src/uu/mv/Cargo.toml
@@ -21,6 +21,7 @@ indicatif = { workspace = true }
 uucore = { workspace = true, features = [
   "backup-control",
   "fs",
+  "fsxattr",
   "update-control",
 ] }
 
diff --git a/src/uu/mv/src/mv.rs b/src/uu/mv/src/mv.rs
index 223ac9119b6..9f24cf77092 100644
--- a/src/uu/mv/src/mv.rs
+++ b/src/uu/mv/src/mv.rs
@@ -27,7 +27,10 @@ use uucore::fs::{
     are_hardlinks_or_one_way_symlink_to_same_file, are_hardlinks_to_same_file,
     path_ends_with_terminator,
 };
+#[cfg(all(unix, not(target_os = "macos")))]
+use uucore::fsxattr;
 use uucore::update_control;
+
 // These are exposed for projects (e.g. nushell) that want to create an `Options` value, which
 // requires these enums
 pub use uucore::{backup_control::BackupMode, update_control::UpdateMode};
@@ -631,6 +634,10 @@ fn rename_with_fallback(
                     None
                 };
 
+            #[cfg(all(unix, not(target_os = "macos")))]
+            let xattrs =
+                fsxattr::retrieve_xattrs(from).unwrap_or_else(|_| std::collections::HashMap::new());
+
             let result = if let Some(ref pb) = progress_bar {
                 move_dir_with_progress(from, to, &options, |process_info: TransitProcess| {
                     pb.set_position(process_info.copied_bytes);
@@ -641,6 +648,9 @@ fn rename_with_fallback(
                 move_dir(from, to, &options)
             };
 
+            #[cfg(all(unix, not(target_os = "macos")))]
+            fsxattr::apply_xattrs(to, xattrs).unwrap();
+
             if let Err(err) = result {
                 return match err.kind {
                     fs_extra::error::ErrorKind::PermissionDenied => Err(io::Error::new(
@@ -651,6 +661,11 @@ fn rename_with_fallback(
                 };
             }
         } else {
+            #[cfg(all(unix, not(target_os = "macos")))]
+            fs::copy(from, to)
+                .and_then(|_| fsxattr::copy_xattrs(&from, &to))
+                .and_then(|_| fs::remove_file(from))?;
+            #[cfg(any(target_os = "macos", not(unix)))]
             fs::copy(from, to).and_then(|_| fs::remove_file(from))?;
         }
     }
diff --git a/src/uucore/Cargo.toml b/src/uucore/Cargo.toml
index 557cdc4dde2..8500faeff8f 100644
--- a/src/uucore/Cargo.toml
+++ b/src/uucore/Cargo.toml
@@ -78,7 +78,7 @@ encoding = ["data-encoding", "data-encoding-macro", "z85", "thiserror"]
 entries = ["libc"]
 fs = ["dunce", "libc", "winapi-util", "windows-sys"]
 fsext = ["libc", "time", "windows-sys"]
-fsxattr = [ "xattr" ]
+fsxattr = ["xattr"]
 lines = []
 format = ["itertools"]
 mode = ["libc"]
diff --git a/tests/by-util/test_mv.rs b/tests/by-util/test_mv.rs
index 175b91e7dab..dd05ffbcd0a 100644
--- a/tests/by-util/test_mv.rs
+++ b/tests/by-util/test_mv.rs
@@ -1569,6 +1569,47 @@ fn test_mv_dir_into_path_slash() {
     assert!(at.dir_exists("f/b"));
 }
 
+#[cfg(all(unix, not(target_os = "macos")))]
+#[test]
+fn test_acl() {
+    use std::process::Command;
+
+    use crate::common::util::compare_xattrs;
+
+    let scene = TestScenario::new(util_name!());
+    let at = &scene.fixtures;
+    let path1 = "a";
+    let path2 = "b";
+    let file = "a/file";
+    let file_target = "b/file";
+    at.mkdir(path1);
+    at.mkdir(path2);
+    at.touch(file);
+
+    let path = at.plus_as_string(file);
+    // calling the command directly. xattr requires some dev packages to be installed
+    // and it adds a complex dependency just for a test
+    match Command::new("setfacl")
+        .args(["-m", "group::rwx", &path1])
+        .status()
+        .map(|status| status.code())
+    {
+        Ok(Some(0)) => {}
+        Ok(_) => {
+            println!("test skipped: setfacl failed");
+            return;
+        }
+        Err(e) => {
+            println!("test skipped: setfacl failed with {}", e);
+            return;
+        }
+    }
+
+    scene.ucmd().arg(&path).arg(path2).succeeds();
+
+    assert!(compare_xattrs(&file, &file_target));
+}
+
 // Todo:
 
 // $ at.touch a b

From 66637a650321f920d8463155b7afdb1e9c8e113f Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Sun, 14 Jan 2024 17:46:45 +0100
Subject: [PATCH 413/429] move the file_has_acl function into uucore

---
 Cargo.lock                             |  1 -
 src/uu/ls/Cargo.toml                   |  4 +--
 src/uu/ls/src/ls.rs                    | 19 +++-----------
 src/uucore/src/lib/features/fsxattr.rs | 36 ++++++++++++++++++++++++++
 4 files changed, 41 insertions(+), 19 deletions(-)

diff --git a/Cargo.lock b/Cargo.lock
index 0ef909d732a..cbff54c4b91 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -2608,7 +2608,6 @@ dependencies = [
  "unicode-width",
  "uucore",
  "uutils_term_grid",
- "xattr",
 ]
 
 [[package]]
diff --git a/src/uu/ls/Cargo.toml b/src/uu/ls/Cargo.toml
index 38312eefc5e..dc79c6f93d0 100644
--- a/src/uu/ls/Cargo.toml
+++ b/src/uu/ls/Cargo.toml
@@ -27,6 +27,7 @@ uucore = { workspace = true, features = [
   "colors",
   "entries",
   "fs",
+  "fsxattr",
   "quoting-style",
   "version-cmp",
 ] }
@@ -34,9 +35,6 @@ once_cell = { workspace = true }
 selinux = { workspace = true, optional = true }
 hostname = { workspace = true }
 
-[target.'cfg(unix)'.dependencies]
-xattr = { workspace = true }
-
 [[bin]]
 name = "ls"
 path = "src/main.rs"
diff --git a/src/uu/ls/src/ls.rs b/src/uu/ls/src/ls.rs
index 1c89cd3536d..ed100477f42 100644
--- a/src/uu/ls/src/ls.rs
+++ b/src/uu/ls/src/ls.rs
@@ -3,7 +3,7 @@
 // For the full copyright and license information, please view the LICENSE
 // file that was distributed with this source code.
 
-// spell-checker:ignore (ToDO) somegroup nlink tabsize dired subdired dtype colorterm getxattr
+// spell-checker:ignore (ToDO) somegroup nlink tabsize dired subdired dtype colorterm
 
 use clap::{
     builder::{NonEmptyStringValueParser, ValueParser},
@@ -36,7 +36,8 @@ use std::{
 };
 use term_grid::{Cell, Direction, Filling, Grid, GridOptions};
 use unicode_width::UnicodeWidthStr;
-
+#[cfg(all(unix, not(any(target_os = "android", target_os = "macos"))))]
+use uucore::fsxattr::has_acl;
 #[cfg(any(
     target_os = "linux",
     target_os = "macos",
@@ -2621,18 +2622,6 @@ fn display_grid(
     Ok(())
 }
 
-#[cfg(all(unix, not(any(target_os = "android", target_os = "macos"))))]
-fn file_has_acl<P: AsRef<Path>>(file: P) -> bool {
-    // don't use exacl here, it is doing more getxattr call then needed
-    match xattr::list(file) {
-        Ok(acl) => {
-            // if we have extra attributes, we have an acl
-            acl.count() > 0
-        }
-        Err(_) => false,
-    }
-}
-
 /// This writes to the BufWriter out a single string of the output of `ls -l`.
 ///
 /// It writes the following keys, in order:
@@ -2680,7 +2669,7 @@ fn display_item_long(
         // TODO: See how Mac should work here
         let is_acl_set = false;
         #[cfg(all(unix, not(any(target_os = "android", target_os = "macos"))))]
-        let is_acl_set = file_has_acl(item.display_name.as_os_str());
+        let is_acl_set = has_acl(item.display_name.as_os_str());
         write!(
             output_display,
             "{}{}{} {}",
diff --git a/src/uucore/src/lib/features/fsxattr.rs b/src/uucore/src/lib/features/fsxattr.rs
index 7bda023f9a7..36ec0ba8e40 100644
--- a/src/uucore/src/lib/features/fsxattr.rs
+++ b/src/uucore/src/lib/features/fsxattr.rs
@@ -66,6 +66,26 @@ pub fn apply_xattrs<P: AsRef<Path>>(
     Ok(())
 }
 
+/// Checks if a file has an Access Control List (ACL) based on its extended attributes.
+///
+/// # Arguments
+///
+/// * `file` - A reference to the path of the file.
+///
+/// # Returns
+///
+/// `true` if the file has extended attributes (indicating an ACL), `false` otherwise.
+pub fn has_acl<P: AsRef<Path>>(file: P) -> bool {
+    // don't use exacl here, it is doing more getxattr call then needed
+    match xattr::list(file) {
+        Ok(acl) => {
+            // if we have extra attributes, we have an acl
+            acl.count() > 0
+        }
+        Err(_) => false,
+    }
+}
+
 #[cfg(test)]
 mod tests {
     use super::*;
@@ -113,4 +133,20 @@ mod tests {
             test_value
         );
     }
+
+    #[test]
+    fn test_file_has_acl() {
+        let temp_dir = tempdir().unwrap();
+        let file_path = temp_dir.path().join("test_file.txt");
+
+        File::create(&file_path).unwrap();
+
+        assert!(!has_acl(&file_path));
+
+        let test_attr = "user.test_acl";
+        let test_value = b"test value";
+        xattr::set(&file_path, test_attr, test_value).unwrap();
+
+        assert!(has_acl(&file_path));
+    }
 }

From 3872aca9c66a34ea99566e011c1828e6c0ff20be Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Sun, 14 Jan 2024 21:39:59 +0100
Subject: [PATCH 414/429] spell: ignore getxattr

---
 src/uucore/src/lib/features/fsxattr.rs | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/src/uucore/src/lib/features/fsxattr.rs b/src/uucore/src/lib/features/fsxattr.rs
index 36ec0ba8e40..3cb00edc0cb 100644
--- a/src/uucore/src/lib/features/fsxattr.rs
+++ b/src/uucore/src/lib/features/fsxattr.rs
@@ -3,6 +3,8 @@
 // For the full copyright and license information, please view the LICENSE
 // file that was distributed with this source code.
 
+// spell-checker:ignore getxattr
+
 //! Set of functions to manage xattr on files and dirs
 use std::collections::HashMap;
 use std::ffi::OsString;

From 69c8753f80947dd56bfc9450be2aa36de89c27f8 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Mon, 15 Jan 2024 11:28:29 +0100
Subject: [PATCH 415/429]  cp test: use compare_xattrs from tests/utils

---
 tests/by-util/test_cp.rs | 17 +----------------
 1 file changed, 1 insertion(+), 16 deletions(-)

diff --git a/tests/by-util/test_cp.rs b/tests/by-util/test_cp.rs
index 1271909ecb9..c0d81d9a915 100644
--- a/tests/by-util/test_cp.rs
+++ b/tests/by-util/test_cp.rs
@@ -57,7 +57,7 @@ static TEST_MOUNT_OTHER_FILESYSTEM_FILE: &str = "mount/DO_NOT_copy_me.txt";
 #[cfg(unix)]
 static TEST_NONEXISTENT_FILE: &str = "nonexistent_file.txt";
 #[cfg(all(unix, not(any(target_os = "android", target_os = "macos"))))]
-use xattr;
+use crate::common::util::compare_xattrs;
 
 /// Assert that mode, ownership, and permissions of two metadata objects match.
 #[cfg(all(not(windows), not(target_os = "freebsd")))]
@@ -3739,21 +3739,6 @@ fn test_cp_no_such() {
         .stderr_is("cp: 'no-such/' is not a directory\n");
 }
 
-#[cfg(all(unix, not(any(target_os = "android", target_os = "macos"))))]
-fn compare_xattrs<P: AsRef<Path>>(path1: P, path2: P) -> bool {
-    let get_sorted_xattrs = |path: P| {
-        xattr::list(path)
-            .map(|attrs| {
-                let mut attrs = attrs.collect::<Vec<_>>();
-                attrs.sort();
-                attrs
-            })
-            .unwrap_or_else(|_| Vec::new())
-    };
-
-    get_sorted_xattrs(path1) == get_sorted_xattrs(path2)
-}
-
 #[cfg(all(unix, not(any(target_os = "android", target_os = "macos"))))]
 #[test]
 fn test_acl_preserve() {

From dc533a915a86a367f303f6b79332d50325a30535 Mon Sep 17 00:00:00 2001
From: Ulrich Hornung <hornunguli@gmx.de>
Date: Wed, 17 Jan 2024 10:07:34 +0100
Subject: [PATCH 416/429] install: fix strip program stdout and destination
 hyphen handling #5718 (#5848)

* Fix missing dependency to "process" to make it compile.

* fix issue of not forwarding stdout from strip program

* fix issue of applying "./" redundantly

* cargo fmt
---
 src/uu/install/Cargo.toml     |  1 +
 src/uu/install/src/install.rs | 22 +++++++++-------------
 tests/by-util/test_install.rs | 15 ++++++++++++++-
 3 files changed, 24 insertions(+), 14 deletions(-)

diff --git a/src/uu/install/Cargo.toml b/src/uu/install/Cargo.toml
index 0110380068b..cc687efdb3d 100644
--- a/src/uu/install/Cargo.toml
+++ b/src/uu/install/Cargo.toml
@@ -25,6 +25,7 @@ uucore = { workspace = true, features = [
   "mode",
   "perms",
   "entries",
+  "process",
 ] }
 
 [[bin]]
diff --git a/src/uu/install/src/install.rs b/src/uu/install/src/install.rs
index e568149acf6..9955be7b292 100644
--- a/src/uu/install/src/install.rs
+++ b/src/uu/install/src/install.rs
@@ -776,27 +776,23 @@ fn copy_file(from: &Path, to: &Path) -> UResult<()> {
 ///
 fn strip_file(to: &Path, b: &Behavior) -> UResult<()> {
     // Check if the filename starts with a hyphen and adjust the path
-    let to = if to
-        .file_name()
-        .unwrap_or_default()
-        .to_str()
-        .unwrap_or_default()
-        .starts_with('-')
-    {
+    let to_str = to.as_os_str().to_str().unwrap_or_default();
+    let to = if to_str.starts_with('-') {
         let mut new_path = PathBuf::from(".");
         new_path.push(to);
         new_path
     } else {
         to.to_path_buf()
     };
-    match process::Command::new(&b.strip_program).arg(&to).output() {
-        Ok(o) => {
-            if !o.status.success() {
+    match process::Command::new(&b.strip_program).arg(&to).status() {
+        Ok(status) => {
+            if !status.success() {
                 // Follow GNU's behavior: if strip fails, removes the target
                 let _ = fs::remove_file(to);
-                return Err(InstallError::StripProgramFailed(
-                    String::from_utf8(o.stderr).unwrap_or_default(),
-                )
+                return Err(InstallError::StripProgramFailed(format!(
+                    "strip process terminated abnormally - exit code: {}",
+                    status.code().unwrap()
+                ))
                 .into());
             }
         }
diff --git a/tests/by-util/test_install.rs b/tests/by-util/test_install.rs
index 3db25c81fc2..6b1d76e5527 100644
--- a/tests/by-util/test_install.rs
+++ b/tests/by-util/test_install.rs
@@ -699,7 +699,20 @@ fn test_install_and_strip_with_program_hyphen() {
         .arg("src")
         .arg("-dest")
         .succeeds()
-        .no_stderr();
+        .no_stderr()
+        .stdout_is("./-dest\n");
+
+    scene
+        .ucmd()
+        .arg("-s")
+        .arg("--strip-program")
+        .arg("./no-hyphen")
+        .arg("--")
+        .arg("src")
+        .arg("./-dest")
+        .succeeds()
+        .no_stderr()
+        .stdout_is("./-dest\n");
 }
 
 #[test]

From 61de1dc23ac055237789bf3d54e86eda85af4984 Mon Sep 17 00:00:00 2001
From: Terts Diepraam <terts.diepraam@gmail.com>
Date: Wed, 17 Jan 2024 10:44:33 +0100
Subject: [PATCH 417/429] uucore/sum: fix crlf test

---
 src/uucore/src/lib/features/sum.rs | 13 +++++++------
 1 file changed, 7 insertions(+), 6 deletions(-)

diff --git a/src/uucore/src/lib/features/sum.rs b/src/uucore/src/lib/features/sum.rs
index e079d7a30e3..3a8bb55d59b 100644
--- a/src/uucore/src/lib/features/sum.rs
+++ b/src/uucore/src/lib/features/sum.rs
@@ -484,22 +484,23 @@ mod tests {
     fn test_crlf_across_blocks() {
         use std::io::Write;
 
-        use crate::digest::Digest;
-        use crate::digest::DigestWriter;
+        use super::Digest;
+        use super::DigestWriter;
+        use super::Md5;
 
         // Writing "\r" in one call to `write()`, and then "\n" in another.
-        let mut digest = Box::new(md5::Md5::new()) as Box<dyn Digest>;
+        let mut digest = Box::new(Md5::new()) as Box<dyn Digest>;
         let mut writer_crlf = DigestWriter::new(&mut digest, false);
         writer_crlf.write_all(&[b'\r']).unwrap();
         writer_crlf.write_all(&[b'\n']).unwrap();
-        writer_crlf.hash_finalize();
+        writer_crlf.finalize();
         let result_crlf = digest.result_str();
 
         // We expect "\r\n" to be replaced with "\n" in text mode on Windows.
-        let mut digest = Box::new(md5::Md5::new()) as Box<dyn Digest>;
+        let mut digest = Box::new(Md5::new()) as Box<dyn Digest>;
         let mut writer_lf = DigestWriter::new(&mut digest, false);
         writer_lf.write_all(&[b'\n']).unwrap();
-        writer_lf.hash_finalize();
+        writer_lf.finalize();
         let result_lf = digest.result_str();
 
         assert_eq!(result_crlf, result_lf);

From 12758be6c6ad543c0eb3ba2b6862f40e08b72448 Mon Sep 17 00:00:00 2001
From: "renovate[bot]" <29139614+renovate[bot]@users.noreply.github.com>
Date: Wed, 17 Jan 2024 17:09:22 +0000
Subject: [PATCH 418/429] chore(deps): update actions/cache action to v4

---
 .github/workflows/android.yml | 8 ++++----
 .github/workflows/fuzzing.yml | 4 ++--
 2 files changed, 6 insertions(+), 6 deletions(-)

diff --git a/.github/workflows/android.yml b/.github/workflows/android.yml
index 34dcf910d18..86b5a89e83a 100644
--- a/.github/workflows/android.yml
+++ b/.github/workflows/android.yml
@@ -33,7 +33,7 @@ jobs:
     steps:
     - uses: actions/checkout@v4
     - name: Restore AVD cache
-      uses: actions/cache/restore@v3
+      uses: actions/cache/restore@v4
       id: avd-cache
       with:
         path: |
@@ -57,7 +57,7 @@ jobs:
           util/android-commands.sh init "${{ matrix.arch }}" "${{ matrix.api-level }}" "${{ env.TERMUX }}"
     - name: Save AVD cache
       if: steps.avd-cache.outputs.cache-hit != 'true'
-      uses: actions/cache/save@v3
+      uses: actions/cache/save@v4
       with:
         path: |
           ~/.android/avd/*
@@ -73,7 +73,7 @@ jobs:
         trim: true
     - name: Restore rust cache
       id: rust-cache
-      uses: actions/cache/restore@v3
+      uses: actions/cache/restore@v4
       with:
         path: ~/__rust_cache__
         # The version vX at the end of the key is just a development version to avoid conflicts in
@@ -99,7 +99,7 @@ jobs:
           if [[ "${{ steps.rust-cache.outputs.cache-hit }}" != 'true' ]]; then util/android-commands.sh sync_image; fi; exit 0
     - name: Save rust cache
       if: steps.rust-cache.outputs.cache-hit != 'true'
-      uses: actions/cache/save@v3
+      uses: actions/cache/save@v4
       with:
         path: ~/__rust_cache__
         key: ${{ matrix.arch }}_${{ matrix.target}}_${{ steps.read_rustc_hash.outputs.content }}_${{ hashFiles('**/Cargo.toml', '**/Cargo.lock') }}_v3
diff --git a/.github/workflows/fuzzing.yml b/.github/workflows/fuzzing.yml
index b96f7e4ef22..c60c01ff4be 100644
--- a/.github/workflows/fuzzing.yml
+++ b/.github/workflows/fuzzing.yml
@@ -66,7 +66,7 @@ jobs:
         shared-key: "cargo-fuzz-cache-key"
         cache-directories: "fuzz/target"
     - name: Restore Cached Corpus
-      uses: actions/cache/restore@v3
+      uses: actions/cache/restore@v4
       with:
         key: corpus-cache-${{ matrix.test-target.name }}
         path: |
@@ -77,7 +77,7 @@ jobs:
       run: |
         cargo +nightly fuzz run ${{ matrix.test-target.name }} -- -max_total_time=${{ env.RUN_FOR }} -detect_leaks=0
     - name: Save Corpus Cache
-      uses: actions/cache/save@v3
+      uses: actions/cache/save@v4
       with:
         key: corpus-cache-${{ matrix.test-target.name }}
         path: |

From 667a9469c48d509ce5617dbe270067fa5bb9dc1f Mon Sep 17 00:00:00 2001
From: "renovate[bot]" <29139614+renovate[bot]@users.noreply.github.com>
Date: Fri, 19 Jan 2024 09:23:10 +0000
Subject: [PATCH 419/429] chore(deps): update rust crate smallvec to 1.13

---
 Cargo.lock | 4 ++--
 Cargo.toml | 2 +-
 2 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/Cargo.lock b/Cargo.lock
index cbff54c4b91..fb931cdb815 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -1987,9 +1987,9 @@ dependencies = [
 
 [[package]]
 name = "smallvec"
-version = "1.12.0"
+version = "1.13.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "2593d31f82ead8df961d8bd23a64c2ccf2eb5dd34b0a34bfb4dd54011c72009e"
+checksum = "3b187f0231d56fe41bfb12034819dd2bf336422a5866de41bc3fec4b2e3883e8"
 
 [[package]]
 name = "smawk"
diff --git a/Cargo.toml b/Cargo.toml
index a8e9c399b5c..2779ea8fdd3 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -318,7 +318,7 @@ same-file = "1.0.6"
 self_cell = "1.0.3"
 selinux = "0.4"
 signal-hook = "0.3.17"
-smallvec = { version = "1.12", features = ["union"] }
+smallvec = { version = "1.13", features = ["union"] }
 tempfile = "3.9.0"
 uutils_term_grid = "0.3"
 terminal_size = "0.3.0"

From b363064e48d17b9fb9abcb5a370015b4505b87fd Mon Sep 17 00:00:00 2001
From: "renovate[bot]" <29139614+renovate[bot]@users.noreply.github.com>
Date: Fri, 19 Jan 2024 09:38:39 +0000
Subject: [PATCH 420/429] chore(deps): update
 davidanson/markdownlint-cli2-action action to v15

---
 .github/workflows/CICD.yml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/.github/workflows/CICD.yml b/.github/workflows/CICD.yml
index 40d7c018df4..ad12ede6833 100644
--- a/.github/workflows/CICD.yml
+++ b/.github/workflows/CICD.yml
@@ -137,7 +137,7 @@ jobs:
       shell: bash
       run: |
         RUSTDOCFLAGS="-Dwarnings" cargo doc  ${{ steps.vars.outputs.CARGO_FEATURES_OPTION }} --no-deps --workspace --document-private-items
-    - uses: DavidAnson/markdownlint-cli2-action@v14
+    - uses: DavidAnson/markdownlint-cli2-action@v15
       with:
         fix: "true"
         globs: |

From 746a7b14d03f32fb0db6e951b46cbbd3003c5ff7 Mon Sep 17 00:00:00 2001
From: SaHHiiLL <87093947+SaHHiiLL@users.noreply.github.com>
Date: Fri, 19 Jan 2024 14:39:00 +0000
Subject: [PATCH 421/429] tsort: returns error when input is dir - same as GNU
 tsort (#5860)

* fix: return error when input is dir

* test: when tsort is given a dir

* fix: do not need to mention tsort in error message

* test: using concrete directory name

* tsort: fix formatting in test

---------

Co-authored-by: Daniel Hofstetter <daniel.hofstetter@42dh.com>
---
 src/uu/tsort/src/tsort.rs   | 9 ++++++++-
 tests/by-util/test_tsort.rs | 9 +++++++++
 2 files changed, 17 insertions(+), 1 deletion(-)

diff --git a/src/uu/tsort/src/tsort.rs b/src/uu/tsort/src/tsort.rs
index 3ae4f4f97e6..2bc9d317576 100644
--- a/src/uu/tsort/src/tsort.rs
+++ b/src/uu/tsort/src/tsort.rs
@@ -32,7 +32,14 @@ pub fn uumain(args: impl uucore::Args) -> UResult<()> {
         stdin_buf = stdin();
         &mut stdin_buf as &mut dyn Read
     } else {
-        file_buf = File::open(Path::new(&input)).map_err_context(|| input.to_string())?;
+        let path = Path::new(&input);
+        if path.is_dir() {
+            return Err(USimpleError::new(
+                1,
+                format!("{}: read error: Is a directory", input),
+            ));
+        }
+        file_buf = File::open(path).map_err_context(|| input.to_string())?;
         &mut file_buf as &mut dyn Read
     });
 
diff --git a/tests/by-util/test_tsort.rs b/tests/by-util/test_tsort.rs
index 18889451629..79195efa211 100644
--- a/tests/by-util/test_tsort.rs
+++ b/tests/by-util/test_tsort.rs
@@ -64,3 +64,12 @@ fn test_multiple_arguments() {
         .fails()
         .stderr_contains("unexpected argument 'invalid_file' found");
 }
+
+#[test]
+fn test_error_on_dir() {
+    let (at, mut ucmd) = at_and_ucmd!();
+    at.mkdir("tsort_test_dir");
+    ucmd.arg("tsort_test_dir")
+        .fails()
+        .stderr_contains("tsort: tsort_test_dir: read error: Is a directory");
+}

From 4589f637ee8b1f33398cd66de8c3ad638593e031 Mon Sep 17 00:00:00 2001
From: Laurent Cheylus <foxy@free.fr>
Date: Fri, 19 Jan 2024 17:35:18 +0100
Subject: [PATCH 422/429] tests: disable tests for tools unsupported on OpenBSD

pinky, uptime and who are not supported on OpenBSD (no support of utmpx feature) => disable tests
for these tools on OpenBSD with conditional compilation

Signed-off-by: Laurent Cheylus <foxy@free.fr>
---
 tests/by-util/test_pinky.rs  | 5 +++++
 tests/by-util/test_uptime.rs | 2 ++
 tests/by-util/test_who.rs    | 8 ++++++++
 3 files changed, 15 insertions(+)

diff --git a/tests/by-util/test_pinky.rs b/tests/by-util/test_pinky.rs
index 57413c4c95e..0fff402df96 100644
--- a/tests/by-util/test_pinky.rs
+++ b/tests/by-util/test_pinky.rs
@@ -21,6 +21,7 @@ fn test_capitalize() {
 }
 
 #[test]
+#[cfg(not(target_os = "openbsd"))]
 fn test_long_format() {
     let login = "root";
     let pw: Passwd = Passwd::locate(login).unwrap();
@@ -44,6 +45,7 @@ fn test_long_format() {
 
 #[cfg(unix)]
 #[test]
+#[cfg(not(target_os = "openbsd"))]
 fn test_long_format_multiple_users() {
     // multiple instances of one account we know exists,
     // the account of the test runner,
@@ -71,6 +73,7 @@ fn test_long_format_wo_user() {
 
 #[cfg(unix)]
 #[test]
+#[cfg(not(target_os = "openbsd"))]
 fn test_short_format_i() {
     // allow whitespace variation
     // * minor whitespace differences occur between platform built-in outputs; specifically, the number of trailing TABs may be variant
@@ -85,6 +88,7 @@ fn test_short_format_i() {
 
 #[cfg(unix)]
 #[test]
+#[cfg(not(target_os = "openbsd"))]
 fn test_short_format_q() {
     // allow whitespace variation
     // * minor whitespace differences occur between platform built-in outputs; specifically, the number of trailing TABs may be variant
@@ -99,6 +103,7 @@ fn test_short_format_q() {
 
 #[cfg(unix)]
 #[test]
+#[cfg(not(target_os = "openbsd"))]
 fn test_no_flag() {
     let ts = TestScenario::new(util_name!());
     let actual = ts.ucmd().succeeds().stdout_move_str();
diff --git a/tests/by-util/test_uptime.rs b/tests/by-util/test_uptime.rs
index 3967d025251..89e5567fba4 100644
--- a/tests/by-util/test_uptime.rs
+++ b/tests/by-util/test_uptime.rs
@@ -11,6 +11,7 @@ fn test_invalid_arg() {
 }
 
 #[test]
+#[cfg(not(target_os = "openbsd"))]
 fn test_uptime() {
     TestScenario::new(util_name!())
         .ucmd()
@@ -22,6 +23,7 @@ fn test_uptime() {
 }
 
 #[test]
+#[cfg(not(target_os = "openbsd"))]
 fn test_uptime_since() {
     let re = Regex::new(r"\d{4}-\d{2}-\d{2} \d{2}:\d{2}:\d{2}").unwrap();
 
diff --git a/tests/by-util/test_who.rs b/tests/by-util/test_who.rs
index 3bacc38c112..36325fe7c57 100644
--- a/tests/by-util/test_who.rs
+++ b/tests/by-util/test_who.rs
@@ -25,6 +25,7 @@ fn test_count() {
 
 #[cfg(unix)]
 #[test]
+#[cfg(not(target_os = "openbsd"))]
 fn test_boot() {
     let ts = TestScenario::new(util_name!());
     for opt in ["-b", "--boot", "--b"] {
@@ -65,6 +66,7 @@ fn test_short() {
 
 #[cfg(unix)]
 #[test]
+#[cfg(not(target_os = "openbsd"))]
 fn test_login() {
     let ts = TestScenario::new(util_name!());
     for opt in ["-l", "--login", "--log"] {
@@ -75,6 +77,7 @@ fn test_login() {
 
 #[cfg(unix)]
 #[test]
+#[cfg(not(target_os = "openbsd"))]
 fn test_m() {
     let ts = TestScenario::new(util_name!());
     let expected_stdout = unwrap_or_return!(expected_result(&ts, &["-m"])).stdout_move_str();
@@ -83,6 +86,7 @@ fn test_m() {
 
 #[cfg(unix)]
 #[test]
+#[cfg(not(target_os = "openbsd"))]
 fn test_process() {
     let ts = TestScenario::new(util_name!());
     for opt in ["-p", "--process", "--p"] {
@@ -93,6 +97,7 @@ fn test_process() {
 
 #[cfg(unix)]
 #[test]
+#[cfg(not(target_os = "openbsd"))]
 fn test_runlevel() {
     let ts = TestScenario::new(util_name!());
     for opt in ["-r", "--runlevel", "--r"] {
@@ -106,6 +111,7 @@ fn test_runlevel() {
 
 #[cfg(unix)]
 #[test]
+#[cfg(not(target_os = "openbsd"))]
 fn test_time() {
     let ts = TestScenario::new(util_name!());
     for opt in ["-t", "--time", "--t"] {
@@ -141,6 +147,7 @@ fn test_mesg() {
 
 #[cfg(unix)]
 #[test]
+#[cfg(not(target_os = "openbsd"))]
 fn test_arg1_arg2() {
     let args = ["am", "i"];
     let ts = TestScenario::new(util_name!());
@@ -195,6 +202,7 @@ fn test_lookup() {
 
 #[cfg(unix)]
 #[test]
+#[cfg(not(target_os = "openbsd"))]
 fn test_dead() {
     let ts = TestScenario::new(util_name!());
     for opt in ["-d", "--dead", "--de"] {

From 5e29c60b26cf8fdbef9a733601667c3f6b664c92 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Fri, 19 Jan 2024 20:34:09 +0100
Subject: [PATCH 423/429] hashsum: when the filename contains some special
 chars, escape them

Should fix tests/cksum/md5sum-newline.pl
---
 src/uu/hashsum/src/hashsum.rs | 14 +++++++++++++-
 tests/by-util/test_hashsum.rs | 15 +++++++++++++++
 2 files changed, 28 insertions(+), 1 deletion(-)

diff --git a/src/uu/hashsum/src/hashsum.rs b/src/uu/hashsum/src/hashsum.rs
index 22ef4152070..5e439853a58 100644
--- a/src/uu/hashsum/src/hashsum.rs
+++ b/src/uu/hashsum/src/hashsum.rs
@@ -756,7 +756,9 @@ where
             } else if options.zero {
                 print!("{} {}{}\0", sum, binary_marker, filename.display());
             } else {
-                println!("{} {}{}", sum, binary_marker, filename.display());
+                let (filename, has_prefix) = escape_filename(filename);
+                let prefix = if has_prefix { "\\" } else { "" };
+                println!("{}{} {}{}", prefix, sum, binary_marker, filename);
             }
         }
     }
@@ -781,6 +783,16 @@ where
     Ok(())
 }
 
+fn escape_filename(filename: &Path) -> (String, bool) {
+    let original = filename.as_os_str().to_string_lossy();
+    let escaped = original
+        .replace('\\', "\\\\")
+        .replace('\n', "\\n")
+        .replace('\r', "\\r");
+    let has_changed = escaped != original;
+    (escaped, has_changed)
+}
+
 fn digest_reader<T: Read>(
     digest: &mut Box<dyn Digest>,
     reader: &mut BufReader<T>,
diff --git a/tests/by-util/test_hashsum.rs b/tests/by-util/test_hashsum.rs
index 31471495b07..7edd387c326 100644
--- a/tests/by-util/test_hashsum.rs
+++ b/tests/by-util/test_hashsum.rs
@@ -371,3 +371,18 @@ fn test_tag() {
             "SHA256 (foobar) = 1f2ec52b774368781bed1d1fb140a92e0eb6348090619c9291f9a5a3c8e8d151\n",
         );
 }
+
+#[test]
+#[cfg(not(windows))]
+fn test_with_escape_filename() {
+    let scene = TestScenario::new(util_name!());
+
+    let at = &scene.fixtures;
+    let filename = "a\nb";
+    at.touch(filename);
+    let result = scene.ccmd("md5sum").arg("--text").arg(filename).succeeds();
+    let stdout = result.stdout_str();
+    println!("stdout {}", stdout);
+    assert!(stdout.starts_with('\\'));
+    assert!(stdout.trim().ends_with("a\\nb"));
+}

From dd5c6c2d00316159809393d66164d52c957b16fb Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Sat, 30 Dec 2023 20:17:23 +0100
Subject: [PATCH 424/429] 0.0.23 => 0.0.24

---
 Cargo.lock                             | 214 ++++++++++++-------------
 Cargo.toml                             | 206 ++++++++++++------------
 src/uu/arch/Cargo.toml                 |   2 +-
 src/uu/base32/Cargo.toml               |   2 +-
 src/uu/base64/Cargo.toml               |   2 +-
 src/uu/basename/Cargo.toml             |   2 +-
 src/uu/basenc/Cargo.toml               |   2 +-
 src/uu/cat/Cargo.toml                  |   2 +-
 src/uu/chcon/Cargo.toml                |   2 +-
 src/uu/chgrp/Cargo.toml                |   2 +-
 src/uu/chmod/Cargo.toml                |   2 +-
 src/uu/chown/Cargo.toml                |   2 +-
 src/uu/chroot/Cargo.toml               |   2 +-
 src/uu/cksum/Cargo.toml                |   2 +-
 src/uu/comm/Cargo.toml                 |   2 +-
 src/uu/cp/Cargo.toml                   |   2 +-
 src/uu/csplit/Cargo.toml               |   2 +-
 src/uu/cut/Cargo.toml                  |   2 +-
 src/uu/date/Cargo.toml                 |   2 +-
 src/uu/dd/Cargo.toml                   |   2 +-
 src/uu/df/Cargo.toml                   |   2 +-
 src/uu/dir/Cargo.toml                  |   2 +-
 src/uu/dircolors/Cargo.toml            |   2 +-
 src/uu/dirname/Cargo.toml              |   2 +-
 src/uu/du/Cargo.toml                   |   2 +-
 src/uu/echo/Cargo.toml                 |   2 +-
 src/uu/env/Cargo.toml                  |   2 +-
 src/uu/expand/Cargo.toml               |   2 +-
 src/uu/expr/Cargo.toml                 |   2 +-
 src/uu/factor/Cargo.toml               |   2 +-
 src/uu/false/Cargo.toml                |   2 +-
 src/uu/fmt/Cargo.toml                  |   2 +-
 src/uu/fold/Cargo.toml                 |   2 +-
 src/uu/groups/Cargo.toml               |   2 +-
 src/uu/hashsum/Cargo.toml              |   2 +-
 src/uu/head/Cargo.toml                 |   2 +-
 src/uu/hostid/Cargo.toml               |   2 +-
 src/uu/hostname/Cargo.toml             |   2 +-
 src/uu/id/Cargo.toml                   |   2 +-
 src/uu/install/Cargo.toml              |   2 +-
 src/uu/join/Cargo.toml                 |   2 +-
 src/uu/kill/Cargo.toml                 |   2 +-
 src/uu/link/Cargo.toml                 |   2 +-
 src/uu/ln/Cargo.toml                   |   2 +-
 src/uu/logname/Cargo.toml              |   2 +-
 src/uu/ls/Cargo.toml                   |   2 +-
 src/uu/mkdir/Cargo.toml                |   2 +-
 src/uu/mkfifo/Cargo.toml               |   2 +-
 src/uu/mknod/Cargo.toml                |   2 +-
 src/uu/mktemp/Cargo.toml               |   2 +-
 src/uu/more/Cargo.toml                 |   2 +-
 src/uu/mv/Cargo.toml                   |   2 +-
 src/uu/nice/Cargo.toml                 |   2 +-
 src/uu/nl/Cargo.toml                   |   2 +-
 src/uu/nohup/Cargo.toml                |   2 +-
 src/uu/nproc/Cargo.toml                |   2 +-
 src/uu/numfmt/Cargo.toml               |   2 +-
 src/uu/od/Cargo.toml                   |   2 +-
 src/uu/paste/Cargo.toml                |   2 +-
 src/uu/pathchk/Cargo.toml              |   2 +-
 src/uu/pinky/Cargo.toml                |   2 +-
 src/uu/pr/Cargo.toml                   |   2 +-
 src/uu/printenv/Cargo.toml             |   2 +-
 src/uu/printf/Cargo.toml               |   2 +-
 src/uu/ptx/Cargo.toml                  |   2 +-
 src/uu/pwd/Cargo.toml                  |   2 +-
 src/uu/readlink/Cargo.toml             |   2 +-
 src/uu/realpath/Cargo.toml             |   2 +-
 src/uu/rm/Cargo.toml                   |   2 +-
 src/uu/rmdir/Cargo.toml                |   2 +-
 src/uu/runcon/Cargo.toml               |   2 +-
 src/uu/seq/Cargo.toml                  |   2 +-
 src/uu/shred/Cargo.toml                |   2 +-
 src/uu/shuf/Cargo.toml                 |   2 +-
 src/uu/sleep/Cargo.toml                |   2 +-
 src/uu/sort/Cargo.toml                 |   2 +-
 src/uu/split/Cargo.toml                |   2 +-
 src/uu/stat/Cargo.toml                 |   2 +-
 src/uu/stdbuf/Cargo.toml               |   4 +-
 src/uu/stdbuf/src/libstdbuf/Cargo.toml |   2 +-
 src/uu/stty/Cargo.toml                 |   2 +-
 src/uu/sum/Cargo.toml                  |   2 +-
 src/uu/sync/Cargo.toml                 |   2 +-
 src/uu/tac/Cargo.toml                  |   2 +-
 src/uu/tail/Cargo.toml                 |   2 +-
 src/uu/tee/Cargo.toml                  |   2 +-
 src/uu/test/Cargo.toml                 |   2 +-
 src/uu/timeout/Cargo.toml              |   2 +-
 src/uu/touch/Cargo.toml                |   2 +-
 src/uu/tr/Cargo.toml                   |   2 +-
 src/uu/true/Cargo.toml                 |   2 +-
 src/uu/truncate/Cargo.toml             |   2 +-
 src/uu/tsort/Cargo.toml                |   2 +-
 src/uu/tty/Cargo.toml                  |   2 +-
 src/uu/uname/Cargo.toml                |   2 +-
 src/uu/unexpand/Cargo.toml             |   2 +-
 src/uu/uniq/Cargo.toml                 |   2 +-
 src/uu/unlink/Cargo.toml               |   2 +-
 src/uu/uptime/Cargo.toml               |   2 +-
 src/uu/users/Cargo.toml                |   2 +-
 src/uu/vdir/Cargo.toml                 |   2 +-
 src/uu/wc/Cargo.toml                   |   2 +-
 src/uu/who/Cargo.toml                  |   2 +-
 src/uu/whoami/Cargo.toml               |   2 +-
 src/uu/yes/Cargo.toml                  |   2 +-
 src/uucore/Cargo.toml                  |   2 +-
 src/uucore_procs/Cargo.toml            |   4 +-
 src/uuhelp_parser/Cargo.toml           |   2 +-
 util/update-version.sh                 |   4 +-
 109 files changed, 320 insertions(+), 320 deletions(-)

diff --git a/Cargo.lock b/Cargo.lock
index fb931cdb815..6b7ba1d5000 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -374,7 +374,7 @@ checksum = "5827cebf4670468b8772dd191856768aedcb1b0278a04f989f7766351917b9dc"
 
 [[package]]
 name = "coreutils"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "chrono",
  "clap",
@@ -2188,7 +2188,7 @@ checksum = "711b9620af191e0cdc7468a8d14e709c3dcdb115b36f838e601583af800a370a"
 
 [[package]]
 name = "uu_arch"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "platform-info",
@@ -2197,7 +2197,7 @@ dependencies = [
 
 [[package]]
 name = "uu_base32"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "uucore",
@@ -2205,7 +2205,7 @@ dependencies = [
 
 [[package]]
 name = "uu_base64"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "uu_base32",
  "uucore",
@@ -2213,7 +2213,7 @@ dependencies = [
 
 [[package]]
 name = "uu_basename"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "uucore",
@@ -2221,7 +2221,7 @@ dependencies = [
 
 [[package]]
 name = "uu_basenc"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "uu_base32",
@@ -2230,7 +2230,7 @@ dependencies = [
 
 [[package]]
 name = "uu_cat"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "nix",
@@ -2240,7 +2240,7 @@ dependencies = [
 
 [[package]]
 name = "uu_chcon"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "fts-sys",
@@ -2252,7 +2252,7 @@ dependencies = [
 
 [[package]]
 name = "uu_chgrp"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "uucore",
@@ -2260,7 +2260,7 @@ dependencies = [
 
 [[package]]
 name = "uu_chmod"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "libc",
@@ -2269,7 +2269,7 @@ dependencies = [
 
 [[package]]
 name = "uu_chown"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "uucore",
@@ -2277,7 +2277,7 @@ dependencies = [
 
 [[package]]
 name = "uu_chroot"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "uucore",
@@ -2285,7 +2285,7 @@ dependencies = [
 
 [[package]]
 name = "uu_cksum"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "hex",
@@ -2294,7 +2294,7 @@ dependencies = [
 
 [[package]]
 name = "uu_comm"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "uucore",
@@ -2302,7 +2302,7 @@ dependencies = [
 
 [[package]]
 name = "uu_cp"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "exacl",
@@ -2318,7 +2318,7 @@ dependencies = [
 
 [[package]]
 name = "uu_csplit"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "regex",
@@ -2328,7 +2328,7 @@ dependencies = [
 
 [[package]]
 name = "uu_cut"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "bstr",
  "clap",
@@ -2338,7 +2338,7 @@ dependencies = [
 
 [[package]]
 name = "uu_date"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "chrono",
  "clap",
@@ -2350,7 +2350,7 @@ dependencies = [
 
 [[package]]
 name = "uu_dd"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "gcd",
@@ -2362,7 +2362,7 @@ dependencies = [
 
 [[package]]
 name = "uu_df"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "tempfile",
@@ -2372,7 +2372,7 @@ dependencies = [
 
 [[package]]
 name = "uu_dir"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "uu_ls",
@@ -2381,7 +2381,7 @@ dependencies = [
 
 [[package]]
 name = "uu_dircolors"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "uucore",
@@ -2389,7 +2389,7 @@ dependencies = [
 
 [[package]]
 name = "uu_dirname"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "uucore",
@@ -2397,7 +2397,7 @@ dependencies = [
 
 [[package]]
 name = "uu_du"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "chrono",
  "clap",
@@ -2408,7 +2408,7 @@ dependencies = [
 
 [[package]]
 name = "uu_echo"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "uucore",
@@ -2416,7 +2416,7 @@ dependencies = [
 
 [[package]]
 name = "uu_env"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "nix",
@@ -2426,7 +2426,7 @@ dependencies = [
 
 [[package]]
 name = "uu_expand"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "unicode-width",
@@ -2435,7 +2435,7 @@ dependencies = [
 
 [[package]]
 name = "uu_expr"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "num-bigint",
@@ -2446,7 +2446,7 @@ dependencies = [
 
 [[package]]
 name = "uu_factor"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "coz",
@@ -2459,7 +2459,7 @@ dependencies = [
 
 [[package]]
 name = "uu_false"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "uucore",
@@ -2467,7 +2467,7 @@ dependencies = [
 
 [[package]]
 name = "uu_fmt"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "unicode-width",
@@ -2476,7 +2476,7 @@ dependencies = [
 
 [[package]]
 name = "uu_fold"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "uucore",
@@ -2484,7 +2484,7 @@ dependencies = [
 
 [[package]]
 name = "uu_groups"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "uucore",
@@ -2492,7 +2492,7 @@ dependencies = [
 
 [[package]]
 name = "uu_hashsum"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "hex",
@@ -2503,7 +2503,7 @@ dependencies = [
 
 [[package]]
 name = "uu_head"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "memchr",
@@ -2512,7 +2512,7 @@ dependencies = [
 
 [[package]]
 name = "uu_hostid"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "libc",
@@ -2521,7 +2521,7 @@ dependencies = [
 
 [[package]]
 name = "uu_hostname"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "hostname",
@@ -2531,7 +2531,7 @@ dependencies = [
 
 [[package]]
 name = "uu_id"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "selinux",
@@ -2540,7 +2540,7 @@ dependencies = [
 
 [[package]]
 name = "uu_install"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "file_diff",
@@ -2551,7 +2551,7 @@ dependencies = [
 
 [[package]]
 name = "uu_join"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "memchr",
@@ -2560,7 +2560,7 @@ dependencies = [
 
 [[package]]
 name = "uu_kill"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "nix",
@@ -2569,7 +2569,7 @@ dependencies = [
 
 [[package]]
 name = "uu_link"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "uucore",
@@ -2577,7 +2577,7 @@ dependencies = [
 
 [[package]]
 name = "uu_ln"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "uucore",
@@ -2585,7 +2585,7 @@ dependencies = [
 
 [[package]]
 name = "uu_logname"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "libc",
@@ -2594,7 +2594,7 @@ dependencies = [
 
 [[package]]
 name = "uu_ls"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "chrono",
  "clap",
@@ -2612,7 +2612,7 @@ dependencies = [
 
 [[package]]
 name = "uu_mkdir"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "uucore",
@@ -2620,7 +2620,7 @@ dependencies = [
 
 [[package]]
 name = "uu_mkfifo"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "libc",
@@ -2629,7 +2629,7 @@ dependencies = [
 
 [[package]]
 name = "uu_mknod"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "libc",
@@ -2638,7 +2638,7 @@ dependencies = [
 
 [[package]]
 name = "uu_mktemp"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "rand",
@@ -2648,7 +2648,7 @@ dependencies = [
 
 [[package]]
 name = "uu_more"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "crossterm",
@@ -2660,7 +2660,7 @@ dependencies = [
 
 [[package]]
 name = "uu_mv"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "fs_extra",
@@ -2670,7 +2670,7 @@ dependencies = [
 
 [[package]]
 name = "uu_nice"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "libc",
@@ -2680,7 +2680,7 @@ dependencies = [
 
 [[package]]
 name = "uu_nl"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "regex",
@@ -2689,7 +2689,7 @@ dependencies = [
 
 [[package]]
 name = "uu_nohup"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "libc",
@@ -2698,7 +2698,7 @@ dependencies = [
 
 [[package]]
 name = "uu_nproc"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "libc",
@@ -2707,7 +2707,7 @@ dependencies = [
 
 [[package]]
 name = "uu_numfmt"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "uucore",
@@ -2715,7 +2715,7 @@ dependencies = [
 
 [[package]]
 name = "uu_od"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "byteorder",
  "clap",
@@ -2725,7 +2725,7 @@ dependencies = [
 
 [[package]]
 name = "uu_paste"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "uucore",
@@ -2733,7 +2733,7 @@ dependencies = [
 
 [[package]]
 name = "uu_pathchk"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "libc",
@@ -2742,7 +2742,7 @@ dependencies = [
 
 [[package]]
 name = "uu_pinky"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "uucore",
@@ -2750,7 +2750,7 @@ dependencies = [
 
 [[package]]
 name = "uu_pr"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "chrono",
  "clap",
@@ -2762,7 +2762,7 @@ dependencies = [
 
 [[package]]
 name = "uu_printenv"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "uucore",
@@ -2770,7 +2770,7 @@ dependencies = [
 
 [[package]]
 name = "uu_printf"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "uucore",
@@ -2778,7 +2778,7 @@ dependencies = [
 
 [[package]]
 name = "uu_ptx"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "regex",
@@ -2787,7 +2787,7 @@ dependencies = [
 
 [[package]]
 name = "uu_pwd"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "uucore",
@@ -2795,7 +2795,7 @@ dependencies = [
 
 [[package]]
 name = "uu_readlink"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "uucore",
@@ -2803,7 +2803,7 @@ dependencies = [
 
 [[package]]
 name = "uu_realpath"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "uucore",
@@ -2811,7 +2811,7 @@ dependencies = [
 
 [[package]]
 name = "uu_rm"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "libc",
@@ -2822,7 +2822,7 @@ dependencies = [
 
 [[package]]
 name = "uu_rmdir"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "libc",
@@ -2831,7 +2831,7 @@ dependencies = [
 
 [[package]]
 name = "uu_runcon"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "libc",
@@ -2842,7 +2842,7 @@ dependencies = [
 
 [[package]]
 name = "uu_seq"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "bigdecimal",
  "clap",
@@ -2853,7 +2853,7 @@ dependencies = [
 
 [[package]]
 name = "uu_shred"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "libc",
@@ -2863,7 +2863,7 @@ dependencies = [
 
 [[package]]
 name = "uu_shuf"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "memchr",
@@ -2874,7 +2874,7 @@ dependencies = [
 
 [[package]]
 name = "uu_sleep"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "fundu",
@@ -2883,7 +2883,7 @@ dependencies = [
 
 [[package]]
 name = "uu_sort"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "binary-heap-plus",
  "clap",
@@ -2902,7 +2902,7 @@ dependencies = [
 
 [[package]]
 name = "uu_split"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "memchr",
@@ -2911,7 +2911,7 @@ dependencies = [
 
 [[package]]
 name = "uu_stat"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "uucore",
@@ -2919,7 +2919,7 @@ dependencies = [
 
 [[package]]
 name = "uu_stdbuf"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "tempfile",
@@ -2929,7 +2929,7 @@ dependencies = [
 
 [[package]]
 name = "uu_stdbuf_libstdbuf"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "cpp",
  "cpp_build",
@@ -2938,7 +2938,7 @@ dependencies = [
 
 [[package]]
 name = "uu_stty"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "nix",
@@ -2947,7 +2947,7 @@ dependencies = [
 
 [[package]]
 name = "uu_sum"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "uucore",
@@ -2955,7 +2955,7 @@ dependencies = [
 
 [[package]]
 name = "uu_sync"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "libc",
@@ -2966,7 +2966,7 @@ dependencies = [
 
 [[package]]
 name = "uu_tac"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "memchr",
@@ -2977,7 +2977,7 @@ dependencies = [
 
 [[package]]
 name = "uu_tail"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "fundu",
@@ -2993,7 +2993,7 @@ dependencies = [
 
 [[package]]
 name = "uu_tee"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "libc",
@@ -3002,7 +3002,7 @@ dependencies = [
 
 [[package]]
 name = "uu_test"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "libc",
@@ -3012,7 +3012,7 @@ dependencies = [
 
 [[package]]
 name = "uu_timeout"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "libc",
@@ -3022,7 +3022,7 @@ dependencies = [
 
 [[package]]
 name = "uu_touch"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "chrono",
  "clap",
@@ -3034,7 +3034,7 @@ dependencies = [
 
 [[package]]
 name = "uu_tr"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "nom",
@@ -3043,7 +3043,7 @@ dependencies = [
 
 [[package]]
 name = "uu_true"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "uucore",
@@ -3051,7 +3051,7 @@ dependencies = [
 
 [[package]]
 name = "uu_truncate"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "uucore",
@@ -3059,7 +3059,7 @@ dependencies = [
 
 [[package]]
 name = "uu_tsort"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "uucore",
@@ -3067,7 +3067,7 @@ dependencies = [
 
 [[package]]
 name = "uu_tty"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "nix",
@@ -3076,7 +3076,7 @@ dependencies = [
 
 [[package]]
 name = "uu_uname"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "platform-info",
@@ -3085,7 +3085,7 @@ dependencies = [
 
 [[package]]
 name = "uu_unexpand"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "unicode-width",
@@ -3094,7 +3094,7 @@ dependencies = [
 
 [[package]]
 name = "uu_uniq"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "uucore",
@@ -3102,7 +3102,7 @@ dependencies = [
 
 [[package]]
 name = "uu_unlink"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "uucore",
@@ -3110,7 +3110,7 @@ dependencies = [
 
 [[package]]
 name = "uu_uptime"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "chrono",
  "clap",
@@ -3119,7 +3119,7 @@ dependencies = [
 
 [[package]]
 name = "uu_users"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "uucore",
@@ -3127,7 +3127,7 @@ dependencies = [
 
 [[package]]
 name = "uu_vdir"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "uu_ls",
@@ -3136,7 +3136,7 @@ dependencies = [
 
 [[package]]
 name = "uu_wc"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "bytecount",
  "clap",
@@ -3149,7 +3149,7 @@ dependencies = [
 
 [[package]]
 name = "uu_who"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "uucore",
@@ -3157,7 +3157,7 @@ dependencies = [
 
 [[package]]
 name = "uu_whoami"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "libc",
@@ -3167,7 +3167,7 @@ dependencies = [
 
 [[package]]
 name = "uu_yes"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "clap",
  "itertools",
@@ -3177,7 +3177,7 @@ dependencies = [
 
 [[package]]
 name = "uucore"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "blake2b_simd",
  "blake3",
@@ -3214,7 +3214,7 @@ dependencies = [
 
 [[package]]
 name = "uucore_procs"
-version = "0.0.23"
+version = "0.0.24"
 dependencies = [
  "proc-macro2",
  "quote",
@@ -3223,7 +3223,7 @@ dependencies = [
 
 [[package]]
 name = "uuhelp_parser"
-version = "0.0.23"
+version = "0.0.24"
 
 [[package]]
 name = "uuid"
diff --git a/Cargo.toml b/Cargo.toml
index 2779ea8fdd3..f10792a16c0 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -5,7 +5,7 @@
 
 [package]
 name = "coreutils"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "coreutils ~ GNU coreutils (updated); implemented as universal (cross-platform) utils, written in Rust"
@@ -363,109 +363,109 @@ zip = { workspace = true, optional = true }
 uuhelp_parser = { optional = true, version = ">=0.0.19", path = "src/uuhelp_parser" }
 
 # * uutils
-uu_test = { optional = true, version = "0.0.23", package = "uu_test", path = "src/uu/test" }
+uu_test = { optional = true, version = "0.0.24", package = "uu_test", path = "src/uu/test" }
 #
-arch = { optional = true, version = "0.0.23", package = "uu_arch", path = "src/uu/arch" }
-base32 = { optional = true, version = "0.0.23", package = "uu_base32", path = "src/uu/base32" }
-base64 = { optional = true, version = "0.0.23", package = "uu_base64", path = "src/uu/base64" }
-basename = { optional = true, version = "0.0.23", package = "uu_basename", path = "src/uu/basename" }
-basenc = { optional = true, version = "0.0.23", package = "uu_basenc", path = "src/uu/basenc" }
-cat = { optional = true, version = "0.0.23", package = "uu_cat", path = "src/uu/cat" }
-chcon = { optional = true, version = "0.0.23", package = "uu_chcon", path = "src/uu/chcon" }
-chgrp = { optional = true, version = "0.0.23", package = "uu_chgrp", path = "src/uu/chgrp" }
-chmod = { optional = true, version = "0.0.23", package = "uu_chmod", path = "src/uu/chmod" }
-chown = { optional = true, version = "0.0.23", package = "uu_chown", path = "src/uu/chown" }
-chroot = { optional = true, version = "0.0.23", package = "uu_chroot", path = "src/uu/chroot" }
-cksum = { optional = true, version = "0.0.23", package = "uu_cksum", path = "src/uu/cksum" }
-comm = { optional = true, version = "0.0.23", package = "uu_comm", path = "src/uu/comm" }
-cp = { optional = true, version = "0.0.23", package = "uu_cp", path = "src/uu/cp" }
-csplit = { optional = true, version = "0.0.23", package = "uu_csplit", path = "src/uu/csplit" }
-cut = { optional = true, version = "0.0.23", package = "uu_cut", path = "src/uu/cut" }
-date = { optional = true, version = "0.0.23", package = "uu_date", path = "src/uu/date" }
-dd = { optional = true, version = "0.0.23", package = "uu_dd", path = "src/uu/dd" }
-df = { optional = true, version = "0.0.23", package = "uu_df", path = "src/uu/df" }
-dir = { optional = true, version = "0.0.23", package = "uu_dir", path = "src/uu/dir" }
-dircolors = { optional = true, version = "0.0.23", package = "uu_dircolors", path = "src/uu/dircolors" }
-dirname = { optional = true, version = "0.0.23", package = "uu_dirname", path = "src/uu/dirname" }
-du = { optional = true, version = "0.0.23", package = "uu_du", path = "src/uu/du" }
-echo = { optional = true, version = "0.0.23", package = "uu_echo", path = "src/uu/echo" }
-env = { optional = true, version = "0.0.23", package = "uu_env", path = "src/uu/env" }
-expand = { optional = true, version = "0.0.23", package = "uu_expand", path = "src/uu/expand" }
-expr = { optional = true, version = "0.0.23", package = "uu_expr", path = "src/uu/expr" }
-factor = { optional = true, version = "0.0.23", package = "uu_factor", path = "src/uu/factor" }
-false = { optional = true, version = "0.0.23", package = "uu_false", path = "src/uu/false" }
-fmt = { optional = true, version = "0.0.23", package = "uu_fmt", path = "src/uu/fmt" }
-fold = { optional = true, version = "0.0.23", package = "uu_fold", path = "src/uu/fold" }
-groups = { optional = true, version = "0.0.23", package = "uu_groups", path = "src/uu/groups" }
-hashsum = { optional = true, version = "0.0.23", package = "uu_hashsum", path = "src/uu/hashsum" }
-head = { optional = true, version = "0.0.23", package = "uu_head", path = "src/uu/head" }
-hostid = { optional = true, version = "0.0.23", package = "uu_hostid", path = "src/uu/hostid" }
-hostname = { optional = true, version = "0.0.23", package = "uu_hostname", path = "src/uu/hostname" }
-id = { optional = true, version = "0.0.23", package = "uu_id", path = "src/uu/id" }
-install = { optional = true, version = "0.0.23", package = "uu_install", path = "src/uu/install" }
-join = { optional = true, version = "0.0.23", package = "uu_join", path = "src/uu/join" }
-kill = { optional = true, version = "0.0.23", package = "uu_kill", path = "src/uu/kill" }
-link = { optional = true, version = "0.0.23", package = "uu_link", path = "src/uu/link" }
-ln = { optional = true, version = "0.0.23", package = "uu_ln", path = "src/uu/ln" }
-ls = { optional = true, version = "0.0.23", package = "uu_ls", path = "src/uu/ls" }
-logname = { optional = true, version = "0.0.23", package = "uu_logname", path = "src/uu/logname" }
-mkdir = { optional = true, version = "0.0.23", package = "uu_mkdir", path = "src/uu/mkdir" }
-mkfifo = { optional = true, version = "0.0.23", package = "uu_mkfifo", path = "src/uu/mkfifo" }
-mknod = { optional = true, version = "0.0.23", package = "uu_mknod", path = "src/uu/mknod" }
-mktemp = { optional = true, version = "0.0.23", package = "uu_mktemp", path = "src/uu/mktemp" }
-more = { optional = true, version = "0.0.23", package = "uu_more", path = "src/uu/more" }
-mv = { optional = true, version = "0.0.23", package = "uu_mv", path = "src/uu/mv" }
-nice = { optional = true, version = "0.0.23", package = "uu_nice", path = "src/uu/nice" }
-nl = { optional = true, version = "0.0.23", package = "uu_nl", path = "src/uu/nl" }
-nohup = { optional = true, version = "0.0.23", package = "uu_nohup", path = "src/uu/nohup" }
-nproc = { optional = true, version = "0.0.23", package = "uu_nproc", path = "src/uu/nproc" }
-numfmt = { optional = true, version = "0.0.23", package = "uu_numfmt", path = "src/uu/numfmt" }
-od = { optional = true, version = "0.0.23", package = "uu_od", path = "src/uu/od" }
-paste = { optional = true, version = "0.0.23", package = "uu_paste", path = "src/uu/paste" }
-pathchk = { optional = true, version = "0.0.23", package = "uu_pathchk", path = "src/uu/pathchk" }
-pinky = { optional = true, version = "0.0.23", package = "uu_pinky", path = "src/uu/pinky" }
-pr = { optional = true, version = "0.0.23", package = "uu_pr", path = "src/uu/pr" }
-printenv = { optional = true, version = "0.0.23", package = "uu_printenv", path = "src/uu/printenv" }
-printf = { optional = true, version = "0.0.23", package = "uu_printf", path = "src/uu/printf" }
-ptx = { optional = true, version = "0.0.23", package = "uu_ptx", path = "src/uu/ptx" }
-pwd = { optional = true, version = "0.0.23", package = "uu_pwd", path = "src/uu/pwd" }
-readlink = { optional = true, version = "0.0.23", package = "uu_readlink", path = "src/uu/readlink" }
-realpath = { optional = true, version = "0.0.23", package = "uu_realpath", path = "src/uu/realpath" }
-rm = { optional = true, version = "0.0.23", package = "uu_rm", path = "src/uu/rm" }
-rmdir = { optional = true, version = "0.0.23", package = "uu_rmdir", path = "src/uu/rmdir" }
-runcon = { optional = true, version = "0.0.23", package = "uu_runcon", path = "src/uu/runcon" }
-seq = { optional = true, version = "0.0.23", package = "uu_seq", path = "src/uu/seq" }
-shred = { optional = true, version = "0.0.23", package = "uu_shred", path = "src/uu/shred" }
-shuf = { optional = true, version = "0.0.23", package = "uu_shuf", path = "src/uu/shuf" }
-sleep = { optional = true, version = "0.0.23", package = "uu_sleep", path = "src/uu/sleep" }
-sort = { optional = true, version = "0.0.23", package = "uu_sort", path = "src/uu/sort" }
-split = { optional = true, version = "0.0.23", package = "uu_split", path = "src/uu/split" }
-stat = { optional = true, version = "0.0.23", package = "uu_stat", path = "src/uu/stat" }
-stdbuf = { optional = true, version = "0.0.23", package = "uu_stdbuf", path = "src/uu/stdbuf" }
-stty = { optional = true, version = "0.0.23", package = "uu_stty", path = "src/uu/stty" }
-sum = { optional = true, version = "0.0.23", package = "uu_sum", path = "src/uu/sum" }
-sync = { optional = true, version = "0.0.23", package = "uu_sync", path = "src/uu/sync" }
-tac = { optional = true, version = "0.0.23", package = "uu_tac", path = "src/uu/tac" }
-tail = { optional = true, version = "0.0.23", package = "uu_tail", path = "src/uu/tail" }
-tee = { optional = true, version = "0.0.23", package = "uu_tee", path = "src/uu/tee" }
-timeout = { optional = true, version = "0.0.23", package = "uu_timeout", path = "src/uu/timeout" }
-touch = { optional = true, version = "0.0.23", package = "uu_touch", path = "src/uu/touch" }
-tr = { optional = true, version = "0.0.23", package = "uu_tr", path = "src/uu/tr" }
-true = { optional = true, version = "0.0.23", package = "uu_true", path = "src/uu/true" }
-truncate = { optional = true, version = "0.0.23", package = "uu_truncate", path = "src/uu/truncate" }
-tsort = { optional = true, version = "0.0.23", package = "uu_tsort", path = "src/uu/tsort" }
-tty = { optional = true, version = "0.0.23", package = "uu_tty", path = "src/uu/tty" }
-uname = { optional = true, version = "0.0.23", package = "uu_uname", path = "src/uu/uname" }
-unexpand = { optional = true, version = "0.0.23", package = "uu_unexpand", path = "src/uu/unexpand" }
-uniq = { optional = true, version = "0.0.23", package = "uu_uniq", path = "src/uu/uniq" }
-unlink = { optional = true, version = "0.0.23", package = "uu_unlink", path = "src/uu/unlink" }
-uptime = { optional = true, version = "0.0.23", package = "uu_uptime", path = "src/uu/uptime" }
-users = { optional = true, version = "0.0.23", package = "uu_users", path = "src/uu/users" }
-vdir = { optional = true, version = "0.0.23", package = "uu_vdir", path = "src/uu/vdir" }
-wc = { optional = true, version = "0.0.23", package = "uu_wc", path = "src/uu/wc" }
-who = { optional = true, version = "0.0.23", package = "uu_who", path = "src/uu/who" }
-whoami = { optional = true, version = "0.0.23", package = "uu_whoami", path = "src/uu/whoami" }
-yes = { optional = true, version = "0.0.23", package = "uu_yes", path = "src/uu/yes" }
+arch = { optional = true, version = "0.0.24", package = "uu_arch", path = "src/uu/arch" }
+base32 = { optional = true, version = "0.0.24", package = "uu_base32", path = "src/uu/base32" }
+base64 = { optional = true, version = "0.0.24", package = "uu_base64", path = "src/uu/base64" }
+basename = { optional = true, version = "0.0.24", package = "uu_basename", path = "src/uu/basename" }
+basenc = { optional = true, version = "0.0.24", package = "uu_basenc", path = "src/uu/basenc" }
+cat = { optional = true, version = "0.0.24", package = "uu_cat", path = "src/uu/cat" }
+chcon = { optional = true, version = "0.0.24", package = "uu_chcon", path = "src/uu/chcon" }
+chgrp = { optional = true, version = "0.0.24", package = "uu_chgrp", path = "src/uu/chgrp" }
+chmod = { optional = true, version = "0.0.24", package = "uu_chmod", path = "src/uu/chmod" }
+chown = { optional = true, version = "0.0.24", package = "uu_chown", path = "src/uu/chown" }
+chroot = { optional = true, version = "0.0.24", package = "uu_chroot", path = "src/uu/chroot" }
+cksum = { optional = true, version = "0.0.24", package = "uu_cksum", path = "src/uu/cksum" }
+comm = { optional = true, version = "0.0.24", package = "uu_comm", path = "src/uu/comm" }
+cp = { optional = true, version = "0.0.24", package = "uu_cp", path = "src/uu/cp" }
+csplit = { optional = true, version = "0.0.24", package = "uu_csplit", path = "src/uu/csplit" }
+cut = { optional = true, version = "0.0.24", package = "uu_cut", path = "src/uu/cut" }
+date = { optional = true, version = "0.0.24", package = "uu_date", path = "src/uu/date" }
+dd = { optional = true, version = "0.0.24", package = "uu_dd", path = "src/uu/dd" }
+df = { optional = true, version = "0.0.24", package = "uu_df", path = "src/uu/df" }
+dir = { optional = true, version = "0.0.24", package = "uu_dir", path = "src/uu/dir" }
+dircolors = { optional = true, version = "0.0.24", package = "uu_dircolors", path = "src/uu/dircolors" }
+dirname = { optional = true, version = "0.0.24", package = "uu_dirname", path = "src/uu/dirname" }
+du = { optional = true, version = "0.0.24", package = "uu_du", path = "src/uu/du" }
+echo = { optional = true, version = "0.0.24", package = "uu_echo", path = "src/uu/echo" }
+env = { optional = true, version = "0.0.24", package = "uu_env", path = "src/uu/env" }
+expand = { optional = true, version = "0.0.24", package = "uu_expand", path = "src/uu/expand" }
+expr = { optional = true, version = "0.0.24", package = "uu_expr", path = "src/uu/expr" }
+factor = { optional = true, version = "0.0.24", package = "uu_factor", path = "src/uu/factor" }
+false = { optional = true, version = "0.0.24", package = "uu_false", path = "src/uu/false" }
+fmt = { optional = true, version = "0.0.24", package = "uu_fmt", path = "src/uu/fmt" }
+fold = { optional = true, version = "0.0.24", package = "uu_fold", path = "src/uu/fold" }
+groups = { optional = true, version = "0.0.24", package = "uu_groups", path = "src/uu/groups" }
+hashsum = { optional = true, version = "0.0.24", package = "uu_hashsum", path = "src/uu/hashsum" }
+head = { optional = true, version = "0.0.24", package = "uu_head", path = "src/uu/head" }
+hostid = { optional = true, version = "0.0.24", package = "uu_hostid", path = "src/uu/hostid" }
+hostname = { optional = true, version = "0.0.24", package = "uu_hostname", path = "src/uu/hostname" }
+id = { optional = true, version = "0.0.24", package = "uu_id", path = "src/uu/id" }
+install = { optional = true, version = "0.0.24", package = "uu_install", path = "src/uu/install" }
+join = { optional = true, version = "0.0.24", package = "uu_join", path = "src/uu/join" }
+kill = { optional = true, version = "0.0.24", package = "uu_kill", path = "src/uu/kill" }
+link = { optional = true, version = "0.0.24", package = "uu_link", path = "src/uu/link" }
+ln = { optional = true, version = "0.0.24", package = "uu_ln", path = "src/uu/ln" }
+ls = { optional = true, version = "0.0.24", package = "uu_ls", path = "src/uu/ls" }
+logname = { optional = true, version = "0.0.24", package = "uu_logname", path = "src/uu/logname" }
+mkdir = { optional = true, version = "0.0.24", package = "uu_mkdir", path = "src/uu/mkdir" }
+mkfifo = { optional = true, version = "0.0.24", package = "uu_mkfifo", path = "src/uu/mkfifo" }
+mknod = { optional = true, version = "0.0.24", package = "uu_mknod", path = "src/uu/mknod" }
+mktemp = { optional = true, version = "0.0.24", package = "uu_mktemp", path = "src/uu/mktemp" }
+more = { optional = true, version = "0.0.24", package = "uu_more", path = "src/uu/more" }
+mv = { optional = true, version = "0.0.24", package = "uu_mv", path = "src/uu/mv" }
+nice = { optional = true, version = "0.0.24", package = "uu_nice", path = "src/uu/nice" }
+nl = { optional = true, version = "0.0.24", package = "uu_nl", path = "src/uu/nl" }
+nohup = { optional = true, version = "0.0.24", package = "uu_nohup", path = "src/uu/nohup" }
+nproc = { optional = true, version = "0.0.24", package = "uu_nproc", path = "src/uu/nproc" }
+numfmt = { optional = true, version = "0.0.24", package = "uu_numfmt", path = "src/uu/numfmt" }
+od = { optional = true, version = "0.0.24", package = "uu_od", path = "src/uu/od" }
+paste = { optional = true, version = "0.0.24", package = "uu_paste", path = "src/uu/paste" }
+pathchk = { optional = true, version = "0.0.24", package = "uu_pathchk", path = "src/uu/pathchk" }
+pinky = { optional = true, version = "0.0.24", package = "uu_pinky", path = "src/uu/pinky" }
+pr = { optional = true, version = "0.0.24", package = "uu_pr", path = "src/uu/pr" }
+printenv = { optional = true, version = "0.0.24", package = "uu_printenv", path = "src/uu/printenv" }
+printf = { optional = true, version = "0.0.24", package = "uu_printf", path = "src/uu/printf" }
+ptx = { optional = true, version = "0.0.24", package = "uu_ptx", path = "src/uu/ptx" }
+pwd = { optional = true, version = "0.0.24", package = "uu_pwd", path = "src/uu/pwd" }
+readlink = { optional = true, version = "0.0.24", package = "uu_readlink", path = "src/uu/readlink" }
+realpath = { optional = true, version = "0.0.24", package = "uu_realpath", path = "src/uu/realpath" }
+rm = { optional = true, version = "0.0.24", package = "uu_rm", path = "src/uu/rm" }
+rmdir = { optional = true, version = "0.0.24", package = "uu_rmdir", path = "src/uu/rmdir" }
+runcon = { optional = true, version = "0.0.24", package = "uu_runcon", path = "src/uu/runcon" }
+seq = { optional = true, version = "0.0.24", package = "uu_seq", path = "src/uu/seq" }
+shred = { optional = true, version = "0.0.24", package = "uu_shred", path = "src/uu/shred" }
+shuf = { optional = true, version = "0.0.24", package = "uu_shuf", path = "src/uu/shuf" }
+sleep = { optional = true, version = "0.0.24", package = "uu_sleep", path = "src/uu/sleep" }
+sort = { optional = true, version = "0.0.24", package = "uu_sort", path = "src/uu/sort" }
+split = { optional = true, version = "0.0.24", package = "uu_split", path = "src/uu/split" }
+stat = { optional = true, version = "0.0.24", package = "uu_stat", path = "src/uu/stat" }
+stdbuf = { optional = true, version = "0.0.24", package = "uu_stdbuf", path = "src/uu/stdbuf" }
+stty = { optional = true, version = "0.0.24", package = "uu_stty", path = "src/uu/stty" }
+sum = { optional = true, version = "0.0.24", package = "uu_sum", path = "src/uu/sum" }
+sync = { optional = true, version = "0.0.24", package = "uu_sync", path = "src/uu/sync" }
+tac = { optional = true, version = "0.0.24", package = "uu_tac", path = "src/uu/tac" }
+tail = { optional = true, version = "0.0.24", package = "uu_tail", path = "src/uu/tail" }
+tee = { optional = true, version = "0.0.24", package = "uu_tee", path = "src/uu/tee" }
+timeout = { optional = true, version = "0.0.24", package = "uu_timeout", path = "src/uu/timeout" }
+touch = { optional = true, version = "0.0.24", package = "uu_touch", path = "src/uu/touch" }
+tr = { optional = true, version = "0.0.24", package = "uu_tr", path = "src/uu/tr" }
+true = { optional = true, version = "0.0.24", package = "uu_true", path = "src/uu/true" }
+truncate = { optional = true, version = "0.0.24", package = "uu_truncate", path = "src/uu/truncate" }
+tsort = { optional = true, version = "0.0.24", package = "uu_tsort", path = "src/uu/tsort" }
+tty = { optional = true, version = "0.0.24", package = "uu_tty", path = "src/uu/tty" }
+uname = { optional = true, version = "0.0.24", package = "uu_uname", path = "src/uu/uname" }
+unexpand = { optional = true, version = "0.0.24", package = "uu_unexpand", path = "src/uu/unexpand" }
+uniq = { optional = true, version = "0.0.24", package = "uu_uniq", path = "src/uu/uniq" }
+unlink = { optional = true, version = "0.0.24", package = "uu_unlink", path = "src/uu/unlink" }
+uptime = { optional = true, version = "0.0.24", package = "uu_uptime", path = "src/uu/uptime" }
+users = { optional = true, version = "0.0.24", package = "uu_users", path = "src/uu/users" }
+vdir = { optional = true, version = "0.0.24", package = "uu_vdir", path = "src/uu/vdir" }
+wc = { optional = true, version = "0.0.24", package = "uu_wc", path = "src/uu/wc" }
+who = { optional = true, version = "0.0.24", package = "uu_who", path = "src/uu/who" }
+whoami = { optional = true, version = "0.0.24", package = "uu_whoami", path = "src/uu/whoami" }
+yes = { optional = true, version = "0.0.24", package = "uu_yes", path = "src/uu/yes" }
 
 # this breaks clippy linting with: "tests/by-util/test_factor_benches.rs: No such file or directory (os error 2)"
 # factor_benches = { optional = true, version = "0.0.0", package = "uu_factor_benches", path = "tests/benches/factor" }
diff --git a/src/uu/arch/Cargo.toml b/src/uu/arch/Cargo.toml
index edb15f846c2..b4d07b26c59 100644
--- a/src/uu/arch/Cargo.toml
+++ b/src/uu/arch/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_arch"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "arch ~ (uutils) display machine architecture"
diff --git a/src/uu/base32/Cargo.toml b/src/uu/base32/Cargo.toml
index 71fbe325fe8..1c27e14cf3f 100644
--- a/src/uu/base32/Cargo.toml
+++ b/src/uu/base32/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_base32"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "base32 ~ (uutils) decode/encode input (base32-encoding)"
diff --git a/src/uu/base64/Cargo.toml b/src/uu/base64/Cargo.toml
index e52665bb692..204b880bf72 100644
--- a/src/uu/base64/Cargo.toml
+++ b/src/uu/base64/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_base64"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "base64 ~ (uutils) decode/encode input (base64-encoding)"
diff --git a/src/uu/basename/Cargo.toml b/src/uu/basename/Cargo.toml
index 3de240e04a9..51202235b15 100644
--- a/src/uu/basename/Cargo.toml
+++ b/src/uu/basename/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_basename"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "basename ~ (uutils) display PATHNAME with leading directory components removed"
diff --git a/src/uu/basenc/Cargo.toml b/src/uu/basenc/Cargo.toml
index 54a5a53a118..26a2364282f 100644
--- a/src/uu/basenc/Cargo.toml
+++ b/src/uu/basenc/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_basenc"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "basenc ~ (uutils) decode/encode input"
diff --git a/src/uu/cat/Cargo.toml b/src/uu/cat/Cargo.toml
index 14383895e7d..cce6561c084 100644
--- a/src/uu/cat/Cargo.toml
+++ b/src/uu/cat/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_cat"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "cat ~ (uutils) concatenate and display input"
diff --git a/src/uu/chcon/Cargo.toml b/src/uu/chcon/Cargo.toml
index d21da4cf04d..021e435823a 100644
--- a/src/uu/chcon/Cargo.toml
+++ b/src/uu/chcon/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_chcon"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "chcon ~ (uutils) change file security context"
diff --git a/src/uu/chgrp/Cargo.toml b/src/uu/chgrp/Cargo.toml
index 79942033f1e..bbad8d31e6e 100644
--- a/src/uu/chgrp/Cargo.toml
+++ b/src/uu/chgrp/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_chgrp"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "chgrp ~ (uutils) change the group ownership of FILE"
diff --git a/src/uu/chmod/Cargo.toml b/src/uu/chmod/Cargo.toml
index ebfe00fe1c5..e779469deda 100644
--- a/src/uu/chmod/Cargo.toml
+++ b/src/uu/chmod/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_chmod"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "chmod ~ (uutils) change mode of FILE"
diff --git a/src/uu/chown/Cargo.toml b/src/uu/chown/Cargo.toml
index aab8f20b6c1..dfa9dba32a1 100644
--- a/src/uu/chown/Cargo.toml
+++ b/src/uu/chown/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_chown"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "chown ~ (uutils) change the ownership of FILE"
diff --git a/src/uu/chroot/Cargo.toml b/src/uu/chroot/Cargo.toml
index a78c89685bf..12533b6542a 100644
--- a/src/uu/chroot/Cargo.toml
+++ b/src/uu/chroot/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_chroot"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "chroot ~ (uutils) run COMMAND under a new root directory"
diff --git a/src/uu/cksum/Cargo.toml b/src/uu/cksum/Cargo.toml
index 9a811fafdbc..47b4d73592a 100644
--- a/src/uu/cksum/Cargo.toml
+++ b/src/uu/cksum/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_cksum"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "cksum ~ (uutils) display CRC and size of input"
diff --git a/src/uu/comm/Cargo.toml b/src/uu/comm/Cargo.toml
index 71ed0ad717f..cd759aad246 100644
--- a/src/uu/comm/Cargo.toml
+++ b/src/uu/comm/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_comm"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "comm ~ (uutils) compare sorted inputs"
diff --git a/src/uu/cp/Cargo.toml b/src/uu/cp/Cargo.toml
index 179b4668e68..7db6b202bb2 100644
--- a/src/uu/cp/Cargo.toml
+++ b/src/uu/cp/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_cp"
-version = "0.0.23"
+version = "0.0.24"
 authors = [
   "Jordy Dickinson <jordy.dickinson@gmail.com>",
   "Joshua S. Miller <jsmiller@uchicago.edu>",
diff --git a/src/uu/csplit/Cargo.toml b/src/uu/csplit/Cargo.toml
index e68b1258253..5e2f310cb51 100644
--- a/src/uu/csplit/Cargo.toml
+++ b/src/uu/csplit/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_csplit"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "csplit ~ (uutils) Output pieces of FILE separated by PATTERN(s) to files 'xx00', 'xx01', ..., and output byte counts of each piece to standard output"
diff --git a/src/uu/cut/Cargo.toml b/src/uu/cut/Cargo.toml
index e572d987ec4..c98bec5bc42 100644
--- a/src/uu/cut/Cargo.toml
+++ b/src/uu/cut/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_cut"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "cut ~ (uutils) display byte/field columns of input lines"
diff --git a/src/uu/date/Cargo.toml b/src/uu/date/Cargo.toml
index c5682f83e5a..11ad64bbef7 100644
--- a/src/uu/date/Cargo.toml
+++ b/src/uu/date/Cargo.toml
@@ -1,7 +1,7 @@
 # spell-checker:ignore datetime
 [package]
 name = "uu_date"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "date ~ (uutils) display or set the current time"
diff --git a/src/uu/dd/Cargo.toml b/src/uu/dd/Cargo.toml
index 410ebf4d6a8..1dbb37bde55 100644
--- a/src/uu/dd/Cargo.toml
+++ b/src/uu/dd/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_dd"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "dd ~ (uutils) copy and convert files"
diff --git a/src/uu/df/Cargo.toml b/src/uu/df/Cargo.toml
index d074e6be74f..e9aa192e820 100644
--- a/src/uu/df/Cargo.toml
+++ b/src/uu/df/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_df"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "df ~ (uutils) display file system information"
diff --git a/src/uu/dir/Cargo.toml b/src/uu/dir/Cargo.toml
index 628c0fb8cfe..b82298ce319 100644
--- a/src/uu/dir/Cargo.toml
+++ b/src/uu/dir/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_dir"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "shortcut to ls -C -b"
diff --git a/src/uu/dircolors/Cargo.toml b/src/uu/dircolors/Cargo.toml
index 66ee792f839..1bf87c22cc1 100644
--- a/src/uu/dircolors/Cargo.toml
+++ b/src/uu/dircolors/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_dircolors"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "dircolors ~ (uutils) display commands to set LS_COLORS"
diff --git a/src/uu/dirname/Cargo.toml b/src/uu/dirname/Cargo.toml
index b093ce3c55c..85391859663 100644
--- a/src/uu/dirname/Cargo.toml
+++ b/src/uu/dirname/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_dirname"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "dirname ~ (uutils) display parent directory of PATHNAME"
diff --git a/src/uu/du/Cargo.toml b/src/uu/du/Cargo.toml
index 5e87b2f4381..8b9eb062e48 100644
--- a/src/uu/du/Cargo.toml
+++ b/src/uu/du/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_du"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "du ~ (uutils) display disk usage"
diff --git a/src/uu/echo/Cargo.toml b/src/uu/echo/Cargo.toml
index e63977e57f7..ddb896c3389 100644
--- a/src/uu/echo/Cargo.toml
+++ b/src/uu/echo/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_echo"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "echo ~ (uutils) display TEXT"
diff --git a/src/uu/env/Cargo.toml b/src/uu/env/Cargo.toml
index a1df3563b20..26fa1ebbec8 100644
--- a/src/uu/env/Cargo.toml
+++ b/src/uu/env/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_env"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "env ~ (uutils) set each NAME to VALUE in the environment and run COMMAND"
diff --git a/src/uu/expand/Cargo.toml b/src/uu/expand/Cargo.toml
index 63425bc5ea1..87f8f8f7716 100644
--- a/src/uu/expand/Cargo.toml
+++ b/src/uu/expand/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_expand"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "expand ~ (uutils) convert input tabs to spaces"
diff --git a/src/uu/expr/Cargo.toml b/src/uu/expr/Cargo.toml
index a867c27c80a..17d37413e26 100644
--- a/src/uu/expr/Cargo.toml
+++ b/src/uu/expr/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_expr"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "expr ~ (uutils) display the value of EXPRESSION"
diff --git a/src/uu/factor/Cargo.toml b/src/uu/factor/Cargo.toml
index aee67eeeaf0..a149056888a 100644
--- a/src/uu/factor/Cargo.toml
+++ b/src/uu/factor/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_factor"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "factor ~ (uutils) display the prime factors of each NUMBER"
diff --git a/src/uu/false/Cargo.toml b/src/uu/false/Cargo.toml
index 50b5bc027d8..e88fa99783f 100644
--- a/src/uu/false/Cargo.toml
+++ b/src/uu/false/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_false"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "false ~ (uutils) do nothing and fail"
diff --git a/src/uu/fmt/Cargo.toml b/src/uu/fmt/Cargo.toml
index 688525e3b00..de415310f2f 100644
--- a/src/uu/fmt/Cargo.toml
+++ b/src/uu/fmt/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_fmt"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "fmt ~ (uutils) reformat each paragraph of input"
diff --git a/src/uu/fold/Cargo.toml b/src/uu/fold/Cargo.toml
index 1887f1bbd3a..02cf1115ec2 100644
--- a/src/uu/fold/Cargo.toml
+++ b/src/uu/fold/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_fold"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "fold ~ (uutils) wrap each line of input"
diff --git a/src/uu/groups/Cargo.toml b/src/uu/groups/Cargo.toml
index 9c513517500..dac52fc5864 100644
--- a/src/uu/groups/Cargo.toml
+++ b/src/uu/groups/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_groups"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "groups ~ (uutils) display group memberships for USERNAME"
diff --git a/src/uu/hashsum/Cargo.toml b/src/uu/hashsum/Cargo.toml
index 1ecb5f8403c..a20fe0d7826 100644
--- a/src/uu/hashsum/Cargo.toml
+++ b/src/uu/hashsum/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_hashsum"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "hashsum ~ (uutils) display or check input digests"
diff --git a/src/uu/head/Cargo.toml b/src/uu/head/Cargo.toml
index 12872c80820..45e51b881b2 100644
--- a/src/uu/head/Cargo.toml
+++ b/src/uu/head/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_head"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "head ~ (uutils) display the first lines of input"
diff --git a/src/uu/hostid/Cargo.toml b/src/uu/hostid/Cargo.toml
index 602e7ef3751..8e551befb4a 100644
--- a/src/uu/hostid/Cargo.toml
+++ b/src/uu/hostid/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_hostid"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "hostid ~ (uutils) display the numeric identifier of the current host"
diff --git a/src/uu/hostname/Cargo.toml b/src/uu/hostname/Cargo.toml
index 1fe10170964..7dd6eabe5ad 100644
--- a/src/uu/hostname/Cargo.toml
+++ b/src/uu/hostname/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_hostname"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "hostname ~ (uutils) display or set the host name of the current host"
diff --git a/src/uu/id/Cargo.toml b/src/uu/id/Cargo.toml
index b62df1eebd2..6d332acfc3c 100644
--- a/src/uu/id/Cargo.toml
+++ b/src/uu/id/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_id"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "id ~ (uutils) display user and group information for USER"
diff --git a/src/uu/install/Cargo.toml b/src/uu/install/Cargo.toml
index cc687efdb3d..647e0958ee0 100644
--- a/src/uu/install/Cargo.toml
+++ b/src/uu/install/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_install"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["Ben Eills <ben@beneills.com>", "uutils developers"]
 license = "MIT"
 description = "install ~ (uutils) copy files from SOURCE to DESTINATION (with specified attributes)"
diff --git a/src/uu/join/Cargo.toml b/src/uu/join/Cargo.toml
index 20853527d83..759b04af712 100644
--- a/src/uu/join/Cargo.toml
+++ b/src/uu/join/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_join"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "join ~ (uutils) merge lines from inputs with matching join fields"
diff --git a/src/uu/kill/Cargo.toml b/src/uu/kill/Cargo.toml
index 6cb8cee6e3d..e60faa1c455 100644
--- a/src/uu/kill/Cargo.toml
+++ b/src/uu/kill/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_kill"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "kill ~ (uutils) send a signal to a process"
diff --git a/src/uu/link/Cargo.toml b/src/uu/link/Cargo.toml
index cba12c95c3b..d3643c5dcf6 100644
--- a/src/uu/link/Cargo.toml
+++ b/src/uu/link/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_link"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "link ~ (uutils) create a hard (file system) link to FILE"
diff --git a/src/uu/ln/Cargo.toml b/src/uu/ln/Cargo.toml
index 4243075ea0a..ba97c84e365 100644
--- a/src/uu/ln/Cargo.toml
+++ b/src/uu/ln/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_ln"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "ln ~ (uutils) create a (file system) link to TARGET"
diff --git a/src/uu/logname/Cargo.toml b/src/uu/logname/Cargo.toml
index 2e8553f12c4..d9870b1d99c 100644
--- a/src/uu/logname/Cargo.toml
+++ b/src/uu/logname/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_logname"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "logname ~ (uutils) display the login name of the current user"
diff --git a/src/uu/ls/Cargo.toml b/src/uu/ls/Cargo.toml
index dc79c6f93d0..49c64ba0937 100644
--- a/src/uu/ls/Cargo.toml
+++ b/src/uu/ls/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_ls"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "ls ~ (uutils) display directory contents"
diff --git a/src/uu/mkdir/Cargo.toml b/src/uu/mkdir/Cargo.toml
index 4f6ddb3cc02..a0ba24b42e8 100644
--- a/src/uu/mkdir/Cargo.toml
+++ b/src/uu/mkdir/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_mkdir"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "mkdir ~ (uutils) create DIRECTORY"
diff --git a/src/uu/mkfifo/Cargo.toml b/src/uu/mkfifo/Cargo.toml
index d7f787511a8..10ff3661686 100644
--- a/src/uu/mkfifo/Cargo.toml
+++ b/src/uu/mkfifo/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_mkfifo"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "mkfifo ~ (uutils) create FIFOs (named pipes)"
diff --git a/src/uu/mknod/Cargo.toml b/src/uu/mknod/Cargo.toml
index 58caa5d9dc4..000fe4d01a5 100644
--- a/src/uu/mknod/Cargo.toml
+++ b/src/uu/mknod/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_mknod"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "mknod ~ (uutils) create special file NAME of TYPE"
diff --git a/src/uu/mktemp/Cargo.toml b/src/uu/mktemp/Cargo.toml
index 2913e4b6e02..504c46350d7 100644
--- a/src/uu/mktemp/Cargo.toml
+++ b/src/uu/mktemp/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_mktemp"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "mktemp ~ (uutils) create and display a temporary file or directory from TEMPLATE"
diff --git a/src/uu/more/Cargo.toml b/src/uu/more/Cargo.toml
index 9f0bc9d3d65..58957a08c74 100644
--- a/src/uu/more/Cargo.toml
+++ b/src/uu/more/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_more"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "more ~ (uutils) input perusal filter"
diff --git a/src/uu/mv/Cargo.toml b/src/uu/mv/Cargo.toml
index 83d68bc3d82..4193f9595cb 100644
--- a/src/uu/mv/Cargo.toml
+++ b/src/uu/mv/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_mv"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "mv ~ (uutils) move (rename) SOURCE to DESTINATION"
diff --git a/src/uu/nice/Cargo.toml b/src/uu/nice/Cargo.toml
index 6fab5cefc24..7285318ef63 100644
--- a/src/uu/nice/Cargo.toml
+++ b/src/uu/nice/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_nice"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "nice ~ (uutils) run PROGRAM with modified scheduling priority"
diff --git a/src/uu/nl/Cargo.toml b/src/uu/nl/Cargo.toml
index 56cb8d8e94e..35b0f3d848b 100644
--- a/src/uu/nl/Cargo.toml
+++ b/src/uu/nl/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_nl"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "nl ~ (uutils) display input with added line numbers"
diff --git a/src/uu/nohup/Cargo.toml b/src/uu/nohup/Cargo.toml
index 24d8f659c7e..8e8bd50cb4d 100644
--- a/src/uu/nohup/Cargo.toml
+++ b/src/uu/nohup/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_nohup"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "nohup ~ (uutils) run COMMAND, ignoring hangup signals"
diff --git a/src/uu/nproc/Cargo.toml b/src/uu/nproc/Cargo.toml
index 54bb1d83c09..9e6efc559c1 100644
--- a/src/uu/nproc/Cargo.toml
+++ b/src/uu/nproc/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_nproc"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "nproc ~ (uutils) display the number of processing units available"
diff --git a/src/uu/numfmt/Cargo.toml b/src/uu/numfmt/Cargo.toml
index 79e6d5401aa..71505d4b7db 100644
--- a/src/uu/numfmt/Cargo.toml
+++ b/src/uu/numfmt/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_numfmt"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "numfmt ~ (uutils) reformat NUMBER"
diff --git a/src/uu/od/Cargo.toml b/src/uu/od/Cargo.toml
index 84c89ee8611..e2c0a236b93 100644
--- a/src/uu/od/Cargo.toml
+++ b/src/uu/od/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_od"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "od ~ (uutils) display formatted representation of input"
diff --git a/src/uu/paste/Cargo.toml b/src/uu/paste/Cargo.toml
index 68255c82ddd..0ab1015b9df 100644
--- a/src/uu/paste/Cargo.toml
+++ b/src/uu/paste/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_paste"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "paste ~ (uutils) merge lines from inputs"
diff --git a/src/uu/pathchk/Cargo.toml b/src/uu/pathchk/Cargo.toml
index dee85deae55..eeb667ac349 100644
--- a/src/uu/pathchk/Cargo.toml
+++ b/src/uu/pathchk/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_pathchk"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "pathchk ~ (uutils) diagnose invalid or non-portable PATHNAME"
diff --git a/src/uu/pinky/Cargo.toml b/src/uu/pinky/Cargo.toml
index f64cb758510..ba1dbc09688 100644
--- a/src/uu/pinky/Cargo.toml
+++ b/src/uu/pinky/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_pinky"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "pinky ~ (uutils) display user information"
diff --git a/src/uu/pr/Cargo.toml b/src/uu/pr/Cargo.toml
index ab54593837f..4d09ad7afc8 100644
--- a/src/uu/pr/Cargo.toml
+++ b/src/uu/pr/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_pr"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "pr ~ (uutils) convert text files for printing"
diff --git a/src/uu/printenv/Cargo.toml b/src/uu/printenv/Cargo.toml
index a6d7c91d046..32765a1f1e9 100644
--- a/src/uu/printenv/Cargo.toml
+++ b/src/uu/printenv/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_printenv"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "printenv ~ (uutils) display value of environment VAR"
diff --git a/src/uu/printf/Cargo.toml b/src/uu/printf/Cargo.toml
index 0404654e207..0033c31494b 100644
--- a/src/uu/printf/Cargo.toml
+++ b/src/uu/printf/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_printf"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["Nathan Ross", "uutils developers"]
 license = "MIT"
 description = "printf ~ (uutils) FORMAT and display ARGUMENTS"
diff --git a/src/uu/ptx/Cargo.toml b/src/uu/ptx/Cargo.toml
index 4ea395dc5cc..30bee8642b1 100644
--- a/src/uu/ptx/Cargo.toml
+++ b/src/uu/ptx/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_ptx"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "ptx ~ (uutils) display a permuted index of input"
diff --git a/src/uu/pwd/Cargo.toml b/src/uu/pwd/Cargo.toml
index 8bd0ccece58..82cd4cf8ee1 100644
--- a/src/uu/pwd/Cargo.toml
+++ b/src/uu/pwd/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_pwd"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "pwd ~ (uutils) display current working directory"
diff --git a/src/uu/readlink/Cargo.toml b/src/uu/readlink/Cargo.toml
index 4d1574c50be..cb17296129f 100644
--- a/src/uu/readlink/Cargo.toml
+++ b/src/uu/readlink/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_readlink"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "readlink ~ (uutils) display resolved path of PATHNAME"
diff --git a/src/uu/realpath/Cargo.toml b/src/uu/realpath/Cargo.toml
index 8b21d6c7f8d..942f9601640 100644
--- a/src/uu/realpath/Cargo.toml
+++ b/src/uu/realpath/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_realpath"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "realpath ~ (uutils) display resolved absolute path of PATHNAME"
diff --git a/src/uu/rm/Cargo.toml b/src/uu/rm/Cargo.toml
index 34ada60e865..a36251838d5 100644
--- a/src/uu/rm/Cargo.toml
+++ b/src/uu/rm/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_rm"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "rm ~ (uutils) remove PATHNAME"
diff --git a/src/uu/rmdir/Cargo.toml b/src/uu/rmdir/Cargo.toml
index f17db50b0ee..e567b98b69d 100644
--- a/src/uu/rmdir/Cargo.toml
+++ b/src/uu/rmdir/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_rmdir"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "rmdir ~ (uutils) remove empty DIRECTORY"
diff --git a/src/uu/runcon/Cargo.toml b/src/uu/runcon/Cargo.toml
index 72237ece95a..e22f2e9d1ca 100644
--- a/src/uu/runcon/Cargo.toml
+++ b/src/uu/runcon/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_runcon"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "runcon ~ (uutils) run command with specified security context"
diff --git a/src/uu/seq/Cargo.toml b/src/uu/seq/Cargo.toml
index afa4f9ecaf5..dca08f5d064 100644
--- a/src/uu/seq/Cargo.toml
+++ b/src/uu/seq/Cargo.toml
@@ -1,7 +1,7 @@
 # spell-checker:ignore bigdecimal
 [package]
 name = "uu_seq"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "seq ~ (uutils) display a sequence of numbers"
diff --git a/src/uu/shred/Cargo.toml b/src/uu/shred/Cargo.toml
index 8721cd624f0..97fab64e1f6 100644
--- a/src/uu/shred/Cargo.toml
+++ b/src/uu/shred/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_shred"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "shred ~ (uutils) hide former FILE contents with repeated overwrites"
diff --git a/src/uu/shuf/Cargo.toml b/src/uu/shuf/Cargo.toml
index 2bbf2af149d..c1d2de7c8bd 100644
--- a/src/uu/shuf/Cargo.toml
+++ b/src/uu/shuf/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_shuf"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "shuf ~ (uutils) display random permutations of input lines"
diff --git a/src/uu/sleep/Cargo.toml b/src/uu/sleep/Cargo.toml
index d3d1fe61e9f..94789f31312 100644
--- a/src/uu/sleep/Cargo.toml
+++ b/src/uu/sleep/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_sleep"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "sleep ~ (uutils) pause for DURATION"
diff --git a/src/uu/sort/Cargo.toml b/src/uu/sort/Cargo.toml
index 8c1c03dc638..7f5938c7034 100644
--- a/src/uu/sort/Cargo.toml
+++ b/src/uu/sort/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_sort"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "sort ~ (uutils) sort input lines"
diff --git a/src/uu/split/Cargo.toml b/src/uu/split/Cargo.toml
index 6253dbf2be3..5a7ded4bc8b 100644
--- a/src/uu/split/Cargo.toml
+++ b/src/uu/split/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_split"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "split ~ (uutils) split input into output files"
diff --git a/src/uu/stat/Cargo.toml b/src/uu/stat/Cargo.toml
index 5ed91a88cb6..dd28fc5f382 100644
--- a/src/uu/stat/Cargo.toml
+++ b/src/uu/stat/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_stat"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "stat ~ (uutils) display FILE status"
diff --git a/src/uu/stdbuf/Cargo.toml b/src/uu/stdbuf/Cargo.toml
index ed7a0e2e11e..fdee4f68433 100644
--- a/src/uu/stdbuf/Cargo.toml
+++ b/src/uu/stdbuf/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_stdbuf"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "stdbuf ~ (uutils) run COMMAND with modified standard stream buffering"
@@ -20,7 +20,7 @@ tempfile = { workspace = true }
 uucore = { workspace = true }
 
 [build-dependencies]
-libstdbuf = { version = "0.0.23", package = "uu_stdbuf_libstdbuf", path = "src/libstdbuf" }
+libstdbuf = { version = "0.0.24", package = "uu_stdbuf_libstdbuf", path = "src/libstdbuf" }
 
 [[bin]]
 name = "stdbuf"
diff --git a/src/uu/stdbuf/src/libstdbuf/Cargo.toml b/src/uu/stdbuf/src/libstdbuf/Cargo.toml
index eaa82e6e73d..eab74dc089e 100644
--- a/src/uu/stdbuf/src/libstdbuf/Cargo.toml
+++ b/src/uu/stdbuf/src/libstdbuf/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_stdbuf_libstdbuf"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "stdbuf/libstdbuf ~ (uutils); dynamic library required for stdbuf"
diff --git a/src/uu/stty/Cargo.toml b/src/uu/stty/Cargo.toml
index a353c66030f..51863220d5f 100644
--- a/src/uu/stty/Cargo.toml
+++ b/src/uu/stty/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_stty"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "stty ~ (uutils) print or change terminal characteristics"
diff --git a/src/uu/sum/Cargo.toml b/src/uu/sum/Cargo.toml
index 04be0fe72db..56711b6fd29 100644
--- a/src/uu/sum/Cargo.toml
+++ b/src/uu/sum/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_sum"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "sum ~ (uutils) display checksum and block counts for input"
diff --git a/src/uu/sync/Cargo.toml b/src/uu/sync/Cargo.toml
index 4048115243a..0c93433928c 100644
--- a/src/uu/sync/Cargo.toml
+++ b/src/uu/sync/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_sync"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "sync ~ (uutils) synchronize cache writes to storage"
diff --git a/src/uu/tac/Cargo.toml b/src/uu/tac/Cargo.toml
index 164972c5f45..a89f179e388 100644
--- a/src/uu/tac/Cargo.toml
+++ b/src/uu/tac/Cargo.toml
@@ -2,7 +2,7 @@
 
 [package]
 name = "uu_tac"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "tac ~ (uutils) concatenate and display input lines in reverse order"
diff --git a/src/uu/tail/Cargo.toml b/src/uu/tail/Cargo.toml
index 636480e08ba..826f7f83daf 100644
--- a/src/uu/tail/Cargo.toml
+++ b/src/uu/tail/Cargo.toml
@@ -1,7 +1,7 @@
 # spell-checker:ignore (libs) kqueue fundu
 [package]
 name = "uu_tail"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "tail ~ (uutils) display the last lines of input"
diff --git a/src/uu/tee/Cargo.toml b/src/uu/tee/Cargo.toml
index 441b891a4ad..b84e7cb314a 100644
--- a/src/uu/tee/Cargo.toml
+++ b/src/uu/tee/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_tee"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "tee ~ (uutils) display input and copy to FILE"
diff --git a/src/uu/test/Cargo.toml b/src/uu/test/Cargo.toml
index 93a77b11d4a..35132cd27b2 100644
--- a/src/uu/test/Cargo.toml
+++ b/src/uu/test/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_test"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "test ~ (uutils) evaluate comparison and file type expressions"
diff --git a/src/uu/timeout/Cargo.toml b/src/uu/timeout/Cargo.toml
index 4f6c062bb8a..3a9500a2e96 100644
--- a/src/uu/timeout/Cargo.toml
+++ b/src/uu/timeout/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_timeout"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "timeout ~ (uutils) run COMMAND with a DURATION time limit"
diff --git a/src/uu/touch/Cargo.toml b/src/uu/touch/Cargo.toml
index d67cd1f8a16..51cc4ac3f41 100644
--- a/src/uu/touch/Cargo.toml
+++ b/src/uu/touch/Cargo.toml
@@ -1,7 +1,7 @@
 # spell-checker:ignore datetime
 [package]
 name = "uu_touch"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "touch ~ (uutils) change FILE timestamps"
diff --git a/src/uu/tr/Cargo.toml b/src/uu/tr/Cargo.toml
index a07679dd187..ff1efbe921f 100644
--- a/src/uu/tr/Cargo.toml
+++ b/src/uu/tr/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_tr"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "tr ~ (uutils) translate characters within input and display"
diff --git a/src/uu/true/Cargo.toml b/src/uu/true/Cargo.toml
index 8c4080724b6..eae893d2176 100644
--- a/src/uu/true/Cargo.toml
+++ b/src/uu/true/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_true"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "true ~ (uutils) do nothing and succeed"
diff --git a/src/uu/truncate/Cargo.toml b/src/uu/truncate/Cargo.toml
index 254a004e779..2ea443ce7f4 100644
--- a/src/uu/truncate/Cargo.toml
+++ b/src/uu/truncate/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_truncate"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "truncate ~ (uutils) truncate (or extend) FILE to SIZE"
diff --git a/src/uu/tsort/Cargo.toml b/src/uu/tsort/Cargo.toml
index 567d41e0b79..f0430b41b3b 100644
--- a/src/uu/tsort/Cargo.toml
+++ b/src/uu/tsort/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_tsort"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "tsort ~ (uutils) topologically sort input (partially ordered) pairs"
diff --git a/src/uu/tty/Cargo.toml b/src/uu/tty/Cargo.toml
index 95734e6c933..d6065d4679e 100644
--- a/src/uu/tty/Cargo.toml
+++ b/src/uu/tty/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_tty"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "tty ~ (uutils) display the name of the terminal connected to standard input"
diff --git a/src/uu/uname/Cargo.toml b/src/uu/uname/Cargo.toml
index cfd459c5bf1..f9883eef93c 100644
--- a/src/uu/uname/Cargo.toml
+++ b/src/uu/uname/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_uname"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "uname ~ (uutils) display system information"
diff --git a/src/uu/unexpand/Cargo.toml b/src/uu/unexpand/Cargo.toml
index 459a67b9015..d10239b960e 100644
--- a/src/uu/unexpand/Cargo.toml
+++ b/src/uu/unexpand/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_unexpand"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "unexpand ~ (uutils) convert input spaces to tabs"
diff --git a/src/uu/uniq/Cargo.toml b/src/uu/uniq/Cargo.toml
index efe5ca8ee53..52d1d22e16a 100644
--- a/src/uu/uniq/Cargo.toml
+++ b/src/uu/uniq/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_uniq"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "uniq ~ (uutils) filter identical adjacent lines from input"
diff --git a/src/uu/unlink/Cargo.toml b/src/uu/unlink/Cargo.toml
index c6bfcd66bb7..854df092c1b 100644
--- a/src/uu/unlink/Cargo.toml
+++ b/src/uu/unlink/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_unlink"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "unlink ~ (uutils) remove a (file system) link to FILE"
diff --git a/src/uu/uptime/Cargo.toml b/src/uu/uptime/Cargo.toml
index 899a30dfaa5..0013e980a67 100644
--- a/src/uu/uptime/Cargo.toml
+++ b/src/uu/uptime/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_uptime"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "uptime ~ (uutils) display dynamic system information"
diff --git a/src/uu/users/Cargo.toml b/src/uu/users/Cargo.toml
index 030c7d62551..8e29b119e8a 100644
--- a/src/uu/users/Cargo.toml
+++ b/src/uu/users/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_users"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "users ~ (uutils) display names of currently logged-in users"
diff --git a/src/uu/vdir/Cargo.toml b/src/uu/vdir/Cargo.toml
index d14e10d9565..3c7e55eda69 100644
--- a/src/uu/vdir/Cargo.toml
+++ b/src/uu/vdir/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_vdir"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "shortcut to ls -l -b"
diff --git a/src/uu/wc/Cargo.toml b/src/uu/wc/Cargo.toml
index 8471472f867..516e3be46a3 100644
--- a/src/uu/wc/Cargo.toml
+++ b/src/uu/wc/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_wc"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "wc ~ (uutils) display newline, word, and byte counts for input"
diff --git a/src/uu/who/Cargo.toml b/src/uu/who/Cargo.toml
index 249d5a8eeec..f343942fc4b 100644
--- a/src/uu/who/Cargo.toml
+++ b/src/uu/who/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_who"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "who ~ (uutils) display information about currently logged-in users"
diff --git a/src/uu/whoami/Cargo.toml b/src/uu/whoami/Cargo.toml
index 5336568334f..3d2abb034a7 100644
--- a/src/uu/whoami/Cargo.toml
+++ b/src/uu/whoami/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_whoami"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "whoami ~ (uutils) display user name of current effective user ID"
diff --git a/src/uu/yes/Cargo.toml b/src/uu/yes/Cargo.toml
index dd562cab675..1f59bdb16f5 100644
--- a/src/uu/yes/Cargo.toml
+++ b/src/uu/yes/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "uu_yes"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "yes ~ (uutils) repeatedly display a line with STRING (or 'y')"
diff --git a/src/uucore/Cargo.toml b/src/uucore/Cargo.toml
index 8500faeff8f..78c01cd071c 100644
--- a/src/uucore/Cargo.toml
+++ b/src/uucore/Cargo.toml
@@ -2,7 +2,7 @@
 
 [package]
 name = "uucore"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["uutils developers"]
 license = "MIT"
 description = "uutils ~ 'core' uutils code library (cross-platform)"
diff --git a/src/uucore_procs/Cargo.toml b/src/uucore_procs/Cargo.toml
index f6b92fe6353..2411bb6c166 100644
--- a/src/uucore_procs/Cargo.toml
+++ b/src/uucore_procs/Cargo.toml
@@ -1,7 +1,7 @@
 # spell-checker:ignore uuhelp
 [package]
 name = "uucore_procs"
-version = "0.0.23"
+version = "0.0.24"
 authors = ["Roy Ivy III <rivy.dev@gmail.com>"]
 license = "MIT"
 description = "uutils ~ 'uucore' proc-macros"
@@ -19,4 +19,4 @@ proc-macro = true
 [dependencies]
 proc-macro2 = "1.0"
 quote = "1.0"
-uuhelp_parser = { path = "../uuhelp_parser", version = "0.0.23" }
+uuhelp_parser = { path = "../uuhelp_parser", version = "0.0.24" }
diff --git a/src/uuhelp_parser/Cargo.toml b/src/uuhelp_parser/Cargo.toml
index cbf049f9dba..018aa1d898f 100644
--- a/src/uuhelp_parser/Cargo.toml
+++ b/src/uuhelp_parser/Cargo.toml
@@ -1,7 +1,7 @@
 # spell-checker:ignore uuhelp
 [package]
 name = "uuhelp_parser"
-version = "0.0.23"
+version = "0.0.24"
 edition = "2021"
 license = "MIT"
 description = "A collection of functions to parse the markdown code of help files"
diff --git a/util/update-version.sh b/util/update-version.sh
index 244a7a7b29a..7f785f1d7af 100755
--- a/util/update-version.sh
+++ b/util/update-version.sh
@@ -17,8 +17,8 @@
 # 10) Create the release on github https://github.com/uutils/coreutils/releases/new
 # 11) Make sure we have good release notes
 
-FROM="0.0.22"
-TO="0.0.23"
+FROM="0.0.23"
+TO="0.0.24"
 
 PROGS=$(ls -1d src/uu/*/Cargo.toml src/uu/stdbuf/src/libstdbuf/Cargo.toml src/uucore/Cargo.toml Cargo.toml)
 

From 5006db2e9225992aa75706f7fccf2db48e44fe2d Mon Sep 17 00:00:00 2001
From: "renovate[bot]" <29139614+renovate[bot]@users.noreply.github.com>
Date: Sun, 21 Jan 2024 16:53:53 +0000
Subject: [PATCH 425/429] chore(deps): update rust crate regex to 1.10.3

---
 Cargo.lock | 8 ++++----
 Cargo.toml | 2 +-
 2 files changed, 5 insertions(+), 5 deletions(-)

diff --git a/Cargo.lock b/Cargo.lock
index 6b7ba1d5000..732e56efc4e 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -1705,9 +1705,9 @@ checksum = "f1bfbf25d7eb88ddcbb1ec3d755d0634da8f7657b2cb8b74089121409ab8228f"
 
 [[package]]
 name = "regex"
-version = "1.10.2"
+version = "1.10.3"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "380b951a9c5e80ddfd6136919eef32310721aa4aacd4889a8d39124b026ab343"
+checksum = "b62dbe01f0b06f9d8dc7d49e05a0785f153b00b2c227856282f671e0318c9b15"
 dependencies = [
  "aho-corasick",
  "memchr",
@@ -1717,9 +1717,9 @@ dependencies = [
 
 [[package]]
 name = "regex-automata"
-version = "0.4.3"
+version = "0.4.4"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "5f804c7828047e88b2d32e2d7fe5a105da8ee3264f01902f796c8e067dc2483f"
+checksum = "3b7fa1134405e2ec9353fd416b17f8dacd46c473d7d3fd1cf202706a14eb792a"
 dependencies = [
  "aho-corasick",
  "memchr",
diff --git a/Cargo.toml b/Cargo.toml
index f10792a16c0..f63fae178cb 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -311,7 +311,7 @@ rand = { version = "0.8", features = ["small_rng"] }
 rand_core = "0.6"
 rayon = "1.8"
 redox_syscall = "0.4"
-regex = "1.10.2"
+regex = "1.10.3"
 rstest = "0.18.2"
 rust-ini = "0.19.0"
 same-file = "1.0.6"

From 8493800d4f1549ba38bf33790a6d58fad523b3cb Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Mon, 22 Jan 2024 08:06:13 +0100
Subject: [PATCH 426/429] fuzzing: print the diff in case of issue (#5866)

* fuzzing: print the diff in case of issue

* Simplify the code

* fuzz: remove unused import similar::ChangeTag

---------

Co-authored-by: Daniel Hofstetter <daniel.hofstetter@42dh.com>
---
 fuzz/Cargo.toml                  |  1 +
 fuzz/fuzz_targets/fuzz_common.rs | 13 +++++++++++++
 2 files changed, 14 insertions(+)

diff --git a/fuzz/Cargo.toml b/fuzz/Cargo.toml
index 076e274ec8a..dfb62aba5e1 100644
--- a/fuzz/Cargo.toml
+++ b/fuzz/Cargo.toml
@@ -12,6 +12,7 @@ libfuzzer-sys = "0.4"
 libc = "0.2"
 tempfile = "3"
 rand = { version = "0.8", features = ["small_rng"] }
+similar = "2"
 
 uucore = { path = "../src/uucore/" }
 uu_date = { path = "../src/uu/date/" }
diff --git a/fuzz/fuzz_targets/fuzz_common.rs b/fuzz/fuzz_targets/fuzz_common.rs
index e8cac8d4048..cf56268d75a 100644
--- a/fuzz/fuzz_targets/fuzz_common.rs
+++ b/fuzz/fuzz_targets/fuzz_common.rs
@@ -7,6 +7,7 @@ use libc::STDIN_FILENO;
 use libc::{close, dup, dup2, pipe, STDERR_FILENO, STDOUT_FILENO};
 use rand::prelude::SliceRandom;
 use rand::Rng;
+use similar::TextDiff;
 use std::ffi::OsString;
 use std::io::{Seek, SeekFrom, Write};
 use std::os::fd::{AsRawFd, RawFd};
@@ -321,12 +322,14 @@ pub fn compare_result(
         discrepancies.push("stdout differs");
         println!("Rust stdout: {}", rust_result.stdout);
         println!("GNU stdout: {}", gnu_result.stdout);
+        print_diff(&rust_result.stdout, &gnu_result.stdout);
         should_panic = true;
     }
     if rust_result.stderr.trim() != gnu_result.stderr.trim() {
         discrepancies.push("stderr differs");
         println!("Rust stderr: {}", rust_result.stderr);
         println!("GNU stderr: {}", gnu_result.stderr);
+        print_diff(&rust_result.stderr, &gnu_result.stderr);
         if fail_on_stderr_diff {
             should_panic = true;
         }
@@ -353,6 +356,16 @@ pub fn compare_result(
     }
 }
 
+/// When we have different outputs, print the diff
+fn print_diff(rust_output: &str, gnu_output: &str) {
+    println!("Diff=");
+    let diff = TextDiff::from_lines(rust_output, gnu_output);
+    for change in diff.iter_all_changes() {
+        print!("{}{}", change.tag(), change);
+    }
+    println!();
+}
+
 pub fn generate_random_string(max_length: usize) -> String {
     let mut rng = rand::thread_rng();
     let valid_utf8: Vec<char> = "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789"

From e050fa9c8cb1f74cdfa929cc1e061b0be56ca2ee Mon Sep 17 00:00:00 2001
From: "renovate[bot]" <29139614+renovate[bot]@users.noreply.github.com>
Date: Mon, 22 Jan 2024 23:21:22 +0000
Subject: [PATCH 427/429] chore(deps): update rust crate chrono to ^0.4.32

---
 Cargo.lock | 6 +++---
 Cargo.toml | 2 +-
 2 files changed, 4 insertions(+), 4 deletions(-)

diff --git a/Cargo.lock b/Cargo.lock
index 732e56efc4e..e8c0ce0ca28 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -238,14 +238,14 @@ checksum = "baf1de4339761588bc0619e3cbc0120ee582ebb74b53b4efbf79117bd2da40fd"
 
 [[package]]
 name = "chrono"
-version = "0.4.31"
+version = "0.4.32"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "7f2c685bad3eb3d45a01354cedb7d5faa66194d1d58ba6e267a8de788f79db38"
+checksum = "41daef31d7a747c5c847246f36de49ced6f7403b4cdabc807a97b5cc184cda7a"
 dependencies = [
  "android-tzdata",
  "iana-time-zone",
  "num-traits",
- "windows-targets 0.48.0",
+ "windows-targets 0.52.0",
 ]
 
 [[package]]
diff --git a/Cargo.toml b/Cargo.toml
index f63fae178cb..757cacf3492 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -263,7 +263,7 @@ binary-heap-plus = "0.5.0"
 bstr = "1.9"
 bytecount = "0.6.7"
 byteorder = "1.5.0"
-chrono = { version = "^0.4.31", default-features = false, features = [
+chrono = { version = "^0.4.32", default-features = false, features = [
   "std",
   "alloc",
   "clock",

From 150b287fe8ab268a6ef3fded5aa0e4ce3aa6cd2d Mon Sep 17 00:00:00 2001
From: Biplab Mochan Gartia <45629823+biplab5464@users.noreply.github.com>
Date: Wed, 24 Jan 2024 20:31:26 +0530
Subject: [PATCH 428/429] unexpand: allow multiple files & show error message
 if a directory is specified

* unexpand: should allow multiple files #5852 and unexpand: show error message if a directory is specified #5845

* test file added for #5845 #5852

* test case test_multiple_files improve

* cakebaker suggestion for a better code #5845 #5852

---------

Co-authored-by: biplab5464 <biplab5464@outlook.com>
---
 src/uu/unexpand/src/unexpand.rs | 18 +++++++++++++-----
 tests/by-util/test_unexpand.rs  | 32 ++++++++++++++++++++++++++++++++
 2 files changed, 45 insertions(+), 5 deletions(-)

diff --git a/src/uu/unexpand/src/unexpand.rs b/src/uu/unexpand/src/unexpand.rs
index 66d9a0187b6..7336376eb6c 100644
--- a/src/uu/unexpand/src/unexpand.rs
+++ b/src/uu/unexpand/src/unexpand.rs
@@ -11,11 +11,12 @@ use std::fmt;
 use std::fs::File;
 use std::io::{stdin, stdout, BufRead, BufReader, BufWriter, Read, Stdout, Write};
 use std::num::IntErrorKind;
+use std::path::Path;
 use std::str::from_utf8;
 use unicode_width::UnicodeWidthChar;
 use uucore::display::Quotable;
 use uucore::error::{FromIo, UError, UResult, USimpleError};
-use uucore::{crash_if_err, format_usage, help_about, help_usage};
+use uucore::{crash_if_err, format_usage, help_about, help_usage, show};
 
 const USAGE: &str = help_usage!("unexpand.md");
 const ABOUT: &str = help_about!("unexpand.md");
@@ -105,8 +106,8 @@ impl Options {
             && !matches.get_flag(options::FIRST_ONLY);
         let uflag = !matches.get_flag(options::NO_UTF8);
 
-        let files = match matches.get_one::<String>(options::FILE) {
-            Some(v) => vec![v.to_string()],
+        let files = match matches.get_many::<String>(options::FILE) {
+            Some(v) => v.cloned().collect(),
             None => vec!["-".to_owned()],
         };
 
@@ -211,7 +212,13 @@ pub fn uu_app() -> Command {
 
 fn open(path: &str) -> UResult<BufReader<Box<dyn Read + 'static>>> {
     let file_buf;
-    if path == "-" {
+    let filename = Path::new(path);
+    if filename.is_dir() {
+        Err(Box::new(USimpleError {
+            code: 1,
+            message: format!("{}: Is a directory", filename.display()),
+        }))
+    } else if path == "-" {
         Ok(BufReader::new(Box::new(stdin()) as Box<dyn Read>))
     } else {
         file_buf = File::open(path).map_err_context(|| path.to_string())?;
@@ -401,7 +408,8 @@ fn unexpand(options: &Options) -> UResult<()> {
         let mut fh = match open(file) {
             Ok(reader) => reader,
             Err(err) => {
-                return Err(USimpleError::new(1, err.to_string()));
+                show!(err);
+                continue;
             }
         };
 
diff --git a/tests/by-util/test_unexpand.rs b/tests/by-util/test_unexpand.rs
index ddbe3343efa..c1310be01a3 100644
--- a/tests/by-util/test_unexpand.rs
+++ b/tests/by-util/test_unexpand.rs
@@ -2,6 +2,7 @@
 //
 // For the full copyright and license information, please view the LICENSE
 // file that was distributed with this source code.
+// spell-checker:ignore contenta
 use crate::common::util::TestScenario;
 
 #[test]
@@ -235,3 +236,34 @@ fn test_tabs_shortcut_with_too_large_size() {
 
     new_ucmd!().arg(arg).fails().stderr_contains(expected_error);
 }
+
+#[test]
+fn test_is_directory() {
+    let (at, mut ucmd) = at_and_ucmd!();
+    let dir_name = "dir";
+    at.mkdir(dir_name);
+
+    ucmd.arg(dir_name)
+        .fails()
+        .stderr_contains(format!("unexpand: {}: Is a directory", dir_name));
+}
+
+#[test]
+fn test_multiple_files() {
+    let (at, mut ucmd) = at_and_ucmd!();
+
+    at.write("file", "content");
+    at.write("file1", "a        b");
+
+    ucmd.args(&["file", "file1"])
+        .succeeds()
+        .stdout_is("contenta        b");
+}
+
+#[test]
+fn test_one_nonexisting_file() {
+    new_ucmd!()
+        .arg("asdf.txt")
+        .fails()
+        .stderr_contains("asdf.txt: No such file or directory");
+}

From 169364044677bdea1e7d497fc638f947fd29c460 Mon Sep 17 00:00:00 2001
From: Sylvestre Ledru <sylvestre@debian.org>
Date: Wed, 24 Jan 2024 21:33:25 +0100
Subject: [PATCH 429/429] whoami: add missing feature

---
 src/uu/whoami/Cargo.toml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/uu/whoami/Cargo.toml b/src/uu/whoami/Cargo.toml
index 3d2abb034a7..7e47898efa2 100644
--- a/src/uu/whoami/Cargo.toml
+++ b/src/uu/whoami/Cargo.toml
@@ -16,7 +16,7 @@ path = "src/whoami.rs"
 
 [dependencies]
 clap = { workspace = true }
-uucore = { workspace = true, features = ["entries"] }
+uucore = { workspace = true, features = ["entries", "process"] }
 
 [target.'cfg(target_os = "windows")'.dependencies]
 windows-sys = { workspace = true, features = [