This increases throughput on systems with unlocked stdio functions.
E.g., 2.5x in the following case:

    $ timeout 1m taskset 1 shuf -r -i 0-100 \
        | taskset 2 uniq -c \
        | taskset 3 pv -r > /dev/null
    [ 100MiB/s]
    $ timeout 1m taskset 1 shuf -r -i 0-100 \
        | taskset 2 uniq -c \
        | taskset 3 pv -r > /dev/null
    [ 246MiB/s]

* src/uniq.c: Include assure.h.
(writeline): Convert the value to a string by hand and use fwrite, which
may be unlocked, instead of printf.
* tests/uniq/uniq-c-width.sh: New test to verify the padding logic.
* tests/local.mk (all_tests): Add the test case.
* NEWS: Mention the improvement.
---
 NEWS                       |  4 ++++
 src/uniq.c                 | 19 ++++++++++++++++++-
 tests/local.mk             |  1 +
 tests/uniq/uniq-c-width.sh | 33 +++++++++++++++++++++++++++++++++
 4 files changed, 56 insertions(+), 1 deletion(-)
 create mode 100755 tests/uniq/uniq-c-width.sh

diff --git a/NEWS b/NEWS
index 613bda0a2..2ae329509 100644
--- a/NEWS
+++ b/NEWS
@@ -59,6 +59,10 @@ GNU coreutils NEWS                                    -*- 
outline -*-
   'sort' will now better use available memory and parallel operation
   when reading from unknown sized inputs like pipes.
 
+  'uniq -c' now operates up to 2.5x times faster on systems with unlocked stdio
+  functions.
+
+
 ** Build-related
 
   configure no longer accepts the --with-linux-crypto option, which allowed
diff --git a/src/uniq.c b/src/uniq.c
index 5834596f9..f91c4212c 100644
--- a/src/uniq.c
+++ b/src/uniq.c
@@ -23,6 +23,7 @@
 
 #include "system.h"
 #include "argmatch.h"
+#include "assure.h"
 #include "linebuffer.h"
 #include "fadvise.h"
 #include "mcel.h"
@@ -324,7 +325,23 @@ writeline (struct linebuffer const *line,
     return;
 
   if (count_occurrences)
-    printf ("%7jd ", linecount + 1);
+    {
+      char buf[7 + INT_BUFSIZE_BOUND (intmax_t)];
+      char *end = buf + sizeof buf;
+      char *p = end;
+      *--p = ' ';
+      intmax_t i = linecount + 1;
+      affirm (0 < i);
+      do
+        *--p = '0' + i % 10;
+      while ((i /= 10));
+      /* 7 characters, padded with spaces if LINECOUNT + 1 is too small.  */
+      while (end - p < 8)
+        *--p = ' ';
+      const idx_t nbytes = end - p;
+      if (fwrite (p, sizeof (char), nbytes, stdout) != nbytes)
+        write_error ();
+    }
 
   if (fwrite (line->buffer, sizeof (char), line->length, stdout)
       != line->length)
diff --git a/tests/local.mk b/tests/local.mk
index 154b591ce..0001534ac 100644
--- a/tests/local.mk
+++ b/tests/local.mk
@@ -531,6 +531,7 @@ all_tests =                                 \
   tests/uniq/uniq.pl                           \
   tests/uniq/uniq-perf.sh                      \
   tests/uniq/uniq-collate.sh                   \
+  tests/uniq/uniq-c-width.sh                   \
   tests/misc/xattr.sh                          \
   tests/misc/yes.sh                            \
   tests/tail/wait.sh                           \
diff --git a/tests/uniq/uniq-c-width.sh b/tests/uniq/uniq-c-width.sh
new file mode 100755
index 000000000..27f8eef0a
--- /dev/null
+++ b/tests/uniq/uniq-c-width.sh
@@ -0,0 +1,33 @@
+#!/bin/sh
+# Test 'uniq -c' with various integer widths.
+
+# Copyright (C) 2026 Free Software Foundation, Inc.
+
+# This program is free software: you can redistribute it and/or modify
+# it under the terms of the GNU General Public License as published by
+# the Free Software Foundation, either version 3 of the License, or
+# (at your option) any later version.
+
+# This program is distributed in the hope that it will be useful,
+# but WITHOUT ANY WARRANTY; without even the implied warranty of
+# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+# GNU General Public License for more details.
+
+# You should have received a copy of the GNU General Public License
+# along with this program.  If not, see <https://www.gnu.org/licenses/>.
+
+. "${srcdir=.}/tests/init.sh"; path_prepend_ ./src
+print_ver_ uniq
+expensive_
+
+count=$(shuf -i 10000000-99999999 -n 1) || framework_failure_
+
+while test $count -gt 0; do
+  printf '%7d y\n' $count >exp || framework_failure_
+  yes | head -n $count | uniq -c >out 2>err || fail=1
+  compare exp out || fail=1
+  compare /dev/null err || fail=1
+  count=$((count / 10))
+done
+
+Exit $fail
-- 
2.54.0


Reply via email to