I was looking at changing announce-gen to use SHA-256 and SHA3-256
instead of SHA-1 and SHA-256. That lead me to discovering the following:
$ cksum -a sha3 --length=256 --base64 --untagged \
Makefile > Makefile.sum
$ cksum -a sha3 --check Makefile.sum
cksum: Makefile.sum: no properly formatted checksum lines found
The same issue exists for --algorithm=sha2. This patch fixes it:
$ ./src/cksum -a sha3 --check Makefile.sum
Makefile: OK
$ sed 's|[[:graph:]] Makefile$| Makefile|g' \
Makefile.sum > truncated
$ ./src/cksum -a sha3 --check truncated
cksum: truncated: no properly formatted checksum lines found
I left the behavior the same for blake2b since 'b2sum' does not support
--base64. I'm not sure if 'cksum -a blake2b' and 'b2sum' should differ
in this case...
Collin
>From bd5afe3ada0fadc4b47b27725dbf06ee0f50999e Mon Sep 17 00:00:00 2001
Message-ID: <bd5afe3ada0fadc4b47b27725dbf06ee0f50999e.1759624110.git.collin.fu...@gmail.com>
From: Collin Funk <[email protected]>
Date: Sat, 4 Oct 2025 17:18:01 -0700
Subject: [PATCH] cksum: allow --algorithm={sha2,sha3} --check to work on
base64
* NEWS: Mention the bug.
* src/digest.c (split_3): Check for the number of base64 characters.
* tests/cksum/cksum-base64-untagged.sh: New file.
* tests/local.mk (all_tests): Add the new test.
---
NEWS | 5 ++++
src/digest.c | 22 ++++++++++++--
tests/cksum/cksum-base64-untagged.sh | 43 ++++++++++++++++++++++++++++
tests/local.mk | 1 +
4 files changed, 68 insertions(+), 3 deletions(-)
create mode 100755 tests/cksum/cksum-base64-untagged.sh
diff --git a/NEWS b/NEWS
index b8c4ed4ef..2fa8464dd 100644
--- a/NEWS
+++ b/NEWS
@@ -15,6 +15,11 @@ GNU coreutils NEWS -*- outline -*-
that use the GNU extension /NUM or +NUM formats.
[bug introduced in coreutils-8.28]
+ 'cksum --algorithm={sha2,sha3} --check' can now operate on files
+ generated using 'cksum --algorithm={sha2,sha3} --base64 --untagged'.
+ [bug introduced in coreutils-9.8]
+
+
** Improvements
wc -l now operates 10% faster on hosts that support AVX512 instructions.
diff --git a/src/digest.c b/src/digest.c
index ce0e222e1..2f6daf23a 100644
--- a/src/digest.c
+++ b/src/digest.c
@@ -930,15 +930,31 @@ split_3 (char *s, size_t s_len,
# endif
unsigned char const *hp = *digest;
digest_hex_bytes = 0;
- while (c_isxdigit (*hp++))
- digest_hex_bytes++;
+ for (; c_isxdigit (*hp); ++hp, ++digest_hex_bytes)
+ ;
# if HASH_ALGO_CKSUM
+ /* Check the number of base64 characters. This works because the hexadecimal
+ character set is a subset of the base64 character set. */
+ size_t digest_base64_bytes = digest_hex_bytes;
+ for (; isubase64 (*hp) || *hp == '='; ++hp, ++digest_base64_bytes)
+ ;
if ((cksum_algorithm == sha2 || cksum_algorithm == sha3)
&& digest_hex_bytes / 2 != SHA224_DIGEST_SIZE
&& digest_hex_bytes / 2 != SHA256_DIGEST_SIZE
&& digest_hex_bytes / 2 != SHA384_DIGEST_SIZE
&& digest_hex_bytes / 2 != SHA512_DIGEST_SIZE)
- return false;
+ {
+ if (digest_base64_bytes == BASE64_LENGTH (SHA224_DIGEST_SIZE))
+ digest_hex_bytes = SHA224_DIGEST_SIZE * 2;
+ else if (digest_base64_bytes == BASE64_LENGTH (SHA256_DIGEST_SIZE))
+ digest_hex_bytes = SHA256_DIGEST_SIZE * 2;
+ else if (digest_base64_bytes == BASE64_LENGTH (SHA384_DIGEST_SIZE))
+ digest_hex_bytes = SHA384_DIGEST_SIZE * 2;
+ else if (digest_base64_bytes == BASE64_LENGTH (SHA512_DIGEST_SIZE))
+ digest_hex_bytes = SHA512_DIGEST_SIZE * 2;
+ else
+ return false;
+ }
# endif
if (digest_hex_bytes < 2 || digest_hex_bytes % 2
|| DIGEST_MAX_LEN * 2 < digest_hex_bytes)
diff --git a/tests/cksum/cksum-base64-untagged.sh b/tests/cksum/cksum-base64-untagged.sh
new file mode 100755
index 000000000..0e2eb9cb8
--- /dev/null
+++ b/tests/cksum/cksum-base64-untagged.sh
@@ -0,0 +1,43 @@
+#!/bin/sh
+# Test that cksum can guess the digest length from base64 checksums.
+
+# Copyright (C) 2025 Free Software Foundation, Inc.
+
+# This program is free software: you can redistribute it and/or modify
+# it under the terms of the GNU General Public License as published by
+# the Free Software Foundation, either version 3 of the License, or
+# (at your option) any later version.
+
+# This program is distributed in the hope that it will be useful,
+# but WITHOUT ANY WARRANTY; without even the implied warranty of
+# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
+# GNU General Public License for more details.
+
+# You should have received a copy of the GNU General Public License
+# along with this program. If not, see <https://www.gnu.org/licenses/>.
+
+. "${srcdir=.}/tests/init.sh"; path_prepend_ ./src
+print_ver_ cksum
+getlimits_
+
+echo 'test input' > inp
+echo 'inp: OK' > expout
+echo 'cksum: truncated: no properly formatted checksum lines found' > experr
+
+for algorithm in sha2 sha3; do
+ for length in 224 256 384 512; do
+ # Create files with base64 checksums in the untagged format.
+ cksum -a $algorithm --length $length --base64 --untagged inp \
+ > check || fail=1
+ # Check that the length can be determined from the base64 checksum.
+ cksum -a $algorithm --check check > out || fail=1
+ compare expout out || fail=1
+ # Check that only valid lengths are supported.
+ sed 's|[[:graph:]] inp$| inp|g' check > truncated || fail=1
+ cp truncated $HOME
+ returns_ 1 cksum -a $algorithm --check truncated 2> err || fail=1
+ compare experr err || fail=1
+ done
+done
+
+Exit $fail
diff --git a/tests/local.mk b/tests/local.mk
index 19bc194fb..52184b7ac 100644
--- a/tests/local.mk
+++ b/tests/local.mk
@@ -305,6 +305,7 @@ all_tests = \
tests/cksum/cksum-a.sh \
tests/cksum/cksum-c.sh \
tests/cksum/cksum-base64.pl \
+ tests/cksum/cksum-base64-untagged.sh \
tests/cksum/cksum-raw.sh \
tests/misc/comm.pl \
tests/csplit/csplit.sh \
--
2.51.0