https://sourceware.org/git/gitweb.cgi?p=newlib-cygwin.git;h=e18542110635cd1aa0ee754987c501002320cd2b
commit e18542110635cd1aa0ee754987c501002320cd2b Author: Corinna Vinschen <cori...@vinschen.de> Date: Tue Apr 12 15:06:05 2016 +0200 strxfrm/wcsxfrm: Always return length of the transformed string Cygwin's strxfrm/wcsfrm treated a too short output buffer as an error condition and always returned the size value provided as third parameter. This is not as it's documented in POSIX.1-2008. Rather, the only error condition is an invalid input string(*). Other than that, the functions are supposed to return the length of the resulting sort key, even if the output buffer is too small. In the latter case the content of the output array is unspecified, but it's the job of the application to check that the return value is greater or equal to the provided buffer size. (*) We have to make an exception in Cygwin: strxfrm has to call the UNICODE function LCMapStringW for reasons outlined in a source comment. If the incoming multibyte string is so large that we fail to malloc the space required to convert it to a wchar_t string, we have to ser errno as well since we have nothing to call LCMapStringW with. * nlsfuncs.cc (wcsxfrm): Fix expression computing offset of trailing wchar_t NUL. Compute correct return value even if output buffer is too small. (strxfrm): Handle failing malloc. Compute correct return value even if output buffer is too small. Signed-off-by: Corinna Vinschen <cori...@vinschen.de> Diff: --- winsup/cygwin/nlsfuncs.cc | 36 ++++++++++++++++++++++++------------ 1 file changed, 24 insertions(+), 12 deletions(-) diff --git a/winsup/cygwin/nlsfuncs.cc b/winsup/cygwin/nlsfuncs.cc index 9dbd9b1..172188d 100644 --- a/winsup/cygwin/nlsfuncs.cc +++ b/winsup/cygwin/nlsfuncs.cc @@ -1271,21 +1271,27 @@ wcsxfrm (wchar_t *__restrict ws1, const wchar_t *__restrict ws2, size_t wsn) the result is wchar_t-NUL terminated. */ if (ret) { - ret = (ret + 1) / sizeof (wchar_t); - if (ret >= wsn) - return wsn; - ws1[ret] = L'\0'; + ret /= sizeof (wchar_t); + if (ret < wsn) + ws1[ret] = L'\0'; return ret; } if (GetLastError () != ERROR_INSUFFICIENT_BUFFER) set_errno (EINVAL); + else + { + ret = LCMapStringW (collate_lcid, LCMAP_SORTKEY | LCMAP_BYTEREV, ws2, -1, + NULL, 0); + if (ret) + wsn = ret / sizeof (wchar_t); + } return wsn; } extern "C" size_t strxfrm (char *__restrict s1, const char *__restrict s2, size_t sn) { - size_t ret; + size_t ret = 0; size_t n2; wchar_t *ws2; tmp_pathbuf tp; @@ -1297,17 +1303,23 @@ strxfrm (char *__restrict s1, const char *__restrict s2, size_t sn) n2 = lc_mbstowcs (collate_mbtowc, collate_charset, NULL, s2, 0) + 1; ws2 = (n2 > NT_MAX_PATH ? (wchar_t *) malloc (n2 * sizeof (wchar_t)) : tp.w_get ()); - lc_mbstowcs (collate_mbtowc, collate_charset, ws2, s2, n2); - /* The sort key is a NUL-terminated byte string. */ - ret = LCMapStringW (collate_lcid, LCMAP_SORTKEY, ws2, -1, (PWCHAR) s1, sn); - if (n2 > NT_MAX_PATH) - free (ws2); + if (ws2) + { + lc_mbstowcs (collate_mbtowc, collate_charset, ws2, s2, n2); + /* The sort key is a NUL-terminated byte string. */ + ret = LCMapStringW (collate_lcid, LCMAP_SORTKEY, ws2, -1, + (PWCHAR) s1, sn); + } if (ret == 0) { - if (GetLastError () != ERROR_INSUFFICIENT_BUFFER) + ret = sn + 1; + if (!ws2 || GetLastError () != ERROR_INSUFFICIENT_BUFFER) set_errno (EINVAL); - return sn; + else + ret = LCMapStringW (collate_lcid, LCMAP_SORTKEY, ws2, -1, NULL, 0); } + if (ws2 && n2 > NT_MAX_PATH) + free (ws2); /* LCMapStringW returns byte count including the terminating NUL character. strxfrm is supposed to return length excluding the NUL. */ return ret - 1;