forked from pool/glibc
Andreas Schwab
c2c4c80482
- Update to glibc 2.28 * The localization data for ISO 14651 is updated to match the 2016 Edition 4 release of the standard, this matches data provided by Unicode 9.0.0 * Unicode 11.0.0 Support: Character encoding, character type info, and transliteration tables are all updated to Unicode 11.0.0, using generator scripts contributed by Mike FABIAN (Red Hat) * <math.h> functions that round their results to a narrower type are added from TS 18661-1:2014 and TS 18661-3:2015 * Two grammatical forms of month names are now supported * The renameat2 function has been added, a variant of the renameat function which has a flags argument * The statx function has been added, a variant of the fstatat64 function with an additional flags argument * IDN domain names in getaddrinfo and getnameinfo now use the system libidn2 library if installed * Parsing of dynamic string tokens in DT_RPATH, DT_RUNPATH, DT_NEEDED, DT_AUXILIARY, and DT_FILTER has been expanded to support the full range of ELF gABI expressions including such constructs as '$ORIGIN$ORIGIN' (if valid) * Support for ISO C threads (ISO/IEC 9899:2011) has been added. * The nonstandard header files <libio.h> and <_G_config.h> are no longer installed * The stdio functions 'getc' and 'putc' are no longer defined as macros * All stdio functions now treat end-of-file as a sticky condition * The macros 'major', 'minor', and 'makedev' are now only available from the header <sys/sysmacros.h> * The obsolete function ustat is no longer available to newly linked binaries; the headers <ustat.h> and <sys/ustat.h> have been removed * The obsolete function nfsservctl is no longer available to newly linked OBS-URL: https://build.opensuse.org/request/show/627715 OBS-URL: https://build.opensuse.org/package/show/Base:System/glibc?expand=0&rev=509
479 lines
13 KiB
Diff
479 lines
13 KiB
Diff
Fix fnmatch handling of collating elements (BZ #17396, BZ #16976)
|
|
|
|
[BZ #16976]
|
|
[BZ #17396]
|
|
* posix/fnmatch_loop.c (internal_fnmatch, internal_fnwmatch): When
|
|
looking up collating elements match against (wide) character
|
|
sequence instead of name. Correct alignment adjustment.
|
|
* posix/fnmatch.c: Don't include "../locale/elem-hash.h".
|
|
* posix/Makefile (tests): Add tst-fnmatch4 and tst-fnmatch5.
|
|
(LOCALES): Add cs_CZ.ISO-8859-2.
|
|
* posix/tst-fnmatch4.c: New file.
|
|
* posix/tst-fnmatch5.c: New file.
|
|
|
|
Index: glibc-2.27/posix/Makefile
|
|
===================================================================
|
|
--- glibc-2.27.orig/posix/Makefile
|
|
+++ glibc-2.27/posix/Makefile
|
|
@@ -92,6 +92,7 @@ tests := test-errno tstgetopt testfnm r
|
|
bug-getopt5 tst-getopt_long1 bug-regex34 bug-regex35 \
|
|
tst-pathconf tst-rxspencer-no-utf8 \
|
|
tst-fnmatch3 bug-regex36 \
|
|
+ tst-fnmatch4 tst-fnmatch5 \
|
|
tst-posix_spawn-fd tst-posix_spawn-setsid \
|
|
tst-posix_fadvise tst-posix_fadvise64 \
|
|
tst-sysconf-empty-chroot tst-glob_symlinks tst-fexecve \
|
|
@@ -165,7 +166,8 @@ $(objpfx)wordexp-tst.out: wordexp-tst.sh $(objpfx)wordexp-test
|
|
endif
|
|
|
|
LOCALES := cs_CZ.UTF-8 da_DK.ISO-8859-1 de_DE.ISO-8859-1 de_DE.UTF-8 \
|
|
- en_US.UTF-8 es_US.ISO-8859-1 es_US.UTF-8 ja_JP.EUC-JP tr_TR.UTF-8
|
|
+ en_US.UTF-8 es_US.ISO-8859-1 es_US.UTF-8 ja_JP.EUC-JP tr_TR.UTF-8 \
|
|
+ cs_CZ.ISO-8859-2
|
|
include ../gen-locales.mk
|
|
|
|
$(objpfx)bug-regex1.out: $(gen-locales)
|
|
Index: glibc-2.27/posix/fnmatch.c
|
|
===================================================================
|
|
--- glibc-2.27.orig/posix/fnmatch.c
|
|
+++ glibc-2.27/posix/fnmatch.c
|
|
@@ -53,7 +53,6 @@
|
|
we support a correct implementation only in glibc. */
|
|
#ifdef _LIBC
|
|
# include "../locale/localeinfo.h"
|
|
-# include "../locale/elem-hash.h"
|
|
# include "../locale/coll-lookup.h"
|
|
# include <shlib-compat.h>
|
|
|
|
Index: glibc-2.27/posix/fnmatch_loop.c
|
|
===================================================================
|
|
--- glibc-2.27.orig/posix/fnmatch_loop.c
|
|
+++ glibc-2.27/posix/fnmatch_loop.c
|
|
@@ -494,26 +494,12 @@ FCT (const CHAR *pattern, const CHAR *st
|
|
{
|
|
int32_t table_size;
|
|
const int32_t *symb_table;
|
|
-# if WIDE_CHAR_VERSION
|
|
- char str[c1];
|
|
- unsigned int strcnt;
|
|
-# else
|
|
-# define str (startp + 1)
|
|
-# endif
|
|
const unsigned char *extra;
|
|
int32_t idx;
|
|
int32_t elem;
|
|
- int32_t second;
|
|
- int32_t hash;
|
|
-
|
|
# if WIDE_CHAR_VERSION
|
|
- /* We have to convert the name to a single-byte
|
|
- string. This is possible since the names
|
|
- consist of ASCII characters and the internal
|
|
- representation is UCS4. */
|
|
- for (strcnt = 0; strcnt < c1; ++strcnt)
|
|
- str[strcnt] = startp[1 + strcnt];
|
|
-#endif
|
|
+ int32_t *wextra;
|
|
+# endif
|
|
|
|
table_size =
|
|
_NL_CURRENT_WORD (LC_COLLATE,
|
|
@@ -525,71 +511,55 @@ FCT (const CHAR *pattern, const CHAR *st
|
|
_NL_CURRENT (LC_COLLATE,
|
|
_NL_COLLATE_SYMB_EXTRAMB);
|
|
|
|
- /* Locate the character in the hashing table. */
|
|
- hash = elem_hash (str, c1);
|
|
-
|
|
- idx = 0;
|
|
- elem = hash % table_size;
|
|
- if (symb_table[2 * elem] != 0)
|
|
- {
|
|
- second = hash % (table_size - 2) + 1;
|
|
-
|
|
- do
|
|
- {
|
|
- /* First compare the hashing value. */
|
|
- if (symb_table[2 * elem] == hash
|
|
- && (c1
|
|
- == extra[symb_table[2 * elem + 1]])
|
|
- && memcmp (str,
|
|
- &extra[symb_table[2 * elem
|
|
- + 1]
|
|
- + 1], c1) == 0)
|
|
- {
|
|
- /* Yep, this is the entry. */
|
|
- idx = symb_table[2 * elem + 1];
|
|
- idx += 1 + extra[idx];
|
|
- break;
|
|
- }
|
|
-
|
|
- /* Next entry. */
|
|
- elem += second;
|
|
- }
|
|
- while (symb_table[2 * elem] != 0);
|
|
- }
|
|
+ for (elem = 0; elem < table_size; elem++)
|
|
+ if (symb_table[2 * elem] != 0)
|
|
+ {
|
|
+ idx = symb_table[2 * elem + 1];
|
|
+ /* Skip the name of collating element. */
|
|
+ idx += 1 + extra[idx];
|
|
+# if WIDE_CHAR_VERSION
|
|
+ /* Skip the byte sequence of the
|
|
+ collating element. */
|
|
+ idx += 1 + extra[idx];
|
|
+ /* Adjust for the alignment. */
|
|
+ idx = (idx + 3) & ~3;
|
|
+
|
|
+ wextra = (int32_t *) &extra[idx + 4];
|
|
+
|
|
+ if (/* Compare the length of the sequence. */
|
|
+ c1 == wextra[0]
|
|
+ /* Compare the wide char sequence. */
|
|
+ && memcmp (startp + 1, &wextra[1],
|
|
+ c1 * sizeof (UCHAR)) == 0)
|
|
+ /* Yep, this is the entry. */
|
|
+ break;
|
|
+# else
|
|
+ if (/* Compare the length of the sequence. */
|
|
+ c1 == extra[idx]
|
|
+ /* Compare the byte sequence. */
|
|
+ && memcmp (startp + 1,
|
|
+ &extra[idx + 1], c1) == 0)
|
|
+ /* Yep, this is the entry. */
|
|
+ break;
|
|
+# endif
|
|
+ }
|
|
|
|
- if (symb_table[2 * elem] != 0)
|
|
+ if (elem < table_size)
|
|
{
|
|
/* Compare the byte sequence but only if
|
|
this is not part of a range. */
|
|
-# if WIDE_CHAR_VERSION
|
|
- int32_t *wextra;
|
|
+ if (! is_range
|
|
|
|
- idx += 1 + extra[idx];
|
|
- /* Adjust for the alignment. */
|
|
- idx = (idx + 3) & ~3;
|
|
-
|
|
- wextra = (int32_t *) &extra[idx + 4];
|
|
-# endif
|
|
-
|
|
- if (! is_range)
|
|
- {
|
|
# if WIDE_CHAR_VERSION
|
|
- for (c1 = 0;
|
|
- (int32_t) c1 < wextra[idx];
|
|
- ++c1)
|
|
- if (n[c1] != wextra[1 + c1])
|
|
- break;
|
|
-
|
|
- if ((int32_t) c1 == wextra[idx])
|
|
- goto matched;
|
|
+ && memcmp (n, &wextra[1],
|
|
+ c1 * sizeof (UCHAR)) == 0
|
|
# else
|
|
- for (c1 = 0; c1 < extra[idx]; ++c1)
|
|
- if (n[c1] != extra[1 + c1])
|
|
- break;
|
|
-
|
|
- if (c1 == extra[idx])
|
|
- goto matched;
|
|
+ && memcmp (n, &extra[idx + 1], c1) == 0
|
|
# endif
|
|
+ )
|
|
+ {
|
|
+ n += c1 - 1;
|
|
+ goto matched;
|
|
}
|
|
|
|
/* Get the collation sequence value. */
|
|
@@ -597,9 +567,9 @@ FCT (const CHAR *pattern, const CHAR *st
|
|
# if WIDE_CHAR_VERSION
|
|
cold = wextra[1 + wextra[idx]];
|
|
# else
|
|
- /* Adjust for the alignment. */
|
|
idx += 1 + extra[idx];
|
|
- idx = (idx + 3) & ~4;
|
|
+ /* Adjust for the alignment. */
|
|
+ idx = (idx + 3) & ~3;
|
|
cold = *((int32_t *) &extra[idx]);
|
|
# endif
|
|
|
|
@@ -609,10 +579,10 @@ FCT (const CHAR *pattern, const CHAR *st
|
|
{
|
|
/* No valid character. Match it as a
|
|
single byte. */
|
|
- if (!is_range && *n == str[0])
|
|
+ if (!is_range && *n == startp[1])
|
|
goto matched;
|
|
|
|
- cold = str[0];
|
|
+ cold = startp[1];
|
|
c = *p++;
|
|
}
|
|
else
|
|
@@ -620,7 +590,6 @@ FCT (const CHAR *pattern, const CHAR *st
|
|
}
|
|
}
|
|
else
|
|
-# undef str
|
|
#endif
|
|
{
|
|
c = FOLD (c);
|
|
@@ -712,25 +681,11 @@ FCT (const CHAR *pattern, const CHAR *st
|
|
{
|
|
int32_t table_size;
|
|
const int32_t *symb_table;
|
|
-# if WIDE_CHAR_VERSION
|
|
- char str[c1];
|
|
- unsigned int strcnt;
|
|
-# else
|
|
-# define str (startp + 1)
|
|
-# endif
|
|
const unsigned char *extra;
|
|
int32_t idx;
|
|
int32_t elem;
|
|
- int32_t second;
|
|
- int32_t hash;
|
|
-
|
|
# if WIDE_CHAR_VERSION
|
|
- /* We have to convert the name to a single-byte
|
|
- string. This is possible since the names
|
|
- consist of ASCII characters and the internal
|
|
- representation is UCS4. */
|
|
- for (strcnt = 0; strcnt < c1; ++strcnt)
|
|
- str[strcnt] = startp[1 + strcnt];
|
|
+ int32_t *wextra;
|
|
# endif
|
|
|
|
table_size =
|
|
@@ -743,51 +698,44 @@ FCT (const CHAR *pattern, const CHAR *st
|
|
_NL_CURRENT (LC_COLLATE,
|
|
_NL_COLLATE_SYMB_EXTRAMB);
|
|
|
|
- /* Locate the character in the hashing
|
|
- table. */
|
|
- hash = elem_hash (str, c1);
|
|
-
|
|
- idx = 0;
|
|
- elem = hash % table_size;
|
|
- if (symb_table[2 * elem] != 0)
|
|
- {
|
|
- second = hash % (table_size - 2) + 1;
|
|
-
|
|
- do
|
|
- {
|
|
- /* First compare the hashing value. */
|
|
- if (symb_table[2 * elem] == hash
|
|
- && (c1
|
|
- == extra[symb_table[2 * elem + 1]])
|
|
- && memcmp (str,
|
|
- &extra[symb_table[2 * elem + 1]
|
|
- + 1], c1) == 0)
|
|
- {
|
|
- /* Yep, this is the entry. */
|
|
- idx = symb_table[2 * elem + 1];
|
|
- idx += 1 + extra[idx];
|
|
- break;
|
|
- }
|
|
-
|
|
- /* Next entry. */
|
|
- elem += second;
|
|
- }
|
|
- while (symb_table[2 * elem] != 0);
|
|
- }
|
|
-
|
|
- if (symb_table[2 * elem] != 0)
|
|
- {
|
|
- /* Compare the byte sequence but only if
|
|
- this is not part of a range. */
|
|
+ for (elem = 0; elem < table_size; elem++)
|
|
+ if (symb_table[2 * elem] != 0)
|
|
+ {
|
|
+ idx = symb_table[2 * elem + 1];
|
|
+ /* Skip the name of collating
|
|
+ element. */
|
|
+ idx += 1 + extra[idx];
|
|
# if WIDE_CHAR_VERSION
|
|
- int32_t *wextra;
|
|
-
|
|
- idx += 1 + extra[idx];
|
|
- /* Adjust for the alignment. */
|
|
- idx = (idx + 3) & ~4;
|
|
-
|
|
- wextra = (int32_t *) &extra[idx + 4];
|
|
+ /* Skip the byte sequence of the
|
|
+ collating element. */
|
|
+ idx += 1 + extra[idx];
|
|
+ /* Adjust for the alignment. */
|
|
+ idx = (idx + 3) & ~3;
|
|
+
|
|
+ wextra = (int32_t *) &extra[idx + 4];
|
|
+
|
|
+ if (/* Compare the length of the
|
|
+ sequence. */
|
|
+ c1 == wextra[0]
|
|
+ /* Compare the wide char sequence. */
|
|
+ && memcmp (startp + 1, &wextra[1],
|
|
+ c1 * sizeof (int32_t)) == 0)
|
|
+ /* Yep, this is the entry. */
|
|
+ break;
|
|
+# else
|
|
+ if (/* Compare the length of the
|
|
+ sequence. */
|
|
+ c1 == extra[idx]
|
|
+ /* Compare the byte sequence. */
|
|
+ && memcmp (startp + 1,
|
|
+ &extra[idx + 1], c1) == 0)
|
|
+ /* Yep, this is the entry. */
|
|
+ break;
|
|
# endif
|
|
+ }
|
|
+
|
|
+ if (elem < table_size)
|
|
+ {
|
|
/* Get the collation sequence value. */
|
|
is_seqval = 1;
|
|
# if WIDE_CHAR_VERSION
|
|
@@ -795,19 +743,18 @@ FCT (const CHAR *pattern, const CHAR *st
|
|
# else
|
|
/* Adjust for the alignment. */
|
|
idx += 1 + extra[idx];
|
|
- idx = (idx + 3) & ~4;
|
|
+ idx = (idx + 3) & ~3;
|
|
cend = *((int32_t *) &extra[idx]);
|
|
# endif
|
|
}
|
|
- else if (symb_table[2 * elem] != 0 && c1 == 1)
|
|
+ else if (c1 == 1)
|
|
{
|
|
- cend = str[0];
|
|
+ cend = startp[1];
|
|
c = *p++;
|
|
}
|
|
else
|
|
return FNM_NOMATCH;
|
|
}
|
|
-# undef str
|
|
}
|
|
else
|
|
{
|
|
Index: glibc-2.27/posix/tst-fnmatch4.c
|
|
===================================================================
|
|
--- /dev/null
|
|
+++ glibc-2.27/posix/tst-fnmatch4.c
|
|
@@ -0,0 +1,51 @@
|
|
+/* Test for fnmatch handling of collating elements
|
|
+ Copyright (C) 2015 Free Software Foundation, Inc.
|
|
+ This file is part of the GNU C Library.
|
|
+
|
|
+ The GNU C Library is free software; you can redistribute it and/or
|
|
+ modify it under the terms of the GNU Lesser General Public
|
|
+ License as published by the Free Software Foundation; either
|
|
+ version 2.1 of the License, or (at your option) any later version.
|
|
+
|
|
+ The GNU C Library is distributed in the hope that it will be useful,
|
|
+ but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
+ MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
+ Lesser General Public License for more details.
|
|
+
|
|
+ You should have received a copy of the GNU Lesser General Public
|
|
+ License along with the GNU C Library; if not, see
|
|
+ <http://www.gnu.org/licenses/>. */
|
|
+
|
|
+#include <stdio.h>
|
|
+#include <locale.h>
|
|
+#include <fnmatch.h>
|
|
+
|
|
+static int
|
|
+do_test_locale (const char *locale)
|
|
+{
|
|
+ const char *pattern = "[[.ch.]]";
|
|
+
|
|
+ if (setlocale (LC_ALL, locale) == NULL)
|
|
+ {
|
|
+ printf ("could not set locale %s\n", locale);
|
|
+ return 1;
|
|
+ }
|
|
+
|
|
+ if (fnmatch (pattern, "ch", 0) != 0)
|
|
+ {
|
|
+ printf ("%s didn't match in locale %s\n", pattern, locale);
|
|
+ return 1;
|
|
+ }
|
|
+
|
|
+ return 0;
|
|
+}
|
|
+
|
|
+static int
|
|
+do_test (void)
|
|
+{
|
|
+ return (do_test_locale ("cs_CZ.ISO-8859-2")
|
|
+ || do_test_locale ("cs_CZ.UTF-8"));
|
|
+}
|
|
+
|
|
+#define TEST_FUNCTION do_test ()
|
|
+#include "../test-skeleton.c"
|
|
Index: glibc-2.27/posix/tst-fnmatch5.c
|
|
===================================================================
|
|
--- /dev/null
|
|
+++ glibc-2.27/posix/tst-fnmatch5.c
|
|
@@ -0,0 +1,53 @@
|
|
+/* Test for fnmatch handling of collating elements
|
|
+ Copyright (C) 2015 Free Software Foundation, Inc.
|
|
+ This file is part of the GNU C Library.
|
|
+
|
|
+ The GNU C Library is free software; you can redistribute it and/or
|
|
+ modify it under the terms of the GNU Lesser General Public
|
|
+ License as published by the Free Software Foundation; either
|
|
+ version 2.1 of the License, or (at your option) any later version.
|
|
+
|
|
+ The GNU C Library is distributed in the hope that it will be useful,
|
|
+ but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
+ MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
+ Lesser General Public License for more details.
|
|
+
|
|
+ You should have received a copy of the GNU Lesser General Public
|
|
+ License along with the GNU C Library; if not, see
|
|
+ <http://www.gnu.org/licenses/>. */
|
|
+
|
|
+#include <fnmatch.h>
|
|
+#include <locale.h>
|
|
+#include <stdio.h>
|
|
+#include <string.h>
|
|
+
|
|
+#define LENGTH 20000000
|
|
+
|
|
+char pattern[LENGTH + 7];
|
|
+
|
|
+static int
|
|
+do_test (void)
|
|
+{
|
|
+ if (setlocale (LC_ALL, "en_US.UTF-8") == NULL)
|
|
+ {
|
|
+ puts ("could not set locale");
|
|
+ return 1;
|
|
+ }
|
|
+ pattern[0] = '[';
|
|
+ pattern[1] = '[';
|
|
+ pattern[2] = '.';
|
|
+ memset (pattern + 3, 'a', LENGTH);
|
|
+ pattern[LENGTH + 3] = '.';
|
|
+ pattern[LENGTH + 4] = ']';
|
|
+ pattern[LENGTH + 5] = ']';
|
|
+ int ret = fnmatch (pattern, "a", 0);
|
|
+ if (ret == 0)
|
|
+ {
|
|
+ puts ("fnmatch returned 0 for invalid pattern");
|
|
+ return 1;
|
|
+ }
|
|
+ return 0;
|
|
+}
|
|
+
|
|
+#define TEST_FUNCTION do_test ()
|
|
+#include "../test-skeleton.c"
|