From 2d0aea11b0637e7ad3c5df6da3395a8248416811 Mon Sep 17 00:00:00 2001 From: Ulrich Drepper Date: Thu, 15 Feb 2001 22:27:29 +0000 Subject: Update. 2001-02-15 Jakub Jelinek * posix/regex.c (init_syntax_once): Add prototype. (TRANSLATE): If MBS_SUPPORT, translate all characters up to '\xff'. (re_search_2): Avoid warning. (count_mbs_length): Add prototype. * posix/tst-regex3.c: New file. * posix/Makefile (tests): Add bug-regex3. --- ChangeLog | 9 +++++++++ localedata/ChangeLog | 7 +++++++ localedata/locales/i18n | 6 +++--- posix/Makefile | 2 +- posix/bug-regex3.c | 44 ++++++++++++++++++++++++++++++++++++++++++++ posix/regex.c | 15 +++++++++++---- 6 files changed, 75 insertions(+), 8 deletions(-) create mode 100644 posix/bug-regex3.c diff --git a/ChangeLog b/ChangeLog index cf9187cb02..d2614717b6 100644 --- a/ChangeLog +++ b/ChangeLog @@ -1,3 +1,12 @@ +2001-02-15 Jakub Jelinek + + * posix/regex.c (init_syntax_once): Add prototype. + (TRANSLATE): If MBS_SUPPORT, translate all characters up to '\xff'. + (re_search_2): Avoid warning. + (count_mbs_length): Add prototype. + * posix/tst-regex3.c: New file. + * posix/Makefile (tests): Add bug-regex3. + 2001-02-15 Ulrich Drepper * stdio-common/Makefile (tests): Add tst-gets. diff --git a/localedata/ChangeLog b/localedata/ChangeLog index bd2debb725..d8a6996324 100644 --- a/localedata/ChangeLog +++ b/localedata/ChangeLog @@ -1,3 +1,10 @@ +2001-02-15 Ulrich Drepper + + * locales/i18n: Correct classification of Thai characters. This + differs from Unicode's tables but is in line with linguistic rules + in Thailand. + Patch by Theppitak Karoonboonyanan . + 2001-02-14 Ulrich Drepper * charmaps/GB18030: Update for Dec 2000 re-release of GB18030. diff --git a/localedata/locales/i18n b/localedata/locales/i18n index 96aec61e16..7c5319dd71 100644 --- a/localedata/locales/i18n +++ b/localedata/locales/i18n @@ -222,7 +222,7 @@ alpha / ..;..;..;;/ ..;/ % TABLE 26 THAI/ - ..;;;..;/ + ..;..;..;..;/ % TABLE 27 LAO/ ..;;..;;;/ ..;..;..;;;/ @@ -394,8 +394,8 @@ punct / ..;..;..;..;/ ..;..;..;..;/ ..;;..;;..;/ - ;..;..;;..;/ - ;..;..;;..;/ + ;..;..;;;;/ + ;..;;..;/ ..;..;..;..;/ ..;..;..;..;/ ;..;..;..;/ diff --git a/posix/Makefile b/posix/Makefile index c20fa389a2..e61bf6565a 100644 --- a/posix/Makefile +++ b/posix/Makefile @@ -69,7 +69,7 @@ tests := tstgetopt testfnm runtests runptests \ tst-preadwrite tst-preadwrite64 test-vfork regexbug1 \ tst-getlogin tst-mmap tst-getaddrinfo tst-truncate \ tst-truncate64 tst-fork tst-fnmatch tst-regexloc tst-dir \ - tst-chmod bug-regex1 bug-regex2 tst-gnuglob + tst-chmod bug-regex1 bug-regex2 bug-regex3 tst-gnuglob ifeq (yes,$(build-shared)) test-srcs := globtest tests += wordexp-test tst-exec tst-spawn diff --git a/posix/bug-regex3.c b/posix/bug-regex3.c new file mode 100644 index 0000000000..90da85a8be --- /dev/null +++ b/posix/bug-regex3.c @@ -0,0 +1,44 @@ +/* Test for case handling in regex. + Copyright (C) 2001 Free Software Foundation, Inc. + Contributed by Jakub Jelinek , 2001. + + The GNU C Library is free software; you can redistribute it and/or + modify it under the terms of the GNU Library General Public License as + published by the Free Software Foundation; either version 2 of the + License, or (at your option) any later version. + + The GNU C Library is distributed in the hope that it will be useful, + but WITHOUT ANY WARRANTY; without even the implied warranty of + MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU + Library General Public License for more details. + + You should have received a copy of the GNU Library General Public + License along with the GNU C Library; see the file COPYING.LIB. If not, + write to the Free Software Foundation, Inc., 59 Temple Place - Suite 330, + Boston, MA 02111-1307, USA. */ + +#include +#include +#include +#include + + +int +main (void) +{ + regex_t re; + int n; + + n = regcomp (&re, "[a-bA-B]", REG_ICASE); + if (n != 0) + { + char buf[500]; + regerror (n, &re, buf, sizeof (buf)); + printf ("regcomp failed: %s\n", buf); + exit (1); + } + + regfree (&re); + + return 0; +} diff --git a/posix/regex.c b/posix/regex.c index 2b1a62b799..fc25bb0c14 100644 --- a/posix/regex.c +++ b/posix/regex.c @@ -290,6 +290,8 @@ extern char *re_syntax_table; static char re_syntax_table[CHAR_SET_SIZE]; +static void init_syntax_once PARAMS ((void)); + static void init_syntax_once () { @@ -1906,7 +1908,8 @@ static reg_errcode_t compile_range _RE_ARGS ((unsigned int range_start, #ifndef TRANSLATE # ifdef MBS_SUPPORT # define TRANSLATE(d) \ - (translate && (sizeof(d) <= 1)? (char) translate[(unsigned char) (d)] : (d)) + ((translate && ((US_CHAR_TYPE) (d)) <= 0xff) \ + ? (char) translate[(unsigned char) (d)] : (d)) #else # define TRANSLATE(d) \ (translate ? (char) translate[(unsigned char) (d)] : (d)) @@ -5058,9 +5061,9 @@ re_search_2 (bufp, string1, size1, string2, size2, startpos, range, regs, stop) } else /* Searching backwards. */ { - register char c = (size1 == 0 || startpos >= size1 - ? string2[startpos - size1] - : string1[startpos]); + register CHAR_TYPE c = (size1 == 0 || startpos >= size1 + ? string2[startpos - size1] + : string1[startpos]); if (!fastmap[(unsigned char) TRANSLATE (c)]) goto advance; @@ -5309,10 +5312,14 @@ weak_alias (__re_match_2, re_match_2) #endif #ifdef MBS_SUPPORT + +static int count_mbs_length PARAMS ((int *, int)); + /* This check the substring (from 0, to length) of the multibyte string, to which offset_buffer correspond. And count how many wchar_t_characters the substring occupy. We use offset_buffer to optimization. See convert_mbs_to_wcs. */ + static int count_mbs_length(offset_buffer, length) int *offset_buffer; -- cgit v1.2.3