glibc/posix/tst-regexloc.c

47 lines
1.4 KiB
C
Raw Normal View History

/* Copyright (C) 2001-2018 Free Software Foundation, Inc.
2001-06-26 00:01:14 +00:00
This file is part of the GNU C Library.
The GNU C Library is free software; you can redistribute it and/or
modify it under the terms of the GNU Lesser General Public
License as published by the Free Software Foundation; either
version 2.1 of the License, or (at your option) any later version.
2001-06-26 00:01:14 +00:00
The GNU C Library is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
Lesser General Public License for more details.
2001-06-26 00:01:14 +00:00
You should have received a copy of the GNU Lesser General Public
License along with the GNU C Library; if not, see
<http://www.gnu.org/licenses/>. */
2001-06-26 00:01:14 +00:00
#include <sys/types.h>
#include <regex.h>
#include <locale.h>
#include <stdio.h>
static int
do_test (void)
{
regex_t re;
regmatch_t mat[1];
int res = 1;
if (setlocale (LC_ALL, "de_DE.ISO-8859-1") == NULL)
puts ("cannot set locale");
Fix test cases tst-fnmatch and tst-regexloc for the new iso14651_t1_common file. See: http://pubs.opengroup.org/onlinepubs/7908799/xbd/re.html > A range expression represents the set of collating elements that fall > between two elements in the current collation sequence, > inclusively. It is expressed as the starting point and the ending > point separated by a hyphen (-). > > Range expressions must not be used in portable applications because > their behaviour is dependent on the collating sequence. Ranges will be > treated according to the current collating sequence, and include such > characters that fall within the range based on that collating > sequence, regardless of character values. This, however, means that > the interpretation will differ depending on collating sequence. If, > for instance, one collating sequence defines ä as a variant of a, > while another defines it as a letter following z, then the expression > [ä-z] is valid in the first language and invalid in the second. Therefore, using [a-z] does not make much sense except in the C/POSIX locale. The new iso14651_t1_common lists upper case and lower case Latin characters in a different order than the old one which causes surprising results for example in the de_DE locale: [a-z] now includes A because A comes after a in iso14651_t1_common but does not include Z because that comes after z in iso14651_t1_common. * posix/tst-fnmatch.input: Fix results for range expressions for non C locales. * posix/tst-regexloc.c: Do not use a range expression for de_DE.ISO-8859-1 locale.
2018-01-23 16:29:36 +00:00
else if (regcomp (&re, "[abcdef]*", 0) != REG_NOERROR)
puts ("cannot compile expression \"[abcdef]*\"");
else if (regexec (&re, "abcdefCDEF", 1, mat, 0) == REG_NOMATCH)
puts ("no match");
else
{
printf ("match from %d to %d\n", mat[0].rm_so, mat[0].rm_eo);
res = mat[0].rm_so != 0 || mat[0].rm_eo != 6;
}
return res;
}
#define TEST_FUNCTION do_test ()
#include "../test-skeleton.c"