]> git.ipfire.org Git - thirdparty/glibc.git/blame - posix/bug-regex30.c
Fix ranges with multibyte characters as endpoints.
[thirdparty/glibc.git] / posix / bug-regex30.c
CommitLineData
815d8147
PB
1/* Russian regular expression tests.
2 Copyright (C) 2009 Free Software Foundation, Inc.
3 This file is part of the GNU C Library.
4 Contributed by Paolo Bonzini <pbonzini@redhat.com>, 2009.
5
6 The GNU C Library is free software; you can redistribute it and/or
7 modify it under the terms of the GNU Lesser General Public
8 License as published by the Free Software Foundation; either
9 version 2.1 of the License, or (at your option) any later version.
10
11 The GNU C Library is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 Lesser General Public License for more details.
15
16 You should have received a copy of the GNU Lesser General Public
17 License along with the GNU C Library; if not, write to the Free
18 Software Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA
19 02111-1307 USA. */
20
21#include <sys/types.h>
22#include <mcheck.h>
23#include <regex.h>
24#include <stdio.h>
25#include <stdlib.h>
26#include <locale.h>
27
28/* Tests supposed to match. */
29struct
30{
31 const char *pattern;
32 const char *string;
33 int flags, nmatch;
34 regmatch_t rm[5];
35} tests[] = {
36 /* U+0413 \xd0\x93 CYRILLIC CAPITAL LETTER GHE
37 U+0420 \xd0\xa0 CYRILLIC CAPITAL LETTER ER
38 U+0430 \xd0\xb0 CYRILLIC SMALL LETTER A
39 U+0433 \xd0\xb3 CYRILLIC SMALL LETTER GHE
40 U+0440 \xd1\x80 CYRILLIC SMALL LETTER ER
41 U+044F \xd1\x8f CYRILLIC SMALL LETTER YA */
42 { "[\xd0\xb0-\xd1\x8f]", "\xd0\xb3", 0, 1,
43 { { 0, 2 } } },
44 { "[\xd0\xb0-\xd1\x8f]", "\xd0\x93", REG_ICASE, 1,
45 { { 0, 2 } } },
46 { "[\xd1\x80-\xd1\x8f]", "\xd0\xa0", REG_ICASE, 1,
47 { { 0, 2 } } },
48};
49
50
51static int
52do_test (void)
53{
54 if (setlocale (LC_ALL, "de_DE.UTF-8") == NULL)
55 {
56 puts ("setlocale failed");
57 return 1;
58 }
59
60 int ret = 0;
61
62 for (size_t i = 0; i < sizeof (tests) / sizeof (tests[0]); ++i)
63 {
64 regex_t re;
65 regmatch_t rm[5];
66 int n = regcomp (&re, tests[i].pattern, tests[i].flags);
67 if (n != 0)
68 {
69 char buf[500];
70 regerror (n, &re, buf, sizeof (buf));
71 printf ("regcomp %zd failed: %s\n", i, buf);
72 ret = 1;
73 continue;
74 }
75
76 if (regexec (&re, tests[i].string, tests[i].nmatch, rm, 0))
77 {
78 printf ("regexec %zd failed\n", i);
79 ret = 1;
80 regfree (&re);
81 continue;
82 }
83
84 for (n = 0; n < tests[i].nmatch; ++n)
85 if (rm[n].rm_so != tests[i].rm[n].rm_so
86 || rm[n].rm_eo != tests[i].rm[n].rm_eo)
87 {
88 if (tests[i].rm[n].rm_so == -1 && tests[i].rm[n].rm_eo == -1)
89 break;
90 printf ("regexec match failure rm[%d] %d..%d\n",
91 n, rm[n].rm_so, rm[n].rm_eo);
92 ret = 1;
93 break;
94 }
95
96 regfree (&re);
97 }
98
99 return ret;
100}
101
102#define TEST_FUNCTION do_test ()
103#include "../test-skeleton.c"