]>
Commit | Line | Data |
---|---|---|
692de4b3 MS |
1 | /* bug 19432: iconv rejects redundant escape sequences in IBM903, |
2 | IBM905, IBM907, and IBM909 | |
3 | ||
bfff8b1b | 4 | Copyright (C) 2016-2017 Free Software Foundation, Inc. |
692de4b3 MS |
5 | This file is part of the GNU C Library. |
6 | ||
7 | The GNU C Library is free software; you can redistribute it and/or | |
8 | modify it under the terms of the GNU Lesser General Public | |
9 | License as published by the Free Software Foundation; either | |
10 | version 2.1 of the License, or (at your option) any later version. | |
11 | ||
12 | The GNU C Library is distributed in the hope that it will be useful, | |
13 | but WITHOUT ANY WARRANTY; without even the implied warranty of | |
14 | MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU | |
15 | Lesser General Public License for more details. | |
16 | ||
17 | You should have received a copy of the GNU Lesser General Public | |
18 | License along with the GNU C Library; if not, see | |
19 | <http://www.gnu.org/licenses/>. */ | |
20 | ||
21 | #include <iconv.h> | |
22 | #include <stdio.h> | |
23 | #include <stdlib.h> | |
24 | #include <string.h> | |
25 | #include <errno.h> | |
26 | ||
27 | // The longest test input sequence. | |
28 | #define MAXINBYTES 8 | |
29 | #define MAXOUTBYTES (MAXINBYTES * MB_LEN_MAX) | |
30 | ||
31 | /* Verify that a conversion of the INPUT sequence consisting of | |
32 | INBYTESLEFT bytes in the encoding specified by the codeset | |
33 | named by FROM_SET is successful. | |
34 | Return 0 on success, non-zero on iconv() failure. */ | |
35 | ||
36 | static int | |
37 | test_ibm93x (const char *from_set, const char *input, size_t inbytesleft) | |
38 | { | |
39 | const char to_set[] = "UTF-8"; | |
40 | iconv_t cd = iconv_open (to_set, from_set); | |
41 | if (cd == (iconv_t) -1) | |
42 | { | |
43 | printf ("iconv_open(\"%s\", \"%s\"): %s\n", | |
44 | from_set, to_set, strerror (errno)); | |
45 | return 1; | |
46 | } | |
47 | ||
48 | char output [MAXOUTBYTES]; | |
49 | size_t outbytesleft = sizeof output; | |
50 | ||
51 | char *inbuf = (char*)input; | |
52 | char *outbuf = output; | |
53 | ||
54 | printf ("iconv(cd, %p, %zu, %p, %zu)\n", | |
55 | inbuf, inbytesleft, outbuf, outbytesleft); | |
56 | ||
57 | errno = 0; | |
58 | size_t ret = iconv (cd, &inbuf, &inbytesleft, &outbuf, &outbytesleft); | |
ab9f6255 | 59 | printf (" ==> %zu: %s\n" |
692de4b3 MS |
60 | " inbuf%+td, inbytesleft=%zu, outbuf%+td, outbytesleft=%zu\n", |
61 | ret, strerror (errno), | |
62 | inbuf - input, inbytesleft, outbuf - output, outbytesleft); | |
63 | ||
64 | // Return 0 on success, non-zero on iconv() failure. | |
65 | return ret == (size_t)-1 || errno; | |
66 | } | |
67 | ||
68 | static int | |
69 | do_test (void) | |
70 | { | |
71 | // State-dependent encodings to exercise. | |
72 | static const char* const to_code[] = { | |
73 | "IBM930", "IBM933", "IBM935", "IBM937", "IBM939" | |
74 | }; | |
75 | ||
76 | static const size_t ncodesets = sizeof to_code / sizeof *to_code; | |
77 | ||
78 | static const struct { | |
79 | char txt[MAXINBYTES]; | |
80 | size_t len; | |
81 | } input[] = { | |
82 | #define DATA(s) { s, sizeof s - 1 } | |
83 | /* <SI>: denotes the shift-in 1-byte escape sequence, changing | |
84 | the encoder from a sigle-byte encoding to multibyte | |
85 | <SO>: denotes the shift-out 1-byte escape sequence, switching | |
86 | the encoder from a multibyte to a single-byte state */ | |
87 | ||
88 | DATA ("\x0e"), // <SI> (not redundant) | |
89 | DATA ("\x0f"), // <S0> (redundant with initial state) | |
90 | DATA ("\x0e\x0e"), // <SI><SI> | |
91 | DATA ("\x0e\x0f\x0f"), // <SI><SO><SO> | |
92 | DATA ("\x0f\x0f"), // <SO><SO> | |
93 | DATA ("\x0f\x0e\x0e"), // <SO><SI><SI> | |
94 | DATA ("\x0e\x0f\xc7\x0f"), // <SI><SO><G><SO> | |
95 | DATA ("\xc7\x0f") // <G><SO> (redundant with initial state) | |
96 | }; | |
97 | ||
98 | static const size_t ninputs = sizeof input / sizeof *input; | |
99 | ||
100 | int ret = 0; | |
101 | ||
102 | size_t i, j; | |
103 | ||
104 | /* Iterate over the IBM93x codesets above and exercise each with | |
105 | the input sequences above. */ | |
106 | for (i = 0; i != ncodesets; ++i) | |
107 | for (j = 0; j != ninputs; ++j) | |
108 | ret += test_ibm93x (to_code [i], input [i].txt, input [i].len); | |
109 | ||
110 | return ret; | |
111 | } | |
112 | ||
113 | #define TEST_FUNCTION do_test () | |
114 | #include "../test-skeleton.c" |