]>
Commit | Line | Data |
---|---|---|
d001ce5f | 1 | // { dg-require-iconv "UCS-2BE" } |
2 | // { dg-require-iconv "ISO-8859-15" } | |
3 | ||
4 | // 2000-08-22 Benjamin Kosnik <bkoz@cygnus.com> | |
5 | ||
f1717362 | 6 | // Copyright (C) 2000-2016 Free Software Foundation, Inc. |
d001ce5f | 7 | // |
8 | // This file is part of the GNU ISO C++ Library. This library is free | |
9 | // software; you can redistribute it and/or modify it under the | |
10 | // terms of the GNU General Public License as published by the | |
6bc9506f | 11 | // Free Software Foundation; either version 3, or (at your option) |
d001ce5f | 12 | // any later version. |
13 | ||
14 | // This library is distributed in the hope that it will be useful, | |
15 | // but WITHOUT ANY WARRANTY; without even the implied warranty of | |
16 | // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | |
17 | // GNU General Public License for more details. | |
18 | ||
19 | // You should have received a copy of the GNU General Public License along | |
6bc9506f | 20 | // with this library; see the file COPYING3. If not see |
21 | // <http://www.gnu.org/licenses/>. | |
d001ce5f | 22 | |
23 | // 22.2.1.5 - Template class codecvt [lib.locale.codecvt] | |
24 | #include <locale> | |
1f3fc4aa | 25 | #include <cstring> |
d001ce5f | 26 | #include <testsuite_hooks.h> |
27 | #include <ext/codecvt_specializations.h> | |
28 | ||
29 | /* | |
30 | > how do I check that these conversions are correct? | |
31 | Very easy. Since all the characters are from ASCII you simply | |
32 | zero-extend the values. | |
33 | ||
34 | drepper$ echo 'black pearl jasmine tea' | od -t x1 | |
35 | 0000000 62 6c 61 63 6b 20 70 65 61 72 6c 20 6a 61 73 6d | |
36 | 0000020 69 6e 65 20 74 65 61 0a | |
37 | ||
38 | So the UCS-2 string is | |
39 | ||
40 | 0x0062, 0x006c, 0x0061, ... | |
41 | ||
42 | You get the idea. With iconv() you have to take care of the | |
43 | byte-order, though. UCS-2 can mean little- or big endian. Looking at | |
44 | your result | |
45 | ||
46 | > $9 = 25856 | |
47 | ||
48 | it shows that the other byte-order is used (25856 == 0x6500). | |
49 | */ | |
50 | ||
51 | // Partial specialization using encoding_state. | |
52 | // codecvt<unicode_t, char, encoding_state> | |
53 | // UNICODE - UCS2 (big endian) | |
54 | void test01() | |
55 | { | |
56 | using namespace std; | |
57 | typedef codecvt_base::result result; | |
58 | typedef unsigned short int_type; | |
59 | typedef char ext_type; | |
60 | typedef __gnu_cxx::encoding_state state_type; | |
61 | typedef codecvt<int_type, ext_type, state_type> unicode_codecvt; | |
62 | typedef char_traits<int_type> int_traits; | |
63 | typedef char_traits<ext_type> ext_traits; | |
64 | ||
65 | bool test __attribute__((unused)) = true; | |
66 | const ext_type* e_lit = "black pearl jasmine tea"; | |
67 | int size = strlen(e_lit); | |
68 | ||
69 | char i_lit_base[50] __attribute__((aligned(__alignof__(int_type)))) = | |
70 | { | |
9927c753 | 71 | char(0x00), char(0x62), char(0x00), char(0x6c), char(0x00), char(0x61), |
72 | char(0x00), char(0x63), char(0x00), char(0x6b), char(0x00), char(0x20), | |
73 | char(0x00), char(0x70), char(0x00), char(0x65), char(0x00), char(0x61), | |
74 | char(0x00), char(0x72), char(0x00), char(0x6c), char(0x00), char(0x20), | |
75 | char(0x00), char(0x6a), char(0x00), char(0x61), char(0x00), char(0x73), | |
76 | char(0x00), char(0x6d), char(0x00), char(0x69), char(0x00), char(0x6e), | |
77 | char(0x00), char(0x65), char(0x00), char(0x20), char(0x00), char(0x74), | |
78 | char(0x00), char(0x65), char(0x00), char(0x61), char(0x00), char(0xa0) | |
d001ce5f | 79 | }; |
80 | const int_type* i_lit = reinterpret_cast<int_type*>(i_lit_base); | |
81 | ||
82 | const ext_type* efrom_next; | |
83 | const int_type* ifrom_next; | |
84 | ext_type* e_arr = new ext_type[size + 1]; | |
85 | ext_type* eto_next; | |
86 | int_type* i_arr = new int_type[size + 1]; | |
87 | int_type* ito_next; | |
88 | ||
89 | // construct a locale object with the specialized facet. | |
90 | locale loc(locale::classic(), new unicode_codecvt); | |
91 | // sanity check the constructed locale has the specialized facet. | |
92 | VERIFY( has_facet<unicode_codecvt>(loc) ); | |
93 | const unicode_codecvt& cvt = use_facet<unicode_codecvt>(loc); | |
94 | ||
95 | // in | |
96 | // unicode_codecvt::state_type state01("UCS-2BE", "ISO-8859-15", 0xfeff, 0); | |
97 | unicode_codecvt::state_type state01("UCS-2BE", "ISO-8859-15", 0, 0); | |
98 | ||
99 | // internal encoding is bigger because of bom | |
100 | result r1 = cvt.in(state01, e_lit, e_lit + size, efrom_next, | |
101 | i_arr, i_arr + size + 1, ito_next); | |
102 | VERIFY( r1 == codecvt_base::ok ); | |
103 | VERIFY( !int_traits::compare(i_arr, i_lit, size) ); | |
104 | VERIFY( efrom_next == e_lit + size ); | |
105 | VERIFY( ito_next == i_arr + size ); | |
106 | ||
107 | // out | |
108 | unicode_codecvt::state_type state02("UCS-2BE", "ISO-8859-15", 0, 0); | |
109 | result r2 = cvt.out(state02, i_lit, i_lit + size, ifrom_next, | |
110 | e_arr, e_arr + size, eto_next); | |
111 | VERIFY( r2 == codecvt_base::ok ); | |
112 | VERIFY( !ext_traits::compare(e_arr, e_lit, size) ); | |
113 | VERIFY( ifrom_next == i_lit + size ); | |
114 | VERIFY( eto_next == e_arr + size ); | |
115 | ||
116 | // unshift | |
117 | ext_traits::copy(e_arr, e_lit, size); | |
118 | unicode_codecvt::state_type state03("UCS-2BE", "ISO-8859-15", 0, 0); | |
119 | result r3 = cvt.unshift(state03, e_arr, e_arr + size, eto_next); | |
120 | VERIFY( r3 == codecvt_base::noconv ); | |
121 | VERIFY( !ext_traits::compare(e_arr, e_lit, size) ); | |
122 | VERIFY( eto_next == e_arr ); | |
123 | ||
124 | int i = cvt.encoding(); | |
125 | VERIFY( i == 2 ); // Target-dependent. | |
126 | ||
127 | VERIFY( !cvt.always_noconv() ); | |
128 | ||
129 | unicode_codecvt::state_type state04("UCS-2BE", "ISO-8859-15", 0, 0); | |
130 | int j = cvt.length(state03, e_lit, e_lit + size, 5); | |
131 | VERIFY( j == 5 ); | |
132 | ||
133 | int k = cvt.max_length(); | |
134 | VERIFY( k == 1 ); | |
135 | ||
136 | delete [] e_arr; | |
137 | delete [] i_arr; | |
138 | } | |
139 | ||
140 | int main () | |
141 | { | |
142 | test01(); | |
143 | return 0; | |
144 | } |