]>
Commit | Line | Data |
---|---|---|
4ffe6e87 BK |
1 | // { dg-require-iconv "UCS-2LE" } |
2 | // { dg-require-iconv "ISO-8859-15" } | |
3 | ||
4 | // 2000-08-22 Benjamin Kosnik <bkoz@cygnus.com> | |
5 | ||
83ffe9cd | 6 | // Copyright (C) 2000-2023 Free Software Foundation, Inc. |
4ffe6e87 BK |
7 | // |
8 | // This file is part of the GNU ISO C++ Library. This library is free | |
9 | // software; you can redistribute it and/or modify it under the | |
10 | // terms of the GNU General Public License as published by the | |
748086b7 | 11 | // Free Software Foundation; either version 3, or (at your option) |
4ffe6e87 BK |
12 | // any later version. |
13 | ||
14 | // This library is distributed in the hope that it will be useful, | |
15 | // but WITHOUT ANY WARRANTY; without even the implied warranty of | |
16 | // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | |
17 | // GNU General Public License for more details. | |
18 | ||
19 | // You should have received a copy of the GNU General Public License along | |
748086b7 JJ |
20 | // with this library; see the file COPYING3. If not see |
21 | // <http://www.gnu.org/licenses/>. | |
4ffe6e87 BK |
22 | |
23 | // 22.2.1.5 - Template class codecvt [lib.locale.codecvt] | |
24 | #include <locale> | |
1b716e90 | 25 | #include <cstring> |
4ffe6e87 BK |
26 | #include <testsuite_hooks.h> |
27 | #include <ext/codecvt_specializations.h> | |
28 | ||
29 | /* | |
30 | > how do I check that these conversions are correct? | |
31 | Very easy. Since all the characters are from ASCII you simply | |
32 | zero-extend the values. | |
33 | ||
34 | drepper$ echo 'black pearl jasmine tea' | od -t x1 | |
35 | 0000000 62 6c 61 63 6b 20 70 65 61 72 6c 20 6a 61 73 6d | |
36 | 0000020 69 6e 65 20 74 65 61 0a | |
37 | ||
38 | So the UCS-2 string is | |
39 | ||
40 | 0x0062, 0x006c, 0x0061, ... | |
41 | ||
42 | You get the idea. With iconv() you have to take care of the | |
43 | byte-order, though. UCS-2 can mean little- or big endian. Looking at | |
44 | your result | |
45 | ||
46 | > $9 = 25856 | |
47 | ||
48 | it shows that the other byte-order is used (25856 == 0x6500). | |
49 | */ | |
50 | ||
51 | // Partial specialization using encoding_state. | |
52 | // codecvt<unicode_t, char, encoding_state> | |
53 | // UNICODE - UCS2 (little endian) | |
54 | void test02() | |
55 | { | |
56 | using namespace std; | |
57 | typedef codecvt_base::result result; | |
58 | typedef unsigned short int_type; | |
59 | typedef char ext_type; | |
60 | typedef __gnu_cxx::encoding_state state_type; | |
61 | typedef codecvt<int_type, ext_type, state_type> unicode_codecvt; | |
62 | typedef char_traits<int_type> int_traits; | |
63 | typedef char_traits<ext_type> ext_traits; | |
64 | ||
4ffe6e87 BK |
65 | const ext_type* e_lit = "black pearl jasmine tea"; |
66 | int size = strlen(e_lit); | |
67 | ||
68 | char i_lit_base[50] __attribute__((aligned(__alignof__(int_type)))) = | |
69 | { | |
5847ec93 PC |
70 | char(0x62), char(0x00), char(0x6c), char(0x00), char(0x61), char(0x00), |
71 | char(0x63), char(0x00), char(0x6b), char(0x00), char(0x20), char(0x00), | |
72 | char(0x70), char(0x00), char(0x65), char(0x00), char(0x61), char(0x00), | |
73 | char(0x72), char(0x00), char(0x6c), char(0x00), char(0x20), char(0x00), | |
74 | char(0x6a), char(0x00), char(0x61), char(0x00), char(0x73), char(0x00), | |
75 | char(0x6d), char(0x00), char(0x69), char(0x00), char(0x6e), char(0x00), | |
76 | char(0x65), char(0x00), char(0x20), char(0x00), char(0x74), char(0x00), | |
77 | char(0x65), char(0x00), char(0x61), char(0x00), char(0xa0), char(0x00) | |
4ffe6e87 BK |
78 | }; |
79 | const int_type* i_lit = reinterpret_cast<int_type*>(i_lit_base); | |
80 | ||
81 | const ext_type* efrom_next; | |
82 | const int_type* ifrom_next; | |
83 | ext_type* e_arr = new ext_type[size + 1]; | |
84 | ext_type* eto_next; | |
85 | int_type* i_arr = new int_type[size + 1]; | |
86 | int_type* ito_next; | |
87 | ||
88 | // construct a locale object with the specialized facet. | |
89 | locale loc(locale::classic(), new unicode_codecvt); | |
90 | // sanity check the constructed locale has the specialized facet. | |
91 | VERIFY( has_facet<unicode_codecvt>(loc) ); | |
92 | const unicode_codecvt& cvt = use_facet<unicode_codecvt>(loc); | |
93 | ||
94 | // in | |
95 | unicode_codecvt::state_type state01("UCS-2LE", "ISO-8859-15", 0, 0); | |
96 | // internal encoding is bigger because of bom | |
97 | result r1 = cvt.in(state01, e_lit, e_lit + size, efrom_next, | |
98 | i_arr, i_arr + size + 1, ito_next); | |
99 | VERIFY( r1 == codecvt_base::ok ); | |
100 | VERIFY( !int_traits::compare(i_arr, i_lit, size) ); | |
101 | VERIFY( efrom_next == e_lit + size ); | |
102 | VERIFY( ito_next == i_arr + size ); | |
103 | ||
104 | // out | |
105 | unicode_codecvt::state_type state02("UCS-2LE", "ISO-8859-15", 0, 0); | |
106 | result r2 = cvt.out(state02, i_lit, i_lit + size, ifrom_next, | |
107 | e_arr, e_arr + size, eto_next); | |
108 | VERIFY( r2 == codecvt_base::ok ); | |
109 | VERIFY( !ext_traits::compare(e_arr, e_lit, size) ); | |
110 | VERIFY( ifrom_next == i_lit + size ); | |
111 | VERIFY( eto_next == e_arr + size ); | |
112 | ||
113 | // unshift | |
114 | ext_traits::copy(e_arr, e_lit, size); | |
115 | unicode_codecvt::state_type state03("UCS-2LE", "ISO-8859-15", 0, 0); | |
116 | result r3 = cvt.unshift(state03, e_arr, e_arr + size, eto_next); | |
117 | VERIFY( r3 == codecvt_base::noconv ); | |
118 | VERIFY( !ext_traits::compare(e_arr, e_lit, size) ); | |
119 | VERIFY( eto_next == e_arr ); | |
120 | ||
121 | int i = cvt.encoding(); | |
122 | VERIFY( i == 2 ); // Target-dependent. | |
123 | ||
124 | VERIFY( !cvt.always_noconv() ); | |
125 | ||
126 | unicode_codecvt::state_type state04("UCS-2LE", "ISO-8859-15", 0, 0); | |
127 | int j = cvt.length(state03, e_lit, e_lit + size, 5); | |
128 | VERIFY( j == 5 ); | |
129 | ||
130 | int k = cvt.max_length(); | |
131 | VERIFY( k == 1 ); | |
132 | ||
133 | delete [] e_arr; | |
134 | delete [] i_arr; | |
135 | } | |
136 | ||
137 | int main () | |
138 | { | |
139 | test02(); | |
140 | return 0; | |
141 | } |