]>
Commit | Line | Data |
---|---|---|
4a4839c9 | 1 | # -*- coding: utf-8 -*- |
6d7e8eda | 2 | # Copyright (C) 2014-2023 Free Software Foundation, Inc. |
4a4839c9 AO |
3 | # This file is part of the GNU C Library. |
4 | # | |
5 | # The GNU C Library is free software; you can redistribute it and/or | |
6 | # modify it under the terms of the GNU Lesser General Public | |
7 | # License as published by the Free Software Foundation; either | |
8 | # version 2.1 of the License, or (at your option) any later version. | |
9 | # | |
10 | # The GNU C Library is distributed in the hope that it will be useful, | |
11 | # but WITHOUT ANY WARRANTY; without even the implied warranty of | |
12 | # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU | |
13 | # Lesser General Public License for more details. | |
14 | # | |
15 | # You should have received a copy of the GNU Lesser General Public | |
16 | # License along with the GNU C Library; if not, see | |
5a82c748 | 17 | # <https://www.gnu.org/licenses/>. |
4a4839c9 AO |
18 | |
19 | ''' | |
20 | This file contains a list of test cases used by | |
21 | the ctype_compatibility.py script. | |
22 | ''' | |
23 | ||
24 | TEST_CASES = [ | |
25 | [[0x0E2F, 0x0E46], [('alpha', True), ('punct', False)], | |
26 | '''Theppitak Karoonboonyanan <thep@links.nectec.or.th> says | |
27 | <U0E2F>, <U0E46> should belong to punct. DerivedCoreProperties.txt | |
28 | says it is alpha. We trust DerivedCoreProperties.txt.''' | |
29 | ], | |
30 | [[0x0E31, (0x0E34, 0x0E3A)], [('alpha', True)], | |
31 | '''gen-unicode-ctype.c: Theppitak Karoonboonyanan | |
32 | <thep@links.nectec.or.th> says <U0E31>, <U0E34>..<U0E3A> | |
33 | are alpha. DerivedCoreProperties.txt agrees.''' | |
34 | ], | |
35 | [[(0x0E47, 0x0E4C), 0x0E4E], [('alpha', False)], | |
36 | '''gen-unicode-ctype.c: Theppitak Karoonboonyanan | |
37 | <thep@links.nectec.or.th> says <U0E47>..<U0E4E> are | |
38 | is_alpha. DerivedCoreProperties does says *only* <U0E4D> | |
39 | in that range is alphabetic, the others are *not*. We | |
40 | trust DerivedCoreProperties.txt.''' | |
41 | ], | |
42 | [[0x0E4D], [('alpha', True)], | |
43 | '''gen-unicode-ctype.c: Theppitak Karoonboonyanan | |
44 | <thep@links.nectec.or.th> says <U0E47>..<U0E4E> are | |
45 | is_alpha. DerivedCoreProperties does says *only* <U0E4D> | |
46 | in that range is alphabetic, the others are *not*. We | |
47 | trust DerivedCoreProperties.txt. | |
48 | ''' | |
49 | ], | |
50 | [[0x0345], [('alpha', True), ('lower', True)], | |
51 | '''COMBINING GREEK YPOGEGRAMMENI | |
52 | According to DerivedCoreProperties.txt, this is “Alphabetic” | |
53 | and “Lowercase”.''' | |
54 | ], | |
55 | [[(0x2160, 0x2188)], [('alpha', True)], | |
56 | '''Roman Numerals are “Alphabetic” according to | |
57 | DerivedCoreProperties.txt''' | |
58 | ], | |
59 | [[(0x24B6, 0x24E9)], [('alpha', True)], | |
60 | '''Circled Latin letters are “Alphabetic” according to | |
61 | DerivedCoreProperties.txt''' | |
62 | ], | |
63 | [[0x661], [('alpha', True), ('digit', False)], | |
64 | '''gen-unicode-ctype.c: All non-ASCII digits should be alphabetic. | |
65 | ISO C 99 forbids us to have them in category "digit", but we | |
66 | want iswalnum to return true on them. Don’t forget to | |
67 | have a look at all the other digits, 0x661 is just one | |
68 | example tested here.''' | |
69 | ], | |
70 | [[(0x0030, 0x0039)], [('digit', True)], | |
71 | '''gen-unicode-ctype.c: All ASCII digits should be digits.''' | |
72 | ], | |
73 | [[0x0009], [('blank', True)], | |
74 | '''gen-unicode-ctype.c: CHARACTER TABULATION''' | |
75 | ], | |
76 | [[0x2007], [('blank', False), ('space', False)], | |
77 | '''gen-unicode-ctype.c: FIGURE SPACE, because it has <noBreak> | |
78 | in the description.''' | |
79 | ], | |
80 | [[0x0009, 0x000A, 0x000B, 0x000C, 0x000D], [('space', True)], | |
81 | '''gen-unicode-ctype.c: CHARACTER TABULATION, LINE FEED (LF), LINE | |
82 | TABULATION, ;FORM FEED (FF), CARRIAGE RETURN (CR)''' | |
83 | ], | |
84 | [[0x2028, 0x2029], [('cntrl', True)], | |
85 | '''gen-unicode-ctype.c: LINE SEPARATOR and PARAGRAPH SEPARATOR | |
86 | should be cntrl.''' | |
87 | ], | |
88 | [[(0x0030, 0x0039), (0x0041, 0x0046), (0x0061, 0x0066)], | |
89 | [('xdigit', True)], | |
90 | '''gen-unicode-ctype.c: ISO C 99 says (6.4.4.1): hexadecimal-digit: | |
91 | one of 0 1 2 3 4 5 6 7 8 9 a b c d e f A B C D E F (nothing else | |
92 | should be considered as a hexadecimal-digit)''' | |
93 | ], | |
94 | [[0x0330], [('combining', True), ('combining_level3', False)], | |
95 | '''gen-unicode-ctype.c: COMBINING TILDE BELOW, canonical combining | |
96 | class value >= 200, should be in combining but not in | |
97 | combining_level3''' | |
98 | ], | |
99 | [[0x0250, 0x0251, 0x0271], [('lower', True)], | |
100 | '''Should be lower in Unicode 7.0.0 (was not lower in | |
101 | Unicode 5.0.0). | |
102 | ''' | |
103 | ], | |
104 | [[0x2184], [('lower', True)], | |
105 | '''Should be lower both in Unicode 5.0.0 and 7.0.0''' | |
106 | ], | |
107 | [[0xA67F], [('punct', False), ('alpha', True)], | |
108 | '''0xa67f CYRILLIC PAYEROK. Not in Unicode 5.0.0. In Unicode | |
109 | 7.0.0. General category Lm (Letter | |
110 | modifier). DerivedCoreProperties.txt says it is | |
111 | “Alphabetic”. Apparently added manually to punct by mistake in | |
112 | glibc’s old LC_CTYPE.''' | |
113 | ], | |
114 | [[0xA60C], [('punct', False), ('alpha', True)], | |
115 | '''0xa60c VAI SYLLABLE LENGTHENER. Not in Unicode 5.0.0. | |
116 | In Unicode 7.0.0. General category Lm (Letter | |
117 | modifier). DerivedCoreProperties.txt says it is | |
118 | “Alphabetic”. Apparently added manually to punct by mistake in | |
119 | glibc’s old LC_CTYPE.''' | |
120 | ], | |
121 | [[0x2E2F], [('punct', False), ('alpha', True)], | |
122 | '''0x2E2F VERTICAL TILDE. Not in Unicode 5.0.0. In Unicode | |
123 | 7.0.0. General category Lm (Letter | |
124 | modifier). DerivedCoreProperties.txt says it is | |
125 | “Alphabetic”. Apparently added manually to punct by mistake in | |
126 | glibc’s old LC_CTYPE.''' | |
127 | ], | |
128 | [[(0x1090, 0x1099)], [('punct', False), ('alpha', True)], | |
129 | '''MYANMAR SHAN DIGIT ZERO - MYANMAR SHAN DIGIT NINE. | |
130 | These are digits, but because ISO C 99 forbids to | |
131 | put them into digit they should go into alpha.''' | |
132 | ], | |
133 | [[0x103F], [('punct', False), ('alpha', True)], | |
134 | '''0x103F MYANMAR LETTER GREAT SA. Not in Unicode 5.0.0. | |
135 | In Unicode 7.0.0. General category Lo | |
136 | (Other_Letter). DerivedCoreProperties.txt says it is | |
137 | “Alphabetic”. Apparently added manually to punct by | |
138 | mistake in glibc’s old LC_CTYPE.''' | |
139 | ], | |
140 | [[0x0374], [('punct', False), ('alpha', True)], | |
141 | '''0x0374 GREEK NUMERAL SIGN. Unicode 5.0.0: general category | |
142 | Sk. Unicode 7.0.0: General category Lm | |
143 | (Modifier_Letter). DerivedCoreProperties.txt says it is | |
144 | “Alphabetic”.''' | |
145 | ], | |
146 | [[0x02EC], [('punct', False), ('alpha', True)], | |
147 | '''0x02EC MODIFIER LETTER VOICING. Unicode 5.0.0: general category | |
148 | Sk. Unicode 7.0.0: General category Lm | |
149 | (Modifier_Letter). DerivedCoreProperties.txt says it is | |
150 | “Alphabetic”.''' | |
151 | ], | |
152 | [[0x180E], [('space', False), ('blank', False)], | |
153 | '''0x180e MONGOLIAN VOWEL SEPARATOR. Unicode 5.0.0: General | |
154 | category Zs (Space_Separator) Unicode 7.0.0: General category Cf | |
155 | (Format).''' | |
156 | ], | |
157 | [[0x1E9C, 0x1E9D, 0x1E9F], | |
158 | [('lower', True), ('upper', False), ('tolower', False), | |
159 | ('toupper', False), ('totitle', False)], | |
160 | '''ẜ 0x1e9c LATIN SMALL LETTER LONG S WITH DIAGONAL STROKE, | |
161 | ẝ 0x1e9d LATIN SMALL LETTER LONG S WITH HIGH STROKE, | |
162 | ẟ 0x1e9f LATIN SMALL LETTER DELTA. These are “Lowercase” | |
163 | according to DerivedCoreProperties.txt but no upper case versions | |
164 | exist.''' | |
165 | ], | |
166 | [[0x1E9E], | |
167 | [('lower', False), ('upper', True), ('tolower', True), | |
168 | ('toupper', False), ('totitle', False)], | |
169 | '''0x1E9E ẞ LATIN CAPITAL LETTER SHARP S This is “Uppercase” | |
170 | according to DerivedCoreProperties.txt and the lower case | |
171 | version is 0x00DF ß LATIN SMALL LETTER SHARP S.''' | |
172 | ], | |
173 | [[0x2188], | |
174 | [('alpha', True), ('lower', False), ('upper', False), | |
175 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
176 | '''0x2188 ROMAN NUMERAL ONE HUNDRED THOUSAND. This is “Alphabetic” | |
177 | according to DerivedCoreProperties.txt. In glibc’s old | |
178 | LC_CTYPE, it was in “lower”, which seems to be a | |
179 | mistake. It is not “Lowercase” in | |
180 | DerivedCoreProperties.txt and does not have case mappings | |
181 | in UnicodeData.txt either.''' | |
182 | ], | |
183 | [[0x2C71, 0x2C74, (0x2C77, 0x2C7A)], | |
184 | [('alpha', True), ('lower', True), ('upper', False), | |
185 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
186 | '''These are Latin small letters which were not in Unicode 5.0.0 | |
187 | but are in Unicode 7.0.0. According to | |
188 | DerivedCoreProperties.txt they are “Lowercase”. But no | |
189 | uppercase versions exist. They have apparently been added | |
190 | manually to glibc’s old LC_CTYPE.''' | |
191 | ], | |
192 | [[0xA730, 0xA731], | |
193 | [('alpha', True), ('lower', True), ('upper', False), | |
194 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
195 | '''These are Latin small “capital” letters which were not in | |
196 | Unicode 5.0.0 but are in Unicode 7.0.0. According to | |
197 | DerivedCoreProperties.txt they are “Lowercase”. But no | |
198 | uppercase versions exist. They have apparently been added | |
199 | manually to glibc’s old LC_CTYPE.''' | |
200 | ], | |
201 | [[(0xA771, 0xA778)], | |
202 | [('alpha', True), ('lower', True), ('upper', False), | |
203 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
204 | '''These are Latin small (or small “capital”) letters which | |
205 | were not in Unicodee 5.0.0 but are in Unicode 7.0.0. According to | |
206 | DerivedCoreProperties.txt they are “Lowercase”. But no | |
207 | uppercase versions exist. They have apparently been added | |
208 | manually to glibc’s old LC_CTYPE.''' | |
209 | ], | |
210 | [[0x0375], | |
211 | [('combining', False), ('combining_level3', False), | |
212 | ('alpha', False), ('lower', False), ('upper', False), | |
213 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
214 | '''“0375;GREEK LOWER NUMERAL SIGN;Sk;0;ON;;;;;N;;;;;”. Has | |
215 | apparently been added manually to glibc’s old LC_CTYPE as | |
216 | “combining_level3”. That seems wrong, it is no combining | |
217 | character because it does not have one of the general | |
218 | categories Mn, Mc, or Me. According to | |
219 | DerivedCoreProperties.txt it is not “Alphabetic”.''' | |
220 | ], | |
221 | [[0x108D], | |
222 | [('combining', True), ('combining_level3', False), | |
86bdd49d | 223 | ('alpha', True), ('lower', False), ('upper', False), |
4a4839c9 AO |
224 | ('tolower', False), ('toupper', False), ('totitle', False)], |
225 | '''“108D;MYANMAR SIGN SHAN COUNCIL EMPHATIC | |
226 | TONE;Mn;220;NSM;;;;;N;;;;;”. Has apparently been added | |
227 | manually to glibc’s old LC_CTYPE as | |
228 | “combining_level3”. That seems wrong, although it is a | |
229 | combining character because it has the general category | |
230 | Mn, it is not “combining_level3” because the canonical | |
231 | combining class value is 220 which is >= 200. According to | |
232 | gen-unicode-ctype.c, “combining_level3” needs a | |
233 | canonical combining class value < 200. According to | |
86bdd49d MF |
234 | DerivedCoreProperties.txt it was not “Alphabetic” |
235 | until Unicode 11.0.0 but in 12.0.0 it became “Alphabetic”.''' | |
4a4839c9 AO |
236 | ], |
237 | [[0x06DE], | |
238 | [('combining', False), ('combining_level3', False), | |
239 | ('alpha', False), ('lower', False), ('upper', False), | |
240 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
241 | ''' UnicodeData.txt 5.0.0: “06DE;ARABIC START OF RUB EL | |
242 | HIZB;Me;0;NSM;;;;;N;;;;;”; UnicodeData.txt 7.0.0: | |
243 | “06DE;ARABIC START OF RUB EL | |
244 | HIZB;So;0;ON;;;;;N;;;;;”. I.e. this used to be a | |
245 | combining character in Unicode 5.0.0 but not anymore in | |
246 | 7.0.0. According to DerivedCoreProperties.txt it is not | |
247 | “Alphabetic”.''' | |
248 | ], | |
249 | [[0x0BD0], | |
250 | [('combining', False), ('combining_level3', False), | |
251 | ('alpha', True), ('lower', False), ('upper', False), | |
252 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
253 | '''Not in UnicodeData.txt 5.0.0. UnicodeData.txt 7.0.0: | |
254 | “0BD0;TAMIL OM;Lo;0;L;;;;;N;;;;;”. Apparently manually added to | |
255 | “combining” and “combining_level3” in glibc’s old | |
256 | LC_CTYPE. That seems wrong. According to | |
257 | DerivedCoreProperties.txt it is “Alphabetic”.''' | |
258 | ], | |
259 | [[0x103F], | |
260 | [('combining', False), ('combining_level3', False), | |
261 | ('alpha', True), ('lower', False), ('upper', False), | |
262 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
263 | '''Not in UnicodeData.txt 5.0.0. UnicodeData.txt 7.0.0: | |
264 | “103F;MYANMAR LETTER GREAT SA;Lo;0;L;;;;;N;;;;;”. | |
265 | Apparently manually added to “combining” and | |
266 | “combining_level3” in glibc’s old LC_CTYPE. That seems | |
267 | wrong. According to DerivedCoreProperties.txt it is | |
268 | “Alphabetic”.''' | |
269 | ], | |
270 | [[(0x0901, 0x0903)], | |
271 | [('combining', True), ('combining_level3', True), | |
272 | ('alpha', True), ('lower', False), ('upper', False), | |
273 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
274 | '''These have general category “Mn” i.e. these are combining | |
275 | characters (both in UnicodeData.txt 5.0.0 and 7.0.0): | |
276 | “0901;DEVANAGARI SIGN CANDRABINDU;Mn;0;NSM;;;;;N;;;;;”, | |
277 | ”0902;DEVANAGARI SIGN ANUSVARA;Mn;0;NSM;;;;;N;;;;;”, | |
278 | “0903;DEVANAGARI SIGN VISARGA;Mc;0;L;;;;;N;;;;;”. | |
279 | According to DerivedCoreProperties.txt (7.0.0) these are | |
280 | “Alphabetic”.''' | |
281 | ], | |
282 | [[0x093C], | |
283 | [('combining', True), ('combining_level3', True), | |
284 | ('alpha', False), ('lower', False), ('upper', False), | |
285 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
286 | '''UnicodeData.txt (5.0.0 and 7.0.0): “093C;DEVANAGARI SIGN | |
287 | NUKTA;Mn;7;NSM;;;;;N;;;;;” According to | |
288 | DerivedCoreProperties.txt (7.0.0) this is *not* | |
289 | “Alphabetic”. glibc’s old LC_TYPE has this in “alpha”.''' | |
290 | ], | |
291 | [[(0x093E, 0x093F)], | |
292 | [('combining', True), ('combining_level3', True), | |
293 | ('alpha', True), ('lower', False), ('upper', False), | |
294 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
295 | '''These have general category “Mc” i.e. these are combining | |
296 | characters (both in UnicodeData.txt 5.0.0 and 7.0.0): | |
297 | “093E;DEVANAGARI VOWEL SIGN AA;Mc;0;L;;;;;N;;;;;” | |
298 | “093F;DEVANAGARI VOWEL SIGN I;Mc;0;L;;;;;N;;;;;” | |
299 | According to DerivedCoreProperties.txt (7.0.0) these are | |
300 | “Alphabetic”.''' | |
301 | ], | |
302 | [[(0x0940, 0x094C)], | |
303 | [('combining', True), ('combining_level3', True), | |
304 | ('alpha', True), ('lower', False), ('upper', False), | |
305 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
306 | '''These are all combining | |
307 | characters (“Mc” or “Mn” both in UnicodeData.txt 5.0.0 and 7.0.0). | |
308 | According to DerivedCoreProperties.txt (7.0.0) these are | |
309 | “Alphabetic”.''' | |
310 | ], | |
311 | [[0x094D], | |
312 | [('combining', True), ('combining_level3', True), | |
313 | ('alpha', False), ('lower', False), ('upper', False), | |
314 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
315 | '''Combining character, both in UnicodeData.txt 5.0.0 and 7.0.0. | |
316 | “094D;DEVANAGARI SIGN VIRAMA;Mn;9;NSM;;;;;N;;;;;” | |
317 | According to DerivedCoreProperties.txt (7.0.0) it is *not* | |
318 | “Alphabetic”.''' | |
319 | ], | |
320 | [[(0x0951, 0x0954)], | |
321 | [('combining', True), ('combining_level3', False), | |
322 | ('alpha', False), ('lower', False), ('upper', False), | |
323 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
324 | '''Combining characters, both in UnicodeData.txt 5.0.0 and 7.0.0. | |
325 | According to DerivedCoreProperties.txt (7.0.0) these are *not* | |
326 | “Alphabetic”.''' | |
327 | ], | |
328 | [[(0x0962, 0x0963), (0x0981, 0x0983)], | |
329 | [('combining', True), ('combining_level3', True), | |
330 | ('alpha', True), ('lower', False), ('upper', False), | |
331 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
332 | '''Combining characters, both in UnicodeData.txt 5.0.0 and 7.0.0. | |
333 | According to DerivedCoreProperties.txt (7.0.0) these are | |
334 | “Alphabetic”.''' | |
335 | ], | |
336 | [[0x09BC], | |
337 | [('combining', True), ('combining_level3', True), | |
338 | ('alpha', False), ('lower', False), ('upper', False), | |
339 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
340 | ''' | |
341 | “09BC;BENGALI SIGN NUKTA;Mn;7;NSM;;;;;N;;;;;” | |
342 | Combining character, both in UnicodeData.txt 5.0.0 and 7.0.0. | |
343 | According to DerivedCoreProperties.txt (7.0.0) it is *not* | |
344 | “Alphabetic”.''' | |
345 | ], | |
346 | [[(0x09BE, 0x09BF), (0x09C0, 0x09C4), (0x09C7, 0x09C8), | |
347 | (0x09CB, 0x09CC)], | |
348 | [('combining', True), ('combining_level3', True), | |
349 | ('alpha', True), ('lower', False), ('upper', False), | |
350 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
351 | ''' | |
352 | “09BE;BENGALI VOWEL SIGN AA;Mc;0;L;;;;;N;;;;;” | |
353 | “09BF;BENGALI VOWEL SIGN I;Mc;0;L;;;;;N;;;;;” | |
354 | “09C0;BENGALI VOWEL SIGN II;Mc;0;L;;;;;N;;;;;” | |
355 | “09C1;BENGALI VOWEL SIGN U;Mn;0;NSM;;;;;N;;;;;” | |
356 | “09C2;BENGALI VOWEL SIGN UU;Mn;0;NSM;;;;;N;;;;;” | |
357 | “09C3;BENGALI VOWEL SIGN VOCALIC R;Mn;0;NSM;;;;;N;;;;;” | |
358 | “09C4;BENGALI VOWEL SIGN VOCALIC RR;Mn;0;NSM;;;;;N;;;;;” | |
359 | “09C7;BENGALI VOWEL SIGN E;Mc;0;L;;;;;N;;;;;” | |
360 | “09C8;BENGALI VOWEL SIGN AI;Mc;0;L;;;;;N;;;;;” | |
361 | “09CB;BENGALI VOWEL SIGN O;Mc;0;L;09C7 09BE;;;;N;;;;;” | |
362 | “09CC;BENGALI VOWEL SIGN AU;Mc;0;L;09C7 09D7;;;;N;;;;;” | |
363 | Combining characters, both in UnicodeData.txt 5.0.0 and 7.0.0. | |
364 | According to DerivedCoreProperties.txt (7.0.0) these are | |
365 | “Alphabetic”.''' | |
366 | ], | |
367 | [[0x09CD], | |
368 | [('combining', True), ('combining_level3', True), | |
369 | ('alpha', False), ('lower', False), ('upper', False), | |
370 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
371 | ''' | |
372 | “09CD;BENGALI SIGN VIRAMA;Mn;9;NSM;;;;;N;;;;;” | |
373 | Combining character, both in UnicodeData.txt 5.0.0 and 7.0.0. | |
374 | According to DerivedCoreProperties.txt (7.0.0) it is *not* | |
375 | “Alphabetic”.''' | |
376 | ], | |
377 | [[0x09D7, (0x09E2, 0x09E3)], | |
378 | [('combining', True), ('combining_level3', True), | |
379 | ('alpha', True), ('lower', False), ('upper', False), | |
380 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
381 | '''Combining characters, both in UnicodeData.txt 5.0.0 and 7.0.0. | |
382 | According to DerivedCoreProperties.txt (7.0.0) these are | |
383 | “Alphabetic”.''' | |
384 | ], | |
385 | [[0x09F2, 0x09F3], | |
386 | [('combining', False), ('combining_level3', False), | |
387 | ('alpha', False), ('lower', False), ('upper', False), | |
388 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
389 | ''' | |
390 | “09F2;BENGALI RUPEE MARK;Sc;0;ET;;;;;N;;;;;” | |
391 | “09F3;BENGALI RUPEE SIGN;Sc;0;ET;;;;;N;;;;;” | |
392 | According to DerivedCoreProperties.txt (7.0.0) these are *not* | |
393 | “Alphabetic”.''' | |
394 | ], | |
395 | [[(0x09F4, 0x09FA)], | |
396 | [('combining', False), ('combining_level3', False), | |
397 | ('alpha', False), ('lower', False), ('upper', False), | |
398 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
399 | ''' | |
400 | “09F4;BENGALI CURRENCY NUMERATOR ONE;No;0;L;;;;1/16;N;;;;;” | |
401 | “09F5;BENGALI CURRENCY NUMERATOR TWO;No;0;L;;;;1/8;N;;;;;” | |
402 | “09F6;BENGALI CURRENCY NUMERATOR THREE;No;0;L;;;;3/16;N;;;;;” | |
403 | “09F7;BENGALI CURRENCY NUMERATOR FOUR;No;0;L;;;;1/4;N;;;;;” | |
404 | “09F8;BENGALI CURRENCY NUMERATOR ONE LESS THAN THE DENOMINATOR; | |
405 | No;0;L;;;;3/4;N;;;;;” | |
406 | “09F9;BENGALI CURRENCY DENOMINATOR SIXTEEN;No;0;L;;;;16;N;;;;;” | |
407 | “09FA;BENGALI ISSHAR;So;0;L;;;;;N;;;;;” | |
408 | According to DerivedCoreProperties.txt (7.0.0) these are *not* | |
409 | “Alphabetic”.''' | |
410 | ], | |
411 | [[(0x0A01, 0x0A03)], | |
412 | [('combining', True), ('combining_level3', True), | |
413 | ('alpha', True), ('lower', False), ('upper', False), | |
414 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
415 | ''' | |
416 | “0A01;GURMUKHI SIGN ADAK BINDI;Mn;0;NSM;;;;;N;;;;;” | |
417 | “0A02;GURMUKHI SIGN BINDI;Mn;0;NSM;;;;;N;;;;;” | |
418 | “0A03;GURMUKHI SIGN VISARGA;Mc;0;L;;;;;N;;;;;” | |
419 | According to DerivedCoreProperties.txt (7.0.0) these are | |
420 | “Alphabetic”.''' | |
421 | ], | |
422 | [[0x0A3C], | |
423 | [('combining', True), ('combining_level3', True), | |
424 | ('alpha', False), ('lower', False), ('upper', False), | |
425 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
426 | ''' | |
427 | “0A3C;GURMUKHI SIGN NUKTA;Mn;7;NSM;;;;;N;;;;;” | |
428 | According to DerivedCoreProperties.txt (7.0.0) this is *not* | |
429 | “Alphabetic”.''' | |
430 | ], | |
431 | [[(0x0A3E, 0x0A40), (0x0A41, 0x0A42), (0x0A47, 0x0A48), | |
432 | (0x0A4B, 0x0A4C)], | |
433 | [('combining', True), ('combining_level3', True), | |
434 | ('alpha', True), ('lower', False), ('upper', False), | |
435 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
436 | ''' | |
437 | “0A3E;GURMUKHI VOWEL SIGN AA;Mc;0;L;;;;;N;;;;;” | |
438 | “0A3F;GURMUKHI VOWEL SIGN I;Mc;0;L;;;;;N;;;;;” | |
439 | “0A40;GURMUKHI VOWEL SIGN II;Mc;0;L;;;;;N;;;;;” | |
440 | “0A41;GURMUKHI VOWEL SIGN U;Mn;0;NSM;;;;;N;;;;;” | |
441 | “0A42;GURMUKHI VOWEL SIGN UU;Mn;0;NSM;;;;;N;;;;;” | |
442 | “0A47;GURMUKHI VOWEL SIGN EE;Mn;0;NSM;;;;;N;;;;;” | |
443 | “0A48;GURMUKHI VOWEL SIGN AI;Mn;0;NSM;;;;;N;;;;;” | |
444 | “0A4B;GURMUKHI VOWEL SIGN OO;Mn;0;NSM;;;;;N;;;;;” | |
445 | “0A4C;GURMUKHI VOWEL SIGN AU;Mn;0;NSM;;;;;N;;;;;” | |
446 | According to DerivedCoreProperties.txt (7.0.0) these are | |
447 | “Alphabetic”.''' | |
448 | ], | |
449 | [[0x0A4D], | |
450 | [('combining', True), ('combining_level3', True), | |
451 | ('alpha', False), ('lower', False), ('upper', False), | |
452 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
453 | ''' | |
454 | “0A4D;GURMUKHI SIGN VIRAMA;Mn;9;NSM;;;;;N;;;;;” | |
455 | According to DerivedCoreProperties.txt (7.0.0) this is *not* | |
456 | “Alphabetic”.''' | |
457 | ], | |
458 | [[0x0A51, (0x0A70, 0x0A71), 0x0A75, (0x0A81, 0x0A83)], | |
459 | [('combining', True), ('combining_level3', True), | |
460 | ('alpha', True), ('lower', False), ('upper', False), | |
461 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
462 | ''' | |
463 | “0A4D;GURMUKHI SIGN VIRAMA;Mn;9;NSM;;;;;N;;;;;” | |
464 | “0A70;GURMUKHI TIPPI;Mn;0;NSM;;;;;N;;;;;” | |
465 | “0A71;GURMUKHI ADDAK;Mn;0;NSM;;;;;N;;;;;” | |
466 | “0A75;GURMUKHI SIGN YAKASH;Mn;0;NSM;;;;;N;;;;;” | |
467 | “0A81;GUJARATI SIGN CANDRABINDU;Mn;0;NSM;;;;;N;;;;;” | |
468 | “0A82;GUJARATI SIGN ANUSVARA;Mn;0;NSM;;;;;N;;;;;” | |
469 | “0A83;GUJARATI SIGN VISARGA;Mc;0;L;;;;;N;;;;;” | |
470 | According to DerivedCoreProperties.txt (7.0.0) these are | |
471 | “Alphabetic”.''' | |
472 | ], | |
473 | [[0x0ABC], | |
474 | [('combining', True), ('combining_level3', True), | |
475 | ('alpha', False), ('lower', False), ('upper', False), | |
476 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
477 | ''' | |
478 | “0ABC;GUJARATI SIGN NUKTA;Mn;7;NSM;;;;;N;;;;;” | |
479 | According to DerivedCoreProperties.txt (7.0.0) this is *not* | |
480 | “Alphabetic”.''' | |
481 | ], | |
482 | [[(0x0ABE, 0x0AC5), (0x0AC7, 0x0AC9), (0x0ACB, 0x0ACC)], | |
483 | [('combining', True), ('combining_level3', True), | |
484 | ('alpha', True), ('lower', False), ('upper', False), | |
485 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
486 | ''' | |
487 | “0ABE;GUJARATI VOWEL SIGN AA;Mc;0;L;;;;;N;;;;;” | |
488 | “0ABF;GUJARATI VOWEL SIGN I;Mc;0;L;;;;;N;;;;;” | |
489 | “0AC0;GUJARATI VOWEL SIGN II;Mc;0;L;;;;;N;;;;;” | |
490 | “0AC1;GUJARATI VOWEL SIGN U;Mn;0;NSM;;;;;N;;;;;” | |
491 | “0AC2;GUJARATI VOWEL SIGN UU;Mn;0;NSM;;;;;N;;;;;” | |
492 | “0AC3;GUJARATI VOWEL SIGN VOCALIC R;Mn;0;NSM;;;;;N;;;;;” | |
493 | “0AC4;GUJARATI VOWEL SIGN VOCALIC RR;Mn;0;NSM;;;;;N;;;;;” | |
494 | “0AC5;GUJARATI VOWEL SIGN CANDRA E;Mn;0;NSM;;;;;N;;;;;” | |
495 | “0AC7;GUJARATI VOWEL SIGN E;Mn;0;NSM;;;;;N;;;;;” | |
496 | “0AC8;GUJARATI VOWEL SIGN AI;Mn;0;NSM;;;;;N;;;;;” | |
497 | “0AC9;GUJARATI VOWEL SIGN CANDRA O;Mc;0;L;;;;;N;;;;;” | |
498 | “0ACB;GUJARATI VOWEL SIGN O;Mc;0;L;;;;;N;;;;;” | |
499 | “0ACC;GUJARATI VOWEL SIGN AU;Mc;0;L;;;;;N;;;;;” | |
500 | According to DerivedCoreProperties.txt (7.0.0) these are | |
501 | “Alphabetic”.''' | |
502 | ], | |
503 | [[0x0ACD], | |
504 | [('combining', True), ('combining_level3', True), | |
505 | ('alpha', False), ('lower', False), ('upper', False), | |
506 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
507 | ''' | |
508 | “0ACD;GUJARATI SIGN VIRAMA;Mn;9;NSM;;;;;N;;;;;” | |
509 | According to DerivedCoreProperties.txt (7.0.0) this is *not* | |
510 | “Alphabetic”.''' | |
511 | ], | |
512 | [[(0x0AE2, 0x0AE3)], | |
513 | [('combining', True), ('combining_level3', True), | |
514 | ('alpha', True), ('lower', False), ('upper', False), | |
515 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
516 | ''' | |
517 | “0AE2;GUJARATI VOWEL SIGN VOCALIC L;Mn;0;NSM;;;;;N;;;;;” | |
518 | “0AE3;GUJARATI VOWEL SIGN VOCALIC LL;Mn;0;NSM;;;;;N;;;;;” | |
519 | According to DerivedCoreProperties.txt (7.0.0) these are | |
520 | “Alphabetic”.''' | |
521 | ], | |
522 | [[0x0AF1], | |
523 | [('combining', False), ('combining_level3', False), | |
524 | ('alpha', False), ('lower', False), ('upper', False), | |
525 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
526 | ''' | |
527 | “0AF1;GUJARATI RUPEE SIGN;Sc;0;ET;;;;;N;;;;;” | |
528 | According to DerivedCoreProperties.txt (7.0.0) this is *not* | |
529 | “Alphabetic”.''' | |
530 | ], | |
531 | [[(0x0B01, 0x0B03)], | |
532 | [('combining', True), ('combining_level3', True), | |
533 | ('alpha', True), ('lower', False), ('upper', False), | |
534 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
535 | ''' | |
536 | “0B01;ORIYA SIGN CANDRABINDU;Mn;0;NSM;;;;;N;;;;;” | |
537 | “0B02;ORIYA SIGN ANUSVARA;Mc;0;L;;;;;N;;;;;” | |
538 | “0B03;ORIYA SIGN VISARGA;Mc;0;L;;;;;N;;;;;” | |
539 | According to DerivedCoreProperties.txt (7.0.0) these are | |
540 | “Alphabetic”.''' | |
541 | ], | |
542 | [[0x0B3C], | |
543 | [('combining', True), ('combining_level3', True), | |
544 | ('alpha', False), ('lower', False), ('upper', False), | |
545 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
546 | ''' | |
547 | “0B3C;ORIYA SIGN NUKTA;Mn;7;NSM;;;;;N;;;;;” | |
548 | According to DerivedCoreProperties.txt (7.0.0) this is *not* | |
549 | “Alphabetic”.''' | |
550 | ], | |
551 | [[(0x0B3E, 0x0B44), (0x0B47, 0x0B48), (0x0B4B, 0x0B4C)], | |
552 | [('combining', True), ('combining_level3', True), | |
553 | ('alpha', True), ('lower', False), ('upper', False), | |
554 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
555 | ''' | |
556 | “0B3E;ORIYA VOWEL SIGN AA;Mc;0;L;;;;;N;;;;;” | |
557 | “0B3F;ORIYA VOWEL SIGN I;Mn;0;NSM;;;;;N;;;;;” | |
558 | “0B40;ORIYA VOWEL SIGN II;Mc;0;L;;;;;N;;;;;” | |
559 | “0B41;ORIYA VOWEL SIGN U;Mn;0;NSM;;;;;N;;;;;” | |
560 | “0B42;ORIYA VOWEL SIGN UU;Mn;0;NSM;;;;;N;;;;;” | |
561 | “0B43;ORIYA VOWEL SIGN VOCALIC R;Mn;0;NSM;;;;;N;;;;;” | |
562 | “0B44;ORIYA VOWEL SIGN VOCALIC RR;Mn;0;NSM;;;;;N;;;;;” | |
563 | “0B47;ORIYA VOWEL SIGN E;Mc;0;L;;;;;N;;;;;” | |
564 | “0B48;ORIYA VOWEL SIGN AI;Mc;0;L;0B47 0B56;;;;N;;;;;” | |
565 | “0B4B;ORIYA VOWEL SIGN O;Mc;0;L;0B47 0B3E;;;;N;;;;;” | |
566 | “0B4C;ORIYA VOWEL SIGN AU;Mc;0;L;0B47 0B57;;;;N;;;;;” | |
567 | According to DerivedCoreProperties.txt (7.0.0) these are | |
568 | “Alphabetic”.''' | |
569 | ], | |
570 | [[0x0B4D], | |
571 | [('combining', True), ('combining_level3', True), | |
572 | ('alpha', False), ('lower', False), ('upper', False), | |
573 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
574 | ''' | |
575 | “0B4D;ORIYA SIGN VIRAMA;Mn;9;NSM;;;;;N;;;;;” | |
576 | According to DerivedCoreProperties.txt (7.0.0) this is *not* | |
577 | “Alphabetic”.''' | |
578 | ], | |
579 | [[(0x0B56, 0x0B57), (0x0B62, 0x0B63)], | |
580 | [('combining', True), ('combining_level3', True), | |
581 | ('alpha', True), ('lower', False), ('upper', False), | |
582 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
583 | ''' | |
584 | “0B56;ORIYA AI LENGTH MARK;Mn;0;NSM;;;;;N;;;;;” | |
585 | “0B57;ORIYA AU LENGTH MARK;Mc;0;L;;;;;N;;;;;” | |
586 | “0B62;ORIYA VOWEL SIGN VOCALIC L;Mn;0;NSM;;;;;N;;;;;” | |
587 | “0B63;ORIYA VOWEL SIGN VOCALIC LL;Mn;0;NSM;;;;;N;;;;;” | |
588 | According to DerivedCoreProperties.txt (7.0.0) these are | |
589 | “Alphabetic”.''' | |
590 | ], | |
591 | [[0x0B70], | |
592 | [('combining', False), ('combining_level3', False), | |
593 | ('alpha', False), ('lower', False), ('upper', False), | |
594 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
595 | ''' | |
596 | “0B70;ORIYA ISSHAR;So;0;L;;;;;N;;;;;” | |
597 | According to DerivedCoreProperties.txt (7.0.0) this is *not* | |
598 | “Alphabetic”.''' | |
599 | ], | |
600 | [[0x0B82], | |
601 | [('combining', True), ('combining_level3', True), | |
602 | ('alpha', True), ('lower', False), ('upper', False), | |
603 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
604 | ''' | |
605 | “0B82;TAMIL SIGN ANUSVARA;Mn;0;NSM;;;;;N;;;;;” | |
606 | According to DerivedCoreProperties.txt (7.0.0) this is *not* | |
607 | “Alphabetic”.''' | |
608 | ], | |
609 | [[(0x0BBE, 0x0BC2), (0x0BC6, 0x0BC8), (0x0BCA, 0x0BCC)], | |
610 | [('combining', True), ('combining_level3', True), | |
611 | ('alpha', True), ('lower', False), ('upper', False), | |
612 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
613 | ''' | |
614 | “0BBE;TAMIL VOWEL SIGN AA;Mc;0;L;;;;;N;;;;;” | |
615 | “0BBF;TAMIL VOWEL SIGN I;Mc;0;L;;;;;N;;;;;” | |
616 | “0BC0;TAMIL VOWEL SIGN II;Mn;0;NSM;;;;;N;;;;;” | |
617 | “0BC1;TAMIL VOWEL SIGN U;Mc;0;L;;;;;N;;;;;” | |
618 | “0BC2;TAMIL VOWEL SIGN UU;Mc;0;L;;;;;N;;;;;” | |
619 | “0BC6;TAMIL VOWEL SIGN E;Mc;0;L;;;;;N;;;;;” | |
620 | “0BC7;TAMIL VOWEL SIGN EE;Mc;0;L;;;;;N;;;;;” | |
621 | “0BC8;TAMIL VOWEL SIGN AI;Mc;0;L;;;;;N;;;;;” | |
622 | “0BCA;TAMIL VOWEL SIGN O;Mc;0;L;0BC6 0BBE;;;;N;;;;;” | |
623 | “0BCB;TAMIL VOWEL SIGN OO;Mc;0;L;0BC7 0BBE;;;;N;;;;;” | |
624 | “0BCC;TAMIL VOWEL SIGN AU;Mc;0;L;0BC6 0BD7;;;;N;;;;;” | |
625 | According to DerivedCoreProperties.txt (7.0.0) these are | |
626 | “Alphabetic”.''' | |
627 | ], | |
628 | [[0x0BCD], | |
629 | [('combining', True), ('combining_level3', True), | |
630 | ('alpha', False), ('lower', False), ('upper', False), | |
631 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
632 | ''' | |
633 | “0BCD;TAMIL SIGN VIRAMA;Mn;9;NSM;;;;;N;;;;;” | |
634 | According to DerivedCoreProperties.txt (7.0.0) this is *not* | |
635 | “Alphabetic”.''' | |
636 | ], | |
637 | [[0x0BD7], | |
638 | [('combining', True), ('combining_level3', True), | |
639 | ('alpha', True), ('lower', False), ('upper', False), | |
640 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
641 | ''' | |
642 | “0BD7;TAMIL AU LENGTH MARK;Mc;0;L;;;;;N;;;;;” | |
643 | According to DerivedCoreProperties.txt (7.0.0) this is *not* | |
644 | “Alphabetic”.''' | |
645 | ], | |
646 | [[(0x0BF0, 0x0BFA)], | |
647 | [('combining', False), ('combining_level3', False), | |
648 | ('alpha', False), ('lower', False), ('upper', False), | |
649 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
650 | ''' | |
651 | “0BF0;TAMIL NUMBER TEN;No;0;L;;;;10;N;;;;;” | |
652 | “0BF1;TAMIL NUMBER ONE HUNDRED;No;0;L;;;;100;N;;;;;” | |
653 | “0BF2;TAMIL NUMBER ONE THOUSAND;No;0;L;;;;1000;N;;;;;” | |
654 | “0BF3;TAMIL DAY SIGN;So;0;ON;;;;;N;;;;;” | |
655 | “0BF4;TAMIL MONTH SIGN;So;0;ON;;;;;N;;;;;” | |
656 | “0BF5;TAMIL YEAR SIGN;So;0;ON;;;;;N;;;;;” | |
657 | “0BF6;TAMIL DEBIT SIGN;So;0;ON;;;;;N;;;;;” | |
658 | “0BF7;TAMIL CREDIT SIGN;So;0;ON;;;;;N;;;;;” | |
659 | “0BF8;TAMIL AS ABOVE SIGN;So;0;ON;;;;;N;;;;;” | |
660 | “0BF9;TAMIL RUPEE SIGN;Sc;0;ET;;;;;N;;;;;” | |
661 | “0BFA;TAMIL NUMBER SIGN;So;0;ON;;;;;N;;;;;” | |
662 | According to DerivedCoreProperties.txt (7.0.0) this is *not* | |
663 | “Alphabetic”.''' | |
664 | ], | |
665 | [[(0x0C01, 0x0C03)], | |
666 | [('combining', True), ('combining_level3', True), | |
667 | ('alpha', True), ('lower', False), ('upper', False), | |
668 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
669 | ''' | |
670 | “0C01;TELUGU SIGN CANDRABINDU;Mc;0;L;;;;;N;;;;;” | |
671 | “0C02;TELUGU SIGN ANUSVARA;Mc;0;L;;;;;N;;;;;” | |
672 | “0C03;TELUGU SIGN VISARGA;Mc;0;L;;;;;N;;;;;” | |
673 | According to DerivedCoreProperties.txt (7.0.0) these are | |
674 | “Alphabetic”.''' | |
675 | ], | |
676 | [[(0x0C3E, 0x0C44), (0x0C46, 0x0C48), (0x0C4A, 0x0C4C)], | |
677 | [('combining', True), ('combining_level3', True), | |
678 | ('alpha', True), ('lower', False), ('upper', False), | |
679 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
680 | ''' | |
681 | “0C3E;TELUGU VOWEL SIGN AA;Mn;0;NSM;;;;;N;;;;;” | |
682 | “0C3F;TELUGU VOWEL SIGN I;Mn;0;NSM;;;;;N;;;;;” | |
683 | “0C40;TELUGU VOWEL SIGN II;Mn;0;NSM;;;;;N;;;;;” | |
684 | “0C41;TELUGU VOWEL SIGN U;Mc;0;L;;;;;N;;;;;” | |
685 | “0C42;TELUGU VOWEL SIGN UU;Mc;0;L;;;;;N;;;;;” | |
686 | “0C43;TELUGU VOWEL SIGN VOCALIC R;Mc;0;L;;;;;N;;;;;” | |
687 | “0C44;TELUGU VOWEL SIGN VOCALIC RR;Mc;0;L;;;;;N;;;;;” | |
688 | “0C46;TELUGU VOWEL SIGN E;Mn;0;NSM;;;;;N;;;;;” | |
689 | “0C47;TELUGU VOWEL SIGN EE;Mn;0;NSM;;;;;N;;;;;” | |
690 | “0C48;TELUGU VOWEL SIGN AI;Mn;0;NSM;0C46 0C56;;;;N;;;;;” | |
691 | “0C4A;TELUGU VOWEL SIGN O;Mn;0;NSM;;;;;N;;;;;” | |
692 | “0C4B;TELUGU VOWEL SIGN OO;Mn;0;NSM;;;;;N;;;;;” | |
693 | “0C4C;TELUGU VOWEL SIGN AU;Mn;0;NSM;;;;;N;;;;;” | |
694 | According to DerivedCoreProperties.txt (7.0.0) these are | |
695 | “Alphabetic”.''' | |
696 | ], | |
697 | [[0x0C4D], | |
698 | [('combining', True), ('combining_level3', True), | |
699 | ('alpha', False), ('lower', False), ('upper', False), | |
700 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
701 | ''' | |
702 | “0C4D;TELUGU SIGN VIRAMA;Mn;9;NSM;;;;;N;;;;;” | |
703 | According to DerivedCoreProperties.txt (7.0.0) these are *not* | |
704 | “Alphabetic”.''' | |
705 | ], | |
706 | [[(0x0C55, 0x0C56), (0x0C62, 0x0C63)], | |
707 | [('combining', True), ('combining_level3', True), | |
708 | ('alpha', True), ('lower', False), ('upper', False), | |
709 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
710 | ''' | |
711 | “0C55;TELUGU LENGTH MARK;Mn;84;NSM;;;;;N;;;;;” | |
712 | “0C56;TELUGU AI LENGTH MARK;Mn;91;NSM;;;;;N;;;;;” | |
713 | “0C62;TELUGU VOWEL SIGN VOCALIC L;Mn;0;NSM;;;;;N;;;;;” | |
714 | “0C63;TELUGU VOWEL SIGN VOCALIC LL;Mn;0;NSM;;;;;N;;;;;” | |
715 | According to DerivedCoreProperties.txt (7.0.0) these are | |
716 | “Alphabetic”.''' | |
717 | ], | |
718 | [[(0x0C78, 0x0C7F)], | |
719 | [('combining', False), ('combining_level3', False), | |
720 | ('alpha', False), ('lower', False), ('upper', False), | |
721 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
722 | ''' | |
723 | “0C78;TELUGU FRACTION DIGIT ZERO FOR ODD POWERS OF FOUR; | |
724 | No;0;ON;;;;0;N;;;;;” | |
725 | “0C79;TELUGU FRACTION DIGIT ONE FOR ODD POWERS OF FOUR; | |
726 | No;0;ON;;;;1;N;;;;;” | |
727 | “0C7A;TELUGU FRACTION DIGIT TWO FOR ODD POWERS OF FOUR; | |
728 | No;0;ON;;;;2;N;;;;;” | |
729 | “0C7B;TELUGU FRACTION DIGIT THREE FOR ODD POWERS OF FOUR; | |
730 | No;0;ON;;;;3;N;;;;;” | |
731 | “0C7C;TELUGU FRACTION DIGIT ONE FOR EVEN POWERS OF FOUR; | |
732 | No;0;ON;;;;1;N;;;;;” | |
733 | “0C7D;TELUGU FRACTION DIGIT TWO FOR EVEN POWERS OF FOUR; | |
734 | No;0;ON;;;;2;N;;;;;” | |
735 | “0C7E;TELUGU FRACTION DIGIT THREE FOR EVEN POWERS OF FOUR; | |
736 | No;0;ON;;;;3;N;;;;;” | |
737 | “0C7F;TELUGU SIGN TUUMU;So;0;L;;;;;N;;;;;” | |
738 | According to DerivedCoreProperties.txt (7.0.0) these are *not* | |
739 | “Alphabetic”.''' | |
740 | ], | |
741 | [[(0x0C82, 0x0C83)], | |
742 | [('combining', True), ('combining_level3', True), | |
743 | ('alpha', True), ('lower', False), ('upper', False), | |
744 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
745 | ''' | |
746 | “0C81;KANNADA SIGN CANDRABINDU;Mn;0;NSM;;;;;N;;;;;” | |
747 | “0C82;KANNADA SIGN ANUSVARA;Mc;0;L;;;;;N;;;;;” | |
748 | “0C83;KANNADA SIGN VISARGA;Mc;0;L;;;;;N;;;;;” | |
749 | According to DerivedCoreProperties.txt (7.0.0) these are | |
750 | “Alphabetic”.''' | |
751 | ], | |
752 | [[0x0CBC], | |
753 | [('combining', True), ('combining_level3', True), | |
754 | ('alpha', False), ('lower', False), ('upper', False), | |
755 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
756 | ''' | |
757 | “0CBC;KANNADA SIGN NUKTA;Mn;7;NSM;;;;;N;;;;;” | |
758 | According to DerivedCoreProperties.txt (7.0.0) these are | |
759 | “Alphabetic”.''' | |
760 | ], | |
761 | [[(0x0CBE, 0x0CC4), (0x0CC6, 0x0CC8), (0x0CCA, 0x0CCC)], | |
762 | [('combining', True), ('combining_level3', True), | |
763 | ('alpha', True), ('lower', False), ('upper', False), | |
764 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
765 | ''' | |
766 | “0CBE;KANNADA VOWEL SIGN AA;Mc;0;L;;;;;N;;;;;” | |
767 | “0CBF;KANNADA VOWEL SIGN I;Mn;0;L;;;;;N;;;;;” | |
768 | “0CC0;KANNADA VOWEL SIGN II;Mc;0;L;0CBF 0CD5;;;;N;;;;;” | |
769 | “0CC1;KANNADA VOWEL SIGN U;Mc;0;L;;;;;N;;;;;” | |
770 | “0CC2;KANNADA VOWEL SIGN UU;Mc;0;L;;;;;N;;;;;” | |
771 | “0CC3;KANNADA VOWEL SIGN VOCALIC R;Mc;0;L;;;;;N;;;;;” | |
772 | “0CC4;KANNADA VOWEL SIGN VOCALIC RR;Mc;0;L;;;;;N;;;;;” | |
773 | “0CC6;KANNADA VOWEL SIGN E;Mn;0;L;;;;;N;;;;;” | |
774 | “0CC7;KANNADA VOWEL SIGN EE;Mc;0;L;0CC6 0CD5;;;;N;;;;;” | |
775 | “0CC8;KANNADA VOWEL SIGN AI;Mc;0;L;0CC6 0CD6;;;;N;;;;;” | |
776 | “0CCA;KANNADA VOWEL SIGN O;Mc;0;L;0CC6 0CC2;;;;N;;;;;” | |
777 | “0CCB;KANNADA VOWEL SIGN OO;Mc;0;L;0CCA 0CD5;;;;N;;;;;” | |
778 | “0CCC;KANNADA VOWEL SIGN AU;Mn;0;NSM;;;;;N;;;;;” | |
779 | According to DerivedCoreProperties.txt (7.0.0) these are | |
780 | “Alphabetic”.''' | |
781 | ], | |
782 | [[0x0CCD], | |
783 | [('combining', True), ('combining_level3', True), | |
784 | ('alpha', False), ('lower', False), ('upper', False), | |
785 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
786 | ''' | |
787 | “0CCD;KANNADA SIGN VIRAMA;Mn;9;NSM;;;;;N;;;;;” | |
788 | According to DerivedCoreProperties.txt (7.0.0) these are *not* | |
789 | “Alphabetic”.''' | |
790 | ], | |
791 | [[(0x0CD5, 0x0CD6), (0x0CE2, 0x0CE3)], | |
792 | [('combining', True), ('combining_level3', True), | |
793 | ('alpha', True), ('lower', False), ('upper', False), | |
794 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
795 | ''' | |
796 | 0CD5;KANNADA LENGTH MARK;Mc;0;L;;;;;N;;;;; | |
797 | 0CD6;KANNADA AI LENGTH MARK;Mc;0;L;;;;;N;;;;; | |
798 | 0CE2;KANNADA VOWEL SIGN VOCALIC L;Mn;0;NSM;;;;;N;;;;; | |
799 | 0CE3;KANNADA VOWEL SIGN VOCALIC LL;Mn;0;NSM;;;;;N;;;;; | |
800 | According to DerivedCoreProperties.txt (7.0.0) these are | |
801 | “Alphabetic”.''' | |
802 | ], | |
803 | [[(0x0D02, 0x0D03), (0x0D3E, 0x0D44), (0x0D46, 0x0D48), | |
804 | (0x0D4A, 0x0D4C)], | |
805 | [('combining', True), ('combining_level3', True), | |
806 | ('alpha', True), ('lower', False), ('upper', False), | |
807 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
808 | ''' | |
809 | “0D02;MALAYALAM SIGN ANUSVARA;Mc;0;L;;;;;N;;;;;” | |
810 | “0D03;MALAYALAM SIGN VISARGA;Mc;0;L;;;;;N;;;;;” | |
811 | “0D3E;MALAYALAM VOWEL SIGN AA;Mc;0;L;;;;;N;;;;;” | |
812 | “0D3F;MALAYALAM VOWEL SIGN I;Mc;0;L;;;;;N;;;;;” | |
813 | “0D40;MALAYALAM VOWEL SIGN II;Mc;0;L;;;;;N;;;;;” | |
814 | “0D41;MALAYALAM VOWEL SIGN U;Mn;0;NSM;;;;;N;;;;;” | |
815 | “0D42;MALAYALAM VOWEL SIGN UU;Mn;0;NSM;;;;;N;;;;;” | |
816 | “0D43;MALAYALAM VOWEL SIGN VOCALIC R;Mn;0;NSM;;;;;N;;;;;” | |
817 | “0D44;MALAYALAM VOWEL SIGN VOCALIC RR;Mn;0;NSM;;;;;N;;;;;” | |
818 | “0D46;MALAYALAM VOWEL SIGN E;Mc;0;L;;;;;N;;;;;” | |
819 | “0D47;MALAYALAM VOWEL SIGN EE;Mc;0;L;;;;;N;;;;;” | |
820 | “0D48;MALAYALAM VOWEL SIGN AI;Mc;0;L;;;;;N;;;;;” | |
821 | “0D4A;MALAYALAM VOWEL SIGN O;Mc;0;L;0D46 0D3E;;;;N;;;;;” | |
822 | “0D4B;MALAYALAM VOWEL SIGN OO;Mc;0;L;0D47 0D3E;;;;N;;;;;” | |
823 | “0D4C;MALAYALAM VOWEL SIGN AU;Mc;0;L;0D46 0D57;;;;N;;;;;” | |
824 | According to DerivedCoreProperties.txt (7.0.0) these are | |
825 | “Alphabetic”.''' | |
826 | ], | |
827 | [[0x0D4D], | |
828 | [('combining', True), ('combining_level3', True), | |
829 | ('alpha', False), ('lower', False), ('upper', False), | |
830 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
831 | ''' | |
832 | “0D4D;MALAYALAM SIGN VIRAMA;Mn;9;NSM;;;;;N;;;;;” | |
833 | According to DerivedCoreProperties.txt (7.0.0) these are | |
834 | “Alphabetic”.''' | |
835 | ], | |
836 | [[0x0D57, (0x0D62, 0x0D63)], | |
837 | [('combining', True), ('combining_level3', True), | |
838 | ('alpha', True), ('lower', False), ('upper', False), | |
839 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
840 | ''' | |
841 | “0D57;MALAYALAM AU LENGTH MARK;Mc;0;L;;;;;N;;;;;” | |
842 | “0D62;MALAYALAM VOWEL SIGN VOCALIC L;Mn;0;NSM;;;;;N;;;;;” | |
843 | “0D63;MALAYALAM VOWEL SIGN VOCALIC LL;Mn;0;NSM;;;;;N;;;;;” | |
844 | According to DerivedCoreProperties.txt (7.0.0) these are | |
845 | “Alphabetic”.''' | |
846 | ], | |
847 | [[(0x0D70, 0x0D79)], | |
848 | [('combining', False), ('combining_level3', False), | |
849 | ('alpha', False), ('lower', False), ('upper', False), | |
850 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
851 | ''' | |
852 | “0D70;MALAYALAM NUMBER TEN;No;0;L;;;;10;N;;;;;” | |
853 | “0D71;MALAYALAM NUMBER ONE HUNDRED;No;0;L;;;;100;N;;;;;” | |
854 | “0D72;MALAYALAM NUMBER ONE THOUSAND;No;0;L;;;;1000;N;;;;;” | |
855 | “0D73;MALAYALAM FRACTION ONE QUARTER;No;0;L;;;;1/4;N;;;;;” | |
856 | “0D74;MALAYALAM FRACTION ONE HALF;No;0;L;;;;1/2;N;;;;;” | |
857 | “0D75;MALAYALAM FRACTION THREE QUARTERS;No;0;L;;;;3/4;N;;;;;” | |
858 | “0D79;MALAYALAM DATE MARK;So;0;L;;;;;N;;;;;” | |
859 | According to DerivedCoreProperties.txt (7.0.0) these are *not* | |
860 | “Alphabetic”.''' | |
861 | ], | |
862 | [[(0x0D82, 0x0D83)], | |
863 | [('combining', True), ('combining_level3', True), | |
864 | ('alpha', True), ('lower', False), ('upper', False), | |
865 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
866 | ''' | |
867 | “0D82;SINHALA SIGN ANUSVARAYA;Mc;0;L;;;;;N;;;;;” | |
868 | “0D83;SINHALA SIGN VISARGAYA;Mc;0;L;;;;;N;;;;;” | |
869 | According to DerivedCoreProperties.txt (7.0.0) these are | |
870 | “Alphabetic”.''' | |
871 | ], | |
872 | [[0x0DCA], | |
873 | [('combining', True), ('combining_level3', True), | |
874 | ('alpha', False), ('lower', False), ('upper', False), | |
875 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
876 | ''' | |
877 | “0DCA;SINHALA SIGN AL-LAKUNA;Mn;9;NSM;;;;;N;;;;;” | |
878 | According to DerivedCoreProperties.txt (7.0.0) these are *not* | |
879 | “Alphabetic”.''' | |
880 | ], | |
881 | [[(0x0DCF, 0x0DD4), 0x0DD6, (0x0DD8, 0x0DDF), (0x0DF2, 0x0DF3)], | |
882 | [('combining', True), ('combining_level3', True), | |
883 | ('alpha', True), ('lower', False), ('upper', False), | |
884 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
885 | ''' | |
886 | “0DCF;SINHALA VOWEL SIGN AELA-PILLA;Mc;0;L;;;;;N;;;;;” | |
887 | “0DD0;SINHALA VOWEL SIGN KETTI AEDA-PILLA;Mc;0;L;;;;;N;;;;;” | |
888 | “0DD1;SINHALA VOWEL SIGN DIGA AEDA-PILLA;Mc;0;L;;;;;N;;;;;” | |
889 | “0DD2;SINHALA VOWEL SIGN KETTI IS-PILLA;Mn;0;NSM;;;;;N;;;;;” | |
890 | “0DD3;SINHALA VOWEL SIGN DIGA IS-PILLA;Mn;0;NSM;;;;;N;;;;;” | |
891 | “0DD4;SINHALA VOWEL SIGN KETTI PAA-PILLA;Mn;0;NSM;;;;;N;;;;;” | |
892 | “0DD6;SINHALA VOWEL SIGN DIGA PAA-PILLA;Mn;0;NSM;;;;;N;;;;;” | |
893 | “0DD8;SINHALA VOWEL SIGN GAETTA-PILLA;Mc;0;L;;;;;N;;;;;” | |
894 | “0DD9;SINHALA VOWEL SIGN KOMBUVA;Mc;0;L;;;;;N;;;;;” | |
895 | “0DDA;SINHALA VOWEL SIGN DIGA KOMBUVA;Mc;0;L;0DD9 0DCA;;;;N;;;;;” | |
896 | “0DDB;SINHALA VOWEL SIGN KOMBU DEKA;Mc;0;L;;;;;N;;;;;” | |
897 | “0DDC;SINHALA VOWEL SIGN KOMBUVA HAA AELA-PILLA; | |
898 | Mc;0;L;0DD9 0DCF;;;;N;;;;;” | |
899 | “0DDD;SINHALA VOWEL SIGN KOMBUVA HAA DIGA AELA-PILLA; | |
900 | Mc;0;L;0DDC 0DCA;;;;N;;;;;” | |
901 | “0DDE;SINHALA VOWEL SIGN KOMBUVA HAA GAYANUKITTA; | |
902 | Mc;0;L;0DD9 0DDF;;;;N;;;;;” | |
903 | “0DDF;SINHALA VOWEL SIGN GAYANUKITTA;Mc;0;L;;;;;N;;;;;” | |
904 | “0DF2;SINHALA VOWEL SIGN DIGA GAETTA-PILLA;Mc;0;L;;;;;N;;;;;” | |
905 | “0DF3;SINHALA VOWEL SIGN DIGA GAYANUKITTA;Mc;0;L;;;;;N;;;;;” | |
906 | According to DerivedCoreProperties.txt (7.0.0) these are | |
907 | “Alphabetic”.''' | |
908 | ], | |
909 | [[0x0DF4], | |
910 | [('combining', False), ('combining_level3', False), | |
911 | ('alpha', False), ('lower', False), ('upper', False), | |
912 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
913 | ''' | |
914 | “0DF4;SINHALA PUNCTUATION KUNDDALIYA;Po;0;L;;;;;N;;;;;” | |
915 | According to DerivedCoreProperties.txt (7.0.0) these are *not* | |
916 | “Alphabetic”.''' | |
917 | ], | |
918 | [[(0xA789, 0xA78A)], | |
919 | [('combining', False), ('combining_level3', False), | |
920 | ('alpha', False), ('lower', False), ('upper', False), | |
921 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
922 | ''' | |
923 | “A789;MODIFIER LETTER COLON;Sk;0;L;;;;;N;;;;;” | |
924 | “A78A;MODIFIER LETTER SHORT EQUALS SIGN;Sk;0;L;;;;;N;;;;;” | |
925 | According to DerivedCoreProperties.txt (7.0.0) these are *not* | |
926 | “Alphabetic”.''' | |
927 | ], | |
928 | [[(0xA926, 0xA92A)], | |
929 | [('combining', True), ('combining_level3', True), | |
930 | ('alpha', True), ('lower', False), ('upper', False), | |
931 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
932 | ''' | |
933 | “A926;KAYAH LI VOWEL UE;Mn;0;NSM;;;;;N;;;;;” | |
934 | “A927;KAYAH LI VOWEL E;Mn;0;NSM;;;;;N;;;;;” | |
935 | “A928;KAYAH LI VOWEL U;Mn;0;NSM;;;;;N;;;;;” | |
936 | “A929;KAYAH LI VOWEL EE;Mn;0;NSM;;;;;N;;;;;” | |
937 | “A92A;KAYAH LI VOWEL O;Mn;0;NSM;;;;;N;;;;;” | |
938 | According to DerivedCoreProperties.txt (7.0.0) these are | |
939 | “Alphabetic”.''' | |
940 | ], | |
941 | [[(0xA92B, 0xA92D)], | |
942 | [('combining', True), ('combining_level3', False), | |
943 | ('alpha', False), ('lower', False), ('upper', False), | |
944 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
945 | ''' | |
946 | “A92B;KAYAH LI TONE PLOPHU;Mn;220;NSM;;;;;N;;;;;” | |
947 | “A92C;KAYAH LI TONE CALYA;Mn;220;NSM;;;;;N;;;;;” | |
948 | “A92D;KAYAH LI TONE CALYA PLOPHU;Mn;220;NSM;;;;;N;;;;;” | |
949 | According to DerivedCoreProperties.txt (7.0.0) these are *not* | |
950 | “Alphabetic”.''' | |
951 | ] | |
952 | ] |