]>
Commit | Line | Data |
---|---|---|
4a4839c9 | 1 | # -*- coding: utf-8 -*- |
688903eb | 2 | # Copyright (C) 2014-2018 Free Software Foundation, Inc. |
4a4839c9 AO |
3 | # This file is part of the GNU C Library. |
4 | # | |
5 | # The GNU C Library is free software; you can redistribute it and/or | |
6 | # modify it under the terms of the GNU Lesser General Public | |
7 | # License as published by the Free Software Foundation; either | |
8 | # version 2.1 of the License, or (at your option) any later version. | |
9 | # | |
10 | # The GNU C Library is distributed in the hope that it will be useful, | |
11 | # but WITHOUT ANY WARRANTY; without even the implied warranty of | |
12 | # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU | |
13 | # Lesser General Public License for more details. | |
14 | # | |
15 | # You should have received a copy of the GNU Lesser General Public | |
16 | # License along with the GNU C Library; if not, see | |
17 | # <http://www.gnu.org/licenses/>. | |
18 | ||
19 | ''' | |
20 | This file contains a list of test cases used by | |
21 | the ctype_compatibility.py script. | |
22 | ''' | |
23 | ||
24 | TEST_CASES = [ | |
25 | [[0x0E2F, 0x0E46], [('alpha', True), ('punct', False)], | |
26 | '''Theppitak Karoonboonyanan <thep@links.nectec.or.th> says | |
27 | <U0E2F>, <U0E46> should belong to punct. DerivedCoreProperties.txt | |
28 | says it is alpha. We trust DerivedCoreProperties.txt.''' | |
29 | ], | |
30 | [[0x0E31, (0x0E34, 0x0E3A)], [('alpha', True)], | |
31 | '''gen-unicode-ctype.c: Theppitak Karoonboonyanan | |
32 | <thep@links.nectec.or.th> says <U0E31>, <U0E34>..<U0E3A> | |
33 | are alpha. DerivedCoreProperties.txt agrees.''' | |
34 | ], | |
35 | [[(0x0E47, 0x0E4C), 0x0E4E], [('alpha', False)], | |
36 | '''gen-unicode-ctype.c: Theppitak Karoonboonyanan | |
37 | <thep@links.nectec.or.th> says <U0E47>..<U0E4E> are | |
38 | is_alpha. DerivedCoreProperties does says *only* <U0E4D> | |
39 | in that range is alphabetic, the others are *not*. We | |
40 | trust DerivedCoreProperties.txt.''' | |
41 | ], | |
42 | [[0x0E4D], [('alpha', True)], | |
43 | '''gen-unicode-ctype.c: Theppitak Karoonboonyanan | |
44 | <thep@links.nectec.or.th> says <U0E47>..<U0E4E> are | |
45 | is_alpha. DerivedCoreProperties does says *only* <U0E4D> | |
46 | in that range is alphabetic, the others are *not*. We | |
47 | trust DerivedCoreProperties.txt. | |
48 | ''' | |
49 | ], | |
50 | [[0x0345], [('alpha', True), ('lower', True)], | |
51 | '''COMBINING GREEK YPOGEGRAMMENI | |
52 | According to DerivedCoreProperties.txt, this is “Alphabetic” | |
53 | and “Lowercase”.''' | |
54 | ], | |
55 | [[(0x2160, 0x2188)], [('alpha', True)], | |
56 | '''Roman Numerals are “Alphabetic” according to | |
57 | DerivedCoreProperties.txt''' | |
58 | ], | |
59 | [[(0x24B6, 0x24E9)], [('alpha', True)], | |
60 | '''Circled Latin letters are “Alphabetic” according to | |
61 | DerivedCoreProperties.txt''' | |
62 | ], | |
63 | [[0x661], [('alpha', True), ('digit', False)], | |
64 | '''gen-unicode-ctype.c: All non-ASCII digits should be alphabetic. | |
65 | ISO C 99 forbids us to have them in category "digit", but we | |
66 | want iswalnum to return true on them. Don’t forget to | |
67 | have a look at all the other digits, 0x661 is just one | |
68 | example tested here.''' | |
69 | ], | |
70 | [[(0x0030, 0x0039)], [('digit', True)], | |
71 | '''gen-unicode-ctype.c: All ASCII digits should be digits.''' | |
72 | ], | |
73 | [[0x0009], [('blank', True)], | |
74 | '''gen-unicode-ctype.c: CHARACTER TABULATION''' | |
75 | ], | |
76 | [[0x2007], [('blank', False), ('space', False)], | |
77 | '''gen-unicode-ctype.c: FIGURE SPACE, because it has <noBreak> | |
78 | in the description.''' | |
79 | ], | |
80 | [[0x0009, 0x000A, 0x000B, 0x000C, 0x000D], [('space', True)], | |
81 | '''gen-unicode-ctype.c: CHARACTER TABULATION, LINE FEED (LF), LINE | |
82 | TABULATION, ;FORM FEED (FF), CARRIAGE RETURN (CR)''' | |
83 | ], | |
84 | [[0x2028, 0x2029], [('cntrl', True)], | |
85 | '''gen-unicode-ctype.c: LINE SEPARATOR and PARAGRAPH SEPARATOR | |
86 | should be cntrl.''' | |
87 | ], | |
88 | [[(0x0030, 0x0039), (0x0041, 0x0046), (0x0061, 0x0066)], | |
89 | [('xdigit', True)], | |
90 | '''gen-unicode-ctype.c: ISO C 99 says (6.4.4.1): hexadecimal-digit: | |
91 | one of 0 1 2 3 4 5 6 7 8 9 a b c d e f A B C D E F (nothing else | |
92 | should be considered as a hexadecimal-digit)''' | |
93 | ], | |
94 | [[0x0330], [('combining', True), ('combining_level3', False)], | |
95 | '''gen-unicode-ctype.c: COMBINING TILDE BELOW, canonical combining | |
96 | class value >= 200, should be in combining but not in | |
97 | combining_level3''' | |
98 | ], | |
99 | [[0x0250, 0x0251, 0x0271], [('lower', True)], | |
100 | '''Should be lower in Unicode 7.0.0 (was not lower in | |
101 | Unicode 5.0.0). | |
102 | ''' | |
103 | ], | |
104 | [[0x2184], [('lower', True)], | |
105 | '''Should be lower both in Unicode 5.0.0 and 7.0.0''' | |
106 | ], | |
107 | [[0xA67F], [('punct', False), ('alpha', True)], | |
108 | '''0xa67f CYRILLIC PAYEROK. Not in Unicode 5.0.0. In Unicode | |
109 | 7.0.0. General category Lm (Letter | |
110 | modifier). DerivedCoreProperties.txt says it is | |
111 | “Alphabetic”. Apparently added manually to punct by mistake in | |
112 | glibc’s old LC_CTYPE.''' | |
113 | ], | |
114 | [[0xA60C], [('punct', False), ('alpha', True)], | |
115 | '''0xa60c VAI SYLLABLE LENGTHENER. Not in Unicode 5.0.0. | |
116 | In Unicode 7.0.0. General category Lm (Letter | |
117 | modifier). DerivedCoreProperties.txt says it is | |
118 | “Alphabetic”. Apparently added manually to punct by mistake in | |
119 | glibc’s old LC_CTYPE.''' | |
120 | ], | |
121 | [[0x2E2F], [('punct', False), ('alpha', True)], | |
122 | '''0x2E2F VERTICAL TILDE. Not in Unicode 5.0.0. In Unicode | |
123 | 7.0.0. General category Lm (Letter | |
124 | modifier). DerivedCoreProperties.txt says it is | |
125 | “Alphabetic”. Apparently added manually to punct by mistake in | |
126 | glibc’s old LC_CTYPE.''' | |
127 | ], | |
128 | [[(0x1090, 0x1099)], [('punct', False), ('alpha', True)], | |
129 | '''MYANMAR SHAN DIGIT ZERO - MYANMAR SHAN DIGIT NINE. | |
130 | These are digits, but because ISO C 99 forbids to | |
131 | put them into digit they should go into alpha.''' | |
132 | ], | |
133 | [[0x103F], [('punct', False), ('alpha', True)], | |
134 | '''0x103F MYANMAR LETTER GREAT SA. Not in Unicode 5.0.0. | |
135 | In Unicode 7.0.0. General category Lo | |
136 | (Other_Letter). DerivedCoreProperties.txt says it is | |
137 | “Alphabetic”. Apparently added manually to punct by | |
138 | mistake in glibc’s old LC_CTYPE.''' | |
139 | ], | |
140 | [[0x0374], [('punct', False), ('alpha', True)], | |
141 | '''0x0374 GREEK NUMERAL SIGN. Unicode 5.0.0: general category | |
142 | Sk. Unicode 7.0.0: General category Lm | |
143 | (Modifier_Letter). DerivedCoreProperties.txt says it is | |
144 | “Alphabetic”.''' | |
145 | ], | |
146 | [[0x02EC], [('punct', False), ('alpha', True)], | |
147 | '''0x02EC MODIFIER LETTER VOICING. Unicode 5.0.0: general category | |
148 | Sk. Unicode 7.0.0: General category Lm | |
149 | (Modifier_Letter). DerivedCoreProperties.txt says it is | |
150 | “Alphabetic”.''' | |
151 | ], | |
152 | [[0x180E], [('space', False), ('blank', False)], | |
153 | '''0x180e MONGOLIAN VOWEL SEPARATOR. Unicode 5.0.0: General | |
154 | category Zs (Space_Separator) Unicode 7.0.0: General category Cf | |
155 | (Format).''' | |
156 | ], | |
157 | [[0x1E9C, 0x1E9D, 0x1E9F], | |
158 | [('lower', True), ('upper', False), ('tolower', False), | |
159 | ('toupper', False), ('totitle', False)], | |
160 | '''ẜ 0x1e9c LATIN SMALL LETTER LONG S WITH DIAGONAL STROKE, | |
161 | ẝ 0x1e9d LATIN SMALL LETTER LONG S WITH HIGH STROKE, | |
162 | ẟ 0x1e9f LATIN SMALL LETTER DELTA. These are “Lowercase” | |
163 | according to DerivedCoreProperties.txt but no upper case versions | |
164 | exist.''' | |
165 | ], | |
166 | [[0x1E9E], | |
167 | [('lower', False), ('upper', True), ('tolower', True), | |
168 | ('toupper', False), ('totitle', False)], | |
169 | '''0x1E9E ẞ LATIN CAPITAL LETTER SHARP S This is “Uppercase” | |
170 | according to DerivedCoreProperties.txt and the lower case | |
171 | version is 0x00DF ß LATIN SMALL LETTER SHARP S.''' | |
172 | ], | |
173 | [[0x2188], | |
174 | [('alpha', True), ('lower', False), ('upper', False), | |
175 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
176 | '''0x2188 ROMAN NUMERAL ONE HUNDRED THOUSAND. This is “Alphabetic” | |
177 | according to DerivedCoreProperties.txt. In glibc’s old | |
178 | LC_CTYPE, it was in “lower”, which seems to be a | |
179 | mistake. It is not “Lowercase” in | |
180 | DerivedCoreProperties.txt and does not have case mappings | |
181 | in UnicodeData.txt either.''' | |
182 | ], | |
183 | [[0x2C71, 0x2C74, (0x2C77, 0x2C7A)], | |
184 | [('alpha', True), ('lower', True), ('upper', False), | |
185 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
186 | '''These are Latin small letters which were not in Unicode 5.0.0 | |
187 | but are in Unicode 7.0.0. According to | |
188 | DerivedCoreProperties.txt they are “Lowercase”. But no | |
189 | uppercase versions exist. They have apparently been added | |
190 | manually to glibc’s old LC_CTYPE.''' | |
191 | ], | |
192 | [[0xA730, 0xA731], | |
193 | [('alpha', True), ('lower', True), ('upper', False), | |
194 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
195 | '''These are Latin small “capital” letters which were not in | |
196 | Unicode 5.0.0 but are in Unicode 7.0.0. According to | |
197 | DerivedCoreProperties.txt they are “Lowercase”. But no | |
198 | uppercase versions exist. They have apparently been added | |
199 | manually to glibc’s old LC_CTYPE.''' | |
200 | ], | |
201 | [[(0xA771, 0xA778)], | |
202 | [('alpha', True), ('lower', True), ('upper', False), | |
203 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
204 | '''These are Latin small (or small “capital”) letters which | |
205 | were not in Unicodee 5.0.0 but are in Unicode 7.0.0. According to | |
206 | DerivedCoreProperties.txt they are “Lowercase”. But no | |
207 | uppercase versions exist. They have apparently been added | |
208 | manually to glibc’s old LC_CTYPE.''' | |
209 | ], | |
210 | [[0x0375], | |
211 | [('combining', False), ('combining_level3', False), | |
212 | ('alpha', False), ('lower', False), ('upper', False), | |
213 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
214 | '''“0375;GREEK LOWER NUMERAL SIGN;Sk;0;ON;;;;;N;;;;;”. Has | |
215 | apparently been added manually to glibc’s old LC_CTYPE as | |
216 | “combining_level3”. That seems wrong, it is no combining | |
217 | character because it does not have one of the general | |
218 | categories Mn, Mc, or Me. According to | |
219 | DerivedCoreProperties.txt it is not “Alphabetic”.''' | |
220 | ], | |
221 | [[0x108D], | |
222 | [('combining', True), ('combining_level3', False), | |
223 | ('alpha', False), ('lower', False), ('upper', False), | |
224 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
225 | '''“108D;MYANMAR SIGN SHAN COUNCIL EMPHATIC | |
226 | TONE;Mn;220;NSM;;;;;N;;;;;”. Has apparently been added | |
227 | manually to glibc’s old LC_CTYPE as | |
228 | “combining_level3”. That seems wrong, although it is a | |
229 | combining character because it has the general category | |
230 | Mn, it is not “combining_level3” because the canonical | |
231 | combining class value is 220 which is >= 200. According to | |
232 | gen-unicode-ctype.c, “combining_level3” needs a | |
233 | canonical combining class value < 200. According to | |
234 | DerivedCoreProperties.txt it is not “Alphabetic”.''' | |
235 | ], | |
236 | [[0x06DE], | |
237 | [('combining', False), ('combining_level3', False), | |
238 | ('alpha', False), ('lower', False), ('upper', False), | |
239 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
240 | ''' UnicodeData.txt 5.0.0: “06DE;ARABIC START OF RUB EL | |
241 | HIZB;Me;0;NSM;;;;;N;;;;;”; UnicodeData.txt 7.0.0: | |
242 | “06DE;ARABIC START OF RUB EL | |
243 | HIZB;So;0;ON;;;;;N;;;;;”. I.e. this used to be a | |
244 | combining character in Unicode 5.0.0 but not anymore in | |
245 | 7.0.0. According to DerivedCoreProperties.txt it is not | |
246 | “Alphabetic”.''' | |
247 | ], | |
248 | [[0x0BD0], | |
249 | [('combining', False), ('combining_level3', False), | |
250 | ('alpha', True), ('lower', False), ('upper', False), | |
251 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
252 | '''Not in UnicodeData.txt 5.0.0. UnicodeData.txt 7.0.0: | |
253 | “0BD0;TAMIL OM;Lo;0;L;;;;;N;;;;;”. Apparently manually added to | |
254 | “combining” and “combining_level3” in glibc’s old | |
255 | LC_CTYPE. That seems wrong. According to | |
256 | DerivedCoreProperties.txt it is “Alphabetic”.''' | |
257 | ], | |
258 | [[0x103F], | |
259 | [('combining', False), ('combining_level3', False), | |
260 | ('alpha', True), ('lower', False), ('upper', False), | |
261 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
262 | '''Not in UnicodeData.txt 5.0.0. UnicodeData.txt 7.0.0: | |
263 | “103F;MYANMAR LETTER GREAT SA;Lo;0;L;;;;;N;;;;;”. | |
264 | Apparently manually added to “combining” and | |
265 | “combining_level3” in glibc’s old LC_CTYPE. That seems | |
266 | wrong. According to DerivedCoreProperties.txt it is | |
267 | “Alphabetic”.''' | |
268 | ], | |
269 | [[(0x0901, 0x0903)], | |
270 | [('combining', True), ('combining_level3', True), | |
271 | ('alpha', True), ('lower', False), ('upper', False), | |
272 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
273 | '''These have general category “Mn” i.e. these are combining | |
274 | characters (both in UnicodeData.txt 5.0.0 and 7.0.0): | |
275 | “0901;DEVANAGARI SIGN CANDRABINDU;Mn;0;NSM;;;;;N;;;;;”, | |
276 | ”0902;DEVANAGARI SIGN ANUSVARA;Mn;0;NSM;;;;;N;;;;;”, | |
277 | “0903;DEVANAGARI SIGN VISARGA;Mc;0;L;;;;;N;;;;;”. | |
278 | According to DerivedCoreProperties.txt (7.0.0) these are | |
279 | “Alphabetic”.''' | |
280 | ], | |
281 | [[0x093C], | |
282 | [('combining', True), ('combining_level3', True), | |
283 | ('alpha', False), ('lower', False), ('upper', False), | |
284 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
285 | '''UnicodeData.txt (5.0.0 and 7.0.0): “093C;DEVANAGARI SIGN | |
286 | NUKTA;Mn;7;NSM;;;;;N;;;;;” According to | |
287 | DerivedCoreProperties.txt (7.0.0) this is *not* | |
288 | “Alphabetic”. glibc’s old LC_TYPE has this in “alpha”.''' | |
289 | ], | |
290 | [[(0x093E, 0x093F)], | |
291 | [('combining', True), ('combining_level3', True), | |
292 | ('alpha', True), ('lower', False), ('upper', False), | |
293 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
294 | '''These have general category “Mc” i.e. these are combining | |
295 | characters (both in UnicodeData.txt 5.0.0 and 7.0.0): | |
296 | “093E;DEVANAGARI VOWEL SIGN AA;Mc;0;L;;;;;N;;;;;” | |
297 | “093F;DEVANAGARI VOWEL SIGN I;Mc;0;L;;;;;N;;;;;” | |
298 | According to DerivedCoreProperties.txt (7.0.0) these are | |
299 | “Alphabetic”.''' | |
300 | ], | |
301 | [[(0x0940, 0x094C)], | |
302 | [('combining', True), ('combining_level3', True), | |
303 | ('alpha', True), ('lower', False), ('upper', False), | |
304 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
305 | '''These are all combining | |
306 | characters (“Mc” or “Mn” both in UnicodeData.txt 5.0.0 and 7.0.0). | |
307 | According to DerivedCoreProperties.txt (7.0.0) these are | |
308 | “Alphabetic”.''' | |
309 | ], | |
310 | [[0x094D], | |
311 | [('combining', True), ('combining_level3', True), | |
312 | ('alpha', False), ('lower', False), ('upper', False), | |
313 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
314 | '''Combining character, both in UnicodeData.txt 5.0.0 and 7.0.0. | |
315 | “094D;DEVANAGARI SIGN VIRAMA;Mn;9;NSM;;;;;N;;;;;” | |
316 | According to DerivedCoreProperties.txt (7.0.0) it is *not* | |
317 | “Alphabetic”.''' | |
318 | ], | |
319 | [[(0x0951, 0x0954)], | |
320 | [('combining', True), ('combining_level3', False), | |
321 | ('alpha', False), ('lower', False), ('upper', False), | |
322 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
323 | '''Combining characters, both in UnicodeData.txt 5.0.0 and 7.0.0. | |
324 | According to DerivedCoreProperties.txt (7.0.0) these are *not* | |
325 | “Alphabetic”.''' | |
326 | ], | |
327 | [[(0x0962, 0x0963), (0x0981, 0x0983)], | |
328 | [('combining', True), ('combining_level3', True), | |
329 | ('alpha', True), ('lower', False), ('upper', False), | |
330 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
331 | '''Combining characters, both in UnicodeData.txt 5.0.0 and 7.0.0. | |
332 | According to DerivedCoreProperties.txt (7.0.0) these are | |
333 | “Alphabetic”.''' | |
334 | ], | |
335 | [[0x09BC], | |
336 | [('combining', True), ('combining_level3', True), | |
337 | ('alpha', False), ('lower', False), ('upper', False), | |
338 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
339 | ''' | |
340 | “09BC;BENGALI SIGN NUKTA;Mn;7;NSM;;;;;N;;;;;” | |
341 | Combining character, both in UnicodeData.txt 5.0.0 and 7.0.0. | |
342 | According to DerivedCoreProperties.txt (7.0.0) it is *not* | |
343 | “Alphabetic”.''' | |
344 | ], | |
345 | [[(0x09BE, 0x09BF), (0x09C0, 0x09C4), (0x09C7, 0x09C8), | |
346 | (0x09CB, 0x09CC)], | |
347 | [('combining', True), ('combining_level3', True), | |
348 | ('alpha', True), ('lower', False), ('upper', False), | |
349 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
350 | ''' | |
351 | “09BE;BENGALI VOWEL SIGN AA;Mc;0;L;;;;;N;;;;;” | |
352 | “09BF;BENGALI VOWEL SIGN I;Mc;0;L;;;;;N;;;;;” | |
353 | “09C0;BENGALI VOWEL SIGN II;Mc;0;L;;;;;N;;;;;” | |
354 | “09C1;BENGALI VOWEL SIGN U;Mn;0;NSM;;;;;N;;;;;” | |
355 | “09C2;BENGALI VOWEL SIGN UU;Mn;0;NSM;;;;;N;;;;;” | |
356 | “09C3;BENGALI VOWEL SIGN VOCALIC R;Mn;0;NSM;;;;;N;;;;;” | |
357 | “09C4;BENGALI VOWEL SIGN VOCALIC RR;Mn;0;NSM;;;;;N;;;;;” | |
358 | “09C7;BENGALI VOWEL SIGN E;Mc;0;L;;;;;N;;;;;” | |
359 | “09C8;BENGALI VOWEL SIGN AI;Mc;0;L;;;;;N;;;;;” | |
360 | “09CB;BENGALI VOWEL SIGN O;Mc;0;L;09C7 09BE;;;;N;;;;;” | |
361 | “09CC;BENGALI VOWEL SIGN AU;Mc;0;L;09C7 09D7;;;;N;;;;;” | |
362 | Combining characters, both in UnicodeData.txt 5.0.0 and 7.0.0. | |
363 | According to DerivedCoreProperties.txt (7.0.0) these are | |
364 | “Alphabetic”.''' | |
365 | ], | |
366 | [[0x09CD], | |
367 | [('combining', True), ('combining_level3', True), | |
368 | ('alpha', False), ('lower', False), ('upper', False), | |
369 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
370 | ''' | |
371 | “09CD;BENGALI SIGN VIRAMA;Mn;9;NSM;;;;;N;;;;;” | |
372 | Combining character, both in UnicodeData.txt 5.0.0 and 7.0.0. | |
373 | According to DerivedCoreProperties.txt (7.0.0) it is *not* | |
374 | “Alphabetic”.''' | |
375 | ], | |
376 | [[0x09D7, (0x09E2, 0x09E3)], | |
377 | [('combining', True), ('combining_level3', True), | |
378 | ('alpha', True), ('lower', False), ('upper', False), | |
379 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
380 | '''Combining characters, both in UnicodeData.txt 5.0.0 and 7.0.0. | |
381 | According to DerivedCoreProperties.txt (7.0.0) these are | |
382 | “Alphabetic”.''' | |
383 | ], | |
384 | [[0x09F2, 0x09F3], | |
385 | [('combining', False), ('combining_level3', False), | |
386 | ('alpha', False), ('lower', False), ('upper', False), | |
387 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
388 | ''' | |
389 | “09F2;BENGALI RUPEE MARK;Sc;0;ET;;;;;N;;;;;” | |
390 | “09F3;BENGALI RUPEE SIGN;Sc;0;ET;;;;;N;;;;;” | |
391 | According to DerivedCoreProperties.txt (7.0.0) these are *not* | |
392 | “Alphabetic”.''' | |
393 | ], | |
394 | [[(0x09F4, 0x09FA)], | |
395 | [('combining', False), ('combining_level3', False), | |
396 | ('alpha', False), ('lower', False), ('upper', False), | |
397 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
398 | ''' | |
399 | “09F4;BENGALI CURRENCY NUMERATOR ONE;No;0;L;;;;1/16;N;;;;;” | |
400 | “09F5;BENGALI CURRENCY NUMERATOR TWO;No;0;L;;;;1/8;N;;;;;” | |
401 | “09F6;BENGALI CURRENCY NUMERATOR THREE;No;0;L;;;;3/16;N;;;;;” | |
402 | “09F7;BENGALI CURRENCY NUMERATOR FOUR;No;0;L;;;;1/4;N;;;;;” | |
403 | “09F8;BENGALI CURRENCY NUMERATOR ONE LESS THAN THE DENOMINATOR; | |
404 | No;0;L;;;;3/4;N;;;;;” | |
405 | “09F9;BENGALI CURRENCY DENOMINATOR SIXTEEN;No;0;L;;;;16;N;;;;;” | |
406 | “09FA;BENGALI ISSHAR;So;0;L;;;;;N;;;;;” | |
407 | According to DerivedCoreProperties.txt (7.0.0) these are *not* | |
408 | “Alphabetic”.''' | |
409 | ], | |
410 | [[(0x0A01, 0x0A03)], | |
411 | [('combining', True), ('combining_level3', True), | |
412 | ('alpha', True), ('lower', False), ('upper', False), | |
413 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
414 | ''' | |
415 | “0A01;GURMUKHI SIGN ADAK BINDI;Mn;0;NSM;;;;;N;;;;;” | |
416 | “0A02;GURMUKHI SIGN BINDI;Mn;0;NSM;;;;;N;;;;;” | |
417 | “0A03;GURMUKHI SIGN VISARGA;Mc;0;L;;;;;N;;;;;” | |
418 | According to DerivedCoreProperties.txt (7.0.0) these are | |
419 | “Alphabetic”.''' | |
420 | ], | |
421 | [[0x0A3C], | |
422 | [('combining', True), ('combining_level3', True), | |
423 | ('alpha', False), ('lower', False), ('upper', False), | |
424 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
425 | ''' | |
426 | “0A3C;GURMUKHI SIGN NUKTA;Mn;7;NSM;;;;;N;;;;;” | |
427 | According to DerivedCoreProperties.txt (7.0.0) this is *not* | |
428 | “Alphabetic”.''' | |
429 | ], | |
430 | [[(0x0A3E, 0x0A40), (0x0A41, 0x0A42), (0x0A47, 0x0A48), | |
431 | (0x0A4B, 0x0A4C)], | |
432 | [('combining', True), ('combining_level3', True), | |
433 | ('alpha', True), ('lower', False), ('upper', False), | |
434 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
435 | ''' | |
436 | “0A3E;GURMUKHI VOWEL SIGN AA;Mc;0;L;;;;;N;;;;;” | |
437 | “0A3F;GURMUKHI VOWEL SIGN I;Mc;0;L;;;;;N;;;;;” | |
438 | “0A40;GURMUKHI VOWEL SIGN II;Mc;0;L;;;;;N;;;;;” | |
439 | “0A41;GURMUKHI VOWEL SIGN U;Mn;0;NSM;;;;;N;;;;;” | |
440 | “0A42;GURMUKHI VOWEL SIGN UU;Mn;0;NSM;;;;;N;;;;;” | |
441 | “0A47;GURMUKHI VOWEL SIGN EE;Mn;0;NSM;;;;;N;;;;;” | |
442 | “0A48;GURMUKHI VOWEL SIGN AI;Mn;0;NSM;;;;;N;;;;;” | |
443 | “0A4B;GURMUKHI VOWEL SIGN OO;Mn;0;NSM;;;;;N;;;;;” | |
444 | “0A4C;GURMUKHI VOWEL SIGN AU;Mn;0;NSM;;;;;N;;;;;” | |
445 | According to DerivedCoreProperties.txt (7.0.0) these are | |
446 | “Alphabetic”.''' | |
447 | ], | |
448 | [[0x0A4D], | |
449 | [('combining', True), ('combining_level3', True), | |
450 | ('alpha', False), ('lower', False), ('upper', False), | |
451 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
452 | ''' | |
453 | “0A4D;GURMUKHI SIGN VIRAMA;Mn;9;NSM;;;;;N;;;;;” | |
454 | According to DerivedCoreProperties.txt (7.0.0) this is *not* | |
455 | “Alphabetic”.''' | |
456 | ], | |
457 | [[0x0A51, (0x0A70, 0x0A71), 0x0A75, (0x0A81, 0x0A83)], | |
458 | [('combining', True), ('combining_level3', True), | |
459 | ('alpha', True), ('lower', False), ('upper', False), | |
460 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
461 | ''' | |
462 | “0A4D;GURMUKHI SIGN VIRAMA;Mn;9;NSM;;;;;N;;;;;” | |
463 | “0A70;GURMUKHI TIPPI;Mn;0;NSM;;;;;N;;;;;” | |
464 | “0A71;GURMUKHI ADDAK;Mn;0;NSM;;;;;N;;;;;” | |
465 | “0A75;GURMUKHI SIGN YAKASH;Mn;0;NSM;;;;;N;;;;;” | |
466 | “0A81;GUJARATI SIGN CANDRABINDU;Mn;0;NSM;;;;;N;;;;;” | |
467 | “0A82;GUJARATI SIGN ANUSVARA;Mn;0;NSM;;;;;N;;;;;” | |
468 | “0A83;GUJARATI SIGN VISARGA;Mc;0;L;;;;;N;;;;;” | |
469 | According to DerivedCoreProperties.txt (7.0.0) these are | |
470 | “Alphabetic”.''' | |
471 | ], | |
472 | [[0x0ABC], | |
473 | [('combining', True), ('combining_level3', True), | |
474 | ('alpha', False), ('lower', False), ('upper', False), | |
475 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
476 | ''' | |
477 | “0ABC;GUJARATI SIGN NUKTA;Mn;7;NSM;;;;;N;;;;;” | |
478 | According to DerivedCoreProperties.txt (7.0.0) this is *not* | |
479 | “Alphabetic”.''' | |
480 | ], | |
481 | [[(0x0ABE, 0x0AC5), (0x0AC7, 0x0AC9), (0x0ACB, 0x0ACC)], | |
482 | [('combining', True), ('combining_level3', True), | |
483 | ('alpha', True), ('lower', False), ('upper', False), | |
484 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
485 | ''' | |
486 | “0ABE;GUJARATI VOWEL SIGN AA;Mc;0;L;;;;;N;;;;;” | |
487 | “0ABF;GUJARATI VOWEL SIGN I;Mc;0;L;;;;;N;;;;;” | |
488 | “0AC0;GUJARATI VOWEL SIGN II;Mc;0;L;;;;;N;;;;;” | |
489 | “0AC1;GUJARATI VOWEL SIGN U;Mn;0;NSM;;;;;N;;;;;” | |
490 | “0AC2;GUJARATI VOWEL SIGN UU;Mn;0;NSM;;;;;N;;;;;” | |
491 | “0AC3;GUJARATI VOWEL SIGN VOCALIC R;Mn;0;NSM;;;;;N;;;;;” | |
492 | “0AC4;GUJARATI VOWEL SIGN VOCALIC RR;Mn;0;NSM;;;;;N;;;;;” | |
493 | “0AC5;GUJARATI VOWEL SIGN CANDRA E;Mn;0;NSM;;;;;N;;;;;” | |
494 | “0AC7;GUJARATI VOWEL SIGN E;Mn;0;NSM;;;;;N;;;;;” | |
495 | “0AC8;GUJARATI VOWEL SIGN AI;Mn;0;NSM;;;;;N;;;;;” | |
496 | “0AC9;GUJARATI VOWEL SIGN CANDRA O;Mc;0;L;;;;;N;;;;;” | |
497 | “0ACB;GUJARATI VOWEL SIGN O;Mc;0;L;;;;;N;;;;;” | |
498 | “0ACC;GUJARATI VOWEL SIGN AU;Mc;0;L;;;;;N;;;;;” | |
499 | According to DerivedCoreProperties.txt (7.0.0) these are | |
500 | “Alphabetic”.''' | |
501 | ], | |
502 | [[0x0ACD], | |
503 | [('combining', True), ('combining_level3', True), | |
504 | ('alpha', False), ('lower', False), ('upper', False), | |
505 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
506 | ''' | |
507 | “0ACD;GUJARATI SIGN VIRAMA;Mn;9;NSM;;;;;N;;;;;” | |
508 | According to DerivedCoreProperties.txt (7.0.0) this is *not* | |
509 | “Alphabetic”.''' | |
510 | ], | |
511 | [[(0x0AE2, 0x0AE3)], | |
512 | [('combining', True), ('combining_level3', True), | |
513 | ('alpha', True), ('lower', False), ('upper', False), | |
514 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
515 | ''' | |
516 | “0AE2;GUJARATI VOWEL SIGN VOCALIC L;Mn;0;NSM;;;;;N;;;;;” | |
517 | “0AE3;GUJARATI VOWEL SIGN VOCALIC LL;Mn;0;NSM;;;;;N;;;;;” | |
518 | According to DerivedCoreProperties.txt (7.0.0) these are | |
519 | “Alphabetic”.''' | |
520 | ], | |
521 | [[0x0AF1], | |
522 | [('combining', False), ('combining_level3', False), | |
523 | ('alpha', False), ('lower', False), ('upper', False), | |
524 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
525 | ''' | |
526 | “0AF1;GUJARATI RUPEE SIGN;Sc;0;ET;;;;;N;;;;;” | |
527 | According to DerivedCoreProperties.txt (7.0.0) this is *not* | |
528 | “Alphabetic”.''' | |
529 | ], | |
530 | [[(0x0B01, 0x0B03)], | |
531 | [('combining', True), ('combining_level3', True), | |
532 | ('alpha', True), ('lower', False), ('upper', False), | |
533 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
534 | ''' | |
535 | “0B01;ORIYA SIGN CANDRABINDU;Mn;0;NSM;;;;;N;;;;;” | |
536 | “0B02;ORIYA SIGN ANUSVARA;Mc;0;L;;;;;N;;;;;” | |
537 | “0B03;ORIYA SIGN VISARGA;Mc;0;L;;;;;N;;;;;” | |
538 | According to DerivedCoreProperties.txt (7.0.0) these are | |
539 | “Alphabetic”.''' | |
540 | ], | |
541 | [[0x0B3C], | |
542 | [('combining', True), ('combining_level3', True), | |
543 | ('alpha', False), ('lower', False), ('upper', False), | |
544 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
545 | ''' | |
546 | “0B3C;ORIYA SIGN NUKTA;Mn;7;NSM;;;;;N;;;;;” | |
547 | According to DerivedCoreProperties.txt (7.0.0) this is *not* | |
548 | “Alphabetic”.''' | |
549 | ], | |
550 | [[(0x0B3E, 0x0B44), (0x0B47, 0x0B48), (0x0B4B, 0x0B4C)], | |
551 | [('combining', True), ('combining_level3', True), | |
552 | ('alpha', True), ('lower', False), ('upper', False), | |
553 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
554 | ''' | |
555 | “0B3E;ORIYA VOWEL SIGN AA;Mc;0;L;;;;;N;;;;;” | |
556 | “0B3F;ORIYA VOWEL SIGN I;Mn;0;NSM;;;;;N;;;;;” | |
557 | “0B40;ORIYA VOWEL SIGN II;Mc;0;L;;;;;N;;;;;” | |
558 | “0B41;ORIYA VOWEL SIGN U;Mn;0;NSM;;;;;N;;;;;” | |
559 | “0B42;ORIYA VOWEL SIGN UU;Mn;0;NSM;;;;;N;;;;;” | |
560 | “0B43;ORIYA VOWEL SIGN VOCALIC R;Mn;0;NSM;;;;;N;;;;;” | |
561 | “0B44;ORIYA VOWEL SIGN VOCALIC RR;Mn;0;NSM;;;;;N;;;;;” | |
562 | “0B47;ORIYA VOWEL SIGN E;Mc;0;L;;;;;N;;;;;” | |
563 | “0B48;ORIYA VOWEL SIGN AI;Mc;0;L;0B47 0B56;;;;N;;;;;” | |
564 | “0B4B;ORIYA VOWEL SIGN O;Mc;0;L;0B47 0B3E;;;;N;;;;;” | |
565 | “0B4C;ORIYA VOWEL SIGN AU;Mc;0;L;0B47 0B57;;;;N;;;;;” | |
566 | According to DerivedCoreProperties.txt (7.0.0) these are | |
567 | “Alphabetic”.''' | |
568 | ], | |
569 | [[0x0B4D], | |
570 | [('combining', True), ('combining_level3', True), | |
571 | ('alpha', False), ('lower', False), ('upper', False), | |
572 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
573 | ''' | |
574 | “0B4D;ORIYA SIGN VIRAMA;Mn;9;NSM;;;;;N;;;;;” | |
575 | According to DerivedCoreProperties.txt (7.0.0) this is *not* | |
576 | “Alphabetic”.''' | |
577 | ], | |
578 | [[(0x0B56, 0x0B57), (0x0B62, 0x0B63)], | |
579 | [('combining', True), ('combining_level3', True), | |
580 | ('alpha', True), ('lower', False), ('upper', False), | |
581 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
582 | ''' | |
583 | “0B56;ORIYA AI LENGTH MARK;Mn;0;NSM;;;;;N;;;;;” | |
584 | “0B57;ORIYA AU LENGTH MARK;Mc;0;L;;;;;N;;;;;” | |
585 | “0B62;ORIYA VOWEL SIGN VOCALIC L;Mn;0;NSM;;;;;N;;;;;” | |
586 | “0B63;ORIYA VOWEL SIGN VOCALIC LL;Mn;0;NSM;;;;;N;;;;;” | |
587 | According to DerivedCoreProperties.txt (7.0.0) these are | |
588 | “Alphabetic”.''' | |
589 | ], | |
590 | [[0x0B70], | |
591 | [('combining', False), ('combining_level3', False), | |
592 | ('alpha', False), ('lower', False), ('upper', False), | |
593 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
594 | ''' | |
595 | “0B70;ORIYA ISSHAR;So;0;L;;;;;N;;;;;” | |
596 | According to DerivedCoreProperties.txt (7.0.0) this is *not* | |
597 | “Alphabetic”.''' | |
598 | ], | |
599 | [[0x0B82], | |
600 | [('combining', True), ('combining_level3', True), | |
601 | ('alpha', True), ('lower', False), ('upper', False), | |
602 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
603 | ''' | |
604 | “0B82;TAMIL SIGN ANUSVARA;Mn;0;NSM;;;;;N;;;;;” | |
605 | According to DerivedCoreProperties.txt (7.0.0) this is *not* | |
606 | “Alphabetic”.''' | |
607 | ], | |
608 | [[(0x0BBE, 0x0BC2), (0x0BC6, 0x0BC8), (0x0BCA, 0x0BCC)], | |
609 | [('combining', True), ('combining_level3', True), | |
610 | ('alpha', True), ('lower', False), ('upper', False), | |
611 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
612 | ''' | |
613 | “0BBE;TAMIL VOWEL SIGN AA;Mc;0;L;;;;;N;;;;;” | |
614 | “0BBF;TAMIL VOWEL SIGN I;Mc;0;L;;;;;N;;;;;” | |
615 | “0BC0;TAMIL VOWEL SIGN II;Mn;0;NSM;;;;;N;;;;;” | |
616 | “0BC1;TAMIL VOWEL SIGN U;Mc;0;L;;;;;N;;;;;” | |
617 | “0BC2;TAMIL VOWEL SIGN UU;Mc;0;L;;;;;N;;;;;” | |
618 | “0BC6;TAMIL VOWEL SIGN E;Mc;0;L;;;;;N;;;;;” | |
619 | “0BC7;TAMIL VOWEL SIGN EE;Mc;0;L;;;;;N;;;;;” | |
620 | “0BC8;TAMIL VOWEL SIGN AI;Mc;0;L;;;;;N;;;;;” | |
621 | “0BCA;TAMIL VOWEL SIGN O;Mc;0;L;0BC6 0BBE;;;;N;;;;;” | |
622 | “0BCB;TAMIL VOWEL SIGN OO;Mc;0;L;0BC7 0BBE;;;;N;;;;;” | |
623 | “0BCC;TAMIL VOWEL SIGN AU;Mc;0;L;0BC6 0BD7;;;;N;;;;;” | |
624 | According to DerivedCoreProperties.txt (7.0.0) these are | |
625 | “Alphabetic”.''' | |
626 | ], | |
627 | [[0x0BCD], | |
628 | [('combining', True), ('combining_level3', True), | |
629 | ('alpha', False), ('lower', False), ('upper', False), | |
630 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
631 | ''' | |
632 | “0BCD;TAMIL SIGN VIRAMA;Mn;9;NSM;;;;;N;;;;;” | |
633 | According to DerivedCoreProperties.txt (7.0.0) this is *not* | |
634 | “Alphabetic”.''' | |
635 | ], | |
636 | [[0x0BD7], | |
637 | [('combining', True), ('combining_level3', True), | |
638 | ('alpha', True), ('lower', False), ('upper', False), | |
639 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
640 | ''' | |
641 | “0BD7;TAMIL AU LENGTH MARK;Mc;0;L;;;;;N;;;;;” | |
642 | According to DerivedCoreProperties.txt (7.0.0) this is *not* | |
643 | “Alphabetic”.''' | |
644 | ], | |
645 | [[(0x0BF0, 0x0BFA)], | |
646 | [('combining', False), ('combining_level3', False), | |
647 | ('alpha', False), ('lower', False), ('upper', False), | |
648 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
649 | ''' | |
650 | “0BF0;TAMIL NUMBER TEN;No;0;L;;;;10;N;;;;;” | |
651 | “0BF1;TAMIL NUMBER ONE HUNDRED;No;0;L;;;;100;N;;;;;” | |
652 | “0BF2;TAMIL NUMBER ONE THOUSAND;No;0;L;;;;1000;N;;;;;” | |
653 | “0BF3;TAMIL DAY SIGN;So;0;ON;;;;;N;;;;;” | |
654 | “0BF4;TAMIL MONTH SIGN;So;0;ON;;;;;N;;;;;” | |
655 | “0BF5;TAMIL YEAR SIGN;So;0;ON;;;;;N;;;;;” | |
656 | “0BF6;TAMIL DEBIT SIGN;So;0;ON;;;;;N;;;;;” | |
657 | “0BF7;TAMIL CREDIT SIGN;So;0;ON;;;;;N;;;;;” | |
658 | “0BF8;TAMIL AS ABOVE SIGN;So;0;ON;;;;;N;;;;;” | |
659 | “0BF9;TAMIL RUPEE SIGN;Sc;0;ET;;;;;N;;;;;” | |
660 | “0BFA;TAMIL NUMBER SIGN;So;0;ON;;;;;N;;;;;” | |
661 | According to DerivedCoreProperties.txt (7.0.0) this is *not* | |
662 | “Alphabetic”.''' | |
663 | ], | |
664 | [[(0x0C01, 0x0C03)], | |
665 | [('combining', True), ('combining_level3', True), | |
666 | ('alpha', True), ('lower', False), ('upper', False), | |
667 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
668 | ''' | |
669 | “0C01;TELUGU SIGN CANDRABINDU;Mc;0;L;;;;;N;;;;;” | |
670 | “0C02;TELUGU SIGN ANUSVARA;Mc;0;L;;;;;N;;;;;” | |
671 | “0C03;TELUGU SIGN VISARGA;Mc;0;L;;;;;N;;;;;” | |
672 | According to DerivedCoreProperties.txt (7.0.0) these are | |
673 | “Alphabetic”.''' | |
674 | ], | |
675 | [[(0x0C3E, 0x0C44), (0x0C46, 0x0C48), (0x0C4A, 0x0C4C)], | |
676 | [('combining', True), ('combining_level3', True), | |
677 | ('alpha', True), ('lower', False), ('upper', False), | |
678 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
679 | ''' | |
680 | “0C3E;TELUGU VOWEL SIGN AA;Mn;0;NSM;;;;;N;;;;;” | |
681 | “0C3F;TELUGU VOWEL SIGN I;Mn;0;NSM;;;;;N;;;;;” | |
682 | “0C40;TELUGU VOWEL SIGN II;Mn;0;NSM;;;;;N;;;;;” | |
683 | “0C41;TELUGU VOWEL SIGN U;Mc;0;L;;;;;N;;;;;” | |
684 | “0C42;TELUGU VOWEL SIGN UU;Mc;0;L;;;;;N;;;;;” | |
685 | “0C43;TELUGU VOWEL SIGN VOCALIC R;Mc;0;L;;;;;N;;;;;” | |
686 | “0C44;TELUGU VOWEL SIGN VOCALIC RR;Mc;0;L;;;;;N;;;;;” | |
687 | “0C46;TELUGU VOWEL SIGN E;Mn;0;NSM;;;;;N;;;;;” | |
688 | “0C47;TELUGU VOWEL SIGN EE;Mn;0;NSM;;;;;N;;;;;” | |
689 | “0C48;TELUGU VOWEL SIGN AI;Mn;0;NSM;0C46 0C56;;;;N;;;;;” | |
690 | “0C4A;TELUGU VOWEL SIGN O;Mn;0;NSM;;;;;N;;;;;” | |
691 | “0C4B;TELUGU VOWEL SIGN OO;Mn;0;NSM;;;;;N;;;;;” | |
692 | “0C4C;TELUGU VOWEL SIGN AU;Mn;0;NSM;;;;;N;;;;;” | |
693 | According to DerivedCoreProperties.txt (7.0.0) these are | |
694 | “Alphabetic”.''' | |
695 | ], | |
696 | [[0x0C4D], | |
697 | [('combining', True), ('combining_level3', True), | |
698 | ('alpha', False), ('lower', False), ('upper', False), | |
699 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
700 | ''' | |
701 | “0C4D;TELUGU SIGN VIRAMA;Mn;9;NSM;;;;;N;;;;;” | |
702 | According to DerivedCoreProperties.txt (7.0.0) these are *not* | |
703 | “Alphabetic”.''' | |
704 | ], | |
705 | [[(0x0C55, 0x0C56), (0x0C62, 0x0C63)], | |
706 | [('combining', True), ('combining_level3', True), | |
707 | ('alpha', True), ('lower', False), ('upper', False), | |
708 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
709 | ''' | |
710 | “0C55;TELUGU LENGTH MARK;Mn;84;NSM;;;;;N;;;;;” | |
711 | “0C56;TELUGU AI LENGTH MARK;Mn;91;NSM;;;;;N;;;;;” | |
712 | “0C62;TELUGU VOWEL SIGN VOCALIC L;Mn;0;NSM;;;;;N;;;;;” | |
713 | “0C63;TELUGU VOWEL SIGN VOCALIC LL;Mn;0;NSM;;;;;N;;;;;” | |
714 | According to DerivedCoreProperties.txt (7.0.0) these are | |
715 | “Alphabetic”.''' | |
716 | ], | |
717 | [[(0x0C78, 0x0C7F)], | |
718 | [('combining', False), ('combining_level3', False), | |
719 | ('alpha', False), ('lower', False), ('upper', False), | |
720 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
721 | ''' | |
722 | “0C78;TELUGU FRACTION DIGIT ZERO FOR ODD POWERS OF FOUR; | |
723 | No;0;ON;;;;0;N;;;;;” | |
724 | “0C79;TELUGU FRACTION DIGIT ONE FOR ODD POWERS OF FOUR; | |
725 | No;0;ON;;;;1;N;;;;;” | |
726 | “0C7A;TELUGU FRACTION DIGIT TWO FOR ODD POWERS OF FOUR; | |
727 | No;0;ON;;;;2;N;;;;;” | |
728 | “0C7B;TELUGU FRACTION DIGIT THREE FOR ODD POWERS OF FOUR; | |
729 | No;0;ON;;;;3;N;;;;;” | |
730 | “0C7C;TELUGU FRACTION DIGIT ONE FOR EVEN POWERS OF FOUR; | |
731 | No;0;ON;;;;1;N;;;;;” | |
732 | “0C7D;TELUGU FRACTION DIGIT TWO FOR EVEN POWERS OF FOUR; | |
733 | No;0;ON;;;;2;N;;;;;” | |
734 | “0C7E;TELUGU FRACTION DIGIT THREE FOR EVEN POWERS OF FOUR; | |
735 | No;0;ON;;;;3;N;;;;;” | |
736 | “0C7F;TELUGU SIGN TUUMU;So;0;L;;;;;N;;;;;” | |
737 | According to DerivedCoreProperties.txt (7.0.0) these are *not* | |
738 | “Alphabetic”.''' | |
739 | ], | |
740 | [[(0x0C82, 0x0C83)], | |
741 | [('combining', True), ('combining_level3', True), | |
742 | ('alpha', True), ('lower', False), ('upper', False), | |
743 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
744 | ''' | |
745 | “0C81;KANNADA SIGN CANDRABINDU;Mn;0;NSM;;;;;N;;;;;” | |
746 | “0C82;KANNADA SIGN ANUSVARA;Mc;0;L;;;;;N;;;;;” | |
747 | “0C83;KANNADA SIGN VISARGA;Mc;0;L;;;;;N;;;;;” | |
748 | According to DerivedCoreProperties.txt (7.0.0) these are | |
749 | “Alphabetic”.''' | |
750 | ], | |
751 | [[0x0CBC], | |
752 | [('combining', True), ('combining_level3', True), | |
753 | ('alpha', False), ('lower', False), ('upper', False), | |
754 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
755 | ''' | |
756 | “0CBC;KANNADA SIGN NUKTA;Mn;7;NSM;;;;;N;;;;;” | |
757 | According to DerivedCoreProperties.txt (7.0.0) these are | |
758 | “Alphabetic”.''' | |
759 | ], | |
760 | [[(0x0CBE, 0x0CC4), (0x0CC6, 0x0CC8), (0x0CCA, 0x0CCC)], | |
761 | [('combining', True), ('combining_level3', True), | |
762 | ('alpha', True), ('lower', False), ('upper', False), | |
763 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
764 | ''' | |
765 | “0CBE;KANNADA VOWEL SIGN AA;Mc;0;L;;;;;N;;;;;” | |
766 | “0CBF;KANNADA VOWEL SIGN I;Mn;0;L;;;;;N;;;;;” | |
767 | “0CC0;KANNADA VOWEL SIGN II;Mc;0;L;0CBF 0CD5;;;;N;;;;;” | |
768 | “0CC1;KANNADA VOWEL SIGN U;Mc;0;L;;;;;N;;;;;” | |
769 | “0CC2;KANNADA VOWEL SIGN UU;Mc;0;L;;;;;N;;;;;” | |
770 | “0CC3;KANNADA VOWEL SIGN VOCALIC R;Mc;0;L;;;;;N;;;;;” | |
771 | “0CC4;KANNADA VOWEL SIGN VOCALIC RR;Mc;0;L;;;;;N;;;;;” | |
772 | “0CC6;KANNADA VOWEL SIGN E;Mn;0;L;;;;;N;;;;;” | |
773 | “0CC7;KANNADA VOWEL SIGN EE;Mc;0;L;0CC6 0CD5;;;;N;;;;;” | |
774 | “0CC8;KANNADA VOWEL SIGN AI;Mc;0;L;0CC6 0CD6;;;;N;;;;;” | |
775 | “0CCA;KANNADA VOWEL SIGN O;Mc;0;L;0CC6 0CC2;;;;N;;;;;” | |
776 | “0CCB;KANNADA VOWEL SIGN OO;Mc;0;L;0CCA 0CD5;;;;N;;;;;” | |
777 | “0CCC;KANNADA VOWEL SIGN AU;Mn;0;NSM;;;;;N;;;;;” | |
778 | According to DerivedCoreProperties.txt (7.0.0) these are | |
779 | “Alphabetic”.''' | |
780 | ], | |
781 | [[0x0CCD], | |
782 | [('combining', True), ('combining_level3', True), | |
783 | ('alpha', False), ('lower', False), ('upper', False), | |
784 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
785 | ''' | |
786 | “0CCD;KANNADA SIGN VIRAMA;Mn;9;NSM;;;;;N;;;;;” | |
787 | According to DerivedCoreProperties.txt (7.0.0) these are *not* | |
788 | “Alphabetic”.''' | |
789 | ], | |
790 | [[(0x0CD5, 0x0CD6), (0x0CE2, 0x0CE3)], | |
791 | [('combining', True), ('combining_level3', True), | |
792 | ('alpha', True), ('lower', False), ('upper', False), | |
793 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
794 | ''' | |
795 | 0CD5;KANNADA LENGTH MARK;Mc;0;L;;;;;N;;;;; | |
796 | 0CD6;KANNADA AI LENGTH MARK;Mc;0;L;;;;;N;;;;; | |
797 | 0CE2;KANNADA VOWEL SIGN VOCALIC L;Mn;0;NSM;;;;;N;;;;; | |
798 | 0CE3;KANNADA VOWEL SIGN VOCALIC LL;Mn;0;NSM;;;;;N;;;;; | |
799 | According to DerivedCoreProperties.txt (7.0.0) these are | |
800 | “Alphabetic”.''' | |
801 | ], | |
802 | [[(0x0D02, 0x0D03), (0x0D3E, 0x0D44), (0x0D46, 0x0D48), | |
803 | (0x0D4A, 0x0D4C)], | |
804 | [('combining', True), ('combining_level3', True), | |
805 | ('alpha', True), ('lower', False), ('upper', False), | |
806 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
807 | ''' | |
808 | “0D02;MALAYALAM SIGN ANUSVARA;Mc;0;L;;;;;N;;;;;” | |
809 | “0D03;MALAYALAM SIGN VISARGA;Mc;0;L;;;;;N;;;;;” | |
810 | “0D3E;MALAYALAM VOWEL SIGN AA;Mc;0;L;;;;;N;;;;;” | |
811 | “0D3F;MALAYALAM VOWEL SIGN I;Mc;0;L;;;;;N;;;;;” | |
812 | “0D40;MALAYALAM VOWEL SIGN II;Mc;0;L;;;;;N;;;;;” | |
813 | “0D41;MALAYALAM VOWEL SIGN U;Mn;0;NSM;;;;;N;;;;;” | |
814 | “0D42;MALAYALAM VOWEL SIGN UU;Mn;0;NSM;;;;;N;;;;;” | |
815 | “0D43;MALAYALAM VOWEL SIGN VOCALIC R;Mn;0;NSM;;;;;N;;;;;” | |
816 | “0D44;MALAYALAM VOWEL SIGN VOCALIC RR;Mn;0;NSM;;;;;N;;;;;” | |
817 | “0D46;MALAYALAM VOWEL SIGN E;Mc;0;L;;;;;N;;;;;” | |
818 | “0D47;MALAYALAM VOWEL SIGN EE;Mc;0;L;;;;;N;;;;;” | |
819 | “0D48;MALAYALAM VOWEL SIGN AI;Mc;0;L;;;;;N;;;;;” | |
820 | “0D4A;MALAYALAM VOWEL SIGN O;Mc;0;L;0D46 0D3E;;;;N;;;;;” | |
821 | “0D4B;MALAYALAM VOWEL SIGN OO;Mc;0;L;0D47 0D3E;;;;N;;;;;” | |
822 | “0D4C;MALAYALAM VOWEL SIGN AU;Mc;0;L;0D46 0D57;;;;N;;;;;” | |
823 | According to DerivedCoreProperties.txt (7.0.0) these are | |
824 | “Alphabetic”.''' | |
825 | ], | |
826 | [[0x0D4D], | |
827 | [('combining', True), ('combining_level3', True), | |
828 | ('alpha', False), ('lower', False), ('upper', False), | |
829 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
830 | ''' | |
831 | “0D4D;MALAYALAM SIGN VIRAMA;Mn;9;NSM;;;;;N;;;;;” | |
832 | According to DerivedCoreProperties.txt (7.0.0) these are | |
833 | “Alphabetic”.''' | |
834 | ], | |
835 | [[0x0D57, (0x0D62, 0x0D63)], | |
836 | [('combining', True), ('combining_level3', True), | |
837 | ('alpha', True), ('lower', False), ('upper', False), | |
838 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
839 | ''' | |
840 | “0D57;MALAYALAM AU LENGTH MARK;Mc;0;L;;;;;N;;;;;” | |
841 | “0D62;MALAYALAM VOWEL SIGN VOCALIC L;Mn;0;NSM;;;;;N;;;;;” | |
842 | “0D63;MALAYALAM VOWEL SIGN VOCALIC LL;Mn;0;NSM;;;;;N;;;;;” | |
843 | According to DerivedCoreProperties.txt (7.0.0) these are | |
844 | “Alphabetic”.''' | |
845 | ], | |
846 | [[(0x0D70, 0x0D79)], | |
847 | [('combining', False), ('combining_level3', False), | |
848 | ('alpha', False), ('lower', False), ('upper', False), | |
849 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
850 | ''' | |
851 | “0D70;MALAYALAM NUMBER TEN;No;0;L;;;;10;N;;;;;” | |
852 | “0D71;MALAYALAM NUMBER ONE HUNDRED;No;0;L;;;;100;N;;;;;” | |
853 | “0D72;MALAYALAM NUMBER ONE THOUSAND;No;0;L;;;;1000;N;;;;;” | |
854 | “0D73;MALAYALAM FRACTION ONE QUARTER;No;0;L;;;;1/4;N;;;;;” | |
855 | “0D74;MALAYALAM FRACTION ONE HALF;No;0;L;;;;1/2;N;;;;;” | |
856 | “0D75;MALAYALAM FRACTION THREE QUARTERS;No;0;L;;;;3/4;N;;;;;” | |
857 | “0D79;MALAYALAM DATE MARK;So;0;L;;;;;N;;;;;” | |
858 | According to DerivedCoreProperties.txt (7.0.0) these are *not* | |
859 | “Alphabetic”.''' | |
860 | ], | |
861 | [[(0x0D82, 0x0D83)], | |
862 | [('combining', True), ('combining_level3', True), | |
863 | ('alpha', True), ('lower', False), ('upper', False), | |
864 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
865 | ''' | |
866 | “0D82;SINHALA SIGN ANUSVARAYA;Mc;0;L;;;;;N;;;;;” | |
867 | “0D83;SINHALA SIGN VISARGAYA;Mc;0;L;;;;;N;;;;;” | |
868 | According to DerivedCoreProperties.txt (7.0.0) these are | |
869 | “Alphabetic”.''' | |
870 | ], | |
871 | [[0x0DCA], | |
872 | [('combining', True), ('combining_level3', True), | |
873 | ('alpha', False), ('lower', False), ('upper', False), | |
874 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
875 | ''' | |
876 | “0DCA;SINHALA SIGN AL-LAKUNA;Mn;9;NSM;;;;;N;;;;;” | |
877 | According to DerivedCoreProperties.txt (7.0.0) these are *not* | |
878 | “Alphabetic”.''' | |
879 | ], | |
880 | [[(0x0DCF, 0x0DD4), 0x0DD6, (0x0DD8, 0x0DDF), (0x0DF2, 0x0DF3)], | |
881 | [('combining', True), ('combining_level3', True), | |
882 | ('alpha', True), ('lower', False), ('upper', False), | |
883 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
884 | ''' | |
885 | “0DCF;SINHALA VOWEL SIGN AELA-PILLA;Mc;0;L;;;;;N;;;;;” | |
886 | “0DD0;SINHALA VOWEL SIGN KETTI AEDA-PILLA;Mc;0;L;;;;;N;;;;;” | |
887 | “0DD1;SINHALA VOWEL SIGN DIGA AEDA-PILLA;Mc;0;L;;;;;N;;;;;” | |
888 | “0DD2;SINHALA VOWEL SIGN KETTI IS-PILLA;Mn;0;NSM;;;;;N;;;;;” | |
889 | “0DD3;SINHALA VOWEL SIGN DIGA IS-PILLA;Mn;0;NSM;;;;;N;;;;;” | |
890 | “0DD4;SINHALA VOWEL SIGN KETTI PAA-PILLA;Mn;0;NSM;;;;;N;;;;;” | |
891 | “0DD6;SINHALA VOWEL SIGN DIGA PAA-PILLA;Mn;0;NSM;;;;;N;;;;;” | |
892 | “0DD8;SINHALA VOWEL SIGN GAETTA-PILLA;Mc;0;L;;;;;N;;;;;” | |
893 | “0DD9;SINHALA VOWEL SIGN KOMBUVA;Mc;0;L;;;;;N;;;;;” | |
894 | “0DDA;SINHALA VOWEL SIGN DIGA KOMBUVA;Mc;0;L;0DD9 0DCA;;;;N;;;;;” | |
895 | “0DDB;SINHALA VOWEL SIGN KOMBU DEKA;Mc;0;L;;;;;N;;;;;” | |
896 | “0DDC;SINHALA VOWEL SIGN KOMBUVA HAA AELA-PILLA; | |
897 | Mc;0;L;0DD9 0DCF;;;;N;;;;;” | |
898 | “0DDD;SINHALA VOWEL SIGN KOMBUVA HAA DIGA AELA-PILLA; | |
899 | Mc;0;L;0DDC 0DCA;;;;N;;;;;” | |
900 | “0DDE;SINHALA VOWEL SIGN KOMBUVA HAA GAYANUKITTA; | |
901 | Mc;0;L;0DD9 0DDF;;;;N;;;;;” | |
902 | “0DDF;SINHALA VOWEL SIGN GAYANUKITTA;Mc;0;L;;;;;N;;;;;” | |
903 | “0DF2;SINHALA VOWEL SIGN DIGA GAETTA-PILLA;Mc;0;L;;;;;N;;;;;” | |
904 | “0DF3;SINHALA VOWEL SIGN DIGA GAYANUKITTA;Mc;0;L;;;;;N;;;;;” | |
905 | According to DerivedCoreProperties.txt (7.0.0) these are | |
906 | “Alphabetic”.''' | |
907 | ], | |
908 | [[0x0DF4], | |
909 | [('combining', False), ('combining_level3', False), | |
910 | ('alpha', False), ('lower', False), ('upper', False), | |
911 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
912 | ''' | |
913 | “0DF4;SINHALA PUNCTUATION KUNDDALIYA;Po;0;L;;;;;N;;;;;” | |
914 | According to DerivedCoreProperties.txt (7.0.0) these are *not* | |
915 | “Alphabetic”.''' | |
916 | ], | |
917 | [[(0xA789, 0xA78A)], | |
918 | [('combining', False), ('combining_level3', False), | |
919 | ('alpha', False), ('lower', False), ('upper', False), | |
920 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
921 | ''' | |
922 | “A789;MODIFIER LETTER COLON;Sk;0;L;;;;;N;;;;;” | |
923 | “A78A;MODIFIER LETTER SHORT EQUALS SIGN;Sk;0;L;;;;;N;;;;;” | |
924 | According to DerivedCoreProperties.txt (7.0.0) these are *not* | |
925 | “Alphabetic”.''' | |
926 | ], | |
927 | [[(0xA926, 0xA92A)], | |
928 | [('combining', True), ('combining_level3', True), | |
929 | ('alpha', True), ('lower', False), ('upper', False), | |
930 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
931 | ''' | |
932 | “A926;KAYAH LI VOWEL UE;Mn;0;NSM;;;;;N;;;;;” | |
933 | “A927;KAYAH LI VOWEL E;Mn;0;NSM;;;;;N;;;;;” | |
934 | “A928;KAYAH LI VOWEL U;Mn;0;NSM;;;;;N;;;;;” | |
935 | “A929;KAYAH LI VOWEL EE;Mn;0;NSM;;;;;N;;;;;” | |
936 | “A92A;KAYAH LI VOWEL O;Mn;0;NSM;;;;;N;;;;;” | |
937 | According to DerivedCoreProperties.txt (7.0.0) these are | |
938 | “Alphabetic”.''' | |
939 | ], | |
940 | [[(0xA92B, 0xA92D)], | |
941 | [('combining', True), ('combining_level3', False), | |
942 | ('alpha', False), ('lower', False), ('upper', False), | |
943 | ('tolower', False), ('toupper', False), ('totitle', False)], | |
944 | ''' | |
945 | “A92B;KAYAH LI TONE PLOPHU;Mn;220;NSM;;;;;N;;;;;” | |
946 | “A92C;KAYAH LI TONE CALYA;Mn;220;NSM;;;;;N;;;;;” | |
947 | “A92D;KAYAH LI TONE CALYA PLOPHU;Mn;220;NSM;;;;;N;;;;;” | |
948 | According to DerivedCoreProperties.txt (7.0.0) these are *not* | |
949 | “Alphabetic”.''' | |
950 | ] | |
951 | ] |