]> git.ipfire.org Git - thirdparty/glibc.git/blob - localedata/unicode-gen/ctype_compatibility_test_cases.py
b7e709a53c74ebcf8ade236d7bf34d928bafbeb9
[thirdparty/glibc.git] / localedata / unicode-gen / ctype_compatibility_test_cases.py
1 # -*- coding: utf-8 -*-
2 # Copyright (C) 2014-2018 Free Software Foundation, Inc.
3 # This file is part of the GNU C Library.
4 #
5 # The GNU C Library is free software; you can redistribute it and/or
6 # modify it under the terms of the GNU Lesser General Public
7 # License as published by the Free Software Foundation; either
8 # version 2.1 of the License, or (at your option) any later version.
9 #
10 # The GNU C Library is distributed in the hope that it will be useful,
11 # but WITHOUT ANY WARRANTY; without even the implied warranty of
12 # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
13 # Lesser General Public License for more details.
14 #
15 # You should have received a copy of the GNU Lesser General Public
16 # License along with the GNU C Library; if not, see
17 # <http://www.gnu.org/licenses/>.
18
19 '''
20 This file contains a list of test cases used by
21 the ctype_compatibility.py script.
22 '''
23
24 TEST_CASES = [
25 [[0x0E2F, 0x0E46], [('alpha', True), ('punct', False)],
26 '''Theppitak Karoonboonyanan <thep@links.nectec.or.th> says
27 <U0E2F>, <U0E46> should belong to punct. DerivedCoreProperties.txt
28 says it is alpha. We trust DerivedCoreProperties.txt.'''
29 ],
30 [[0x0E31, (0x0E34, 0x0E3A)], [('alpha', True)],
31 '''gen-unicode-ctype.c: Theppitak Karoonboonyanan
32 <thep@links.nectec.or.th> says <U0E31>, <U0E34>..<U0E3A>
33 are alpha. DerivedCoreProperties.txt agrees.'''
34 ],
35 [[(0x0E47, 0x0E4C), 0x0E4E], [('alpha', False)],
36 '''gen-unicode-ctype.c: Theppitak Karoonboonyanan
37 <thep@links.nectec.or.th> says <U0E47>..<U0E4E> are
38 is_alpha. DerivedCoreProperties does says *only* <U0E4D>
39 in that range is alphabetic, the others are *not*. We
40 trust DerivedCoreProperties.txt.'''
41 ],
42 [[0x0E4D], [('alpha', True)],
43 '''gen-unicode-ctype.c: Theppitak Karoonboonyanan
44 <thep@links.nectec.or.th> says <U0E47>..<U0E4E> are
45 is_alpha. DerivedCoreProperties does says *only* <U0E4D>
46 in that range is alphabetic, the others are *not*. We
47 trust DerivedCoreProperties.txt.
48 '''
49 ],
50 [[0x0345], [('alpha', True), ('lower', True)],
51 '''COMBINING GREEK YPOGEGRAMMENI
52 According to DerivedCoreProperties.txt, this is “Alphabetic”
53 and “Lowercase”.'''
54 ],
55 [[(0x2160, 0x2188)], [('alpha', True)],
56 '''Roman Numerals are “Alphabetic” according to
57 DerivedCoreProperties.txt'''
58 ],
59 [[(0x24B6, 0x24E9)], [('alpha', True)],
60 '''Circled Latin letters are “Alphabetic” according to
61 DerivedCoreProperties.txt'''
62 ],
63 [[0x661], [('alpha', True), ('digit', False)],
64 '''gen-unicode-ctype.c: All non-ASCII digits should be alphabetic.
65 ISO C 99 forbids us to have them in category "digit", but we
66 want iswalnum to return true on them. Don’t forget to
67 have a look at all the other digits, 0x661 is just one
68 example tested here.'''
69 ],
70 [[(0x0030, 0x0039)], [('digit', True)],
71 '''gen-unicode-ctype.c: All ASCII digits should be digits.'''
72 ],
73 [[0x0009], [('blank', True)],
74 '''gen-unicode-ctype.c: CHARACTER TABULATION'''
75 ],
76 [[0x2007], [('blank', False), ('space', False)],
77 '''gen-unicode-ctype.c: FIGURE SPACE, because it has <noBreak>
78 in the description.'''
79 ],
80 [[0x0009, 0x000A, 0x000B, 0x000C, 0x000D], [('space', True)],
81 '''gen-unicode-ctype.c: CHARACTER TABULATION, LINE FEED (LF), LINE
82 TABULATION, ;FORM FEED (FF), CARRIAGE RETURN (CR)'''
83 ],
84 [[0x2028, 0x2029], [('cntrl', True)],
85 '''gen-unicode-ctype.c: LINE SEPARATOR and PARAGRAPH SEPARATOR
86 should be cntrl.'''
87 ],
88 [[(0x0030, 0x0039), (0x0041, 0x0046), (0x0061, 0x0066)],
89 [('xdigit', True)],
90 '''gen-unicode-ctype.c: ISO C 99 says (6.4.4.1): hexadecimal-digit:
91 one of 0 1 2 3 4 5 6 7 8 9 a b c d e f A B C D E F (nothing else
92 should be considered as a hexadecimal-digit)'''
93 ],
94 [[0x0330], [('combining', True), ('combining_level3', False)],
95 '''gen-unicode-ctype.c: COMBINING TILDE BELOW, canonical combining
96 class value >= 200, should be in combining but not in
97 combining_level3'''
98 ],
99 [[0x0250, 0x0251, 0x0271], [('lower', True)],
100 '''Should be lower in Unicode 7.0.0 (was not lower in
101 Unicode 5.0.0).
102 '''
103 ],
104 [[0x2184], [('lower', True)],
105 '''Should be lower both in Unicode 5.0.0 and 7.0.0'''
106 ],
107 [[0xA67F], [('punct', False), ('alpha', True)],
108 '''0xa67f CYRILLIC PAYEROK. Not in Unicode 5.0.0. In Unicode
109 7.0.0. General category Lm (Letter
110 modifier). DerivedCoreProperties.txt says it is
111 “Alphabetic”. Apparently added manually to punct by mistake in
112 glibc’s old LC_CTYPE.'''
113 ],
114 [[0xA60C], [('punct', False), ('alpha', True)],
115 '''0xa60c VAI SYLLABLE LENGTHENER. Not in Unicode 5.0.0.
116 In Unicode 7.0.0. General category Lm (Letter
117 modifier). DerivedCoreProperties.txt says it is
118 “Alphabetic”. Apparently added manually to punct by mistake in
119 glibc’s old LC_CTYPE.'''
120 ],
121 [[0x2E2F], [('punct', False), ('alpha', True)],
122 '''0x2E2F VERTICAL TILDE. Not in Unicode 5.0.0. In Unicode
123 7.0.0. General category Lm (Letter
124 modifier). DerivedCoreProperties.txt says it is
125 “Alphabetic”. Apparently added manually to punct by mistake in
126 glibc’s old LC_CTYPE.'''
127 ],
128 [[(0x1090, 0x1099)], [('punct', False), ('alpha', True)],
129 '''MYANMAR SHAN DIGIT ZERO - MYANMAR SHAN DIGIT NINE.
130 These are digits, but because ISO C 99 forbids to
131 put them into digit they should go into alpha.'''
132 ],
133 [[0x103F], [('punct', False), ('alpha', True)],
134 '''0x103F MYANMAR LETTER GREAT SA. Not in Unicode 5.0.0.
135 In Unicode 7.0.0. General category Lo
136 (Other_Letter). DerivedCoreProperties.txt says it is
137 “Alphabetic”. Apparently added manually to punct by
138 mistake in glibc’s old LC_CTYPE.'''
139 ],
140 [[0x0374], [('punct', False), ('alpha', True)],
141 '''0x0374 GREEK NUMERAL SIGN. Unicode 5.0.0: general category
142 Sk. Unicode 7.0.0: General category Lm
143 (Modifier_Letter). DerivedCoreProperties.txt says it is
144 “Alphabetic”.'''
145 ],
146 [[0x02EC], [('punct', False), ('alpha', True)],
147 '''0x02EC MODIFIER LETTER VOICING. Unicode 5.0.0: general category
148 Sk. Unicode 7.0.0: General category Lm
149 (Modifier_Letter). DerivedCoreProperties.txt says it is
150 “Alphabetic”.'''
151 ],
152 [[0x180E], [('space', False), ('blank', False)],
153 '''0x180e MONGOLIAN VOWEL SEPARATOR. Unicode 5.0.0: General
154 category Zs (Space_Separator) Unicode 7.0.0: General category Cf
155 (Format).'''
156 ],
157 [[0x1E9C, 0x1E9D, 0x1E9F],
158 [('lower', True), ('upper', False), ('tolower', False),
159 ('toupper', False), ('totitle', False)],
160 '''ẜ 0x1e9c LATIN SMALL LETTER LONG S WITH DIAGONAL STROKE,
161 ẝ 0x1e9d LATIN SMALL LETTER LONG S WITH HIGH STROKE,
162 ẟ 0x1e9f LATIN SMALL LETTER DELTA. These are “Lowercase”
163 according to DerivedCoreProperties.txt but no upper case versions
164 exist.'''
165 ],
166 [[0x1E9E],
167 [('lower', False), ('upper', True), ('tolower', True),
168 ('toupper', False), ('totitle', False)],
169 '''0x1E9E ẞ LATIN CAPITAL LETTER SHARP S This is “Uppercase”
170 according to DerivedCoreProperties.txt and the lower case
171 version is 0x00DF ß LATIN SMALL LETTER SHARP S.'''
172 ],
173 [[0x2188],
174 [('alpha', True), ('lower', False), ('upper', False),
175 ('tolower', False), ('toupper', False), ('totitle', False)],
176 '''0x2188 ROMAN NUMERAL ONE HUNDRED THOUSAND. This is “Alphabetic”
177 according to DerivedCoreProperties.txt. In glibc’s old
178 LC_CTYPE, it was in “lower”, which seems to be a
179 mistake. It is not “Lowercase” in
180 DerivedCoreProperties.txt and does not have case mappings
181 in UnicodeData.txt either.'''
182 ],
183 [[0x2C71, 0x2C74, (0x2C77, 0x2C7A)],
184 [('alpha', True), ('lower', True), ('upper', False),
185 ('tolower', False), ('toupper', False), ('totitle', False)],
186 '''These are Latin small letters which were not in Unicode 5.0.0
187 but are in Unicode 7.0.0. According to
188 DerivedCoreProperties.txt they are “Lowercase”. But no
189 uppercase versions exist. They have apparently been added
190 manually to glibc’s old LC_CTYPE.'''
191 ],
192 [[0xA730, 0xA731],
193 [('alpha', True), ('lower', True), ('upper', False),
194 ('tolower', False), ('toupper', False), ('totitle', False)],
195 '''These are Latin small “capital” letters which were not in
196 Unicode 5.0.0 but are in Unicode 7.0.0. According to
197 DerivedCoreProperties.txt they are “Lowercase”. But no
198 uppercase versions exist. They have apparently been added
199 manually to glibc’s old LC_CTYPE.'''
200 ],
201 [[(0xA771, 0xA778)],
202 [('alpha', True), ('lower', True), ('upper', False),
203 ('tolower', False), ('toupper', False), ('totitle', False)],
204 '''These are Latin small (or small “capital”) letters which
205 were not in Unicodee 5.0.0 but are in Unicode 7.0.0. According to
206 DerivedCoreProperties.txt they are “Lowercase”. But no
207 uppercase versions exist. They have apparently been added
208 manually to glibc’s old LC_CTYPE.'''
209 ],
210 [[0x0375],
211 [('combining', False), ('combining_level3', False),
212 ('alpha', False), ('lower', False), ('upper', False),
213 ('tolower', False), ('toupper', False), ('totitle', False)],
214 '''“0375;GREEK LOWER NUMERAL SIGN;Sk;0;ON;;;;;N;;;;;”. Has
215 apparently been added manually to glibc’s old LC_CTYPE as
216 “combining_level3”. That seems wrong, it is no combining
217 character because it does not have one of the general
218 categories Mn, Mc, or Me. According to
219 DerivedCoreProperties.txt it is not “Alphabetic”.'''
220 ],
221 [[0x108D],
222 [('combining', True), ('combining_level3', False),
223 ('alpha', False), ('lower', False), ('upper', False),
224 ('tolower', False), ('toupper', False), ('totitle', False)],
225 '''“108D;MYANMAR SIGN SHAN COUNCIL EMPHATIC
226 TONE;Mn;220;NSM;;;;;N;;;;;”. Has apparently been added
227 manually to glibc’s old LC_CTYPE as
228 “combining_level3”. That seems wrong, although it is a
229 combining character because it has the general category
230 Mn, it is not “combining_level3” because the canonical
231 combining class value is 220 which is >= 200. According to
232 gen-unicode-ctype.c, “combining_level3” needs a
233 canonical combining class value < 200. According to
234 DerivedCoreProperties.txt it is not “Alphabetic”.'''
235 ],
236 [[0x06DE],
237 [('combining', False), ('combining_level3', False),
238 ('alpha', False), ('lower', False), ('upper', False),
239 ('tolower', False), ('toupper', False), ('totitle', False)],
240 ''' UnicodeData.txt 5.0.0: “06DE;ARABIC START OF RUB EL
241 HIZB;Me;0;NSM;;;;;N;;;;;”; UnicodeData.txt 7.0.0:
242 “06DE;ARABIC START OF RUB EL
243 HIZB;So;0;ON;;;;;N;;;;;”. I.e. this used to be a
244 combining character in Unicode 5.0.0 but not anymore in
245 7.0.0. According to DerivedCoreProperties.txt it is not
246 “Alphabetic”.'''
247 ],
248 [[0x0BD0],
249 [('combining', False), ('combining_level3', False),
250 ('alpha', True), ('lower', False), ('upper', False),
251 ('tolower', False), ('toupper', False), ('totitle', False)],
252 '''Not in UnicodeData.txt 5.0.0. UnicodeData.txt 7.0.0:
253 “0BD0;TAMIL OM;Lo;0;L;;;;;N;;;;;”. Apparently manually added to
254 “combining” and “combining_level3” in glibc’s old
255 LC_CTYPE. That seems wrong. According to
256 DerivedCoreProperties.txt it is “Alphabetic”.'''
257 ],
258 [[0x103F],
259 [('combining', False), ('combining_level3', False),
260 ('alpha', True), ('lower', False), ('upper', False),
261 ('tolower', False), ('toupper', False), ('totitle', False)],
262 '''Not in UnicodeData.txt 5.0.0. UnicodeData.txt 7.0.0:
263 “103F;MYANMAR LETTER GREAT SA;Lo;0;L;;;;;N;;;;;”.
264 Apparently manually added to “combining” and
265 “combining_level3” in glibc’s old LC_CTYPE. That seems
266 wrong. According to DerivedCoreProperties.txt it is
267 “Alphabetic”.'''
268 ],
269 [[(0x0901, 0x0903)],
270 [('combining', True), ('combining_level3', True),
271 ('alpha', True), ('lower', False), ('upper', False),
272 ('tolower', False), ('toupper', False), ('totitle', False)],
273 '''These have general category “Mn” i.e. these are combining
274 characters (both in UnicodeData.txt 5.0.0 and 7.0.0):
275 “0901;DEVANAGARI SIGN CANDRABINDU;Mn;0;NSM;;;;;N;;;;;”,
276 ”0902;DEVANAGARI SIGN ANUSVARA;Mn;0;NSM;;;;;N;;;;;”,
277 “0903;DEVANAGARI SIGN VISARGA;Mc;0;L;;;;;N;;;;;”.
278 According to DerivedCoreProperties.txt (7.0.0) these are
279 “Alphabetic”.'''
280 ],
281 [[0x093C],
282 [('combining', True), ('combining_level3', True),
283 ('alpha', False), ('lower', False), ('upper', False),
284 ('tolower', False), ('toupper', False), ('totitle', False)],
285 '''UnicodeData.txt (5.0.0 and 7.0.0): “093C;DEVANAGARI SIGN
286 NUKTA;Mn;7;NSM;;;;;N;;;;;” According to
287 DerivedCoreProperties.txt (7.0.0) this is *not*
288 “Alphabetic”. glibc’s old LC_TYPE has this in “alpha”.'''
289 ],
290 [[(0x093E, 0x093F)],
291 [('combining', True), ('combining_level3', True),
292 ('alpha', True), ('lower', False), ('upper', False),
293 ('tolower', False), ('toupper', False), ('totitle', False)],
294 '''These have general category “Mc” i.e. these are combining
295 characters (both in UnicodeData.txt 5.0.0 and 7.0.0):
296 “093E;DEVANAGARI VOWEL SIGN AA;Mc;0;L;;;;;N;;;;;”
297 “093F;DEVANAGARI VOWEL SIGN I;Mc;0;L;;;;;N;;;;;”
298 According to DerivedCoreProperties.txt (7.0.0) these are
299 “Alphabetic”.'''
300 ],
301 [[(0x0940, 0x094C)],
302 [('combining', True), ('combining_level3', True),
303 ('alpha', True), ('lower', False), ('upper', False),
304 ('tolower', False), ('toupper', False), ('totitle', False)],
305 '''These are all combining
306 characters (“Mc” or “Mn” both in UnicodeData.txt 5.0.0 and 7.0.0).
307 According to DerivedCoreProperties.txt (7.0.0) these are
308 “Alphabetic”.'''
309 ],
310 [[0x094D],
311 [('combining', True), ('combining_level3', True),
312 ('alpha', False), ('lower', False), ('upper', False),
313 ('tolower', False), ('toupper', False), ('totitle', False)],
314 '''Combining character, both in UnicodeData.txt 5.0.0 and 7.0.0.
315 “094D;DEVANAGARI SIGN VIRAMA;Mn;9;NSM;;;;;N;;;;;”
316 According to DerivedCoreProperties.txt (7.0.0) it is *not*
317 “Alphabetic”.'''
318 ],
319 [[(0x0951, 0x0954)],
320 [('combining', True), ('combining_level3', False),
321 ('alpha', False), ('lower', False), ('upper', False),
322 ('tolower', False), ('toupper', False), ('totitle', False)],
323 '''Combining characters, both in UnicodeData.txt 5.0.0 and 7.0.0.
324 According to DerivedCoreProperties.txt (7.0.0) these are *not*
325 “Alphabetic”.'''
326 ],
327 [[(0x0962, 0x0963), (0x0981, 0x0983)],
328 [('combining', True), ('combining_level3', True),
329 ('alpha', True), ('lower', False), ('upper', False),
330 ('tolower', False), ('toupper', False), ('totitle', False)],
331 '''Combining characters, both in UnicodeData.txt 5.0.0 and 7.0.0.
332 According to DerivedCoreProperties.txt (7.0.0) these are
333 “Alphabetic”.'''
334 ],
335 [[0x09BC],
336 [('combining', True), ('combining_level3', True),
337 ('alpha', False), ('lower', False), ('upper', False),
338 ('tolower', False), ('toupper', False), ('totitle', False)],
339 '''
340 “09BC;BENGALI SIGN NUKTA;Mn;7;NSM;;;;;N;;;;;”
341 Combining character, both in UnicodeData.txt 5.0.0 and 7.0.0.
342 According to DerivedCoreProperties.txt (7.0.0) it is *not*
343 “Alphabetic”.'''
344 ],
345 [[(0x09BE, 0x09BF), (0x09C0, 0x09C4), (0x09C7, 0x09C8),
346 (0x09CB, 0x09CC)],
347 [('combining', True), ('combining_level3', True),
348 ('alpha', True), ('lower', False), ('upper', False),
349 ('tolower', False), ('toupper', False), ('totitle', False)],
350 '''
351 “09BE;BENGALI VOWEL SIGN AA;Mc;0;L;;;;;N;;;;;”
352 “09BF;BENGALI VOWEL SIGN I;Mc;0;L;;;;;N;;;;;”
353 “09C0;BENGALI VOWEL SIGN II;Mc;0;L;;;;;N;;;;;”
354 “09C1;BENGALI VOWEL SIGN U;Mn;0;NSM;;;;;N;;;;;”
355 “09C2;BENGALI VOWEL SIGN UU;Mn;0;NSM;;;;;N;;;;;”
356 “09C3;BENGALI VOWEL SIGN VOCALIC R;Mn;0;NSM;;;;;N;;;;;”
357 “09C4;BENGALI VOWEL SIGN VOCALIC RR;Mn;0;NSM;;;;;N;;;;;”
358 “09C7;BENGALI VOWEL SIGN E;Mc;0;L;;;;;N;;;;;”
359 “09C8;BENGALI VOWEL SIGN AI;Mc;0;L;;;;;N;;;;;”
360 “09CB;BENGALI VOWEL SIGN O;Mc;0;L;09C7 09BE;;;;N;;;;;”
361 “09CC;BENGALI VOWEL SIGN AU;Mc;0;L;09C7 09D7;;;;N;;;;;”
362 Combining characters, both in UnicodeData.txt 5.0.0 and 7.0.0.
363 According to DerivedCoreProperties.txt (7.0.0) these are
364 “Alphabetic”.'''
365 ],
366 [[0x09CD],
367 [('combining', True), ('combining_level3', True),
368 ('alpha', False), ('lower', False), ('upper', False),
369 ('tolower', False), ('toupper', False), ('totitle', False)],
370 '''
371 “09CD;BENGALI SIGN VIRAMA;Mn;9;NSM;;;;;N;;;;;”
372 Combining character, both in UnicodeData.txt 5.0.0 and 7.0.0.
373 According to DerivedCoreProperties.txt (7.0.0) it is *not*
374 “Alphabetic”.'''
375 ],
376 [[0x09D7, (0x09E2, 0x09E3)],
377 [('combining', True), ('combining_level3', True),
378 ('alpha', True), ('lower', False), ('upper', False),
379 ('tolower', False), ('toupper', False), ('totitle', False)],
380 '''Combining characters, both in UnicodeData.txt 5.0.0 and 7.0.0.
381 According to DerivedCoreProperties.txt (7.0.0) these are
382 “Alphabetic”.'''
383 ],
384 [[0x09F2, 0x09F3],
385 [('combining', False), ('combining_level3', False),
386 ('alpha', False), ('lower', False), ('upper', False),
387 ('tolower', False), ('toupper', False), ('totitle', False)],
388 '''
389 “09F2;BENGALI RUPEE MARK;Sc;0;ET;;;;;N;;;;;”
390 “09F3;BENGALI RUPEE SIGN;Sc;0;ET;;;;;N;;;;;”
391 According to DerivedCoreProperties.txt (7.0.0) these are *not*
392 “Alphabetic”.'''
393 ],
394 [[(0x09F4, 0x09FA)],
395 [('combining', False), ('combining_level3', False),
396 ('alpha', False), ('lower', False), ('upper', False),
397 ('tolower', False), ('toupper', False), ('totitle', False)],
398 '''
399 “09F4;BENGALI CURRENCY NUMERATOR ONE;No;0;L;;;;1/16;N;;;;;”
400 “09F5;BENGALI CURRENCY NUMERATOR TWO;No;0;L;;;;1/8;N;;;;;”
401 “09F6;BENGALI CURRENCY NUMERATOR THREE;No;0;L;;;;3/16;N;;;;;”
402 “09F7;BENGALI CURRENCY NUMERATOR FOUR;No;0;L;;;;1/4;N;;;;;”
403 “09F8;BENGALI CURRENCY NUMERATOR ONE LESS THAN THE DENOMINATOR;
404 No;0;L;;;;3/4;N;;;;;”
405 “09F9;BENGALI CURRENCY DENOMINATOR SIXTEEN;No;0;L;;;;16;N;;;;;”
406 “09FA;BENGALI ISSHAR;So;0;L;;;;;N;;;;;”
407 According to DerivedCoreProperties.txt (7.0.0) these are *not*
408 “Alphabetic”.'''
409 ],
410 [[(0x0A01, 0x0A03)],
411 [('combining', True), ('combining_level3', True),
412 ('alpha', True), ('lower', False), ('upper', False),
413 ('tolower', False), ('toupper', False), ('totitle', False)],
414 '''
415 “0A01;GURMUKHI SIGN ADAK BINDI;Mn;0;NSM;;;;;N;;;;;”
416 “0A02;GURMUKHI SIGN BINDI;Mn;0;NSM;;;;;N;;;;;”
417 “0A03;GURMUKHI SIGN VISARGA;Mc;0;L;;;;;N;;;;;”
418 According to DerivedCoreProperties.txt (7.0.0) these are
419 “Alphabetic”.'''
420 ],
421 [[0x0A3C],
422 [('combining', True), ('combining_level3', True),
423 ('alpha', False), ('lower', False), ('upper', False),
424 ('tolower', False), ('toupper', False), ('totitle', False)],
425 '''
426 “0A3C;GURMUKHI SIGN NUKTA;Mn;7;NSM;;;;;N;;;;;”
427 According to DerivedCoreProperties.txt (7.0.0) this is *not*
428 “Alphabetic”.'''
429 ],
430 [[(0x0A3E, 0x0A40), (0x0A41, 0x0A42), (0x0A47, 0x0A48),
431 (0x0A4B, 0x0A4C)],
432 [('combining', True), ('combining_level3', True),
433 ('alpha', True), ('lower', False), ('upper', False),
434 ('tolower', False), ('toupper', False), ('totitle', False)],
435 '''
436 “0A3E;GURMUKHI VOWEL SIGN AA;Mc;0;L;;;;;N;;;;;”
437 “0A3F;GURMUKHI VOWEL SIGN I;Mc;0;L;;;;;N;;;;;”
438 “0A40;GURMUKHI VOWEL SIGN II;Mc;0;L;;;;;N;;;;;”
439 “0A41;GURMUKHI VOWEL SIGN U;Mn;0;NSM;;;;;N;;;;;”
440 “0A42;GURMUKHI VOWEL SIGN UU;Mn;0;NSM;;;;;N;;;;;”
441 “0A47;GURMUKHI VOWEL SIGN EE;Mn;0;NSM;;;;;N;;;;;”
442 “0A48;GURMUKHI VOWEL SIGN AI;Mn;0;NSM;;;;;N;;;;;”
443 “0A4B;GURMUKHI VOWEL SIGN OO;Mn;0;NSM;;;;;N;;;;;”
444 “0A4C;GURMUKHI VOWEL SIGN AU;Mn;0;NSM;;;;;N;;;;;”
445 According to DerivedCoreProperties.txt (7.0.0) these are
446 “Alphabetic”.'''
447 ],
448 [[0x0A4D],
449 [('combining', True), ('combining_level3', True),
450 ('alpha', False), ('lower', False), ('upper', False),
451 ('tolower', False), ('toupper', False), ('totitle', False)],
452 '''
453 “0A4D;GURMUKHI SIGN VIRAMA;Mn;9;NSM;;;;;N;;;;;”
454 According to DerivedCoreProperties.txt (7.0.0) this is *not*
455 “Alphabetic”.'''
456 ],
457 [[0x0A51, (0x0A70, 0x0A71), 0x0A75, (0x0A81, 0x0A83)],
458 [('combining', True), ('combining_level3', True),
459 ('alpha', True), ('lower', False), ('upper', False),
460 ('tolower', False), ('toupper', False), ('totitle', False)],
461 '''
462 “0A4D;GURMUKHI SIGN VIRAMA;Mn;9;NSM;;;;;N;;;;;”
463 “0A70;GURMUKHI TIPPI;Mn;0;NSM;;;;;N;;;;;”
464 “0A71;GURMUKHI ADDAK;Mn;0;NSM;;;;;N;;;;;”
465 “0A75;GURMUKHI SIGN YAKASH;Mn;0;NSM;;;;;N;;;;;”
466 “0A81;GUJARATI SIGN CANDRABINDU;Mn;0;NSM;;;;;N;;;;;”
467 “0A82;GUJARATI SIGN ANUSVARA;Mn;0;NSM;;;;;N;;;;;”
468 “0A83;GUJARATI SIGN VISARGA;Mc;0;L;;;;;N;;;;;”
469 According to DerivedCoreProperties.txt (7.0.0) these are
470 “Alphabetic”.'''
471 ],
472 [[0x0ABC],
473 [('combining', True), ('combining_level3', True),
474 ('alpha', False), ('lower', False), ('upper', False),
475 ('tolower', False), ('toupper', False), ('totitle', False)],
476 '''
477 “0ABC;GUJARATI SIGN NUKTA;Mn;7;NSM;;;;;N;;;;;”
478 According to DerivedCoreProperties.txt (7.0.0) this is *not*
479 “Alphabetic”.'''
480 ],
481 [[(0x0ABE, 0x0AC5), (0x0AC7, 0x0AC9), (0x0ACB, 0x0ACC)],
482 [('combining', True), ('combining_level3', True),
483 ('alpha', True), ('lower', False), ('upper', False),
484 ('tolower', False), ('toupper', False), ('totitle', False)],
485 '''
486 “0ABE;GUJARATI VOWEL SIGN AA;Mc;0;L;;;;;N;;;;;”
487 “0ABF;GUJARATI VOWEL SIGN I;Mc;0;L;;;;;N;;;;;”
488 “0AC0;GUJARATI VOWEL SIGN II;Mc;0;L;;;;;N;;;;;”
489 “0AC1;GUJARATI VOWEL SIGN U;Mn;0;NSM;;;;;N;;;;;”
490 “0AC2;GUJARATI VOWEL SIGN UU;Mn;0;NSM;;;;;N;;;;;”
491 “0AC3;GUJARATI VOWEL SIGN VOCALIC R;Mn;0;NSM;;;;;N;;;;;”
492 “0AC4;GUJARATI VOWEL SIGN VOCALIC RR;Mn;0;NSM;;;;;N;;;;;”
493 “0AC5;GUJARATI VOWEL SIGN CANDRA E;Mn;0;NSM;;;;;N;;;;;”
494 “0AC7;GUJARATI VOWEL SIGN E;Mn;0;NSM;;;;;N;;;;;”
495 “0AC8;GUJARATI VOWEL SIGN AI;Mn;0;NSM;;;;;N;;;;;”
496 “0AC9;GUJARATI VOWEL SIGN CANDRA O;Mc;0;L;;;;;N;;;;;”
497 “0ACB;GUJARATI VOWEL SIGN O;Mc;0;L;;;;;N;;;;;”
498 “0ACC;GUJARATI VOWEL SIGN AU;Mc;0;L;;;;;N;;;;;”
499 According to DerivedCoreProperties.txt (7.0.0) these are
500 “Alphabetic”.'''
501 ],
502 [[0x0ACD],
503 [('combining', True), ('combining_level3', True),
504 ('alpha', False), ('lower', False), ('upper', False),
505 ('tolower', False), ('toupper', False), ('totitle', False)],
506 '''
507 “0ACD;GUJARATI SIGN VIRAMA;Mn;9;NSM;;;;;N;;;;;”
508 According to DerivedCoreProperties.txt (7.0.0) this is *not*
509 “Alphabetic”.'''
510 ],
511 [[(0x0AE2, 0x0AE3)],
512 [('combining', True), ('combining_level3', True),
513 ('alpha', True), ('lower', False), ('upper', False),
514 ('tolower', False), ('toupper', False), ('totitle', False)],
515 '''
516 “0AE2;GUJARATI VOWEL SIGN VOCALIC L;Mn;0;NSM;;;;;N;;;;;”
517 “0AE3;GUJARATI VOWEL SIGN VOCALIC LL;Mn;0;NSM;;;;;N;;;;;”
518 According to DerivedCoreProperties.txt (7.0.0) these are
519 “Alphabetic”.'''
520 ],
521 [[0x0AF1],
522 [('combining', False), ('combining_level3', False),
523 ('alpha', False), ('lower', False), ('upper', False),
524 ('tolower', False), ('toupper', False), ('totitle', False)],
525 '''
526 “0AF1;GUJARATI RUPEE SIGN;Sc;0;ET;;;;;N;;;;;”
527 According to DerivedCoreProperties.txt (7.0.0) this is *not*
528 “Alphabetic”.'''
529 ],
530 [[(0x0B01, 0x0B03)],
531 [('combining', True), ('combining_level3', True),
532 ('alpha', True), ('lower', False), ('upper', False),
533 ('tolower', False), ('toupper', False), ('totitle', False)],
534 '''
535 “0B01;ORIYA SIGN CANDRABINDU;Mn;0;NSM;;;;;N;;;;;”
536 “0B02;ORIYA SIGN ANUSVARA;Mc;0;L;;;;;N;;;;;”
537 “0B03;ORIYA SIGN VISARGA;Mc;0;L;;;;;N;;;;;”
538 According to DerivedCoreProperties.txt (7.0.0) these are
539 “Alphabetic”.'''
540 ],
541 [[0x0B3C],
542 [('combining', True), ('combining_level3', True),
543 ('alpha', False), ('lower', False), ('upper', False),
544 ('tolower', False), ('toupper', False), ('totitle', False)],
545 '''
546 “0B3C;ORIYA SIGN NUKTA;Mn;7;NSM;;;;;N;;;;;”
547 According to DerivedCoreProperties.txt (7.0.0) this is *not*
548 “Alphabetic”.'''
549 ],
550 [[(0x0B3E, 0x0B44), (0x0B47, 0x0B48), (0x0B4B, 0x0B4C)],
551 [('combining', True), ('combining_level3', True),
552 ('alpha', True), ('lower', False), ('upper', False),
553 ('tolower', False), ('toupper', False), ('totitle', False)],
554 '''
555 “0B3E;ORIYA VOWEL SIGN AA;Mc;0;L;;;;;N;;;;;”
556 “0B3F;ORIYA VOWEL SIGN I;Mn;0;NSM;;;;;N;;;;;”
557 “0B40;ORIYA VOWEL SIGN II;Mc;0;L;;;;;N;;;;;”
558 “0B41;ORIYA VOWEL SIGN U;Mn;0;NSM;;;;;N;;;;;”
559 “0B42;ORIYA VOWEL SIGN UU;Mn;0;NSM;;;;;N;;;;;”
560 “0B43;ORIYA VOWEL SIGN VOCALIC R;Mn;0;NSM;;;;;N;;;;;”
561 “0B44;ORIYA VOWEL SIGN VOCALIC RR;Mn;0;NSM;;;;;N;;;;;”
562 “0B47;ORIYA VOWEL SIGN E;Mc;0;L;;;;;N;;;;;”
563 “0B48;ORIYA VOWEL SIGN AI;Mc;0;L;0B47 0B56;;;;N;;;;;”
564 “0B4B;ORIYA VOWEL SIGN O;Mc;0;L;0B47 0B3E;;;;N;;;;;”
565 “0B4C;ORIYA VOWEL SIGN AU;Mc;0;L;0B47 0B57;;;;N;;;;;”
566 According to DerivedCoreProperties.txt (7.0.0) these are
567 “Alphabetic”.'''
568 ],
569 [[0x0B4D],
570 [('combining', True), ('combining_level3', True),
571 ('alpha', False), ('lower', False), ('upper', False),
572 ('tolower', False), ('toupper', False), ('totitle', False)],
573 '''
574 “0B4D;ORIYA SIGN VIRAMA;Mn;9;NSM;;;;;N;;;;;”
575 According to DerivedCoreProperties.txt (7.0.0) this is *not*
576 “Alphabetic”.'''
577 ],
578 [[(0x0B56, 0x0B57), (0x0B62, 0x0B63)],
579 [('combining', True), ('combining_level3', True),
580 ('alpha', True), ('lower', False), ('upper', False),
581 ('tolower', False), ('toupper', False), ('totitle', False)],
582 '''
583 “0B56;ORIYA AI LENGTH MARK;Mn;0;NSM;;;;;N;;;;;”
584 “0B57;ORIYA AU LENGTH MARK;Mc;0;L;;;;;N;;;;;”
585 “0B62;ORIYA VOWEL SIGN VOCALIC L;Mn;0;NSM;;;;;N;;;;;”
586 “0B63;ORIYA VOWEL SIGN VOCALIC LL;Mn;0;NSM;;;;;N;;;;;”
587 According to DerivedCoreProperties.txt (7.0.0) these are
588 “Alphabetic”.'''
589 ],
590 [[0x0B70],
591 [('combining', False), ('combining_level3', False),
592 ('alpha', False), ('lower', False), ('upper', False),
593 ('tolower', False), ('toupper', False), ('totitle', False)],
594 '''
595 “0B70;ORIYA ISSHAR;So;0;L;;;;;N;;;;;”
596 According to DerivedCoreProperties.txt (7.0.0) this is *not*
597 “Alphabetic”.'''
598 ],
599 [[0x0B82],
600 [('combining', True), ('combining_level3', True),
601 ('alpha', True), ('lower', False), ('upper', False),
602 ('tolower', False), ('toupper', False), ('totitle', False)],
603 '''
604 “0B82;TAMIL SIGN ANUSVARA;Mn;0;NSM;;;;;N;;;;;”
605 According to DerivedCoreProperties.txt (7.0.0) this is *not*
606 “Alphabetic”.'''
607 ],
608 [[(0x0BBE, 0x0BC2), (0x0BC6, 0x0BC8), (0x0BCA, 0x0BCC)],
609 [('combining', True), ('combining_level3', True),
610 ('alpha', True), ('lower', False), ('upper', False),
611 ('tolower', False), ('toupper', False), ('totitle', False)],
612 '''
613 “0BBE;TAMIL VOWEL SIGN AA;Mc;0;L;;;;;N;;;;;”
614 “0BBF;TAMIL VOWEL SIGN I;Mc;0;L;;;;;N;;;;;”
615 “0BC0;TAMIL VOWEL SIGN II;Mn;0;NSM;;;;;N;;;;;”
616 “0BC1;TAMIL VOWEL SIGN U;Mc;0;L;;;;;N;;;;;”
617 “0BC2;TAMIL VOWEL SIGN UU;Mc;0;L;;;;;N;;;;;”
618 “0BC6;TAMIL VOWEL SIGN E;Mc;0;L;;;;;N;;;;;”
619 “0BC7;TAMIL VOWEL SIGN EE;Mc;0;L;;;;;N;;;;;”
620 “0BC8;TAMIL VOWEL SIGN AI;Mc;0;L;;;;;N;;;;;”
621 “0BCA;TAMIL VOWEL SIGN O;Mc;0;L;0BC6 0BBE;;;;N;;;;;”
622 “0BCB;TAMIL VOWEL SIGN OO;Mc;0;L;0BC7 0BBE;;;;N;;;;;”
623 “0BCC;TAMIL VOWEL SIGN AU;Mc;0;L;0BC6 0BD7;;;;N;;;;;”
624 According to DerivedCoreProperties.txt (7.0.0) these are
625 “Alphabetic”.'''
626 ],
627 [[0x0BCD],
628 [('combining', True), ('combining_level3', True),
629 ('alpha', False), ('lower', False), ('upper', False),
630 ('tolower', False), ('toupper', False), ('totitle', False)],
631 '''
632 “0BCD;TAMIL SIGN VIRAMA;Mn;9;NSM;;;;;N;;;;;”
633 According to DerivedCoreProperties.txt (7.0.0) this is *not*
634 “Alphabetic”.'''
635 ],
636 [[0x0BD7],
637 [('combining', True), ('combining_level3', True),
638 ('alpha', True), ('lower', False), ('upper', False),
639 ('tolower', False), ('toupper', False), ('totitle', False)],
640 '''
641 “0BD7;TAMIL AU LENGTH MARK;Mc;0;L;;;;;N;;;;;”
642 According to DerivedCoreProperties.txt (7.0.0) this is *not*
643 “Alphabetic”.'''
644 ],
645 [[(0x0BF0, 0x0BFA)],
646 [('combining', False), ('combining_level3', False),
647 ('alpha', False), ('lower', False), ('upper', False),
648 ('tolower', False), ('toupper', False), ('totitle', False)],
649 '''
650 “0BF0;TAMIL NUMBER TEN;No;0;L;;;;10;N;;;;;”
651 “0BF1;TAMIL NUMBER ONE HUNDRED;No;0;L;;;;100;N;;;;;”
652 “0BF2;TAMIL NUMBER ONE THOUSAND;No;0;L;;;;1000;N;;;;;”
653 “0BF3;TAMIL DAY SIGN;So;0;ON;;;;;N;;;;;”
654 “0BF4;TAMIL MONTH SIGN;So;0;ON;;;;;N;;;;;”
655 “0BF5;TAMIL YEAR SIGN;So;0;ON;;;;;N;;;;;”
656 “0BF6;TAMIL DEBIT SIGN;So;0;ON;;;;;N;;;;;”
657 “0BF7;TAMIL CREDIT SIGN;So;0;ON;;;;;N;;;;;”
658 “0BF8;TAMIL AS ABOVE SIGN;So;0;ON;;;;;N;;;;;”
659 “0BF9;TAMIL RUPEE SIGN;Sc;0;ET;;;;;N;;;;;”
660 “0BFA;TAMIL NUMBER SIGN;So;0;ON;;;;;N;;;;;”
661 According to DerivedCoreProperties.txt (7.0.0) this is *not*
662 “Alphabetic”.'''
663 ],
664 [[(0x0C01, 0x0C03)],
665 [('combining', True), ('combining_level3', True),
666 ('alpha', True), ('lower', False), ('upper', False),
667 ('tolower', False), ('toupper', False), ('totitle', False)],
668 '''
669 “0C01;TELUGU SIGN CANDRABINDU;Mc;0;L;;;;;N;;;;;”
670 “0C02;TELUGU SIGN ANUSVARA;Mc;0;L;;;;;N;;;;;”
671 “0C03;TELUGU SIGN VISARGA;Mc;0;L;;;;;N;;;;;”
672 According to DerivedCoreProperties.txt (7.0.0) these are
673 “Alphabetic”.'''
674 ],
675 [[(0x0C3E, 0x0C44), (0x0C46, 0x0C48), (0x0C4A, 0x0C4C)],
676 [('combining', True), ('combining_level3', True),
677 ('alpha', True), ('lower', False), ('upper', False),
678 ('tolower', False), ('toupper', False), ('totitle', False)],
679 '''
680 “0C3E;TELUGU VOWEL SIGN AA;Mn;0;NSM;;;;;N;;;;;”
681 “0C3F;TELUGU VOWEL SIGN I;Mn;0;NSM;;;;;N;;;;;”
682 “0C40;TELUGU VOWEL SIGN II;Mn;0;NSM;;;;;N;;;;;”
683 “0C41;TELUGU VOWEL SIGN U;Mc;0;L;;;;;N;;;;;”
684 “0C42;TELUGU VOWEL SIGN UU;Mc;0;L;;;;;N;;;;;”
685 “0C43;TELUGU VOWEL SIGN VOCALIC R;Mc;0;L;;;;;N;;;;;”
686 “0C44;TELUGU VOWEL SIGN VOCALIC RR;Mc;0;L;;;;;N;;;;;”
687 “0C46;TELUGU VOWEL SIGN E;Mn;0;NSM;;;;;N;;;;;”
688 “0C47;TELUGU VOWEL SIGN EE;Mn;0;NSM;;;;;N;;;;;”
689 “0C48;TELUGU VOWEL SIGN AI;Mn;0;NSM;0C46 0C56;;;;N;;;;;”
690 “0C4A;TELUGU VOWEL SIGN O;Mn;0;NSM;;;;;N;;;;;”
691 “0C4B;TELUGU VOWEL SIGN OO;Mn;0;NSM;;;;;N;;;;;”
692 “0C4C;TELUGU VOWEL SIGN AU;Mn;0;NSM;;;;;N;;;;;”
693 According to DerivedCoreProperties.txt (7.0.0) these are
694 “Alphabetic”.'''
695 ],
696 [[0x0C4D],
697 [('combining', True), ('combining_level3', True),
698 ('alpha', False), ('lower', False), ('upper', False),
699 ('tolower', False), ('toupper', False), ('totitle', False)],
700 '''
701 “0C4D;TELUGU SIGN VIRAMA;Mn;9;NSM;;;;;N;;;;;”
702 According to DerivedCoreProperties.txt (7.0.0) these are *not*
703 “Alphabetic”.'''
704 ],
705 [[(0x0C55, 0x0C56), (0x0C62, 0x0C63)],
706 [('combining', True), ('combining_level3', True),
707 ('alpha', True), ('lower', False), ('upper', False),
708 ('tolower', False), ('toupper', False), ('totitle', False)],
709 '''
710 “0C55;TELUGU LENGTH MARK;Mn;84;NSM;;;;;N;;;;;”
711 “0C56;TELUGU AI LENGTH MARK;Mn;91;NSM;;;;;N;;;;;”
712 “0C62;TELUGU VOWEL SIGN VOCALIC L;Mn;0;NSM;;;;;N;;;;;”
713 “0C63;TELUGU VOWEL SIGN VOCALIC LL;Mn;0;NSM;;;;;N;;;;;”
714 According to DerivedCoreProperties.txt (7.0.0) these are
715 “Alphabetic”.'''
716 ],
717 [[(0x0C78, 0x0C7F)],
718 [('combining', False), ('combining_level3', False),
719 ('alpha', False), ('lower', False), ('upper', False),
720 ('tolower', False), ('toupper', False), ('totitle', False)],
721 '''
722 “0C78;TELUGU FRACTION DIGIT ZERO FOR ODD POWERS OF FOUR;
723 No;0;ON;;;;0;N;;;;;”
724 “0C79;TELUGU FRACTION DIGIT ONE FOR ODD POWERS OF FOUR;
725 No;0;ON;;;;1;N;;;;;”
726 “0C7A;TELUGU FRACTION DIGIT TWO FOR ODD POWERS OF FOUR;
727 No;0;ON;;;;2;N;;;;;”
728 “0C7B;TELUGU FRACTION DIGIT THREE FOR ODD POWERS OF FOUR;
729 No;0;ON;;;;3;N;;;;;”
730 “0C7C;TELUGU FRACTION DIGIT ONE FOR EVEN POWERS OF FOUR;
731 No;0;ON;;;;1;N;;;;;”
732 “0C7D;TELUGU FRACTION DIGIT TWO FOR EVEN POWERS OF FOUR;
733 No;0;ON;;;;2;N;;;;;”
734 “0C7E;TELUGU FRACTION DIGIT THREE FOR EVEN POWERS OF FOUR;
735 No;0;ON;;;;3;N;;;;;”
736 “0C7F;TELUGU SIGN TUUMU;So;0;L;;;;;N;;;;;”
737 According to DerivedCoreProperties.txt (7.0.0) these are *not*
738 “Alphabetic”.'''
739 ],
740 [[(0x0C82, 0x0C83)],
741 [('combining', True), ('combining_level3', True),
742 ('alpha', True), ('lower', False), ('upper', False),
743 ('tolower', False), ('toupper', False), ('totitle', False)],
744 '''
745 “0C81;KANNADA SIGN CANDRABINDU;Mn;0;NSM;;;;;N;;;;;”
746 “0C82;KANNADA SIGN ANUSVARA;Mc;0;L;;;;;N;;;;;”
747 “0C83;KANNADA SIGN VISARGA;Mc;0;L;;;;;N;;;;;”
748 According to DerivedCoreProperties.txt (7.0.0) these are
749 “Alphabetic”.'''
750 ],
751 [[0x0CBC],
752 [('combining', True), ('combining_level3', True),
753 ('alpha', False), ('lower', False), ('upper', False),
754 ('tolower', False), ('toupper', False), ('totitle', False)],
755 '''
756 “0CBC;KANNADA SIGN NUKTA;Mn;7;NSM;;;;;N;;;;;”
757 According to DerivedCoreProperties.txt (7.0.0) these are
758 “Alphabetic”.'''
759 ],
760 [[(0x0CBE, 0x0CC4), (0x0CC6, 0x0CC8), (0x0CCA, 0x0CCC)],
761 [('combining', True), ('combining_level3', True),
762 ('alpha', True), ('lower', False), ('upper', False),
763 ('tolower', False), ('toupper', False), ('totitle', False)],
764 '''
765 “0CBE;KANNADA VOWEL SIGN AA;Mc;0;L;;;;;N;;;;;”
766 “0CBF;KANNADA VOWEL SIGN I;Mn;0;L;;;;;N;;;;;”
767 “0CC0;KANNADA VOWEL SIGN II;Mc;0;L;0CBF 0CD5;;;;N;;;;;”
768 “0CC1;KANNADA VOWEL SIGN U;Mc;0;L;;;;;N;;;;;”
769 “0CC2;KANNADA VOWEL SIGN UU;Mc;0;L;;;;;N;;;;;”
770 “0CC3;KANNADA VOWEL SIGN VOCALIC R;Mc;0;L;;;;;N;;;;;”
771 “0CC4;KANNADA VOWEL SIGN VOCALIC RR;Mc;0;L;;;;;N;;;;;”
772 “0CC6;KANNADA VOWEL SIGN E;Mn;0;L;;;;;N;;;;;”
773 “0CC7;KANNADA VOWEL SIGN EE;Mc;0;L;0CC6 0CD5;;;;N;;;;;”
774 “0CC8;KANNADA VOWEL SIGN AI;Mc;0;L;0CC6 0CD6;;;;N;;;;;”
775 “0CCA;KANNADA VOWEL SIGN O;Mc;0;L;0CC6 0CC2;;;;N;;;;;”
776 “0CCB;KANNADA VOWEL SIGN OO;Mc;0;L;0CCA 0CD5;;;;N;;;;;”
777 “0CCC;KANNADA VOWEL SIGN AU;Mn;0;NSM;;;;;N;;;;;”
778 According to DerivedCoreProperties.txt (7.0.0) these are
779 “Alphabetic”.'''
780 ],
781 [[0x0CCD],
782 [('combining', True), ('combining_level3', True),
783 ('alpha', False), ('lower', False), ('upper', False),
784 ('tolower', False), ('toupper', False), ('totitle', False)],
785 '''
786 “0CCD;KANNADA SIGN VIRAMA;Mn;9;NSM;;;;;N;;;;;”
787 According to DerivedCoreProperties.txt (7.0.0) these are *not*
788 “Alphabetic”.'''
789 ],
790 [[(0x0CD5, 0x0CD6), (0x0CE2, 0x0CE3)],
791 [('combining', True), ('combining_level3', True),
792 ('alpha', True), ('lower', False), ('upper', False),
793 ('tolower', False), ('toupper', False), ('totitle', False)],
794 '''
795 0CD5;KANNADA LENGTH MARK;Mc;0;L;;;;;N;;;;;
796 0CD6;KANNADA AI LENGTH MARK;Mc;0;L;;;;;N;;;;;
797 0CE2;KANNADA VOWEL SIGN VOCALIC L;Mn;0;NSM;;;;;N;;;;;
798 0CE3;KANNADA VOWEL SIGN VOCALIC LL;Mn;0;NSM;;;;;N;;;;;
799 According to DerivedCoreProperties.txt (7.0.0) these are
800 “Alphabetic”.'''
801 ],
802 [[(0x0D02, 0x0D03), (0x0D3E, 0x0D44), (0x0D46, 0x0D48),
803 (0x0D4A, 0x0D4C)],
804 [('combining', True), ('combining_level3', True),
805 ('alpha', True), ('lower', False), ('upper', False),
806 ('tolower', False), ('toupper', False), ('totitle', False)],
807 '''
808 “0D02;MALAYALAM SIGN ANUSVARA;Mc;0;L;;;;;N;;;;;”
809 “0D03;MALAYALAM SIGN VISARGA;Mc;0;L;;;;;N;;;;;”
810 “0D3E;MALAYALAM VOWEL SIGN AA;Mc;0;L;;;;;N;;;;;”
811 “0D3F;MALAYALAM VOWEL SIGN I;Mc;0;L;;;;;N;;;;;”
812 “0D40;MALAYALAM VOWEL SIGN II;Mc;0;L;;;;;N;;;;;”
813 “0D41;MALAYALAM VOWEL SIGN U;Mn;0;NSM;;;;;N;;;;;”
814 “0D42;MALAYALAM VOWEL SIGN UU;Mn;0;NSM;;;;;N;;;;;”
815 “0D43;MALAYALAM VOWEL SIGN VOCALIC R;Mn;0;NSM;;;;;N;;;;;”
816 “0D44;MALAYALAM VOWEL SIGN VOCALIC RR;Mn;0;NSM;;;;;N;;;;;”
817 “0D46;MALAYALAM VOWEL SIGN E;Mc;0;L;;;;;N;;;;;”
818 “0D47;MALAYALAM VOWEL SIGN EE;Mc;0;L;;;;;N;;;;;”
819 “0D48;MALAYALAM VOWEL SIGN AI;Mc;0;L;;;;;N;;;;;”
820 “0D4A;MALAYALAM VOWEL SIGN O;Mc;0;L;0D46 0D3E;;;;N;;;;;”
821 “0D4B;MALAYALAM VOWEL SIGN OO;Mc;0;L;0D47 0D3E;;;;N;;;;;”
822 “0D4C;MALAYALAM VOWEL SIGN AU;Mc;0;L;0D46 0D57;;;;N;;;;;”
823 According to DerivedCoreProperties.txt (7.0.0) these are
824 “Alphabetic”.'''
825 ],
826 [[0x0D4D],
827 [('combining', True), ('combining_level3', True),
828 ('alpha', False), ('lower', False), ('upper', False),
829 ('tolower', False), ('toupper', False), ('totitle', False)],
830 '''
831 “0D4D;MALAYALAM SIGN VIRAMA;Mn;9;NSM;;;;;N;;;;;”
832 According to DerivedCoreProperties.txt (7.0.0) these are
833 “Alphabetic”.'''
834 ],
835 [[0x0D57, (0x0D62, 0x0D63)],
836 [('combining', True), ('combining_level3', True),
837 ('alpha', True), ('lower', False), ('upper', False),
838 ('tolower', False), ('toupper', False), ('totitle', False)],
839 '''
840 “0D57;MALAYALAM AU LENGTH MARK;Mc;0;L;;;;;N;;;;;”
841 “0D62;MALAYALAM VOWEL SIGN VOCALIC L;Mn;0;NSM;;;;;N;;;;;”
842 “0D63;MALAYALAM VOWEL SIGN VOCALIC LL;Mn;0;NSM;;;;;N;;;;;”
843 According to DerivedCoreProperties.txt (7.0.0) these are
844 “Alphabetic”.'''
845 ],
846 [[(0x0D70, 0x0D79)],
847 [('combining', False), ('combining_level3', False),
848 ('alpha', False), ('lower', False), ('upper', False),
849 ('tolower', False), ('toupper', False), ('totitle', False)],
850 '''
851 “0D70;MALAYALAM NUMBER TEN;No;0;L;;;;10;N;;;;;”
852 “0D71;MALAYALAM NUMBER ONE HUNDRED;No;0;L;;;;100;N;;;;;”
853 “0D72;MALAYALAM NUMBER ONE THOUSAND;No;0;L;;;;1000;N;;;;;”
854 “0D73;MALAYALAM FRACTION ONE QUARTER;No;0;L;;;;1/4;N;;;;;”
855 “0D74;MALAYALAM FRACTION ONE HALF;No;0;L;;;;1/2;N;;;;;”
856 “0D75;MALAYALAM FRACTION THREE QUARTERS;No;0;L;;;;3/4;N;;;;;”
857 “0D79;MALAYALAM DATE MARK;So;0;L;;;;;N;;;;;”
858 According to DerivedCoreProperties.txt (7.0.0) these are *not*
859 “Alphabetic”.'''
860 ],
861 [[(0x0D82, 0x0D83)],
862 [('combining', True), ('combining_level3', True),
863 ('alpha', True), ('lower', False), ('upper', False),
864 ('tolower', False), ('toupper', False), ('totitle', False)],
865 '''
866 “0D82;SINHALA SIGN ANUSVARAYA;Mc;0;L;;;;;N;;;;;”
867 “0D83;SINHALA SIGN VISARGAYA;Mc;0;L;;;;;N;;;;;”
868 According to DerivedCoreProperties.txt (7.0.0) these are
869 “Alphabetic”.'''
870 ],
871 [[0x0DCA],
872 [('combining', True), ('combining_level3', True),
873 ('alpha', False), ('lower', False), ('upper', False),
874 ('tolower', False), ('toupper', False), ('totitle', False)],
875 '''
876 “0DCA;SINHALA SIGN AL-LAKUNA;Mn;9;NSM;;;;;N;;;;;”
877 According to DerivedCoreProperties.txt (7.0.0) these are *not*
878 “Alphabetic”.'''
879 ],
880 [[(0x0DCF, 0x0DD4), 0x0DD6, (0x0DD8, 0x0DDF), (0x0DF2, 0x0DF3)],
881 [('combining', True), ('combining_level3', True),
882 ('alpha', True), ('lower', False), ('upper', False),
883 ('tolower', False), ('toupper', False), ('totitle', False)],
884 '''
885 “0DCF;SINHALA VOWEL SIGN AELA-PILLA;Mc;0;L;;;;;N;;;;;”
886 “0DD0;SINHALA VOWEL SIGN KETTI AEDA-PILLA;Mc;0;L;;;;;N;;;;;”
887 “0DD1;SINHALA VOWEL SIGN DIGA AEDA-PILLA;Mc;0;L;;;;;N;;;;;”
888 “0DD2;SINHALA VOWEL SIGN KETTI IS-PILLA;Mn;0;NSM;;;;;N;;;;;”
889 “0DD3;SINHALA VOWEL SIGN DIGA IS-PILLA;Mn;0;NSM;;;;;N;;;;;”
890 “0DD4;SINHALA VOWEL SIGN KETTI PAA-PILLA;Mn;0;NSM;;;;;N;;;;;”
891 “0DD6;SINHALA VOWEL SIGN DIGA PAA-PILLA;Mn;0;NSM;;;;;N;;;;;”
892 “0DD8;SINHALA VOWEL SIGN GAETTA-PILLA;Mc;0;L;;;;;N;;;;;”
893 “0DD9;SINHALA VOWEL SIGN KOMBUVA;Mc;0;L;;;;;N;;;;;”
894 “0DDA;SINHALA VOWEL SIGN DIGA KOMBUVA;Mc;0;L;0DD9 0DCA;;;;N;;;;;”
895 “0DDB;SINHALA VOWEL SIGN KOMBU DEKA;Mc;0;L;;;;;N;;;;;”
896 “0DDC;SINHALA VOWEL SIGN KOMBUVA HAA AELA-PILLA;
897 Mc;0;L;0DD9 0DCF;;;;N;;;;;”
898 “0DDD;SINHALA VOWEL SIGN KOMBUVA HAA DIGA AELA-PILLA;
899 Mc;0;L;0DDC 0DCA;;;;N;;;;;”
900 “0DDE;SINHALA VOWEL SIGN KOMBUVA HAA GAYANUKITTA;
901 Mc;0;L;0DD9 0DDF;;;;N;;;;;”
902 “0DDF;SINHALA VOWEL SIGN GAYANUKITTA;Mc;0;L;;;;;N;;;;;”
903 “0DF2;SINHALA VOWEL SIGN DIGA GAETTA-PILLA;Mc;0;L;;;;;N;;;;;”
904 “0DF3;SINHALA VOWEL SIGN DIGA GAYANUKITTA;Mc;0;L;;;;;N;;;;;”
905 According to DerivedCoreProperties.txt (7.0.0) these are
906 “Alphabetic”.'''
907 ],
908 [[0x0DF4],
909 [('combining', False), ('combining_level3', False),
910 ('alpha', False), ('lower', False), ('upper', False),
911 ('tolower', False), ('toupper', False), ('totitle', False)],
912 '''
913 “0DF4;SINHALA PUNCTUATION KUNDDALIYA;Po;0;L;;;;;N;;;;;”
914 According to DerivedCoreProperties.txt (7.0.0) these are *not*
915 “Alphabetic”.'''
916 ],
917 [[(0xA789, 0xA78A)],
918 [('combining', False), ('combining_level3', False),
919 ('alpha', False), ('lower', False), ('upper', False),
920 ('tolower', False), ('toupper', False), ('totitle', False)],
921 '''
922 “A789;MODIFIER LETTER COLON;Sk;0;L;;;;;N;;;;;”
923 “A78A;MODIFIER LETTER SHORT EQUALS SIGN;Sk;0;L;;;;;N;;;;;”
924 According to DerivedCoreProperties.txt (7.0.0) these are *not*
925 “Alphabetic”.'''
926 ],
927 [[(0xA926, 0xA92A)],
928 [('combining', True), ('combining_level3', True),
929 ('alpha', True), ('lower', False), ('upper', False),
930 ('tolower', False), ('toupper', False), ('totitle', False)],
931 '''
932 “A926;KAYAH LI VOWEL UE;Mn;0;NSM;;;;;N;;;;;”
933 “A927;KAYAH LI VOWEL E;Mn;0;NSM;;;;;N;;;;;”
934 “A928;KAYAH LI VOWEL U;Mn;0;NSM;;;;;N;;;;;”
935 “A929;KAYAH LI VOWEL EE;Mn;0;NSM;;;;;N;;;;;”
936 “A92A;KAYAH LI VOWEL O;Mn;0;NSM;;;;;N;;;;;”
937 According to DerivedCoreProperties.txt (7.0.0) these are
938 “Alphabetic”.'''
939 ],
940 [[(0xA92B, 0xA92D)],
941 [('combining', True), ('combining_level3', False),
942 ('alpha', False), ('lower', False), ('upper', False),
943 ('tolower', False), ('toupper', False), ('totitle', False)],
944 '''
945 “A92B;KAYAH LI TONE PLOPHU;Mn;220;NSM;;;;;N;;;;;”
946 “A92C;KAYAH LI TONE CALYA;Mn;220;NSM;;;;;N;;;;;”
947 “A92D;KAYAH LI TONE CALYA PLOPHU;Mn;220;NSM;;;;;N;;;;;”
948 According to DerivedCoreProperties.txt (7.0.0) these are *not*
949 “Alphabetic”.'''
950 ]
951 ]