1# -*- coding: utf-8 -*-
2# Copyright (C) 2014-2021 Free Software Foundation, Inc.
3# This file is part of the GNU C Library.
4#
5# The GNU C Library is free software; you can redistribute it and/or
6# modify it under the terms of the GNU Lesser General Public
7# License as published by the Free Software Foundation; either
8# version 2.1 of the License, or (at your option) any later version.
9#
10# The GNU C Library is distributed in the hope that it will be useful,
11# but WITHOUT ANY WARRANTY; without even the implied warranty of
12# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
13# Lesser General Public License for more details.
14#
15# You should have received a copy of the GNU Lesser General Public
16# License along with the GNU C Library; if not, see
17# <https://www.gnu.org/licenses/>.
18
19'''
20This file contains a list of test cases used by
21the ctype_compatibility.py script.
22'''
23
24TEST_CASES = [
25    [[0x0E2F, 0x0E46], [('alpha', True), ('punct', False)],
26     '''Theppitak Karoonboonyanan <thep@links.nectec.or.th> says
27     <U0E2F>, <U0E46> should belong to punct. DerivedCoreProperties.txt
28     says it is alpha. We trust DerivedCoreProperties.txt.'''
29    ],
30    [[0x0E31, (0x0E34, 0x0E3A)], [('alpha', True)],
31     '''gen-unicode-ctype.c: Theppitak Karoonboonyanan
32     <thep@links.nectec.or.th> says <U0E31>, <U0E34>..<U0E3A>
33     are alpha. DerivedCoreProperties.txt agrees.'''
34    ],
35    [[(0x0E47, 0x0E4C), 0x0E4E], [('alpha', False)],
36     '''gen-unicode-ctype.c: Theppitak Karoonboonyanan
37     <thep@links.nectec.or.th> says <U0E47>..<U0E4E> are
38     is_alpha. DerivedCoreProperties does says *only* <U0E4D>
39     in that range is alphabetic, the others are *not*. We
40     trust DerivedCoreProperties.txt.'''
41    ],
42    [[0x0E4D], [('alpha', True)],
43     '''gen-unicode-ctype.c: Theppitak Karoonboonyanan
44     <thep@links.nectec.or.th> says <U0E47>..<U0E4E> are
45     is_alpha. DerivedCoreProperties does says *only* <U0E4D>
46            in that range is alphabetic, the others are *not*. We
47            trust DerivedCoreProperties.txt.
48            '''
49    ],
50    [[0x0345], [('alpha', True), ('lower', True)],
51     '''COMBINING GREEK YPOGEGRAMMENI
52     According to DerivedCoreProperties.txt, this is “Alphabetic”
53     and “Lowercase”.'''
54    ],
55    [[(0x2160, 0x2188)], [('alpha', True)],
56     '''Roman Numerals are “Alphabetic” according to
57     DerivedCoreProperties.txt'''
58    ],
59    [[(0x24B6, 0x24E9)], [('alpha', True)],
60     '''Circled Latin letters are “Alphabetic” according to
61     DerivedCoreProperties.txt'''
62    ],
63    [[0x661], [('alpha', True), ('digit', False)],
64     '''gen-unicode-ctype.c: All non-ASCII digits should be alphabetic.
65     ISO C 99 forbids us to have them in category "digit", but we
66     want iswalnum to return true on them. Don’t forget to
67     have a look at all the other digits, 0x661 is just one
68     example tested here.'''
69    ],
70    [[(0x0030, 0x0039)], [('digit', True)],
71     '''gen-unicode-ctype.c: All ASCII digits should be digits.'''
72    ],
73    [[0x0009], [('blank', True)],
74     '''gen-unicode-ctype.c: CHARACTER TABULATION'''
75    ],
76    [[0x2007], [('blank', False), ('space', False)],
77     '''gen-unicode-ctype.c: FIGURE SPACE, because it has <noBreak>
78     in the description.'''
79    ],
80    [[0x0009, 0x000A, 0x000B, 0x000C, 0x000D], [('space', True)],
81     '''gen-unicode-ctype.c: CHARACTER TABULATION, LINE FEED (LF), LINE
82     TABULATION, ;FORM FEED (FF), CARRIAGE RETURN (CR)'''
83    ],
84    [[0x2028, 0x2029], [('cntrl', True)],
85     '''gen-unicode-ctype.c: LINE SEPARATOR and PARAGRAPH SEPARATOR
86     should be cntrl.'''
87    ],
88    [[(0x0030, 0x0039), (0x0041, 0x0046), (0x0061, 0x0066)],
89     [('xdigit', True)],
90     '''gen-unicode-ctype.c: ISO C 99 says (6.4.4.1): hexadecimal-digit:
91     one of 0 1 2 3 4 5 6 7 8 9 a b c d e f A B C D E F (nothing else
92     should be considered as a hexadecimal-digit)'''
93    ],
94    [[0x0330], [('combining', True), ('combining_level3', False)],
95     '''gen-unicode-ctype.c: COMBINING TILDE BELOW, canonical combining
96     class value >= 200, should be in combining but not in
97     combining_level3'''
98    ],
99    [[0x0250, 0x0251, 0x0271], [('lower', True)],
100     '''Should be lower in Unicode 7.0.0 (was not lower in
101     Unicode 5.0.0).
102     '''
103    ],
104    [[0x2184], [('lower', True)],
105     '''Should be lower both in Unicode 5.0.0 and 7.0.0'''
106    ],
107    [[0xA67F], [('punct', False), ('alpha', True)],
108     '''0xa67f CYRILLIC PAYEROK. Not in Unicode 5.0.0. In Unicode
109     7.0.0. General category Lm (Letter
110     modifier). DerivedCoreProperties.txt says it is
111     “Alphabetic”. Apparently added manually to punct by mistake in
112     glibc’s old LC_CTYPE.'''
113    ],
114    [[0xA60C], [('punct', False), ('alpha', True)],
115     '''0xa60c VAI SYLLABLE LENGTHENER. Not in Unicode 5.0.0.
116     In Unicode 7.0.0. General category Lm (Letter
117     modifier). DerivedCoreProperties.txt says it is
118     “Alphabetic”. Apparently added manually to punct by mistake in
119     glibc’s old LC_CTYPE.'''
120    ],
121    [[0x2E2F], [('punct', False), ('alpha', True)],
122     '''0x2E2F VERTICAL TILDE. Not in Unicode 5.0.0. In Unicode
123     7.0.0. General category Lm (Letter
124     modifier). DerivedCoreProperties.txt says it is
125     “Alphabetic”. Apparently added manually to punct by mistake in
126     glibc’s old LC_CTYPE.'''
127    ],
128    [[(0x1090, 0x1099)], [('punct', False), ('alpha', True)],
129     '''MYANMAR SHAN DIGIT ZERO - MYANMAR SHAN DIGIT NINE.
130     These are digits, but because ISO C 99 forbids to
131     put them into digit they should go into alpha.'''
132    ],
133    [[0x103F], [('punct', False), ('alpha', True)],
134     '''0x103F MYANMAR LETTER GREAT SA. Not in Unicode 5.0.0.
135     In Unicode 7.0.0. General category Lo
136     (Other_Letter). DerivedCoreProperties.txt says it is
137     “Alphabetic”. Apparently added manually to punct by
138     mistake in glibc’s old LC_CTYPE.'''
139    ],
140    [[0x0374], [('punct', False), ('alpha', True)],
141     '''0x0374 GREEK NUMERAL SIGN. Unicode 5.0.0: general category
142     Sk. Unicode 7.0.0: General category Lm
143     (Modifier_Letter). DerivedCoreProperties.txt says it is
144     “Alphabetic”.'''
145    ],
146    [[0x02EC], [('punct', False), ('alpha', True)],
147     '''0x02EC MODIFIER LETTER VOICING. Unicode 5.0.0: general category
148     Sk. Unicode 7.0.0: General category Lm
149     (Modifier_Letter). DerivedCoreProperties.txt says it is
150     “Alphabetic”.'''
151    ],
152    [[0x180E], [('space', False), ('blank', False)],
153     '''0x180e MONGOLIAN VOWEL SEPARATOR. Unicode 5.0.0: General
154     category Zs (Space_Separator) Unicode 7.0.0: General category Cf
155     (Format).'''
156    ],
157    [[0x1E9C, 0x1E9D, 0x1E9F],
158     [('lower', True), ('upper', False), ('tolower', False),
159      ('toupper', False), ('totitle', False)],
160     '''ẜ 0x1e9c LATIN SMALL LETTER LONG S WITH DIAGONAL STROKE,
161     ẝ 0x1e9d LATIN SMALL LETTER LONG S WITH HIGH STROKE,
162     ẟ 0x1e9f LATIN SMALL LETTER DELTA. These are “Lowercase”
163     according to DerivedCoreProperties.txt but no upper case versions
164     exist.'''
165    ],
166    [[0x1E9E],
167     [('lower', False), ('upper', True), ('tolower', True),
168      ('toupper', False), ('totitle', False)],
169     '''0x1E9E ẞ LATIN CAPITAL LETTER SHARP S This is “Uppercase”
170     according to DerivedCoreProperties.txt and the lower case
171     version is 0x00DF ß LATIN SMALL LETTER SHARP S.'''
172    ],
173    [[0x2188],
174     [('alpha', True), ('lower', False), ('upper', False),
175      ('tolower', False), ('toupper', False), ('totitle', False)],
176     '''0x2188 ROMAN NUMERAL ONE HUNDRED THOUSAND.  This is “Alphabetic”
177     according to DerivedCoreProperties.txt. In glibc’s old
178     LC_CTYPE, it was in “lower”, which seems to be a
179     mistake. It is not “Lowercase” in
180     DerivedCoreProperties.txt and does not have case mappings
181     in UnicodeData.txt either.'''
182    ],
183    [[0x2C71, 0x2C74, (0x2C77, 0x2C7A)],
184            [('alpha', True), ('lower', True), ('upper', False),
185             ('tolower', False), ('toupper', False), ('totitle', False)],
186            '''These are Latin small letters which were not in Unicode 5.0.0
187            but are in Unicode 7.0.0. According to
188            DerivedCoreProperties.txt they are “Lowercase”. But no
189            uppercase versions exist.  They have apparently been added
190            manually to glibc’s old LC_CTYPE.'''
191    ],
192    [[0xA730, 0xA731],
193            [('alpha', True), ('lower', True), ('upper', False),
194             ('tolower', False), ('toupper', False), ('totitle', False)],
195            '''These are Latin small “capital” letters which were not in
196            Unicode 5.0.0 but are in Unicode 7.0.0. According to
197            DerivedCoreProperties.txt they are “Lowercase”. But no
198            uppercase versions exist.  They have apparently been added
199            manually to glibc’s old LC_CTYPE.'''
200    ],
201    [[(0xA771, 0xA778)],
202     [('alpha', True), ('lower', True), ('upper', False),
203      ('tolower', False), ('toupper', False), ('totitle', False)],
204     '''These are Latin small (or small “capital”) letters which
205     were not in Unicodee 5.0.0 but are in Unicode 7.0.0. According to
206     DerivedCoreProperties.txt they are “Lowercase”. But no
207     uppercase versions exist.  They have apparently been added
208     manually to glibc’s old LC_CTYPE.'''
209    ],
210    [[0x0375],
211     [('combining', False), ('combining_level3', False),
212      ('alpha', False), ('lower', False), ('upper', False),
213      ('tolower', False), ('toupper', False), ('totitle', False)],
214     '''“0375;GREEK LOWER NUMERAL SIGN;Sk;0;ON;;;;;N;;;;;”.  Has
215     apparently been added manually to glibc’s old LC_CTYPE as
216     “combining_level3”. That seems wrong, it is no combining
217     character because it does not have one of the general
218     categories Mn, Mc, or Me. According to
219     DerivedCoreProperties.txt it is not “Alphabetic”.'''
220    ],
221    [[0x108D],
222     [('combining', True), ('combining_level3', False),
223      ('alpha', True), ('lower', False), ('upper', False),
224      ('tolower', False), ('toupper', False), ('totitle', False)],
225     '''“108D;MYANMAR SIGN SHAN COUNCIL EMPHATIC
226     TONE;Mn;220;NSM;;;;;N;;;;;”.  Has apparently been added
227     manually to glibc’s old LC_CTYPE as
228     “combining_level3”. That seems wrong, although it is a
229     combining character because it has the general category
230     Mn, it is not “combining_level3” because the canonical
231     combining class value is 220 which is >= 200. According to
232     gen-unicode-ctype.c, “combining_level3” needs a
233     canonical combining class value < 200. According to
234     DerivedCoreProperties.txt it was not “Alphabetic”
235     until Unicode 11.0.0 but in 12.0.0 it became “Alphabetic”.'''
236    ],
237    [[0x06DE],
238     [('combining', False), ('combining_level3', False),
239      ('alpha', False), ('lower', False), ('upper', False),
240      ('tolower', False), ('toupper', False), ('totitle', False)],
241     ''' UnicodeData.txt 5.0.0: “06DE;ARABIC START OF RUB EL
242     HIZB;Me;0;NSM;;;;;N;;;;;”; UnicodeData.txt 7.0.0:
243     “06DE;ARABIC START OF RUB EL
244     HIZB;So;0;ON;;;;;N;;;;;”. I.e. this used to be a
245     combining character in Unicode 5.0.0 but not anymore in
246     7.0.0. According to DerivedCoreProperties.txt it is not
247     “Alphabetic”.'''
248    ],
249    [[0x0BD0],
250     [('combining', False), ('combining_level3', False),
251      ('alpha', True), ('lower', False), ('upper', False),
252      ('tolower', False), ('toupper', False), ('totitle', False)],
253     '''Not in UnicodeData.txt 5.0.0.  UnicodeData.txt 7.0.0:
254     “0BD0;TAMIL OM;Lo;0;L;;;;;N;;;;;”.  Apparently manually added to
255     “combining” and “combining_level3” in glibc’s old
256     LC_CTYPE. That seems wrong.  According to
257     DerivedCoreProperties.txt it is “Alphabetic”.'''
258    ],
259    [[0x103F],
260     [('combining', False), ('combining_level3', False),
261      ('alpha', True), ('lower', False), ('upper', False),
262      ('tolower', False), ('toupper', False), ('totitle', False)],
263     '''Not in UnicodeData.txt 5.0.0.  UnicodeData.txt 7.0.0:
264     “103F;MYANMAR LETTER GREAT SA;Lo;0;L;;;;;N;;;;;”.
265     Apparently manually added to “combining” and
266     “combining_level3” in glibc’s old LC_CTYPE. That seems
267     wrong.  According to DerivedCoreProperties.txt it is
268     “Alphabetic”.'''
269    ],
270    [[(0x0901, 0x0903)],
271     [('combining', True), ('combining_level3', True),
272      ('alpha', True), ('lower', False), ('upper', False),
273      ('tolower', False), ('toupper', False), ('totitle', False)],
274     '''These have general category “Mn” i.e. these are combining
275     characters (both in UnicodeData.txt 5.0.0 and 7.0.0):
276     “0901;DEVANAGARI SIGN CANDRABINDU;Mn;0;NSM;;;;;N;;;;;”,
277     ”0902;DEVANAGARI SIGN ANUSVARA;Mn;0;NSM;;;;;N;;;;;”,
278     “0903;DEVANAGARI SIGN VISARGA;Mc;0;L;;;;;N;;;;;”.
279     According to DerivedCoreProperties.txt (7.0.0) these are
280     “Alphabetic”.'''
281    ],
282    [[0x093C],
283     [('combining', True), ('combining_level3', True),
284      ('alpha', False), ('lower', False), ('upper', False),
285      ('tolower', False), ('toupper', False), ('totitle', False)],
286     '''UnicodeData.txt (5.0.0 and 7.0.0): “093C;DEVANAGARI SIGN
287     NUKTA;Mn;7;NSM;;;;;N;;;;;” According to
288     DerivedCoreProperties.txt (7.0.0) this is *not*
289     “Alphabetic”. glibc’s old LC_TYPE has this in “alpha”.'''
290    ],
291    [[(0x093E, 0x093F)],
292     [('combining', True), ('combining_level3', True),
293      ('alpha', True), ('lower', False), ('upper', False),
294      ('tolower', False), ('toupper', False), ('totitle', False)],
295     '''These have general category “Mc” i.e. these are combining
296     characters (both in UnicodeData.txt 5.0.0 and 7.0.0):
297     “093E;DEVANAGARI VOWEL SIGN AA;Mc;0;L;;;;;N;;;;;”
298     “093F;DEVANAGARI VOWEL SIGN I;Mc;0;L;;;;;N;;;;;”
299     According to DerivedCoreProperties.txt (7.0.0) these are
300     “Alphabetic”.'''
301    ],
302    [[(0x0940, 0x094C)],
303     [('combining', True), ('combining_level3', True),
304      ('alpha', True), ('lower', False), ('upper', False),
305      ('tolower', False), ('toupper', False), ('totitle', False)],
306     '''These are all combining
307     characters (“Mc” or “Mn” both in UnicodeData.txt 5.0.0 and 7.0.0).
308     According to DerivedCoreProperties.txt (7.0.0) these are
309     “Alphabetic”.'''
310    ],
311    [[0x094D],
312     [('combining', True), ('combining_level3', True),
313      ('alpha', False), ('lower', False), ('upper', False),
314      ('tolower', False), ('toupper', False), ('totitle', False)],
315     '''Combining character, both in UnicodeData.txt 5.0.0 and 7.0.0.
316     “094D;DEVANAGARI SIGN VIRAMA;Mn;9;NSM;;;;;N;;;;;”
317     According to DerivedCoreProperties.txt (7.0.0) it is *not*
318     “Alphabetic”.'''
319    ],
320    [[(0x0951, 0x0954)],
321     [('combining', True), ('combining_level3', False),
322      ('alpha', False), ('lower', False), ('upper', False),
323      ('tolower', False), ('toupper', False), ('totitle', False)],
324     '''Combining characters, both in UnicodeData.txt 5.0.0 and 7.0.0.
325     According to DerivedCoreProperties.txt (7.0.0) these are *not*
326     “Alphabetic”.'''
327    ],
328    [[(0x0962, 0x0963), (0x0981, 0x0983)],
329     [('combining', True), ('combining_level3', True),
330      ('alpha', True), ('lower', False), ('upper', False),
331      ('tolower', False), ('toupper', False), ('totitle', False)],
332     '''Combining characters, both in UnicodeData.txt 5.0.0 and 7.0.0.
333     According to DerivedCoreProperties.txt (7.0.0) these are
334     “Alphabetic”.'''
335    ],
336    [[0x09BC],
337     [('combining', True), ('combining_level3', True),
338      ('alpha', False), ('lower', False), ('upper', False),
339      ('tolower', False), ('toupper', False), ('totitle', False)],
340     '''
341     “09BC;BENGALI SIGN NUKTA;Mn;7;NSM;;;;;N;;;;;”
342     Combining character, both in UnicodeData.txt 5.0.0 and 7.0.0.
343     According to DerivedCoreProperties.txt (7.0.0) it is *not*
344     “Alphabetic”.'''
345    ],
346    [[(0x09BE, 0x09BF), (0x09C0, 0x09C4), (0x09C7, 0x09C8),
347      (0x09CB, 0x09CC)],
348     [('combining', True), ('combining_level3', True),
349      ('alpha', True), ('lower', False), ('upper', False),
350      ('tolower', False), ('toupper', False), ('totitle', False)],
351     '''
352     “09BE;BENGALI VOWEL SIGN AA;Mc;0;L;;;;;N;;;;;”
353     “09BF;BENGALI VOWEL SIGN I;Mc;0;L;;;;;N;;;;;”
354     “09C0;BENGALI VOWEL SIGN II;Mc;0;L;;;;;N;;;;;”
355     “09C1;BENGALI VOWEL SIGN U;Mn;0;NSM;;;;;N;;;;;”
356     “09C2;BENGALI VOWEL SIGN UU;Mn;0;NSM;;;;;N;;;;;”
357     “09C3;BENGALI VOWEL SIGN VOCALIC R;Mn;0;NSM;;;;;N;;;;;”
358     “09C4;BENGALI VOWEL SIGN VOCALIC RR;Mn;0;NSM;;;;;N;;;;;”
359     “09C7;BENGALI VOWEL SIGN E;Mc;0;L;;;;;N;;;;;”
360     “09C8;BENGALI VOWEL SIGN AI;Mc;0;L;;;;;N;;;;;”
361     “09CB;BENGALI VOWEL SIGN O;Mc;0;L;09C7 09BE;;;;N;;;;;”
362     “09CC;BENGALI VOWEL SIGN AU;Mc;0;L;09C7 09D7;;;;N;;;;;”
363     Combining characters, both in UnicodeData.txt 5.0.0 and 7.0.0.
364     According to DerivedCoreProperties.txt (7.0.0) these are
365     “Alphabetic”.'''
366    ],
367    [[0x09CD],
368     [('combining', True), ('combining_level3', True),
369      ('alpha', False), ('lower', False), ('upper', False),
370      ('tolower', False), ('toupper', False), ('totitle', False)],
371     '''
372     “09CD;BENGALI SIGN VIRAMA;Mn;9;NSM;;;;;N;;;;;”
373     Combining character, both in UnicodeData.txt 5.0.0 and 7.0.0.
374     According to DerivedCoreProperties.txt (7.0.0) it is *not*
375     “Alphabetic”.'''
376    ],
377    [[0x09D7, (0x09E2, 0x09E3)],
378     [('combining', True), ('combining_level3', True),
379      ('alpha', True), ('lower', False), ('upper', False),
380      ('tolower', False), ('toupper', False), ('totitle', False)],
381     '''Combining characters, both in UnicodeData.txt 5.0.0 and 7.0.0.
382     According to DerivedCoreProperties.txt (7.0.0) these are
383     “Alphabetic”.'''
384    ],
385    [[0x09F2, 0x09F3],
386     [('combining', False), ('combining_level3', False),
387      ('alpha', False), ('lower', False), ('upper', False),
388      ('tolower', False), ('toupper', False), ('totitle', False)],
389     '''
390     “09F2;BENGALI RUPEE MARK;Sc;0;ET;;;;;N;;;;;”
391     “09F3;BENGALI RUPEE SIGN;Sc;0;ET;;;;;N;;;;;”
392     According to DerivedCoreProperties.txt (7.0.0) these are *not*
393     “Alphabetic”.'''
394    ],
395    [[(0x09F4, 0x09FA)],
396     [('combining', False), ('combining_level3', False),
397      ('alpha', False), ('lower', False), ('upper', False),
398      ('tolower', False), ('toupper', False), ('totitle', False)],
399     '''
400     “09F4;BENGALI CURRENCY NUMERATOR ONE;No;0;L;;;;1/16;N;;;;;”
401     “09F5;BENGALI CURRENCY NUMERATOR TWO;No;0;L;;;;1/8;N;;;;;”
402     “09F6;BENGALI CURRENCY NUMERATOR THREE;No;0;L;;;;3/16;N;;;;;”
403     “09F7;BENGALI CURRENCY NUMERATOR FOUR;No;0;L;;;;1/4;N;;;;;”
404     “09F8;BENGALI CURRENCY NUMERATOR ONE LESS THAN THE DENOMINATOR;
405     No;0;L;;;;3/4;N;;;;;”
406     “09F9;BENGALI CURRENCY DENOMINATOR SIXTEEN;No;0;L;;;;16;N;;;;;”
407     “09FA;BENGALI ISSHAR;So;0;L;;;;;N;;;;;”
408     According to DerivedCoreProperties.txt (7.0.0) these are *not*
409     “Alphabetic”.'''
410    ],
411    [[(0x0A01, 0x0A03)],
412     [('combining', True), ('combining_level3', True),
413      ('alpha', True), ('lower', False), ('upper', False),
414      ('tolower', False), ('toupper', False), ('totitle', False)],
415     '''
416     “0A01;GURMUKHI SIGN ADAK BINDI;Mn;0;NSM;;;;;N;;;;;”
417     “0A02;GURMUKHI SIGN BINDI;Mn;0;NSM;;;;;N;;;;;”
418     “0A03;GURMUKHI SIGN VISARGA;Mc;0;L;;;;;N;;;;;”
419     According to DerivedCoreProperties.txt (7.0.0) these are
420     “Alphabetic”.'''
421    ],
422    [[0x0A3C],
423     [('combining', True), ('combining_level3', True),
424      ('alpha', False), ('lower', False), ('upper', False),
425      ('tolower', False), ('toupper', False), ('totitle', False)],
426     '''
427     “0A3C;GURMUKHI SIGN NUKTA;Mn;7;NSM;;;;;N;;;;;”
428     According to DerivedCoreProperties.txt (7.0.0) this is *not*
429     “Alphabetic”.'''
430    ],
431    [[(0x0A3E, 0x0A40), (0x0A41, 0x0A42), (0x0A47, 0x0A48),
432      (0x0A4B, 0x0A4C)],
433     [('combining', True), ('combining_level3', True),
434      ('alpha', True), ('lower', False), ('upper', False),
435      ('tolower', False), ('toupper', False), ('totitle', False)],
436     '''
437     “0A3E;GURMUKHI VOWEL SIGN AA;Mc;0;L;;;;;N;;;;;”
438     “0A3F;GURMUKHI VOWEL SIGN I;Mc;0;L;;;;;N;;;;;”
439     “0A40;GURMUKHI VOWEL SIGN II;Mc;0;L;;;;;N;;;;;”
440     “0A41;GURMUKHI VOWEL SIGN U;Mn;0;NSM;;;;;N;;;;;”
441     “0A42;GURMUKHI VOWEL SIGN UU;Mn;0;NSM;;;;;N;;;;;”
442     “0A47;GURMUKHI VOWEL SIGN EE;Mn;0;NSM;;;;;N;;;;;”
443     “0A48;GURMUKHI VOWEL SIGN AI;Mn;0;NSM;;;;;N;;;;;”
444     “0A4B;GURMUKHI VOWEL SIGN OO;Mn;0;NSM;;;;;N;;;;;”
445     “0A4C;GURMUKHI VOWEL SIGN AU;Mn;0;NSM;;;;;N;;;;;”
446     According to DerivedCoreProperties.txt (7.0.0) these are
447     “Alphabetic”.'''
448    ],
449    [[0x0A4D],
450     [('combining', True), ('combining_level3', True),
451      ('alpha', False), ('lower', False), ('upper', False),
452      ('tolower', False), ('toupper', False), ('totitle', False)],
453     '''
454     “0A4D;GURMUKHI SIGN VIRAMA;Mn;9;NSM;;;;;N;;;;;”
455     According to DerivedCoreProperties.txt (7.0.0) this is *not*
456     “Alphabetic”.'''
457    ],
458    [[0x0A51, (0x0A70, 0x0A71), 0x0A75, (0x0A81, 0x0A83)],
459     [('combining', True), ('combining_level3', True),
460      ('alpha', True), ('lower', False), ('upper', False),
461      ('tolower', False), ('toupper', False), ('totitle', False)],
462     '''
463     “0A4D;GURMUKHI SIGN VIRAMA;Mn;9;NSM;;;;;N;;;;;”
464     “0A70;GURMUKHI TIPPI;Mn;0;NSM;;;;;N;;;;;”
465     “0A71;GURMUKHI ADDAK;Mn;0;NSM;;;;;N;;;;;”
466     “0A75;GURMUKHI SIGN YAKASH;Mn;0;NSM;;;;;N;;;;;”
467     “0A81;GUJARATI SIGN CANDRABINDU;Mn;0;NSM;;;;;N;;;;;”
468     “0A82;GUJARATI SIGN ANUSVARA;Mn;0;NSM;;;;;N;;;;;”
469     “0A83;GUJARATI SIGN VISARGA;Mc;0;L;;;;;N;;;;;”
470     According to DerivedCoreProperties.txt (7.0.0) these are
471     “Alphabetic”.'''
472    ],
473    [[0x0ABC],
474     [('combining', True), ('combining_level3', True),
475      ('alpha', False), ('lower', False), ('upper', False),
476      ('tolower', False), ('toupper', False), ('totitle', False)],
477     '''
478     “0ABC;GUJARATI SIGN NUKTA;Mn;7;NSM;;;;;N;;;;;”
479     According to DerivedCoreProperties.txt (7.0.0) this is *not*
480     “Alphabetic”.'''
481    ],
482    [[(0x0ABE, 0x0AC5), (0x0AC7, 0x0AC9), (0x0ACB, 0x0ACC)],
483     [('combining', True), ('combining_level3', True),
484      ('alpha', True), ('lower', False), ('upper', False),
485      ('tolower', False), ('toupper', False), ('totitle', False)],
486     '''
487     “0ABE;GUJARATI VOWEL SIGN AA;Mc;0;L;;;;;N;;;;;”
488     “0ABF;GUJARATI VOWEL SIGN I;Mc;0;L;;;;;N;;;;;”
489     “0AC0;GUJARATI VOWEL SIGN II;Mc;0;L;;;;;N;;;;;”
490     “0AC1;GUJARATI VOWEL SIGN U;Mn;0;NSM;;;;;N;;;;;”
491     “0AC2;GUJARATI VOWEL SIGN UU;Mn;0;NSM;;;;;N;;;;;”
492     “0AC3;GUJARATI VOWEL SIGN VOCALIC R;Mn;0;NSM;;;;;N;;;;;”
493     “0AC4;GUJARATI VOWEL SIGN VOCALIC RR;Mn;0;NSM;;;;;N;;;;;”
494     “0AC5;GUJARATI VOWEL SIGN CANDRA E;Mn;0;NSM;;;;;N;;;;;”
495     “0AC7;GUJARATI VOWEL SIGN E;Mn;0;NSM;;;;;N;;;;;”
496     “0AC8;GUJARATI VOWEL SIGN AI;Mn;0;NSM;;;;;N;;;;;”
497     “0AC9;GUJARATI VOWEL SIGN CANDRA O;Mc;0;L;;;;;N;;;;;”
498     “0ACB;GUJARATI VOWEL SIGN O;Mc;0;L;;;;;N;;;;;”
499     “0ACC;GUJARATI VOWEL SIGN AU;Mc;0;L;;;;;N;;;;;”
500     According to DerivedCoreProperties.txt (7.0.0) these are
501     “Alphabetic”.'''
502    ],
503    [[0x0ACD],
504     [('combining', True), ('combining_level3', True),
505      ('alpha', False), ('lower', False), ('upper', False),
506      ('tolower', False), ('toupper', False), ('totitle', False)],
507     '''
508     “0ACD;GUJARATI SIGN VIRAMA;Mn;9;NSM;;;;;N;;;;;”
509     According to DerivedCoreProperties.txt (7.0.0) this is *not*
510     “Alphabetic”.'''
511    ],
512    [[(0x0AE2, 0x0AE3)],
513     [('combining', True), ('combining_level3', True),
514      ('alpha', True), ('lower', False), ('upper', False),
515      ('tolower', False), ('toupper', False), ('totitle', False)],
516     '''
517     “0AE2;GUJARATI VOWEL SIGN VOCALIC L;Mn;0;NSM;;;;;N;;;;;”
518     “0AE3;GUJARATI VOWEL SIGN VOCALIC LL;Mn;0;NSM;;;;;N;;;;;”
519     According to DerivedCoreProperties.txt (7.0.0) these are
520     “Alphabetic”.'''
521    ],
522    [[0x0AF1],
523     [('combining', False), ('combining_level3', False),
524      ('alpha', False), ('lower', False), ('upper', False),
525      ('tolower', False), ('toupper', False), ('totitle', False)],
526     '''
527     “0AF1;GUJARATI RUPEE SIGN;Sc;0;ET;;;;;N;;;;;”
528     According to DerivedCoreProperties.txt (7.0.0) this is *not*
529     “Alphabetic”.'''
530    ],
531    [[(0x0B01, 0x0B03)],
532     [('combining', True), ('combining_level3', True),
533      ('alpha', True), ('lower', False), ('upper', False),
534      ('tolower', False), ('toupper', False), ('totitle', False)],
535     '''
536     “0B01;ORIYA SIGN CANDRABINDU;Mn;0;NSM;;;;;N;;;;;”
537     “0B02;ORIYA SIGN ANUSVARA;Mc;0;L;;;;;N;;;;;”
538     “0B03;ORIYA SIGN VISARGA;Mc;0;L;;;;;N;;;;;”
539     According to DerivedCoreProperties.txt (7.0.0) these are
540     “Alphabetic”.'''
541    ],
542    [[0x0B3C],
543     [('combining', True), ('combining_level3', True),
544      ('alpha', False), ('lower', False), ('upper', False),
545      ('tolower', False), ('toupper', False), ('totitle', False)],
546     '''
547     “0B3C;ORIYA SIGN NUKTA;Mn;7;NSM;;;;;N;;;;;”
548     According to DerivedCoreProperties.txt (7.0.0) this is *not*
549     “Alphabetic”.'''
550    ],
551    [[(0x0B3E, 0x0B44), (0x0B47, 0x0B48), (0x0B4B, 0x0B4C)],
552     [('combining', True), ('combining_level3', True),
553      ('alpha', True), ('lower', False), ('upper', False),
554      ('tolower', False), ('toupper', False), ('totitle', False)],
555     '''
556     “0B3E;ORIYA VOWEL SIGN AA;Mc;0;L;;;;;N;;;;;”
557     “0B3F;ORIYA VOWEL SIGN I;Mn;0;NSM;;;;;N;;;;;”
558     “0B40;ORIYA VOWEL SIGN II;Mc;0;L;;;;;N;;;;;”
559     “0B41;ORIYA VOWEL SIGN U;Mn;0;NSM;;;;;N;;;;;”
560     “0B42;ORIYA VOWEL SIGN UU;Mn;0;NSM;;;;;N;;;;;”
561     “0B43;ORIYA VOWEL SIGN VOCALIC R;Mn;0;NSM;;;;;N;;;;;”
562     “0B44;ORIYA VOWEL SIGN VOCALIC RR;Mn;0;NSM;;;;;N;;;;;”
563     “0B47;ORIYA VOWEL SIGN E;Mc;0;L;;;;;N;;;;;”
564     “0B48;ORIYA VOWEL SIGN AI;Mc;0;L;0B47 0B56;;;;N;;;;;”
565     “0B4B;ORIYA VOWEL SIGN O;Mc;0;L;0B47 0B3E;;;;N;;;;;”
566     “0B4C;ORIYA VOWEL SIGN AU;Mc;0;L;0B47 0B57;;;;N;;;;;”
567     According to DerivedCoreProperties.txt (7.0.0) these are
568     “Alphabetic”.'''
569    ],
570    [[0x0B4D],
571     [('combining', True), ('combining_level3', True),
572      ('alpha', False), ('lower', False), ('upper', False),
573      ('tolower', False), ('toupper', False), ('totitle', False)],
574     '''
575     “0B4D;ORIYA SIGN VIRAMA;Mn;9;NSM;;;;;N;;;;;”
576     According to DerivedCoreProperties.txt (7.0.0) this is *not*
577     “Alphabetic”.'''
578    ],
579    [[(0x0B56, 0x0B57), (0x0B62, 0x0B63)],
580     [('combining', True), ('combining_level3', True),
581      ('alpha', True), ('lower', False), ('upper', False),
582      ('tolower', False), ('toupper', False), ('totitle', False)],
583     '''
584     “0B56;ORIYA AI LENGTH MARK;Mn;0;NSM;;;;;N;;;;;”
585     “0B57;ORIYA AU LENGTH MARK;Mc;0;L;;;;;N;;;;;”
586     “0B62;ORIYA VOWEL SIGN VOCALIC L;Mn;0;NSM;;;;;N;;;;;”
587     “0B63;ORIYA VOWEL SIGN VOCALIC LL;Mn;0;NSM;;;;;N;;;;;”
588     According to DerivedCoreProperties.txt (7.0.0) these are
589     “Alphabetic”.'''
590    ],
591    [[0x0B70],
592     [('combining', False), ('combining_level3', False),
593      ('alpha', False), ('lower', False), ('upper', False),
594      ('tolower', False), ('toupper', False), ('totitle', False)],
595     '''
596     “0B70;ORIYA ISSHAR;So;0;L;;;;;N;;;;;”
597     According to DerivedCoreProperties.txt (7.0.0) this is *not*
598     “Alphabetic”.'''
599    ],
600    [[0x0B82],
601     [('combining', True), ('combining_level3', True),
602      ('alpha', True), ('lower', False), ('upper', False),
603      ('tolower', False), ('toupper', False), ('totitle', False)],
604     '''
605     “0B82;TAMIL SIGN ANUSVARA;Mn;0;NSM;;;;;N;;;;;”
606     According to DerivedCoreProperties.txt (7.0.0) this is *not*
607     “Alphabetic”.'''
608    ],
609    [[(0x0BBE, 0x0BC2), (0x0BC6, 0x0BC8), (0x0BCA, 0x0BCC)],
610     [('combining', True), ('combining_level3', True),
611      ('alpha', True), ('lower', False), ('upper', False),
612      ('tolower', False), ('toupper', False), ('totitle', False)],
613     '''
614     “0BBE;TAMIL VOWEL SIGN AA;Mc;0;L;;;;;N;;;;;”
615     “0BBF;TAMIL VOWEL SIGN I;Mc;0;L;;;;;N;;;;;”
616     “0BC0;TAMIL VOWEL SIGN II;Mn;0;NSM;;;;;N;;;;;”
617     “0BC1;TAMIL VOWEL SIGN U;Mc;0;L;;;;;N;;;;;”
618     “0BC2;TAMIL VOWEL SIGN UU;Mc;0;L;;;;;N;;;;;”
619     “0BC6;TAMIL VOWEL SIGN E;Mc;0;L;;;;;N;;;;;”
620     “0BC7;TAMIL VOWEL SIGN EE;Mc;0;L;;;;;N;;;;;”
621     “0BC8;TAMIL VOWEL SIGN AI;Mc;0;L;;;;;N;;;;;”
622     “0BCA;TAMIL VOWEL SIGN O;Mc;0;L;0BC6 0BBE;;;;N;;;;;”
623     “0BCB;TAMIL VOWEL SIGN OO;Mc;0;L;0BC7 0BBE;;;;N;;;;;”
624     “0BCC;TAMIL VOWEL SIGN AU;Mc;0;L;0BC6 0BD7;;;;N;;;;;”
625     According to DerivedCoreProperties.txt (7.0.0) these are
626     “Alphabetic”.'''
627    ],
628    [[0x0BCD],
629     [('combining', True), ('combining_level3', True),
630      ('alpha', False), ('lower', False), ('upper', False),
631      ('tolower', False), ('toupper', False), ('totitle', False)],
632     '''
633     “0BCD;TAMIL SIGN VIRAMA;Mn;9;NSM;;;;;N;;;;;”
634     According to DerivedCoreProperties.txt (7.0.0) this is *not*
635     “Alphabetic”.'''
636    ],
637    [[0x0BD7],
638     [('combining', True), ('combining_level3', True),
639      ('alpha', True), ('lower', False), ('upper', False),
640      ('tolower', False), ('toupper', False), ('totitle', False)],
641     '''
642     “0BD7;TAMIL AU LENGTH MARK;Mc;0;L;;;;;N;;;;;”
643     According to DerivedCoreProperties.txt (7.0.0) this is *not*
644     “Alphabetic”.'''
645    ],
646    [[(0x0BF0, 0x0BFA)],
647     [('combining', False), ('combining_level3', False),
648      ('alpha', False), ('lower', False), ('upper', False),
649      ('tolower', False), ('toupper', False), ('totitle', False)],
650     '''
651     “0BF0;TAMIL NUMBER TEN;No;0;L;;;;10;N;;;;;”
652     “0BF1;TAMIL NUMBER ONE HUNDRED;No;0;L;;;;100;N;;;;;”
653     “0BF2;TAMIL NUMBER ONE THOUSAND;No;0;L;;;;1000;N;;;;;”
654     “0BF3;TAMIL DAY SIGN;So;0;ON;;;;;N;;;;;”
655     “0BF4;TAMIL MONTH SIGN;So;0;ON;;;;;N;;;;;”
656     “0BF5;TAMIL YEAR SIGN;So;0;ON;;;;;N;;;;;”
657     “0BF6;TAMIL DEBIT SIGN;So;0;ON;;;;;N;;;;;”
658     “0BF7;TAMIL CREDIT SIGN;So;0;ON;;;;;N;;;;;”
659     “0BF8;TAMIL AS ABOVE SIGN;So;0;ON;;;;;N;;;;;”
660     “0BF9;TAMIL RUPEE SIGN;Sc;0;ET;;;;;N;;;;;”
661     “0BFA;TAMIL NUMBER SIGN;So;0;ON;;;;;N;;;;;”
662     According to DerivedCoreProperties.txt (7.0.0) this is *not*
663     “Alphabetic”.'''
664    ],
665    [[(0x0C01, 0x0C03)],
666     [('combining', True), ('combining_level3', True),
667      ('alpha', True), ('lower', False), ('upper', False),
668      ('tolower', False), ('toupper', False), ('totitle', False)],
669     '''
670     “0C01;TELUGU SIGN CANDRABINDU;Mc;0;L;;;;;N;;;;;”
671     “0C02;TELUGU SIGN ANUSVARA;Mc;0;L;;;;;N;;;;;”
672     “0C03;TELUGU SIGN VISARGA;Mc;0;L;;;;;N;;;;;”
673     According to DerivedCoreProperties.txt (7.0.0) these are
674     “Alphabetic”.'''
675    ],
676    [[(0x0C3E, 0x0C44), (0x0C46, 0x0C48), (0x0C4A, 0x0C4C)],
677     [('combining', True), ('combining_level3', True),
678      ('alpha', True), ('lower', False), ('upper', False),
679      ('tolower', False), ('toupper', False), ('totitle', False)],
680     '''
681     “0C3E;TELUGU VOWEL SIGN AA;Mn;0;NSM;;;;;N;;;;;”
682     “0C3F;TELUGU VOWEL SIGN I;Mn;0;NSM;;;;;N;;;;;”
683     “0C40;TELUGU VOWEL SIGN II;Mn;0;NSM;;;;;N;;;;;”
684     “0C41;TELUGU VOWEL SIGN U;Mc;0;L;;;;;N;;;;;”
685     “0C42;TELUGU VOWEL SIGN UU;Mc;0;L;;;;;N;;;;;”
686     “0C43;TELUGU VOWEL SIGN VOCALIC R;Mc;0;L;;;;;N;;;;;”
687     “0C44;TELUGU VOWEL SIGN VOCALIC RR;Mc;0;L;;;;;N;;;;;”
688     “0C46;TELUGU VOWEL SIGN E;Mn;0;NSM;;;;;N;;;;;”
689     “0C47;TELUGU VOWEL SIGN EE;Mn;0;NSM;;;;;N;;;;;”
690     “0C48;TELUGU VOWEL SIGN AI;Mn;0;NSM;0C46 0C56;;;;N;;;;;”
691     “0C4A;TELUGU VOWEL SIGN O;Mn;0;NSM;;;;;N;;;;;”
692     “0C4B;TELUGU VOWEL SIGN OO;Mn;0;NSM;;;;;N;;;;;”
693     “0C4C;TELUGU VOWEL SIGN AU;Mn;0;NSM;;;;;N;;;;;”
694     According to DerivedCoreProperties.txt (7.0.0) these are
695     “Alphabetic”.'''
696    ],
697    [[0x0C4D],
698     [('combining', True), ('combining_level3', True),
699      ('alpha', False), ('lower', False), ('upper', False),
700      ('tolower', False), ('toupper', False), ('totitle', False)],
701     '''
702     “0C4D;TELUGU SIGN VIRAMA;Mn;9;NSM;;;;;N;;;;;”
703     According to DerivedCoreProperties.txt (7.0.0) these are *not*
704     “Alphabetic”.'''
705    ],
706    [[(0x0C55, 0x0C56), (0x0C62, 0x0C63)],
707     [('combining', True), ('combining_level3', True),
708      ('alpha', True), ('lower', False), ('upper', False),
709      ('tolower', False), ('toupper', False), ('totitle', False)],
710     '''
711     “0C55;TELUGU LENGTH MARK;Mn;84;NSM;;;;;N;;;;;”
712     “0C56;TELUGU AI LENGTH MARK;Mn;91;NSM;;;;;N;;;;;”
713     “0C62;TELUGU VOWEL SIGN VOCALIC L;Mn;0;NSM;;;;;N;;;;;”
714     “0C63;TELUGU VOWEL SIGN VOCALIC LL;Mn;0;NSM;;;;;N;;;;;”
715     According to DerivedCoreProperties.txt (7.0.0) these are
716     “Alphabetic”.'''
717    ],
718    [[(0x0C78, 0x0C7F)],
719     [('combining', False), ('combining_level3', False),
720      ('alpha', False), ('lower', False), ('upper', False),
721      ('tolower', False), ('toupper', False), ('totitle', False)],
722     '''
723     “0C78;TELUGU FRACTION DIGIT ZERO FOR ODD POWERS OF FOUR;
724     No;0;ON;;;;0;N;;;;;”
725     “0C79;TELUGU FRACTION DIGIT ONE FOR ODD POWERS OF FOUR;
726     No;0;ON;;;;1;N;;;;;”
727     “0C7A;TELUGU FRACTION DIGIT TWO FOR ODD POWERS OF FOUR;
728     No;0;ON;;;;2;N;;;;;”
729     “0C7B;TELUGU FRACTION DIGIT THREE FOR ODD POWERS OF FOUR;
730     No;0;ON;;;;3;N;;;;;”
731     “0C7C;TELUGU FRACTION DIGIT ONE FOR EVEN POWERS OF FOUR;
732     No;0;ON;;;;1;N;;;;;”
733     “0C7D;TELUGU FRACTION DIGIT TWO FOR EVEN POWERS OF FOUR;
734     No;0;ON;;;;2;N;;;;;”
735     “0C7E;TELUGU FRACTION DIGIT THREE FOR EVEN POWERS OF FOUR;
736     No;0;ON;;;;3;N;;;;;”
737     “0C7F;TELUGU SIGN TUUMU;So;0;L;;;;;N;;;;;”
738     According to DerivedCoreProperties.txt (7.0.0) these are *not*
739     “Alphabetic”.'''
740    ],
741    [[(0x0C82, 0x0C83)],
742     [('combining', True), ('combining_level3', True),
743      ('alpha', True), ('lower', False), ('upper', False),
744      ('tolower', False), ('toupper', False), ('totitle', False)],
745     '''
746     “0C81;KANNADA SIGN CANDRABINDU;Mn;0;NSM;;;;;N;;;;;”
747     “0C82;KANNADA SIGN ANUSVARA;Mc;0;L;;;;;N;;;;;”
748     “0C83;KANNADA SIGN VISARGA;Mc;0;L;;;;;N;;;;;”
749     According to DerivedCoreProperties.txt (7.0.0) these are
750     “Alphabetic”.'''
751    ],
752    [[0x0CBC],
753     [('combining', True), ('combining_level3', True),
754      ('alpha', False), ('lower', False), ('upper', False),
755      ('tolower', False), ('toupper', False), ('totitle', False)],
756     '''
757     “0CBC;KANNADA SIGN NUKTA;Mn;7;NSM;;;;;N;;;;;”
758     According to DerivedCoreProperties.txt (7.0.0) these are
759     “Alphabetic”.'''
760    ],
761    [[(0x0CBE, 0x0CC4), (0x0CC6, 0x0CC8), (0x0CCA, 0x0CCC)],
762     [('combining', True), ('combining_level3', True),
763      ('alpha', True), ('lower', False), ('upper', False),
764      ('tolower', False), ('toupper', False), ('totitle', False)],
765     '''
766     “0CBE;KANNADA VOWEL SIGN AA;Mc;0;L;;;;;N;;;;;”
767     “0CBF;KANNADA VOWEL SIGN I;Mn;0;L;;;;;N;;;;;”
768     “0CC0;KANNADA VOWEL SIGN II;Mc;0;L;0CBF 0CD5;;;;N;;;;;”
769     “0CC1;KANNADA VOWEL SIGN U;Mc;0;L;;;;;N;;;;;”
770     “0CC2;KANNADA VOWEL SIGN UU;Mc;0;L;;;;;N;;;;;”
771     “0CC3;KANNADA VOWEL SIGN VOCALIC R;Mc;0;L;;;;;N;;;;;”
772     “0CC4;KANNADA VOWEL SIGN VOCALIC RR;Mc;0;L;;;;;N;;;;;”
773     “0CC6;KANNADA VOWEL SIGN E;Mn;0;L;;;;;N;;;;;”
774     “0CC7;KANNADA VOWEL SIGN EE;Mc;0;L;0CC6 0CD5;;;;N;;;;;”
775     “0CC8;KANNADA VOWEL SIGN AI;Mc;0;L;0CC6 0CD6;;;;N;;;;;”
776     “0CCA;KANNADA VOWEL SIGN O;Mc;0;L;0CC6 0CC2;;;;N;;;;;”
777     “0CCB;KANNADA VOWEL SIGN OO;Mc;0;L;0CCA 0CD5;;;;N;;;;;”
778     “0CCC;KANNADA VOWEL SIGN AU;Mn;0;NSM;;;;;N;;;;;”
779     According to DerivedCoreProperties.txt (7.0.0) these are
780     “Alphabetic”.'''
781    ],
782    [[0x0CCD],
783     [('combining', True), ('combining_level3', True),
784      ('alpha', False), ('lower', False), ('upper', False),
785      ('tolower', False), ('toupper', False), ('totitle', False)],
786     '''
787     “0CCD;KANNADA SIGN VIRAMA;Mn;9;NSM;;;;;N;;;;;”
788     According to DerivedCoreProperties.txt (7.0.0) these are *not*
789     “Alphabetic”.'''
790    ],
791    [[(0x0CD5, 0x0CD6), (0x0CE2, 0x0CE3)],
792     [('combining', True), ('combining_level3', True),
793      ('alpha', True), ('lower', False), ('upper', False),
794      ('tolower', False), ('toupper', False), ('totitle', False)],
795     '''
796     0CD5;KANNADA LENGTH MARK;Mc;0;L;;;;;N;;;;;
797     0CD6;KANNADA AI LENGTH MARK;Mc;0;L;;;;;N;;;;;
798     0CE2;KANNADA VOWEL SIGN VOCALIC L;Mn;0;NSM;;;;;N;;;;;
799     0CE3;KANNADA VOWEL SIGN VOCALIC LL;Mn;0;NSM;;;;;N;;;;;
800     According to DerivedCoreProperties.txt (7.0.0) these are
801     “Alphabetic”.'''
802    ],
803    [[(0x0D02, 0x0D03), (0x0D3E, 0x0D44), (0x0D46, 0x0D48),
804      (0x0D4A, 0x0D4C)],
805     [('combining', True), ('combining_level3', True),
806      ('alpha', True), ('lower', False), ('upper', False),
807      ('tolower', False), ('toupper', False), ('totitle', False)],
808     '''
809     “0D02;MALAYALAM SIGN ANUSVARA;Mc;0;L;;;;;N;;;;;”
810     “0D03;MALAYALAM SIGN VISARGA;Mc;0;L;;;;;N;;;;;”
811     “0D3E;MALAYALAM VOWEL SIGN AA;Mc;0;L;;;;;N;;;;;”
812     “0D3F;MALAYALAM VOWEL SIGN I;Mc;0;L;;;;;N;;;;;”
813     “0D40;MALAYALAM VOWEL SIGN II;Mc;0;L;;;;;N;;;;;”
814     “0D41;MALAYALAM VOWEL SIGN U;Mn;0;NSM;;;;;N;;;;;”
815     “0D42;MALAYALAM VOWEL SIGN UU;Mn;0;NSM;;;;;N;;;;;”
816     “0D43;MALAYALAM VOWEL SIGN VOCALIC R;Mn;0;NSM;;;;;N;;;;;”
817     “0D44;MALAYALAM VOWEL SIGN VOCALIC RR;Mn;0;NSM;;;;;N;;;;;”
818     “0D46;MALAYALAM VOWEL SIGN E;Mc;0;L;;;;;N;;;;;”
819     “0D47;MALAYALAM VOWEL SIGN EE;Mc;0;L;;;;;N;;;;;”
820     “0D48;MALAYALAM VOWEL SIGN AI;Mc;0;L;;;;;N;;;;;”
821     “0D4A;MALAYALAM VOWEL SIGN O;Mc;0;L;0D46 0D3E;;;;N;;;;;”
822     “0D4B;MALAYALAM VOWEL SIGN OO;Mc;0;L;0D47 0D3E;;;;N;;;;;”
823     “0D4C;MALAYALAM VOWEL SIGN AU;Mc;0;L;0D46 0D57;;;;N;;;;;”
824     According to DerivedCoreProperties.txt (7.0.0) these are
825     “Alphabetic”.'''
826    ],
827    [[0x0D4D],
828     [('combining', True), ('combining_level3', True),
829      ('alpha', False), ('lower', False), ('upper', False),
830      ('tolower', False), ('toupper', False), ('totitle', False)],
831     '''
832     “0D4D;MALAYALAM SIGN VIRAMA;Mn;9;NSM;;;;;N;;;;;”
833     According to DerivedCoreProperties.txt (7.0.0) these are
834     “Alphabetic”.'''
835    ],
836    [[0x0D57, (0x0D62, 0x0D63)],
837     [('combining', True), ('combining_level3', True),
838      ('alpha', True), ('lower', False), ('upper', False),
839      ('tolower', False), ('toupper', False), ('totitle', False)],
840     '''
841     “0D57;MALAYALAM AU LENGTH MARK;Mc;0;L;;;;;N;;;;;”
842     “0D62;MALAYALAM VOWEL SIGN VOCALIC L;Mn;0;NSM;;;;;N;;;;;”
843     “0D63;MALAYALAM VOWEL SIGN VOCALIC LL;Mn;0;NSM;;;;;N;;;;;”
844     According to DerivedCoreProperties.txt (7.0.0) these are
845     “Alphabetic”.'''
846    ],
847    [[(0x0D70, 0x0D79)],
848     [('combining', False), ('combining_level3', False),
849      ('alpha', False), ('lower', False), ('upper', False),
850      ('tolower', False), ('toupper', False), ('totitle', False)],
851     '''
852     “0D70;MALAYALAM NUMBER TEN;No;0;L;;;;10;N;;;;;”
853     “0D71;MALAYALAM NUMBER ONE HUNDRED;No;0;L;;;;100;N;;;;;”
854     “0D72;MALAYALAM NUMBER ONE THOUSAND;No;0;L;;;;1000;N;;;;;”
855     “0D73;MALAYALAM FRACTION ONE QUARTER;No;0;L;;;;1/4;N;;;;;”
856     “0D74;MALAYALAM FRACTION ONE HALF;No;0;L;;;;1/2;N;;;;;”
857     “0D75;MALAYALAM FRACTION THREE QUARTERS;No;0;L;;;;3/4;N;;;;;”
858     “0D79;MALAYALAM DATE MARK;So;0;L;;;;;N;;;;;”
859     According to DerivedCoreProperties.txt (7.0.0) these are *not*
860     “Alphabetic”.'''
861    ],
862    [[(0x0D82, 0x0D83)],
863     [('combining', True), ('combining_level3', True),
864      ('alpha', True), ('lower', False), ('upper', False),
865      ('tolower', False), ('toupper', False), ('totitle', False)],
866     '''
867     “0D82;SINHALA SIGN ANUSVARAYA;Mc;0;L;;;;;N;;;;;”
868     “0D83;SINHALA SIGN VISARGAYA;Mc;0;L;;;;;N;;;;;”
869     According to DerivedCoreProperties.txt (7.0.0) these are
870     “Alphabetic”.'''
871    ],
872    [[0x0DCA],
873     [('combining', True), ('combining_level3', True),
874      ('alpha', False), ('lower', False), ('upper', False),
875      ('tolower', False), ('toupper', False), ('totitle', False)],
876     '''
877     “0DCA;SINHALA SIGN AL-LAKUNA;Mn;9;NSM;;;;;N;;;;;”
878     According to DerivedCoreProperties.txt (7.0.0) these are *not*
879     “Alphabetic”.'''
880    ],
881    [[(0x0DCF, 0x0DD4), 0x0DD6, (0x0DD8, 0x0DDF), (0x0DF2, 0x0DF3)],
882     [('combining', True), ('combining_level3', True),
883      ('alpha', True), ('lower', False), ('upper', False),
884      ('tolower', False), ('toupper', False), ('totitle', False)],
885     '''
886     “0DCF;SINHALA VOWEL SIGN AELA-PILLA;Mc;0;L;;;;;N;;;;;”
887     “0DD0;SINHALA VOWEL SIGN KETTI AEDA-PILLA;Mc;0;L;;;;;N;;;;;”
888     “0DD1;SINHALA VOWEL SIGN DIGA AEDA-PILLA;Mc;0;L;;;;;N;;;;;”
889     “0DD2;SINHALA VOWEL SIGN KETTI IS-PILLA;Mn;0;NSM;;;;;N;;;;;”
890     “0DD3;SINHALA VOWEL SIGN DIGA IS-PILLA;Mn;0;NSM;;;;;N;;;;;”
891     “0DD4;SINHALA VOWEL SIGN KETTI PAA-PILLA;Mn;0;NSM;;;;;N;;;;;”
892     “0DD6;SINHALA VOWEL SIGN DIGA PAA-PILLA;Mn;0;NSM;;;;;N;;;;;”
893     “0DD8;SINHALA VOWEL SIGN GAETTA-PILLA;Mc;0;L;;;;;N;;;;;”
894     “0DD9;SINHALA VOWEL SIGN KOMBUVA;Mc;0;L;;;;;N;;;;;”
895     “0DDA;SINHALA VOWEL SIGN DIGA KOMBUVA;Mc;0;L;0DD9 0DCA;;;;N;;;;;”
896     “0DDB;SINHALA VOWEL SIGN KOMBU DEKA;Mc;0;L;;;;;N;;;;;”
897     “0DDC;SINHALA VOWEL SIGN KOMBUVA HAA AELA-PILLA;
898     Mc;0;L;0DD9 0DCF;;;;N;;;;;”
899     “0DDD;SINHALA VOWEL SIGN KOMBUVA HAA DIGA AELA-PILLA;
900     Mc;0;L;0DDC 0DCA;;;;N;;;;;”
901     “0DDE;SINHALA VOWEL SIGN KOMBUVA HAA GAYANUKITTA;
902     Mc;0;L;0DD9 0DDF;;;;N;;;;;”
903     “0DDF;SINHALA VOWEL SIGN GAYANUKITTA;Mc;0;L;;;;;N;;;;;”
904     “0DF2;SINHALA VOWEL SIGN DIGA GAETTA-PILLA;Mc;0;L;;;;;N;;;;;”
905     “0DF3;SINHALA VOWEL SIGN DIGA GAYANUKITTA;Mc;0;L;;;;;N;;;;;”
906     According to DerivedCoreProperties.txt (7.0.0) these are
907     “Alphabetic”.'''
908    ],
909    [[0x0DF4],
910     [('combining', False), ('combining_level3', False),
911      ('alpha', False), ('lower', False), ('upper', False),
912      ('tolower', False), ('toupper', False), ('totitle', False)],
913     '''
914     “0DF4;SINHALA PUNCTUATION KUNDDALIYA;Po;0;L;;;;;N;;;;;”
915     According to DerivedCoreProperties.txt (7.0.0) these are *not*
916     “Alphabetic”.'''
917    ],
918    [[(0xA789, 0xA78A)],
919     [('combining', False), ('combining_level3', False),
920      ('alpha', False), ('lower', False), ('upper', False),
921      ('tolower', False), ('toupper', False), ('totitle', False)],
922     '''
923     “A789;MODIFIER LETTER COLON;Sk;0;L;;;;;N;;;;;”
924     “A78A;MODIFIER LETTER SHORT EQUALS SIGN;Sk;0;L;;;;;N;;;;;”
925     According to DerivedCoreProperties.txt (7.0.0) these are *not*
926     “Alphabetic”.'''
927    ],
928    [[(0xA926, 0xA92A)],
929     [('combining', True), ('combining_level3', True),
930      ('alpha', True), ('lower', False), ('upper', False),
931      ('tolower', False), ('toupper', False), ('totitle', False)],
932     '''
933     “A926;KAYAH LI VOWEL UE;Mn;0;NSM;;;;;N;;;;;”
934     “A927;KAYAH LI VOWEL E;Mn;0;NSM;;;;;N;;;;;”
935     “A928;KAYAH LI VOWEL U;Mn;0;NSM;;;;;N;;;;;”
936     “A929;KAYAH LI VOWEL EE;Mn;0;NSM;;;;;N;;;;;”
937     “A92A;KAYAH LI VOWEL O;Mn;0;NSM;;;;;N;;;;;”
938     According to DerivedCoreProperties.txt (7.0.0) these are
939     “Alphabetic”.'''
940    ],
941    [[(0xA92B, 0xA92D)],
942     [('combining', True), ('combining_level3', False),
943      ('alpha', False), ('lower', False), ('upper', False),
944      ('tolower', False), ('toupper', False), ('totitle', False)],
945     '''
946     “A92B;KAYAH LI TONE PLOPHU;Mn;220;NSM;;;;;N;;;;;”
947     “A92C;KAYAH LI TONE CALYA;Mn;220;NSM;;;;;N;;;;;”
948     “A92D;KAYAH LI TONE CALYA PLOPHU;Mn;220;NSM;;;;;N;;;;;”
949     According to DerivedCoreProperties.txt (7.0.0) these are *not*
950     “Alphabetic”.'''
951    ]
952]
953