1 # !!!!!!! DO NOT EDIT THIS FILE !!!!!!!
2 # This file is built by mktables.PL from e.g. Unicode.txt.
3 # Any changes made here will be lost!
31 'CANADIAN-ABORIGINAL' => 26,
46 'Latin-1 Supplement' => 41,
47 'Latin Extended-A' => 42,
48 'Latin Extended-B' => 43,
49 'IPA Extensions' => 44,
50 'Spacing Modifier Letters' => 45,
51 'Combining Diacritical Marks' => 46,
53 'Cyrillic Block' => 48,
54 'Armenian Block' => 49,
59 'Devanagari Block' => 54,
60 'Bengali Block' => 55,
61 'Gurmukhi Block' => 56,
62 'Gujarati Block' => 57,
66 'Kannada Block' => 61,
67 'Malayalam Block' => 62,
68 'Sinhala Block' => 63,
71 'Tibetan Block' => 66,
72 'Myanmar Block' => 67,
73 'Georgian Block' => 68,
75 'Ethiopic Block' => 70,
76 'Cherokee Block' => 71,
77 'Unified Canadian Aboriginal Syllabics' => 72,
81 'Mongolian Block' => 76,
82 'Latin Extended Additional' => 77,
83 'Greek Extended' => 78,
84 'General Punctuation' => 79,
85 'Superscripts and Subscripts' => 80,
86 'Currency Symbols' => 81,
87 'Combining Marks for Symbols' => 82,
88 'Letterlike Symbols' => 83,
91 'Mathematical Operators' => 86,
92 'Miscellaneous Technical' => 87,
93 'Control Pictures' => 88,
94 'Optical Character Recognition' => 89,
95 'Enclosed Alphanumerics' => 90,
97 'Block Elements' => 92,
98 'Geometric Shapes' => 93,
99 'Miscellaneous Symbols' => 94,
101 'Braille Patterns' => 96,
102 'CJK Radicals Supplement' => 97,
103 'Kangxi Radicals' => 98,
104 'Ideographic Description Characters' => 99,
105 'CJK Symbols and Punctuation' => 100,
106 'Hiragana Block' => 101,
107 'Katakana Block' => 102,
108 'Bopomofo Block' => 103,
109 'Hangul Compatibility Jamo' => 104,
111 'Bopomofo Extended' => 106,
112 'Enclosed CJK Letters and Months' => 107,
113 'CJK Compatibility' => 108,
114 'CJK Unified Ideographs Extension A' => 109,
115 'CJK Unified Ideographs' => 110,
116 'Yi Syllables' => 111,
117 'Yi Radicals' => 112,
118 'Hangul Syllables' => 113,
119 'High Surrogates' => 114,
120 'High Private Use Surrogates' => 115,
121 'Low Surrogates' => 116,
122 'Private Use' => 117,
123 'CJK Compatibility Ideographs' => 118,
124 'Alphabetic Presentation Forms' => 119,
125 'Arabic Presentation Forms-A' => 120,
126 'Combining Half Marks' => 121,
127 'CJK Compatibility Forms' => 122,
128 'Small Form Variants' => 123,
129 'Arabic Presentation Forms-B' => 124,
131 'Halfwidth and Fullwidth Forms' => 126,
133 'Gothic Block' => 128,
134 'Deseret Block' => 129,
135 'Byzantine Musical Symbols' => 130,
136 'Musical Symbols' => 131,
137 'Mathematical Alphanumeric Symbols' => 132,
138 'CJK Unified Ideographs Extension B' => 133,
139 'CJK Compatibility Ideographs Supplement' => 134,
144 'Alphabetic(?:[-_]|\s+)?Presentation(?:[-_]|\s+)?Forms' => 'Alphabetic Presentation Forms',
147 'ARABIC' => 'ARABIC',
148 'Arabic(?:[-_]|\s+)?Block' => 'Arabic Block',
149 'Arabic(?:[-_]|\s+)?Presentation(?:[-_]|\s+)?Forms(?:[-_]|\s+)?A' => 'Arabic Presentation Forms-A',
150 'Arabic(?:[-_]|\s+)?Presentation(?:[-_]|\s+)?Forms(?:[-_]|\s+)?B' => 'Arabic Presentation Forms-B',
153 'ARMENIAN' => 'ARMENIAN',
154 'Armenian(?:[-_]|\s+)?Block' => 'Armenian Block',
157 'Arrows' => 'Arrows',
160 'Basic(?:[-_]|\s+)?Latin' => 'Basic Latin',
163 'BENGALI' => 'BENGALI',
164 'Bengali(?:[-_]|\s+)?Block' => 'Bengali Block',
167 'Block(?:[-_]|\s+)?Elements' => 'Block Elements',
170 'BOPOMOFO' => 'BOPOMOFO',
171 'Bopomofo(?:[-_]|\s+)?Block' => 'Bopomofo Block',
172 'Bopomofo(?:[-_]|\s+)?Extended' => 'Bopomofo Extended',
175 'Box(?:[-_]|\s+)?Drawing' => 'Box Drawing',
178 'Braille(?:[-_]|\s+)?Patterns' => 'Braille Patterns',
181 'Byzantine(?:[-_]|\s+)?Musical(?:[-_]|\s+)?Symbols' => 'Byzantine Musical Symbols',
184 'CANADIAN(?:[-_]|\s+)?ABORIGINAL' => 'CANADIAN-ABORIGINAL',
187 'CHEROKEE' => 'CHEROKEE',
188 'Cherokee(?:[-_]|\s+)?Block' => 'Cherokee Block',
191 'CJK(?:[-_]|\s+)?Radicals(?:[-_]|\s+)?Supplement' => 'CJK Radicals Supplement',
192 'CJK(?:[-_]|\s+)?Symbols(?:[-_]|\s+)?and(?:[-_]|\s+)?Punctuation' => 'CJK Symbols and Punctuation',
193 'CJK(?:[-_]|\s+)?Compatibility' => 'CJK Compatibility',
194 'CJK(?:[-_]|\s+)?Unified(?:[-_]|\s+)?Ideographs(?:[-_]|\s+)?Extension(?:[-_]|\s+)?A' => 'CJK Unified Ideographs Extension A',
195 'CJK(?:[-_]|\s+)?Unified(?:[-_]|\s+)?Ideographs' => 'CJK Unified Ideographs',
196 'CJK(?:[-_]|\s+)?Compatibility(?:[-_]|\s+)?Ideographs' => 'CJK Compatibility Ideographs',
197 'CJK(?:[-_]|\s+)?Compatibility(?:[-_]|\s+)?Forms' => 'CJK Compatibility Forms',
198 'CJK(?:[-_]|\s+)?Unified(?:[-_]|\s+)?Ideographs(?:[-_]|\s+)?Extension(?:[-_]|\s+)?B' => 'CJK Unified Ideographs Extension B',
199 'CJK(?:[-_]|\s+)?Compatibility(?:[-_]|\s+)?Ideographs(?:[-_]|\s+)?Supplement' => 'CJK Compatibility Ideographs Supplement',
202 'Combining(?:[-_]|\s+)?Diacritical(?:[-_]|\s+)?Marks' => 'Combining Diacritical Marks',
203 'Combining(?:[-_]|\s+)?Marks(?:[-_]|\s+)?for(?:[-_]|\s+)?Symbols' => 'Combining Marks for Symbols',
204 'Combining(?:[-_]|\s+)?Half(?:[-_]|\s+)?Marks' => 'Combining Half Marks',
207 'Control(?:[-_]|\s+)?Pictures' => 'Control Pictures',
210 'Currency(?:[-_]|\s+)?Symbols' => 'Currency Symbols',
213 'CYRILLIC' => 'CYRILLIC',
214 'Cyrillic(?:[-_]|\s+)?Block' => 'Cyrillic Block',
217 'DESERET' => 'DESERET',
218 'Deseret(?:[-_]|\s+)?Block' => 'Deseret Block',
221 'DEVANAGARI' => 'DEVANAGARI',
222 'Devanagari(?:[-_]|\s+)?Block' => 'Devanagari Block',
225 'Dingbats' => 'Dingbats',
228 'Enclosed(?:[-_]|\s+)?Alphanumerics' => 'Enclosed Alphanumerics',
229 'Enclosed(?:[-_]|\s+)?CJK(?:[-_]|\s+)?Letters(?:[-_]|\s+)?and(?:[-_]|\s+)?Months' => 'Enclosed CJK Letters and Months',
232 'ETHIOPIC' => 'ETHIOPIC',
233 'Ethiopic(?:[-_]|\s+)?Block' => 'Ethiopic Block',
236 'General(?:[-_]|\s+)?Punctuation' => 'General Punctuation',
239 'GEORGIAN' => 'GEORGIAN',
240 'Georgian(?:[-_]|\s+)?Block' => 'Georgian Block',
241 'Geometric(?:[-_]|\s+)?Shapes' => 'Geometric Shapes',
244 'GOTHIC' => 'GOTHIC',
245 'Gothic(?:[-_]|\s+)?Block' => 'Gothic Block',
249 'Greek(?:[-_]|\s+)?Block' => 'Greek Block',
250 'Greek(?:[-_]|\s+)?Extended' => 'Greek Extended',
253 'GUJARATI' => 'GUJARATI',
254 'Gujarati(?:[-_]|\s+)?Block' => 'Gujarati Block',
257 'GURMUKHI' => 'GURMUKHI',
258 'Gurmukhi(?:[-_]|\s+)?Block' => 'Gurmukhi Block',
261 'Halfwidth(?:[-_]|\s+)?and(?:[-_]|\s+)?Fullwidth(?:[-_]|\s+)?Forms' => 'Halfwidth and Fullwidth Forms',
264 'HANGUL' => 'HANGUL',
266 'Hangul(?:[-_]|\s+)?Jamo' => 'Hangul Jamo',
267 'Hangul(?:[-_]|\s+)?Compatibility(?:[-_]|\s+)?Jamo' => 'Hangul Compatibility Jamo',
268 'Hangul(?:[-_]|\s+)?Syllables' => 'Hangul Syllables',
271 'HEBREW' => 'HEBREW',
272 'Hebrew(?:[-_]|\s+)?Block' => 'Hebrew Block',
275 'High(?:[-_]|\s+)?Surrogates' => 'High Surrogates',
276 'High(?:[-_]|\s+)?Private(?:[-_]|\s+)?Use(?:[-_]|\s+)?Surrogates' => 'High Private Use Surrogates',
279 'HIRAGANA' => 'HIRAGANA',
280 'Hiragana(?:[-_]|\s+)?Block' => 'Hiragana Block',
283 'Ideographic(?:[-_]|\s+)?Description(?:[-_]|\s+)?Characters' => 'Ideographic Description Characters',
286 'INHERITED' => 'INHERITED',
289 'IPA(?:[-_]|\s+)?Extensions' => 'IPA Extensions',
292 'KANNADA' => 'KANNADA',
293 'Kannada(?:[-_]|\s+)?Block' => 'Kannada Block',
294 'Kangxi(?:[-_]|\s+)?Radicals' => 'Kangxi Radicals',
295 'Kanbun' => 'Kanbun',
298 'KATAKANA' => 'KATAKANA',
299 'Katakana(?:[-_]|\s+)?Block' => 'Katakana Block',
303 'Khmer(?:[-_]|\s+)?Block' => 'Khmer Block',
307 'Lao(?:[-_]|\s+)?Block' => 'Lao Block',
311 'Latin(?:[-_]|\s+)?1(?:[-_]|\s+)?Supplement' => 'Latin-1 Supplement',
312 'Latin(?:[-_]|\s+)?Extended(?:[-_]|\s+)?A' => 'Latin Extended-A',
313 'Latin(?:[-_]|\s+)?Extended(?:[-_]|\s+)?B' => 'Latin Extended-B',
314 'Latin(?:[-_]|\s+)?Extended(?:[-_]|\s+)?Additional' => 'Latin Extended Additional',
317 'Letterlike(?:[-_]|\s+)?Symbols' => 'Letterlike Symbols',
320 'Low(?:[-_]|\s+)?Surrogates' => 'Low Surrogates',
323 'MALAYALAM' => 'MALAYALAM',
324 'Malayalam(?:[-_]|\s+)?Block' => 'Malayalam Block',
327 'Mathematical(?:[-_]|\s+)?Operators' => 'Mathematical Operators',
328 'Mathematical(?:[-_]|\s+)?Alphanumeric(?:[-_]|\s+)?Symbols' => 'Mathematical Alphanumeric Symbols',
331 'Miscellaneous(?:[-_]|\s+)?Technical' => 'Miscellaneous Technical',
332 'Miscellaneous(?:[-_]|\s+)?Symbols' => 'Miscellaneous Symbols',
335 'MONGOLIAN' => 'MONGOLIAN',
336 'Mongolian(?:[-_]|\s+)?Block' => 'Mongolian Block',
339 'Musical(?:[-_]|\s+)?Symbols' => 'Musical Symbols',
342 'MYANMAR' => 'MYANMAR',
343 'Myanmar(?:[-_]|\s+)?Block' => 'Myanmar Block',
346 'Number(?:[-_]|\s+)?Forms' => 'Number Forms',
350 'Ogham(?:[-_]|\s+)?Block' => 'Ogham Block',
353 'OLD(?:[-_]|\s+)?ITALIC' => 'OLD-ITALIC',
354 'Old(?:[-_]|\s+)?Italic' => 'Old Italic',
357 'Optical(?:[-_]|\s+)?Character(?:[-_]|\s+)?Recognition' => 'Optical Character Recognition',
361 'Oriya(?:[-_]|\s+)?Block' => 'Oriya Block',
364 'Private(?:[-_]|\s+)?Use' => 'Private Use',
368 'Runic(?:[-_]|\s+)?Block' => 'Runic Block',
371 'SINHALA' => 'SINHALA',
372 'Sinhala(?:[-_]|\s+)?Block' => 'Sinhala Block',
375 'Small(?:[-_]|\s+)?Form(?:[-_]|\s+)?Variants' => 'Small Form Variants',
378 'Spacing(?:[-_]|\s+)?Modifier(?:[-_]|\s+)?Letters' => 'Spacing Modifier Letters',
381 'Specials' => 'Specials',
384 'Superscripts(?:[-_]|\s+)?and(?:[-_]|\s+)?Subscripts' => 'Superscripts and Subscripts',
387 'SYRIAC' => 'SYRIAC',
388 'Syriac(?:[-_]|\s+)?Block' => 'Syriac Block',
395 'Tamil(?:[-_]|\s+)?Block' => 'Tamil Block',
398 'TELUGU' => 'TELUGU',
399 'Telugu(?:[-_]|\s+)?Block' => 'Telugu Block',
402 'THAANA' => 'THAANA',
404 'Thaana(?:[-_]|\s+)?Block' => 'Thaana Block',
405 'Thai(?:[-_]|\s+)?Block' => 'Thai Block',
408 'TIBETAN' => 'TIBETAN',
409 'Tibetan(?:[-_]|\s+)?Block' => 'Tibetan Block',
412 'Unified(?:[-_]|\s+)?Canadian(?:[-_]|\s+)?Aboriginal(?:[-_]|\s+)?Syllabics' => 'Unified Canadian Aboriginal Syllabics',
418 'Yi(?:[-_]|\s+)?Syllables' => 'Yi Syllables',
419 'Yi(?:[-_]|\s+)?Radicals' => 'Yi Radicals',