1 # !!!!!!! DO NOT EDIT THIS FILE !!!!!!!
2 # This file is built by ./mktables from e.g. Unicode.txt.
3 # Any changes made here will be lost!
6 ## Data in this file used by ../utf8_heavy.pl
9 ## Mapping from name to filename in ./In
13 ## Mappings from regex to filename in ./In/
16 'Alphabetic(?:[-_]|\s+)?Presentation(?:[-_]|\s+)?Forms' => 'Alphabet',
19 'Arabic(?:[-_]|\s+)?Presentation(?:[-_]|\s+)?Forms(?:[-_]|\s+)?A' => 'ArabicP2',
20 'Armenian' => 'Armenian',
23 'Arabic(?:[-_]|\s+)?Presentation(?:[-_]|\s+)?Forms(?:[-_]|\s+)?B' => 'ArabicPr',
26 'Basic(?:[-_]|\s+)?Latin' => 'BasicLat',
29 'Bengali' => 'Bengali',
32 'Block(?:[-_]|\s+)?Elements' => 'BlockEle',
35 'Bopomofo(?:[-_]|\s+)?Extended' => 'Bopomof2',
36 'Box(?:[-_]|\s+)?Drawing' => 'BoxDrawi',
37 'Bopomofo' => 'Bopomofo',
40 'Braille(?:[-_]|\s+)?Patterns' => 'BrailleP',
43 'Byzantine(?:[-_]|\s+)?Musical(?:[-_]|\s+)?Symbols' => 'Byzantin',
46 'Cherokee' => 'Cherokee',
49 'Cjk(?:[-_]|\s+)?Unified(?:[-_]|\s+)?Ideographs(?:[-_]|\s+)?Extension(?:[-_]|\s+)?A' => 'CjkUnif2',
50 'Cjk(?:[-_]|\s+)?Radicals(?:[-_]|\s+)?Supplement' => 'CjkRadic',
51 'Cjk(?:[-_]|\s+)?Compatibility(?:[-_]|\s+)?Ideographs' => 'CjkComp3',
52 'Cjk(?:[-_]|\s+)?Compatibility(?:[-_]|\s+)?Ideographs(?:[-_]|\s+)?Supplement' => 'CjkComp4',
53 'Cjk(?:[-_]|\s+)?Compatibility' => 'CjkCompa',
54 'Cjk(?:[-_]|\s+)?Unified(?:[-_]|\s+)?Ideographs' => 'CjkUnifi',
55 'Cjk(?:[-_]|\s+)?Symbols(?:[-_]|\s+)?And(?:[-_]|\s+)?Punctuation' => 'CjkSymbo',
56 'Cjk(?:[-_]|\s+)?Compatibility(?:[-_]|\s+)?Forms' => 'CjkComp2',
57 'Cjk(?:[-_]|\s+)?Unified(?:[-_]|\s+)?Ideographs(?:[-_]|\s+)?Extension(?:[-_]|\s+)?B' => 'CjkUnif3',
60 'Combining(?:[-_]|\s+)?Diacritical(?:[-_]|\s+)?Marks' => 'Combini2',
61 'Combining(?:[-_]|\s+)?Half(?:[-_]|\s+)?Marks' => 'Combinin',
62 'Control(?:[-_]|\s+)?Pictures' => 'ControlP',
63 'Combining(?:[-_]|\s+)?Marks(?:[-_]|\s+)?For(?:[-_]|\s+)?Symbols' => 'Combini3',
66 'Currency(?:[-_]|\s+)?Symbols' => 'Currency',
69 'Cyrillic' => 'Cyrillic',
72 'Deseret' => 'Deseret',
73 'Devanagari' => 'Devanaga',
76 'Dingbats' => 'Dingbats',
79 'Enclosed(?:[-_]|\s+)?Alphanumerics' => 'Enclosed',
80 'Enclosed(?:[-_]|\s+)?Cjk(?:[-_]|\s+)?Letters(?:[-_]|\s+)?And(?:[-_]|\s+)?Months' => 'Enclose2',
83 'Ethiopic' => 'Ethiopic',
86 'Geometric(?:[-_]|\s+)?Shapes' => 'Geometri',
87 'General(?:[-_]|\s+)?Punctuation' => 'GeneralP',
88 'Georgian' => 'Georgian',
94 'Greek(?:[-_]|\s+)?Extended' => 'GreekExt',
98 'Gujarati' => 'Gujarati',
99 'Gurmukhi' => 'Gurmukhi',
102 'Hangul(?:[-_]|\s+)?Syllables' => 'HangulSy',
103 'Hangul(?:[-_]|\s+)?Compatibility(?:[-_]|\s+)?Jamo' => 'HangulCo',
104 'Halfwidth(?:[-_]|\s+)?And(?:[-_]|\s+)?Fullwidth(?:[-_]|\s+)?Forms' => 'Halfwidt',
105 'Hangul(?:[-_]|\s+)?Jamo' => 'HangulJa',
108 'Hebrew' => 'Hebrew',
111 'High(?:[-_]|\s+)?Surrogates' => 'HighSurr',
112 'Hiragana' => 'Hiragana',
113 'High(?:[-_]|\s+)?Private(?:[-_]|\s+)?Use(?:[-_]|\s+)?Surrogates' => 'HighPriv',
116 'Ideographic(?:[-_]|\s+)?Description(?:[-_]|\s+)?Characters' => 'Ideograp',
119 'Ipa(?:[-_]|\s+)?Extensions' => 'IpaExten',
122 'Kannada' => 'Kannada',
123 'Kanbun' => 'Kanbun',
124 'Kangxi(?:[-_]|\s+)?Radicals' => 'KangxiRa',
125 'Katakana' => 'Katakana',
132 'Latin(?:[-_]|\s+)?Extended(?:[-_]|\s+)?B' => 'LatinExt',
133 'Latin(?:[-_]|\s+)?Extended(?:[-_]|\s+)?A' => 'LatinEx2',
134 'Latin(?:[-_]|\s+)?Extended(?:[-_]|\s+)?Additional' => 'LatinEx3',
135 'Latin(?:[-_]|\s+)?1(?:[-_]|\s+)?Supplement' => 'Latin1Su',
138 'Letterlike(?:[-_]|\s+)?Symbols' => 'Letterli',
141 'Low(?:[-_]|\s+)?Surrogates' => 'LowSurro',
144 'Mathematical(?:[-_]|\s+)?Operators' => 'Mathemat',
145 'Mathematical(?:[-_]|\s+)?Alphanumeric(?:[-_]|\s+)?Symbols' => 'Mathema2',
146 'Malayalam' => 'Malayala',
149 'Miscellaneous(?:[-_]|\s+)?Technical' => 'Miscell2',
150 'Miscellaneous(?:[-_]|\s+)?Symbols' => 'Miscella',
153 'Mongolian' => 'Mongolia',
156 'Musical(?:[-_]|\s+)?Symbols' => 'MusicalS',
159 'Myanmar' => 'Myanmar',
162 'Number(?:[-_]|\s+)?Forms' => 'NumberFo',
168 'Old(?:[-_]|\s+)?Italic' => 'OldItali',
171 'Optical(?:[-_]|\s+)?Character(?:[-_]|\s+)?Recognition' => 'OpticalC',
177 'Private(?:[-_]|\s+)?Use' => 'PrivateU',
183 'Sinhala' => 'Sinhala',
186 'Small(?:[-_]|\s+)?Form(?:[-_]|\s+)?Variants' => 'SmallFor',
189 'Spacing(?:[-_]|\s+)?Modifier(?:[-_]|\s+)?Letters' => 'SpacingM',
190 'Specials' => 'Specials',
193 'Superscripts(?:[-_]|\s+)?And(?:[-_]|\s+)?Subscripts' => 'Superscr',
196 'Syriac' => 'Syriac',
203 'Telugu' => 'Telugu',
206 'Thaana' => 'Thaana',
210 'Tibetan' => 'Tibetan',
213 'Unified(?:[-_]|\s+)?Canadian(?:[-_]|\s+)?Aboriginal(?:[-_]|\s+)?Syllabics' => 'UnifiedC',
216 'Yi(?:[-_]|\s+)?Syllables' => 'YiSyllab',
217 'Yi(?:[-_]|\s+)?Radicals' => 'YiRadica',