Commit | Line | Data |
9fdf68be |
1 | # !!!!!!! DO NOT EDIT THIS FILE !!!!!!! |
99598c8c |
2 | # This file is built by ./mktables from e.g. Unicode.txt. |
9fdf68be |
3 | # Any changes made here will be lost! |
cf25bb62 |
4 | |
5 | ## |
6 | ## Data in this file used by ../utf8_heavy.pl |
7 | ## |
71d929cb |
8 | |
cf25bb62 |
9 | ## Mapping from name to filename in ./In |
10 | %utf8::In = ( |
71d929cb |
11 | ); |
12 | |
cf25bb62 |
13 | ## Mappings from regex to filename in ./In/ |
14 | %utf8::InPat = ( |
15 | 'al' => { |
16 | 'Alphabetic(?:[-_]|\s+)?Presentation(?:[-_]|\s+)?Forms' => 'Alphabet', |
17 | }, |
18 | 'ar' => { |
99598c8c |
19 | 'Arabic(?:[-_]|\s+)?Presentation(?:[-_]|\s+)?Forms(?:[-_]|\s+)?A' => 'ArabicP2', |
cf25bb62 |
20 | 'Armenian' => 'Armenian', |
21 | 'Arabic' => 'Arabic', |
22 | 'Arrows' => 'Arrows', |
99598c8c |
23 | 'Arabic(?:[-_]|\s+)?Presentation(?:[-_]|\s+)?Forms(?:[-_]|\s+)?B' => 'ArabicPr', |
cf25bb62 |
24 | }, |
25 | 'ba' => { |
26 | 'Basic(?:[-_]|\s+)?Latin' => 'BasicLat', |
27 | }, |
28 | 'be' => { |
29 | 'Bengali' => 'Bengali', |
30 | }, |
31 | 'bl' => { |
32 | 'Block(?:[-_]|\s+)?Elements' => 'BlockEle', |
33 | }, |
34 | 'bo' => { |
99598c8c |
35 | 'Bopomofo(?:[-_]|\s+)?Extended' => 'Bopomof2', |
cf25bb62 |
36 | 'Box(?:[-_]|\s+)?Drawing' => 'BoxDrawi', |
99598c8c |
37 | 'Bopomofo' => 'Bopomofo', |
cf25bb62 |
38 | }, |
39 | 'br' => { |
40 | 'Braille(?:[-_]|\s+)?Patterns' => 'BrailleP', |
41 | }, |
42 | 'by' => { |
43 | 'Byzantine(?:[-_]|\s+)?Musical(?:[-_]|\s+)?Symbols' => 'Byzantin', |
44 | }, |
45 | 'ch' => { |
46 | 'Cherokee' => 'Cherokee', |
47 | }, |
48 | 'cj' => { |
99598c8c |
49 | 'Cjk(?:[-_]|\s+)?Unified(?:[-_]|\s+)?Ideographs(?:[-_]|\s+)?Extension(?:[-_]|\s+)?A' => 'CjkUnif2', |
cf25bb62 |
50 | 'Cjk(?:[-_]|\s+)?Radicals(?:[-_]|\s+)?Supplement' => 'CjkRadic', |
99598c8c |
51 | 'Cjk(?:[-_]|\s+)?Compatibility(?:[-_]|\s+)?Ideographs' => 'CjkComp3', |
52 | 'Cjk(?:[-_]|\s+)?Compatibility(?:[-_]|\s+)?Ideographs(?:[-_]|\s+)?Supplement' => 'CjkComp4', |
53 | 'Cjk(?:[-_]|\s+)?Compatibility' => 'CjkCompa', |
54 | 'Cjk(?:[-_]|\s+)?Unified(?:[-_]|\s+)?Ideographs' => 'CjkUnifi', |
cf25bb62 |
55 | 'Cjk(?:[-_]|\s+)?Symbols(?:[-_]|\s+)?And(?:[-_]|\s+)?Punctuation' => 'CjkSymbo', |
99598c8c |
56 | 'Cjk(?:[-_]|\s+)?Compatibility(?:[-_]|\s+)?Forms' => 'CjkComp2', |
cf25bb62 |
57 | 'Cjk(?:[-_]|\s+)?Unified(?:[-_]|\s+)?Ideographs(?:[-_]|\s+)?Extension(?:[-_]|\s+)?B' => 'CjkUnif3', |
cf25bb62 |
58 | }, |
59 | 'co' => { |
99598c8c |
60 | 'Combining(?:[-_]|\s+)?Diacritical(?:[-_]|\s+)?Marks' => 'Combini2', |
61 | 'Combining(?:[-_]|\s+)?Half(?:[-_]|\s+)?Marks' => 'Combinin', |
cf25bb62 |
62 | 'Control(?:[-_]|\s+)?Pictures' => 'ControlP', |
99598c8c |
63 | 'Combining(?:[-_]|\s+)?Marks(?:[-_]|\s+)?For(?:[-_]|\s+)?Symbols' => 'Combini3', |
cf25bb62 |
64 | }, |
65 | 'cu' => { |
66 | 'Currency(?:[-_]|\s+)?Symbols' => 'Currency', |
67 | }, |
68 | 'cy' => { |
69 | 'Cyrillic' => 'Cyrillic', |
70 | }, |
71 | 'de' => { |
cf25bb62 |
72 | 'Deseret' => 'Deseret', |
99598c8c |
73 | 'Devanagari' => 'Devanaga', |
cf25bb62 |
74 | }, |
75 | 'di' => { |
76 | 'Dingbats' => 'Dingbats', |
77 | }, |
78 | 'en' => { |
99598c8c |
79 | 'Enclosed(?:[-_]|\s+)?Alphanumerics' => 'Enclosed', |
80 | 'Enclosed(?:[-_]|\s+)?Cjk(?:[-_]|\s+)?Letters(?:[-_]|\s+)?And(?:[-_]|\s+)?Months' => 'Enclose2', |
cf25bb62 |
81 | }, |
82 | 'et' => { |
83 | 'Ethiopic' => 'Ethiopic', |
84 | }, |
85 | 'ge' => { |
86 | 'Geometric(?:[-_]|\s+)?Shapes' => 'Geometri', |
87 | 'General(?:[-_]|\s+)?Punctuation' => 'GeneralP', |
88 | 'Georgian' => 'Georgian', |
89 | }, |
90 | 'go' => { |
91 | 'Gothic' => 'Gothic', |
92 | }, |
93 | 'gr' => { |
94 | 'Greek(?:[-_]|\s+)?Extended' => 'GreekExt', |
95 | 'Greek' => 'Greek', |
96 | }, |
97 | 'gu' => { |
cf25bb62 |
98 | 'Gujarati' => 'Gujarati', |
99598c8c |
99 | 'Gurmukhi' => 'Gurmukhi', |
cf25bb62 |
100 | }, |
101 | 'ha' => { |
cf25bb62 |
102 | 'Hangul(?:[-_]|\s+)?Syllables' => 'HangulSy', |
99598c8c |
103 | 'Hangul(?:[-_]|\s+)?Compatibility(?:[-_]|\s+)?Jamo' => 'HangulCo', |
cf25bb62 |
104 | 'Halfwidth(?:[-_]|\s+)?And(?:[-_]|\s+)?Fullwidth(?:[-_]|\s+)?Forms' => 'Halfwidt', |
105 | 'Hangul(?:[-_]|\s+)?Jamo' => 'HangulJa', |
106 | }, |
107 | 'he' => { |
108 | 'Hebrew' => 'Hebrew', |
109 | }, |
110 | 'hi' => { |
cf25bb62 |
111 | 'High(?:[-_]|\s+)?Surrogates' => 'HighSurr', |
99598c8c |
112 | 'Hiragana' => 'Hiragana', |
113 | 'High(?:[-_]|\s+)?Private(?:[-_]|\s+)?Use(?:[-_]|\s+)?Surrogates' => 'HighPriv', |
cf25bb62 |
114 | }, |
115 | 'id' => { |
116 | 'Ideographic(?:[-_]|\s+)?Description(?:[-_]|\s+)?Characters' => 'Ideograp', |
117 | }, |
118 | 'ip' => { |
119 | 'Ipa(?:[-_]|\s+)?Extensions' => 'IpaExten', |
120 | }, |
121 | 'ka' => { |
cf25bb62 |
122 | 'Kannada' => 'Kannada', |
123 | 'Kanbun' => 'Kanbun', |
99598c8c |
124 | 'Kangxi(?:[-_]|\s+)?Radicals' => 'KangxiRa', |
125 | 'Katakana' => 'Katakana', |
cf25bb62 |
126 | }, |
127 | 'kh' => { |
128 | 'Khmer' => 'Khmer', |
129 | }, |
130 | 'la' => { |
cf25bb62 |
131 | 'Lao' => 'Lao', |
99598c8c |
132 | 'Latin(?:[-_]|\s+)?Extended(?:[-_]|\s+)?B' => 'LatinExt', |
cf25bb62 |
133 | 'Latin(?:[-_]|\s+)?Extended(?:[-_]|\s+)?A' => 'LatinEx2', |
99598c8c |
134 | 'Latin(?:[-_]|\s+)?Extended(?:[-_]|\s+)?Additional' => 'LatinEx3', |
135 | 'Latin(?:[-_]|\s+)?1(?:[-_]|\s+)?Supplement' => 'Latin1Su', |
cf25bb62 |
136 | }, |
137 | 'le' => { |
138 | 'Letterlike(?:[-_]|\s+)?Symbols' => 'Letterli', |
139 | }, |
140 | 'lo' => { |
141 | 'Low(?:[-_]|\s+)?Surrogates' => 'LowSurro', |
142 | }, |
143 | 'ma' => { |
144 | 'Mathematical(?:[-_]|\s+)?Operators' => 'Mathemat', |
145 | 'Mathematical(?:[-_]|\s+)?Alphanumeric(?:[-_]|\s+)?Symbols' => 'Mathema2', |
146 | 'Malayalam' => 'Malayala', |
147 | }, |
148 | 'mi' => { |
99598c8c |
149 | 'Miscellaneous(?:[-_]|\s+)?Technical' => 'Miscell2', |
150 | 'Miscellaneous(?:[-_]|\s+)?Symbols' => 'Miscella', |
cf25bb62 |
151 | }, |
152 | 'mo' => { |
153 | 'Mongolian' => 'Mongolia', |
154 | }, |
155 | 'mu' => { |
156 | 'Musical(?:[-_]|\s+)?Symbols' => 'MusicalS', |
157 | }, |
158 | 'my' => { |
159 | 'Myanmar' => 'Myanmar', |
160 | }, |
161 | 'nu' => { |
162 | 'Number(?:[-_]|\s+)?Forms' => 'NumberFo', |
163 | }, |
164 | 'og' => { |
165 | 'Ogham' => 'Ogham', |
166 | }, |
167 | 'ol' => { |
168 | 'Old(?:[-_]|\s+)?Italic' => 'OldItali', |
169 | }, |
170 | 'op' => { |
171 | 'Optical(?:[-_]|\s+)?Character(?:[-_]|\s+)?Recognition' => 'OpticalC', |
172 | }, |
173 | 'or' => { |
174 | 'Oriya' => 'Oriya', |
175 | }, |
176 | 'pr' => { |
177 | 'Private(?:[-_]|\s+)?Use' => 'PrivateU', |
178 | }, |
179 | 'ru' => { |
180 | 'Runic' => 'Runic', |
181 | }, |
182 | 'si' => { |
183 | 'Sinhala' => 'Sinhala', |
184 | }, |
185 | 'sm' => { |
186 | 'Small(?:[-_]|\s+)?Form(?:[-_]|\s+)?Variants' => 'SmallFor', |
187 | }, |
188 | 'sp' => { |
cf25bb62 |
189 | 'Spacing(?:[-_]|\s+)?Modifier(?:[-_]|\s+)?Letters' => 'SpacingM', |
99598c8c |
190 | 'Specials' => 'Specials', |
cf25bb62 |
191 | }, |
192 | 'su' => { |
193 | 'Superscripts(?:[-_]|\s+)?And(?:[-_]|\s+)?Subscripts' => 'Superscr', |
194 | }, |
195 | 'sy' => { |
196 | 'Syriac' => 'Syriac', |
197 | }, |
198 | 'ta' => { |
cf25bb62 |
199 | 'Tamil' => 'Tamil', |
99598c8c |
200 | 'Tags' => 'Tags', |
cf25bb62 |
201 | }, |
202 | 'te' => { |
203 | 'Telugu' => 'Telugu', |
204 | }, |
205 | 'th' => { |
206 | 'Thaana' => 'Thaana', |
207 | 'Thai' => 'Thai', |
208 | }, |
209 | 'ti' => { |
210 | 'Tibetan' => 'Tibetan', |
211 | }, |
212 | 'un' => { |
213 | 'Unified(?:[-_]|\s+)?Canadian(?:[-_]|\s+)?Aboriginal(?:[-_]|\s+)?Syllabics' => 'UnifiedC', |
214 | }, |
215 | 'yi' => { |
cf25bb62 |
216 | 'Yi(?:[-_]|\s+)?Syllables' => 'YiSyllab', |
99598c8c |
217 | 'Yi(?:[-_]|\s+)?Radicals' => 'YiRadica', |
cf25bb62 |
218 | }, |
71d929cb |
219 | ); |