Commit | Line | Data |
d73e5302 |
1 | # !!!!!!! DO NOT EDIT THIS FILE !!!!!!! |
2 | # This file is built by mktables from e.g. Unicode.txt. |
3 | # Any changes made here will be lost! |
37fca15e |
4 | # Built Mon Jan 14 15:52:42 2002. |
5 | |
6 | ## |
7 | ## Data in this file used by ../utf8_heavy.pl |
8 | ## |
9 | |
10 | ## Mapping from name to filename in ./Is |
11 | %utf8::Is = ( |
12 | 'ASCII' => 'ASCII', |
13 | 'Alnum' => 'Alnum', |
14 | 'Alpha' => 'Alpha', |
15 | 'BidiAL' => 'BidiAL', |
16 | 'BidiAN' => 'BidiAN', |
17 | 'BidiB' => 'BidiB', |
18 | 'BidiBN' => 'BidiBN', |
19 | 'BidiCS' => 'BidiCS', |
20 | 'BidiEN' => 'BidiEN', |
21 | 'BidiES' => 'BidiES', |
22 | 'BidiET' => 'BidiET', |
23 | 'BidiL' => 'BidiL', |
24 | 'BidiLRE' => 'BidiLRE', |
25 | 'BidiLRO' => 'BidiLRO', |
26 | 'BidiNSM' => 'BidiNSM', |
27 | 'BidiON' => 'BidiON', |
28 | 'BidiPDF' => 'BidiPDF', |
29 | 'BidiR' => 'BidiR', |
30 | 'BidiRLE' => 'BidiRLE', |
31 | 'BidiRLO' => 'BidiRLO', |
32 | 'BidiS' => 'BidiS', |
33 | 'BidiWS' => 'BidiWS', |
34 | 'Blank' => 'Blank', |
35 | 'C' => 'C', |
36 | 'Canon' => 'Canon', |
37 | 'Cc' => 'Cc', |
38 | 'Cf' => 'Cf', |
39 | 'Cn' => 'Cn', |
40 | 'Cntrl' => 'Cntrl', |
41 | 'Co' => 'Co', |
42 | 'Compat' => 'Compat', |
43 | 'Cs' => 'Cs', |
44 | 'DCcircle' => 'DCcircle', |
45 | 'DCcompat' => 'DCcompat', |
46 | 'DCfinal' => 'DCfinal', |
47 | 'DCfont' => 'DCfont', |
48 | 'DCfraction' => 'DCfracti', |
49 | 'DCinitial' => 'DCinitia', |
50 | 'DCisolated' => 'DCisolat', |
51 | 'DCmedial' => 'DCmedial', |
52 | 'DCnarrow' => 'DCnarrow', |
53 | 'DCnoBreak' => 'DCnoBrea', |
54 | 'DCsmall' => 'DCsmall', |
55 | 'DCsquare' => 'DCsquare', |
56 | 'DCsub' => 'DCsub', |
57 | 'DCsuper' => 'DCsuper', |
58 | 'DCvertical' => 'DCvertic', |
59 | 'DCwide' => 'DCwide', |
60 | 'Digit' => 'Digit', |
61 | 'Graph' => 'Graph', |
62 | 'L' => '2', |
63 | 'L&' => 'L', |
64 | 'LbrkAI' => 'LbrkAI', |
65 | 'LbrkAL' => 'LbrkAL', |
66 | 'LbrkB2' => 'LbrkB2', |
67 | 'LbrkBA' => 'LbrkBA', |
68 | 'LbrkBB' => 'LbrkBB', |
69 | 'LbrkBK' => 'LbrkBK', |
70 | 'LbrkCB' => 'LbrkCB', |
71 | 'LbrkCL' => 'LbrkCL', |
72 | 'LbrkCM' => 'LbrkCM', |
73 | 'LbrkCR' => 'LbrkCR', |
74 | 'LbrkEX' => 'LbrkEX', |
75 | 'LbrkGL' => 'LbrkGL', |
76 | 'LbrkHY' => 'LbrkHY', |
77 | 'LbrkID' => 'LbrkID', |
78 | 'LbrkIN' => 'LbrkIN', |
79 | 'LbrkIS' => 'LbrkIS', |
80 | 'LbrkLF' => 'LbrkLF', |
81 | 'LbrkNS' => 'LbrkNS', |
82 | 'LbrkNU' => 'LbrkNU', |
83 | 'LbrkOP' => 'LbrkOP', |
84 | 'LbrkPO' => 'LbrkPO', |
85 | 'LbrkPR' => 'LbrkPR', |
86 | 'LbrkQU' => 'LbrkQU', |
87 | 'LbrkSA' => 'LbrkSA', |
88 | 'LbrkSG' => 'LbrkSG', |
89 | 'LbrkSP' => 'LbrkSP', |
90 | 'LbrkSY' => 'LbrkSY', |
91 | 'LbrkXX' => 'LbrkXX', |
92 | 'LbrkZW' => 'LbrkZW', |
93 | 'Ll' => 'Ll', |
94 | 'Lm' => 'Lm', |
95 | 'Lo' => 'Lo', |
96 | 'Lower' => 'Lower', |
97 | 'Lt' => 'Lt', |
98 | 'Lu' => 'Lu', |
99 | 'M' => 'M', |
100 | 'Mc' => 'Mc', |
101 | 'Me' => 'Me', |
102 | 'Mirrored' => 'Mirrored', |
103 | 'Mn' => 'Mn', |
104 | 'N' => 'N', |
105 | 'Nd' => 'Nd', |
106 | 'Nl' => 'Nl', |
107 | 'No' => 'No', |
108 | 'P' => 'P', |
109 | 'Pc' => 'Pc', |
110 | 'Pd' => 'Pd', |
111 | 'Pe' => 'Pe', |
112 | 'Pf' => 'Pf', |
113 | 'Pi' => 'Pi', |
114 | 'Po' => 'Po', |
115 | 'Print' => 'Print', |
116 | 'Ps' => 'Ps', |
117 | 'Punct' => 'Punct', |
118 | 'S' => 'S', |
119 | 'Sc' => 'Sc', |
120 | 'Sk' => 'Sk', |
121 | 'Sm' => 'Sm', |
122 | 'So' => 'So', |
123 | 'Space' => 'Space', |
124 | 'SpacePerl' => 'SpacePer', |
125 | 'Title' => 'Title', |
126 | 'Upper' => 'Upper', |
127 | 'Word' => 'Word', |
128 | 'XDigit' => 'XDigit', |
129 | 'Z' => 'Z', |
130 | 'Zl' => 'Zl', |
131 | 'Zp' => 'Zp', |
132 | 'Zs' => 'Zs', |
d73e5302 |
133 | ); |
37fca15e |
134 | |
135 | ## Mappings from regex to filename in ./Is/ |
136 | %utf8::IsPat = ( |
137 | 'al' => { |
138 | 'Alphabetic' => 'Alphabet', |
139 | 'All' => 'Any', |
140 | }, |
141 | 'an' => { |
142 | 'Any' => 'Any', |
143 | }, |
144 | 'ar' => { |
145 | 'Armenian' => 'Armenian', |
146 | 'Arabic' => 'Arabic', |
147 | }, |
148 | 'as' => { |
149 | 'ASCII(?:[-_]|\s+)?Hex(?:[-_]|\s+)?Digit' => 'ASCIIHex', |
150 | 'Assigned' => 'Assigned', |
151 | }, |
152 | 'be' => { |
153 | 'Bengali' => 'Bengali', |
154 | }, |
155 | 'bi' => { |
156 | 'Bidi(?:[-_]|\s+)?Control' => 'BidiCont', |
157 | }, |
158 | 'bo' => { |
159 | 'Bopomofo' => 'Bopomofo', |
160 | }, |
161 | 'ca' => { |
162 | 'Canadian(?:[-_]|\s+)?Aboriginal' => 'Canadian', |
163 | }, |
164 | 'ch' => { |
165 | 'Cherokee' => 'Cherokee', |
166 | }, |
167 | 'cl' => { |
d73e5302 |
168 | 'Close(?:[-_]|\s+)?Punctuation' => 'Pe', |
37fca15e |
169 | }, |
170 | 'co' => { |
d73e5302 |
171 | 'Connector(?:[-_]|\s+)?Punctuation' => 'Pc', |
172 | 'Control' => 'Cc', |
37fca15e |
173 | 'Common' => 'Common', |
174 | }, |
175 | 'cu' => { |
d73e5302 |
176 | 'Currency(?:[-_]|\s+)?Symbol' => 'Sc', |
37fca15e |
177 | }, |
178 | 'cy' => { |
179 | 'Cyrillic' => 'Cyrillic', |
180 | }, |
181 | 'da' => { |
d73e5302 |
182 | 'Dash(?:[-_]|\s+)?Punctuation' => 'Pd', |
37fca15e |
183 | 'Dash' => 'Dash', |
184 | }, |
185 | 'de' => { |
186 | 'Devanagari' => 'Devanaga', |
e150c829 |
187 | 'Decimal(?:[-_]|\s+)?Number' => 'Nd', |
37fca15e |
188 | 'Deseret' => 'Deseret', |
189 | }, |
190 | 'di' => { |
191 | 'Diacritic' => 'Diacriti', |
192 | }, |
193 | 'en' => { |
d73e5302 |
194 | 'Enclosing(?:[-_]|\s+)?Mark' => 'Me', |
37fca15e |
195 | }, |
196 | 'et' => { |
197 | 'Ethiopic' => 'Ethiopic', |
198 | }, |
199 | 'ex' => { |
200 | 'Extender' => 'Extender', |
201 | }, |
202 | 'fi' => { |
d73e5302 |
203 | 'Final(?:[-_]|\s+)?Punctuation' => 'Pf', |
37fca15e |
204 | }, |
205 | 'fo' => { |
d73e5302 |
206 | 'Format' => 'Cf', |
37fca15e |
207 | }, |
208 | 'ge' => { |
209 | 'Georgian' => 'Georgian', |
210 | }, |
211 | 'go' => { |
212 | 'Gothic' => 'Gothic', |
213 | }, |
214 | 'gr' => { |
215 | 'Greek' => 'Greek', |
216 | }, |
217 | 'gu' => { |
218 | 'Gurmukhi' => 'Gurmukhi', |
219 | 'Gujarati' => 'Gujarati', |
220 | }, |
221 | 'ha' => { |
222 | 'Han' => 'Han', |
223 | 'Hangul' => 'Hangul', |
224 | }, |
225 | 'he' => { |
226 | 'Hebrew' => 'Hebrew', |
227 | 'Hex(?:[-_]|\s+)?Digit' => 'HexDigit', |
228 | }, |
229 | 'hi' => { |
230 | 'Hiragana' => 'Hiragana', |
231 | }, |
232 | 'hy' => { |
233 | 'Hyphen' => 'Hyphen', |
234 | }, |
235 | 'id' => { |
236 | 'Ideographic' => 'Ideograp', |
237 | 'ID(?:[-_]|\s+)?Continue' => 'IDContin', |
238 | 'ID(?:[-_]|\s+)?Start' => 'IDStart', |
239 | }, |
240 | 'in' => { |
241 | 'Inherited' => 'Inherite', |
d73e5302 |
242 | 'Initial(?:[-_]|\s+)?Punctuation' => 'Pi', |
37fca15e |
243 | }, |
244 | 'jo' => { |
245 | 'Join(?:[-_]|\s+)?Control' => 'JoinCont', |
246 | }, |
247 | 'ka' => { |
248 | 'Katakana' => 'Katakana', |
249 | 'Kannada' => 'Kannada', |
250 | }, |
251 | 'kh' => { |
252 | 'Khmer' => 'Khmer', |
253 | }, |
254 | 'la' => { |
255 | 'Latin' => 'Latin', |
256 | 'Lao' => 'Lao', |
257 | }, |
258 | 'le' => { |
d73e5302 |
259 | 'Letter(?:[-_]|\s+)?Number' => 'Nl', |
37fca15e |
260 | 'Letter' => '2', |
261 | }, |
262 | 'li' => { |
d73e5302 |
263 | 'Line(?:[-_]|\s+)?Separator' => 'Zl', |
37fca15e |
264 | }, |
265 | 'lo' => { |
d73e5302 |
266 | 'Lowercase(?:[-_]|\s+)?Letter' => 'Ll', |
37fca15e |
267 | 'Lowercase' => 'Lowercas', |
268 | }, |
269 | 'ma' => { |
d73e5302 |
270 | 'Math(?:[-_]|\s+)?Symbol' => 'Sm', |
37fca15e |
271 | 'Mark' => 'M', |
272 | 'Math' => 'Math', |
273 | 'Malayalam' => 'Malayala', |
274 | }, |
275 | 'mo' => { |
d73e5302 |
276 | 'Modifier(?:[-_]|\s+)?Letter' => 'Lm', |
277 | 'Modifier(?:[-_]|\s+)?Symbol' => 'Sk', |
37fca15e |
278 | 'Mongolian' => 'Mongolia', |
279 | }, |
280 | 'my' => { |
281 | 'Myanmar' => 'Myanmar', |
282 | }, |
283 | 'no' => { |
d73e5302 |
284 | 'Non(?:[-_]|\s+)?Spacing(?:[-_]|\s+)?Mark' => 'Mn', |
37fca15e |
285 | 'Noncharacter(?:[-_]|\s+)?Code(?:[-_]|\s+)?Point' => 'Nonchara', |
286 | }, |
287 | 'nu' => { |
d73e5302 |
288 | 'Number' => 'N', |
37fca15e |
289 | }, |
290 | 'og' => { |
291 | 'Ogham' => 'Ogham', |
292 | }, |
293 | 'ol' => { |
294 | 'Old(?:[-_]|\s+)?Italic' => 'OldItali', |
295 | }, |
296 | 'op' => { |
d73e5302 |
297 | 'Open(?:[-_]|\s+)?Punctuation' => 'Ps', |
37fca15e |
298 | }, |
299 | 'or' => { |
300 | 'Oriya' => 'Oriya', |
301 | }, |
302 | 'ot' => { |
303 | 'Other(?:[-_]|\s+)?Math' => 'OtherMat', |
d73e5302 |
304 | 'Other(?:[-_]|\s+)?Punctuation' => 'Po', |
37fca15e |
305 | 'Other(?:[-_]|\s+)?Lowercase' => 'OtherLow', |
306 | 'Other(?:[-_]|\s+)?Uppercase' => 'OtherUpp', |
307 | 'Other(?:[-_]|\s+)?Letter' => 'Lo', |
308 | 'Other(?:[-_]|\s+)?Alphabetic' => 'OtherAlp', |
d73e5302 |
309 | 'Other(?:[-_]|\s+)?Symbol' => 'So', |
37fca15e |
310 | 'Other(?:[-_]|\s+)?Number' => 'No', |
311 | 'Other' => 'C', |
312 | }, |
313 | 'pa' => { |
d73e5302 |
314 | 'Paragraph(?:[-_]|\s+)?Separator' => 'Zp', |
37fca15e |
315 | }, |
316 | 'pr' => { |
d73e5302 |
317 | 'Private(?:[-_]|\s+)?Use' => 'Co', |
37fca15e |
318 | }, |
319 | 'pu' => { |
d73e5302 |
320 | 'Punctuation' => 'P', |
37fca15e |
321 | }, |
322 | 'qu' => { |
323 | 'Quotation(?:[-_]|\s+)?Mark' => 'Quotatio', |
324 | }, |
325 | 'ru' => { |
326 | 'Runic' => 'Runic', |
327 | }, |
328 | 'se' => { |
d73e5302 |
329 | 'Separator' => 'Z', |
37fca15e |
330 | }, |
331 | 'si' => { |
332 | 'Sinhala' => 'Sinhala', |
333 | }, |
334 | 'sp' => { |
d73e5302 |
335 | 'Space(?:[-_]|\s+)?Separator' => 'Zs', |
e150c829 |
336 | 'Spacing(?:[-_]|\s+)?Mark' => 'Mc', |
37fca15e |
337 | }, |
338 | 'su' => { |
d73e5302 |
339 | 'Surrogate' => 'Cs', |
37fca15e |
340 | }, |
341 | 'sy' => { |
342 | 'Syriac' => 'Syriac', |
d73e5302 |
343 | 'Symbol' => 'S', |
37fca15e |
344 | }, |
345 | 'ta' => { |
346 | 'Tamil' => 'Tamil', |
347 | }, |
348 | 'te' => { |
349 | 'Terminal(?:[-_]|\s+)?Punctuation' => 'Terminal', |
350 | 'Telugu' => 'Telugu', |
351 | }, |
352 | 'th' => { |
353 | 'Thaana' => 'Thaana', |
354 | 'Thai' => 'Thai', |
355 | }, |
356 | 'ti' => { |
d73e5302 |
357 | 'Titlecase(?:[-_]|\s+)?Letter' => 'Lt', |
37fca15e |
358 | 'Tibetan' => 'Tibetan', |
359 | }, |
360 | 'un' => { |
e150c829 |
361 | 'Unassigned' => 'Cn', |
37fca15e |
362 | }, |
363 | 'up' => { |
d73e5302 |
364 | 'Uppercase(?:[-_]|\s+)?Letter' => 'Lu', |
37fca15e |
365 | 'Uppercase' => 'Uppercas', |
366 | }, |
367 | 'wh' => { |
368 | 'White(?:[-_]|\s+)?space' => 'WhiteSpa', |
369 | }, |
370 | 'yi' => { |
371 | 'Yi' => 'Yi', |
372 | }, |
d73e5302 |
373 | ); |