Commit | Line | Data |
1911be83 |
1 | # PropertyValueAliases-4.0.0.txt |
2 | # Date: 2003-03-12, 23:46:08 GMT [MD] |
822ebcc8 |
3 | # |
4 | # This file contains aliases for property values used in the UCD. |
5 | # These names can be used for XML formats of UCD data, for regular-expression |
6 | # property tests, and other programmatic textual descriptions of Unicode data. |
1911be83 |
7 | # For information on which properties are normative, see UCD.html. |
822ebcc8 |
8 | # |
9 | # The names may be translated in appropriate environments, and additional |
10 | # aliases may be useful. |
11 | # |
12 | # FORMAT |
13 | # |
14 | # Each line describes a property value name. |
15 | # This consists of three fields, separated by semicolons. |
16 | # |
17 | # First Field: The first field describes the property for which that |
18 | # property value name is used. |
19 | # There is one special pseudo-property: "qc" stands for any quick-check property |
20 | # |
21 | # Second Field: The second field is an abbreviated name. |
22 | # If there is no abbreviated name available, the field is marked with "n/a". |
23 | # |
24 | # Third Field: The third field is a long name. |
25 | # |
1911be83 |
26 | # In the case of ccc, there are 4 fields. The second field is numeric, third |
822ebcc8 |
27 | # is abbreviated, and fourth is long. |
28 | # |
29 | # With loose matching of property names, the case distinctions, whitespace, |
30 | # and '_' are ignored. |
31 | # |
822ebcc8 |
32 | # NOTE: Currently there is at most one abbreviated name and one long name for |
1911be83 |
33 | # property value. However, in the future additional aliases may be added. |
34 | # In such a case, the first line for the property value would have |
35 | # the preferred alias for output. |
822ebcc8 |
36 | # |
37 | # NOTE: The property value names are NOT unique across properties, especially |
1911be83 |
38 | # with loose matches. For example: |
39 | # |
822ebcc8 |
40 | # AL means Arabic Letter for the Bidi_Class property, and |
41 | # AL means Alpha_Left for the Combining_Class property, and |
42 | # AL means Alphabetic for the Line_Break property. |
43 | # |
1911be83 |
44 | # In addition, some property names may be the same as some property value names. |
45 | # For example: |
46 | # |
47 | # cc means Combining_Class property, and |
48 | # cc means the General_Category property value Control (cc) |
822ebcc8 |
49 | # |
50 | # The combination of property value and property name is, however, unique. |
1911be83 |
51 | # For more information, see UTR #18: Regular Expression Guidelines |
822ebcc8 |
52 | # ================================================ |
53 | |
54 | |
55 | bc ; AL ; Arabic_Letter |
56 | bc ; AN ; Arabic_Number |
57 | bc ; B ; Paragraph_Separator |
58 | bc ; BN ; Boundary_Neutral |
59 | bc ; CS ; Common_Separator |
60 | bc ; EN ; European_Number |
61 | bc ; ES ; European_Separator |
62 | bc ; ET ; European_Terminator |
63 | bc ; L ; Left_To_Right |
64 | bc ; LRE ; Left_To_Right_Embedding |
65 | bc ; LRO ; Left_To_Right_Override |
66 | bc ; NSM ; Nonspacing_Mark |
67 | bc ; ON ; Other_Neutral |
68 | bc ; PDF ; Pop_Directional_Format |
69 | bc ; R ; Right_To_Left |
70 | bc ; RLE ; Right_To_Left_Embedding |
71 | bc ; RLO ; Right_To_Left_Override |
72 | bc ; S ; Segment_Separator |
73 | bc ; WS ; White_Space |
74 | |
1911be83 |
75 | blk; n/a ; Aegean_Numbers |
76 | blk; n/a ; Alphabetic_Presentation_Forms |
77 | blk; n/a ; Arabic |
78 | blk; n/a ; Arabic_Presentation_Forms-A |
79 | blk; n/a ; Arabic_Presentation_Forms-B |
80 | blk; n/a ; Armenian |
81 | blk; n/a ; Arrows |
82 | blk; n/a ; Basic_Latin |
83 | blk; n/a ; Bengali |
84 | blk; n/a ; Block_Elements |
85 | blk; n/a ; Bopomofo |
86 | blk; n/a ; Bopomofo_Extended |
87 | blk; n/a ; Box_Drawing |
88 | blk; n/a ; Braille_Patterns |
89 | blk; n/a ; Buhid |
90 | blk; n/a ; Byzantine_Musical_Symbols |
91 | blk; n/a ; Cherokee |
92 | blk; n/a ; CJK_Compatibility |
93 | blk; n/a ; CJK_Compatibility_Forms |
94 | blk; n/a ; CJK_Compatibility_Ideographs |
95 | blk; n/a ; CJK_Compatibility_Ideographs_Supplement |
96 | blk; n/a ; CJK_Radicals_Supplement |
97 | blk; n/a ; CJK_Symbols_and_Punctuation |
98 | blk; n/a ; CJK_Unified_Ideographs |
99 | blk; n/a ; CJK_Unified_Ideographs_Extension_A |
100 | blk; n/a ; CJK_Unified_Ideographs_Extension_B |
101 | blk; n/a ; Combining_Diacritical_Marks |
102 | blk; n/a ; Combining_Diacritical_Marks_for_Symbols |
103 | blk; n/a ; Combining_Half_Marks |
104 | blk; n/a ; Control_Pictures |
105 | blk; n/a ; Currency_Symbols |
106 | blk; n/a ; Cypriot_Syllabary |
107 | blk; n/a ; Cyrillic |
108 | blk; n/a ; Cyrillic_Supplementary |
109 | blk; n/a ; Deseret |
110 | blk; n/a ; Devanagari |
111 | blk; n/a ; Dingbats |
112 | blk; n/a ; Enclosed_Alphanumerics |
113 | blk; n/a ; Enclosed_CJK_Letters_and_Months |
114 | blk; n/a ; Ethiopic |
115 | blk; n/a ; General_Punctuation |
116 | blk; n/a ; Geometric_Shapes |
117 | blk; n/a ; Georgian |
118 | blk; n/a ; Gothic |
119 | blk; n/a ; Greek_and_Coptic |
120 | blk; n/a ; Greek_Extended |
121 | blk; n/a ; Gujarati |
122 | blk; n/a ; Gurmukhi |
123 | blk; n/a ; Halfwidth_and_Fullwidth_Forms |
124 | blk; n/a ; Hangul_Compatibility_Jamo |
125 | blk; n/a ; Hangul_Jamo |
126 | blk; n/a ; Hangul_Syllables |
127 | blk; n/a ; Hanunoo |
128 | blk; n/a ; Hebrew |
129 | blk; n/a ; High_Private_Use_Surrogates |
130 | blk; n/a ; High_Surrogates |
131 | blk; n/a ; Hiragana |
132 | blk; n/a ; Ideographic_Description_Characters |
133 | blk; n/a ; IPA_Extensions |
134 | blk; n/a ; Kanbun |
135 | blk; n/a ; Kangxi_Radicals |
136 | blk; n/a ; Kannada |
137 | blk; n/a ; Katakana |
138 | blk; n/a ; Katakana_Phonetic_Extensions |
139 | blk; n/a ; Khmer |
140 | blk; n/a ; Khmer_Symbols |
141 | blk; n/a ; Lao |
142 | blk; n/a ; Latin_Extended_Additional |
143 | blk; n/a ; Latin_Extended-A |
144 | blk; n/a ; Latin_Extended-B |
145 | blk; n/a ; Latin-1_Supplement |
146 | blk; n/a ; Letterlike_Symbols |
147 | blk; n/a ; Limbu |
148 | blk; n/a ; Linear_B_Ideograms |
149 | blk; n/a ; Linear_B_Syllabary |
150 | blk; n/a ; Low_Surrogates |
151 | blk; n/a ; Malayalam |
152 | blk; n/a ; Mathematical_Alphanumeric_Symbols |
153 | blk; n/a ; Mathematical_Operators |
154 | blk; n/a ; Miscellaneous_Mathematical_Symbols-A |
155 | blk; n/a ; Miscellaneous_Mathematical_Symbols-B |
156 | blk; n/a ; Miscellaneous_Symbols |
157 | blk; n/a ; Miscellaneous_Symbols_and_Arrows |
158 | blk; n/a ; Miscellaneous_Technical |
159 | blk; n/a ; Mongolian |
160 | blk; n/a ; Musical_Symbols |
161 | blk; n/a ; Myanmar |
162 | blk; n/a ; No_Block |
163 | blk; n/a ; Number_Forms |
164 | blk; n/a ; Ogham |
165 | blk; n/a ; Old_Italic |
166 | blk; n/a ; Optical_Character_Recognition |
167 | blk; n/a ; Oriya |
168 | blk; n/a ; Osmanya |
169 | blk; n/a ; Phonetic_Extensions |
170 | blk; n/a ; Private_Use_Area |
171 | blk; n/a ; Runic |
172 | blk; n/a ; Shavian |
173 | blk; n/a ; Sinhala |
174 | blk; n/a ; Small_Form_Variants |
175 | blk; n/a ; Spacing_Modifier_Letters |
176 | blk; n/a ; Specials |
177 | blk; n/a ; Superscripts_and_Subscripts |
178 | blk; n/a ; Supplemental_Arrows-A |
179 | blk; n/a ; Supplemental_Arrows-B |
180 | blk; n/a ; Supplemental_Mathematical_Operators |
181 | blk; n/a ; Supplementary_Private_Use_Area-A |
182 | blk; n/a ; Supplementary_Private_Use_Area-B |
183 | blk; n/a ; Syriac |
184 | blk; n/a ; Tagalog |
185 | blk; n/a ; Tagbanwa |
186 | blk; n/a ; Tags |
187 | blk; n/a ; Tai_Le |
188 | blk; n/a ; Tai_Xuan_Jing_Symbols |
189 | blk; n/a ; Tamil |
190 | blk; n/a ; Telugu |
191 | blk; n/a ; Thaana |
192 | blk; n/a ; Thai |
193 | blk; n/a ; Tibetan |
194 | blk; n/a ; Ugaritic |
195 | blk; n/a ; Unified_Canadian_Aboriginal_Syllabics |
196 | blk; n/a ; Variation_Selectors |
197 | blk; n/a ; Variation_Selectors_Supplement |
198 | blk; n/a ; Yi_Radicals |
199 | blk; n/a ; Yi_Syllables |
200 | blk; n/a ; Yijing_Hexagram_Symbols |
201 | |
822ebcc8 |
202 | ccc; 0; NR ; Not_Reordered |
203 | ccc; 1; OV ; Overlay |
1911be83 |
204 | ccc; 202; ATB ; Attached_Below |
822ebcc8 |
205 | ccc; 216; ATAR ; Attached_Above_Right |
206 | ccc; 218; BL ; Below_Left |
207 | ccc; 220; B ; Below |
208 | ccc; 222; BR ; Below_Right |
209 | ccc; 224; L ; Left |
210 | ccc; 226; R ; Right |
211 | ccc; 228; AL ; Above_Left |
212 | ccc; 230; A ; Above |
213 | ccc; 232; AR ; Above_Right |
214 | ccc; 233; DB ; Double_Below |
215 | ccc; 234; DA ; Double_Above |
216 | ccc; 240; IS ; Iota_Subscript |
217 | ccc; 7; NK ; Nukta |
218 | ccc; 8; KV ; Kana_Voicing |
219 | ccc; 9; VR ; Virama |
220 | |
221 | dt ; can ; canonical |
222 | dt ; com ; compat |
223 | dt ; enc ; circle |
224 | dt ; fin ; final |
225 | dt ; font ; font |
226 | dt ; fra ; fraction |
227 | dt ; init ; initial |
228 | dt ; iso ; isolated |
229 | dt ; med ; medial |
230 | dt ; n/a ; none |
231 | dt ; nar ; narrow |
232 | dt ; nb ; noBreak |
233 | dt ; sml ; small |
234 | dt ; sqr ; square |
235 | dt ; sub ; sub |
236 | dt ; sup ; super |
237 | dt ; vert ; vertical |
238 | dt ; wide ; wide |
239 | |
240 | ea ; A ; Ambiguous |
241 | ea ; F ; Fullwidth |
242 | ea ; H ; Halfwidth |
243 | ea ; N ; Neutral |
244 | ea ; Na ; Narrow |
245 | ea ; W ; Wide |
246 | |
247 | gc ; C ; Other # Cc | Cf | Cn | Co | Cs |
248 | gc ; Cc ; Control |
249 | gc ; Cf ; Format |
250 | gc ; Cn ; Unassigned |
251 | gc ; Co ; Private_Use |
252 | gc ; Cs ; Surrogate |
253 | gc ; L ; Letter # Ll | Lm | Lo | Lt | Lu |
254 | gc ; LC ; Cased_Letter # Ll | Lt | Lu |
255 | gc ; Ll ; Lowercase_Letter |
256 | gc ; Lm ; Modifier_Letter |
257 | gc ; Lo ; Other_Letter |
258 | gc ; Lt ; Titlecase_Letter |
259 | gc ; Lu ; Uppercase_Letter |
260 | gc ; M ; Mark # Mc | Me | Mn |
261 | gc ; Mc ; Spacing_Mark |
262 | gc ; Me ; Enclosing_Mark |
263 | gc ; Mn ; Nonspacing_Mark |
264 | gc ; N ; Number # Nd | Nl | No |
265 | gc ; Nd ; Decimal_Number |
266 | gc ; Nl ; Letter_Number |
267 | gc ; No ; Other_Number |
268 | gc ; P ; Punctuation # Pc | Pd | Pe | Pf | Pi | Po | Ps |
269 | gc ; Pc ; Connector_Punctuation |
270 | gc ; Pd ; Dash_Punctuation |
271 | gc ; Pe ; Close_Punctuation |
272 | gc ; Pf ; Final_Punctuation |
273 | gc ; Pi ; Initial_Punctuation |
274 | gc ; Po ; Other_Punctuation |
275 | gc ; Ps ; Open_Punctuation |
276 | gc ; S ; Symbol # Sc | Sk | Sm | So |
277 | gc ; Sc ; Currency_Symbol |
278 | gc ; Sk ; Modifier_Symbol |
279 | gc ; Sm ; Math_Symbol |
280 | gc ; So ; Other_Symbol |
281 | gc ; Z ; Separator # Zl | Zp | Zs |
282 | gc ; Zl ; Line_Separator |
283 | gc ; Zp ; Paragraph_Separator |
284 | gc ; Zs ; Space_Separator |
285 | |
1911be83 |
286 | hst; L ; Leading_Jamo |
287 | hst; LV ; LV_Syllable |
288 | hst; LVT ; LVT_Syllable |
289 | hst; NA ; Not_Applicable |
290 | hst; T ; Trailing_Jamo |
291 | hst; V ; Vowel_Jamo |
292 | |
822ebcc8 |
293 | jg ; n/a ; AIN |
294 | jg ; n/a ; ALAPH |
295 | jg ; n/a ; ALEF |
296 | jg ; n/a ; BEH |
297 | jg ; n/a ; BETH |
298 | jg ; n/a ; DAL |
299 | jg ; n/a ; DALATH_RISH |
300 | jg ; n/a ; E |
1911be83 |
301 | jg ; n/a ; FE |
822ebcc8 |
302 | jg ; n/a ; FEH |
303 | jg ; n/a ; FINAL_SEMKATH |
304 | jg ; n/a ; GAF |
305 | jg ; n/a ; GAMAL |
306 | jg ; n/a ; HAH |
307 | jg ; n/a ; HAMZA_ON_HEH_GOAL |
308 | jg ; n/a ; HE |
309 | jg ; n/a ; HEH |
310 | jg ; n/a ; HEH_GOAL |
311 | jg ; n/a ; HETH |
312 | jg ; n/a ; KAF |
313 | jg ; n/a ; KAPH |
1911be83 |
314 | jg ; n/a ; KHAPH |
822ebcc8 |
315 | jg ; n/a ; KNOTTED_HEH |
316 | jg ; n/a ; LAM |
317 | jg ; n/a ; LAMADH |
318 | jg ; n/a ; MEEM |
319 | jg ; n/a ; MIM |
320 | jg ; n/a ; NO_JOINING_GROUP |
321 | jg ; n/a ; NOON |
322 | jg ; n/a ; NUN |
323 | jg ; n/a ; PE |
324 | jg ; n/a ; QAF |
325 | jg ; n/a ; QAPH |
326 | jg ; n/a ; REH |
327 | jg ; n/a ; REVERSED_PE |
328 | jg ; n/a ; SAD |
329 | jg ; n/a ; SADHE |
330 | jg ; n/a ; SEEN |
331 | jg ; n/a ; SEMKATH |
332 | jg ; n/a ; SHIN |
333 | jg ; n/a ; SWASH_KAF |
334 | jg ; n/a ; SYRIAC_WAW |
335 | jg ; n/a ; TAH |
336 | jg ; n/a ; TAW |
337 | jg ; n/a ; TEH_MARBUTA |
338 | jg ; n/a ; TETH |
339 | jg ; n/a ; WAW |
340 | jg ; n/a ; YEH |
341 | jg ; n/a ; YEH_BARREE |
342 | jg ; n/a ; YEH_WITH_TAIL |
343 | jg ; n/a ; YUDH |
344 | jg ; n/a ; YUDH_HE |
345 | jg ; n/a ; ZAIN |
1911be83 |
346 | jg ; n/a ; ZHAIN |
822ebcc8 |
347 | |
348 | jt ; C ; Join_Causing |
349 | jt ; D ; Dual_Joining |
350 | jt ; L ; Left_Joining |
351 | jt ; R ; Right_Joining |
352 | jt ; T ; Transparent |
353 | jt ; U ; Non_Joining |
354 | |
355 | lb ; AI ; Ambiguous |
356 | lb ; AL ; Alphabetic |
357 | lb ; B2 ; Break_Both |
358 | lb ; BA ; Break_After |
359 | lb ; BB ; Break_Before |
360 | lb ; BK ; Mandatory_Break |
361 | lb ; CB ; Contingent_Break |
362 | lb ; CL ; Close_Punctuation |
363 | lb ; CM ; Combining_Mark |
364 | lb ; CR ; Carriage_Return |
365 | lb ; EX ; Exclamation |
366 | lb ; GL ; Glue |
367 | lb ; HY ; Hyphen |
368 | lb ; ID ; Ideographic |
369 | lb ; IN ; Inseperable |
370 | lb ; IS ; Infix_Numeric |
371 | lb ; LF ; Line_Feed |
1911be83 |
372 | lb ; NL ; Next_Line |
822ebcc8 |
373 | lb ; NS ; Nonstarter |
374 | lb ; NU ; Numeric |
375 | lb ; OP ; Open_Punctuation |
376 | lb ; PO ; Postfix_Numeric |
377 | lb ; PR ; Prefix_Numeric |
378 | lb ; QU ; Quotation |
379 | lb ; SA ; Complex_Context |
380 | lb ; SG ; Surrogate |
381 | lb ; SP ; Space |
382 | lb ; SY ; Break_Symbols |
1911be83 |
383 | lb ; WJ ; Word_Joiner |
822ebcc8 |
384 | lb ; XX ; Unknown |
385 | lb ; ZW ; ZWSpace |
386 | |
387 | nt ; de ; Decimal |
388 | nt ; di ; Digit |
389 | nt ; n/a ; None |
390 | nt ; nu ; Numeric |
391 | |
392 | qc ; M ; Maybe |
393 | qc ; N ; No |
394 | qc ; Y ; Yes |
395 | |
396 | sc ; Arab ; Arabic |
397 | sc ; Armn ; Armenian |
398 | sc ; Beng ; Bengali |
399 | sc ; Bopo ; Bopomofo |
1911be83 |
400 | sc ; Brai ; Braille |
822ebcc8 |
401 | sc ; Buhd ; Buhid |
402 | sc ; Cans ; Canadian_Aboriginal |
403 | sc ; Cher ; Cherokee |
1911be83 |
404 | sc ; Cprt ; Cypriot |
822ebcc8 |
405 | sc ; Cyrl ; Cyrillic |
406 | sc ; Deva ; Devanagari |
407 | sc ; Dsrt ; Deseret |
408 | sc ; Ethi ; Ethiopic |
409 | sc ; Geor ; Georgian |
410 | sc ; Goth ; Gothic |
411 | sc ; Grek ; Greek |
412 | sc ; Gujr ; Gujarati |
413 | sc ; Guru ; Gurmukhi |
414 | sc ; Hang ; Hangul |
415 | sc ; Hani ; Han |
416 | sc ; Hano ; Hanunoo |
417 | sc ; Hebr ; Hebrew |
418 | sc ; Hira ; Hiragana |
419 | sc ; Ital ; Old_Italic |
420 | sc ; Kana ; Katakana |
421 | sc ; Khmr ; Khmer |
422 | sc ; Knda ; Kannada |
423 | sc ; Laoo ; Lao |
424 | sc ; Latn ; Latin |
1911be83 |
425 | sc ; Limb ; Limbu |
426 | sc ; Linb ; Linear_B |
822ebcc8 |
427 | sc ; Mlym ; Malayalam |
428 | sc ; Mong ; Mongolian |
429 | sc ; Mymr ; Myanmar |
430 | sc ; Ogam ; Ogham |
431 | sc ; Orya ; Oriya |
1911be83 |
432 | sc ; Osma ; Osmanya |
822ebcc8 |
433 | sc ; Qaai ; Inherited |
434 | sc ; Runr ; Runic |
1911be83 |
435 | sc ; Shaw ; Shavian |
822ebcc8 |
436 | sc ; Sinh ; Sinhala |
437 | sc ; Syrc ; Syriac |
438 | sc ; Tagb ; Tagbanwa |
1911be83 |
439 | sc ; Tale ; Tai_Le |
822ebcc8 |
440 | sc ; Taml ; Tamil |
441 | sc ; Telu ; Telugu |
442 | sc ; Tglg ; Tagalog |
443 | sc ; Thaa ; Thaana |
444 | sc ; Thai ; Thai |
445 | sc ; Tibt ; Tibetan |
1911be83 |
446 | sc ; Ugar ; Ugaritic |
822ebcc8 |
447 | sc ; Yiii ; Yi |
448 | sc ; Zyyy ; Common |