1 # PropertyValueAliases-5.1.0.txt
2 # Date: 2008-03-03, 21:58:08 GMT [MD]
4 # Unicode Character Database
5 # Copyright (c) 1991-2008 Unicode, Inc.
6 # For terms of use, see http://www.unicode.org/terms_of_use.html
7 # For documentation, see UCD.html
9 # This file contains aliases for property values used in the UCD.
10 # These names can be used for XML formats of UCD data, for regular-expression
11 # property tests, and other programmatic textual descriptions of Unicode data.
12 # For information on which properties are normative, see UCD.html.
14 # The names may be translated in appropriate environments, and additional
15 # aliases may be useful.
19 # Each line describes a property value name.
20 # This consists of three or more fields, separated by semicolons.
22 # First Field: The first field describes the property for which that
23 # property value name is used.
25 # Second Field: The second field is an abbreviated name.
26 # If there is no abbreviated name available, the field is marked with "n/a".
28 # Third Field: The third field is a long name.
30 # In the case of ccc, there are 4 fields. The second field is numeric, third
31 # is abbreviated, and fourth is long.
33 # The above are the preferred aliases. Other aliases may be listed in additional fields.
35 # Loose matching should be applied to all property names and property values, with
36 # the exception of String Property values. With loose matching of property names and
37 # values, the case distinctions, whitespace, and '_' are ignored. For Numeric Property
38 # values, numeric equivalencies are applied: thus "01.00" is equivalent to "1".
40 # NOTE: Property value names are NOT unique across properties. For example:
42 # AL means Arabic Letter for the Bidi_Class property, and
43 # AL means Alpha_Left for the Combining_Class property, and
44 # AL means Alphabetic for the Line_Break property.
46 # In addition, some property names may be the same as some property value names.
49 # sc means the Script property, and
50 # Sc means the General_Category property value Currency_Symbol (Sc)
52 # The combination of property value and property name is, however, unique.
54 # For more information, see UTS #18: Regular Expression Guidelines
55 # ================================================
58 # ASCII_Hex_Digit (AHex)
60 AHex; N ; No ; F ; False
61 AHex; Y ; Yes ; T ; True
79 Alpha; N ; No ; F ; False
80 Alpha; Y ; Yes ; T ; True
84 bc ; AL ; Arabic_Letter
85 bc ; AN ; Arabic_Number
86 bc ; B ; Paragraph_Separator
87 bc ; BN ; Boundary_Neutral
88 bc ; CS ; Common_Separator
89 bc ; EN ; European_Number
90 bc ; ES ; European_Separator
91 bc ; ET ; European_Terminator
92 bc ; L ; Left_To_Right
93 bc ; LRE ; Left_To_Right_Embedding
94 bc ; LRO ; Left_To_Right_Override
95 bc ; NSM ; Nonspacing_Mark
96 bc ; ON ; Other_Neutral
97 bc ; PDF ; Pop_Directional_Format
98 bc ; R ; Right_To_Left
99 bc ; RLE ; Right_To_Left_Embedding
100 bc ; RLO ; Right_To_Left_Override
101 bc ; S ; Segment_Separator
102 bc ; WS ; White_Space
104 # Bidi_Control (Bidi_C)
106 Bidi_C; N ; No ; F ; False
107 Bidi_C; Y ; Yes ; T ; True
109 # Bidi_Mirrored (Bidi_M)
111 Bidi_M; N ; No ; F ; False
112 Bidi_M; Y ; Yes ; T ; True
114 # Bidi_Mirroring_Glyph (bmg)
116 # @missing: 0000..10FFFF; Bidi_Mirroring_Glyph; <none>
120 blk; n/a ; Aegean_Numbers
121 blk; n/a ; Alphabetic_Presentation_Forms
122 blk; n/a ; Ancient_Greek_Musical_Notation
123 blk; n/a ; Ancient_Greek_Numbers
124 blk; n/a ; Ancient_Symbols
126 blk; n/a ; Arabic_Presentation_Forms_A ; Arabic_Presentation_Forms-A
127 blk; n/a ; Arabic_Presentation_Forms_B
128 blk; n/a ; Arabic_Supplement
132 blk; n/a ; Basic_Latin ; ASCII
134 blk; n/a ; Block_Elements
136 blk; n/a ; Bopomofo_Extended
137 blk; n/a ; Box_Drawing
138 blk; n/a ; Braille_Patterns
141 blk; n/a ; Byzantine_Musical_Symbols
145 blk; n/a ; CJK_Compatibility
146 blk; n/a ; CJK_Compatibility_Forms
147 blk; n/a ; CJK_Compatibility_Ideographs
148 blk; n/a ; CJK_Compatibility_Ideographs_Supplement
149 blk; n/a ; CJK_Radicals_Supplement
150 blk; n/a ; CJK_Strokes
151 blk; n/a ; CJK_Symbols_And_Punctuation
152 blk; n/a ; CJK_Unified_Ideographs
153 blk; n/a ; CJK_Unified_Ideographs_Extension_A
154 blk; n/a ; CJK_Unified_Ideographs_Extension_B
155 blk; n/a ; Combining_Diacritical_Marks
156 blk; n/a ; Combining_Diacritical_Marks_For_Symbols; Combining_Marks_For_Symbols
157 blk; n/a ; Combining_Diacritical_Marks_Supplement
158 blk; n/a ; Combining_Half_Marks
159 blk; n/a ; Control_Pictures
161 blk; n/a ; Counting_Rod_Numerals
163 blk; n/a ; Cuneiform_Numbers_And_Punctuation
164 blk; n/a ; Currency_Symbols
165 blk; n/a ; Cypriot_Syllabary
167 blk; n/a ; Cyrillic_Extended_A
168 blk; n/a ; Cyrillic_Extended_B
169 blk; n/a ; Cyrillic_Supplement ; Cyrillic_Supplementary
171 blk; n/a ; Devanagari
173 blk; n/a ; Domino_Tiles
174 blk; n/a ; Enclosed_Alphanumerics
175 blk; n/a ; Enclosed_CJK_Letters_And_Months
177 blk; n/a ; Ethiopic_Extended
178 blk; n/a ; Ethiopic_Supplement
179 blk; n/a ; General_Punctuation
180 blk; n/a ; Geometric_Shapes
182 blk; n/a ; Georgian_Supplement
183 blk; n/a ; Glagolitic
185 blk; n/a ; Greek_And_Coptic ; Greek
186 blk; n/a ; Greek_Extended
189 blk; n/a ; Halfwidth_And_Fullwidth_Forms
190 blk; n/a ; Hangul_Compatibility_Jamo
191 blk; n/a ; Hangul_Jamo
192 blk; n/a ; Hangul_Syllables
195 blk; n/a ; High_Private_Use_Surrogates
196 blk; n/a ; High_Surrogates
198 blk; n/a ; Ideographic_Description_Characters
199 blk; n/a ; IPA_Extensions
201 blk; n/a ; Kangxi_Radicals
204 blk; n/a ; Katakana_Phonetic_Extensions
206 blk; n/a ; Kharoshthi
208 blk; n/a ; Khmer_Symbols
210 blk; n/a ; Latin_1_Supplement ; Latin_1
211 blk; n/a ; Latin_Extended_A
212 blk; n/a ; Latin_Extended_Additional
213 blk; n/a ; Latin_Extended_B
214 blk; n/a ; Latin_Extended_C
215 blk; n/a ; Latin_Extended_D
217 blk; n/a ; Letterlike_Symbols
219 blk; n/a ; Linear_B_Ideograms
220 blk; n/a ; Linear_B_Syllabary
221 blk; n/a ; Low_Surrogates
224 blk; n/a ; Mahjong_Tiles
226 blk; n/a ; Mathematical_Alphanumeric_Symbols
227 blk; n/a ; Mathematical_Operators
228 blk; n/a ; Miscellaneous_Mathematical_Symbols_A
229 blk; n/a ; Miscellaneous_Mathematical_Symbols_B
230 blk; n/a ; Miscellaneous_Symbols
231 blk; n/a ; Miscellaneous_Symbols_And_Arrows
232 blk; n/a ; Miscellaneous_Technical
233 blk; n/a ; Modifier_Tone_Letters
235 blk; n/a ; Musical_Symbols
237 blk; n/a ; New_Tai_Lue
240 blk; n/a ; Number_Forms
243 blk; n/a ; Old_Italic
244 blk; n/a ; Old_Persian
245 blk; n/a ; Optical_Character_Recognition
249 blk; n/a ; Phaistos_Disc
250 blk; n/a ; Phoenician
251 blk; n/a ; Phonetic_Extensions
252 blk; n/a ; Phonetic_Extensions_Supplement
253 blk; n/a ; Private_Use_Area ; Private_Use
256 blk; n/a ; Saurashtra
259 blk; n/a ; Small_Form_Variants
260 blk; n/a ; Spacing_Modifier_Letters
263 blk; n/a ; Superscripts_And_Subscripts
264 blk; n/a ; Supplemental_Arrows_A
265 blk; n/a ; Supplemental_Arrows_B
266 blk; n/a ; Supplemental_Mathematical_Operators
267 blk; n/a ; Supplemental_Punctuation
268 blk; n/a ; Supplementary_Private_Use_Area_A
269 blk; n/a ; Supplementary_Private_Use_Area_B
270 blk; n/a ; Syloti_Nagri
276 blk; n/a ; Tai_Xuan_Jing_Symbols
284 blk; n/a ; Unified_Canadian_Aboriginal_Syllabics; Canadian_Syllabics
286 blk; n/a ; Variation_Selectors
287 blk; n/a ; Variation_Selectors_Supplement
288 blk; n/a ; Vertical_Forms
289 blk; n/a ; Yi_Radicals
290 blk; n/a ; Yi_Syllables
291 blk; n/a ; Yijing_Hexagram_Symbols
293 # Canonical_Combining_Class (ccc)
295 ccc; 0; NR ; Not_Reordered
298 ccc; 8; KV ; Kana_Voicing
300 ccc; 200; ATBL ; Attached_Below_Left
301 ccc; 202; ATB ; Attached_Below
302 ccc; 216; ATAR ; Attached_Above_Right
303 ccc; 218; BL ; Below_Left
305 ccc; 222; BR ; Below_Right
308 ccc; 228; AL ; Above_Left
310 ccc; 232; AR ; Above_Right
311 ccc; 233; DB ; Double_Below
312 ccc; 234; DA ; Double_Above
313 ccc; 240; IS ; Iota_Subscript
317 # @missing: 0000..10FFFF; Case_Folding; <code point>
319 # Composition_Exclusion (CE)
321 CE ; N ; No ; F ; False
322 CE ; Y ; Yes ; T ; True
326 Dash; N ; No ; F ; False
327 Dash; Y ; Yes ; T ; True
329 # Decomposition_Mapping (dm)
331 # @missing: 0000..10FFFF; Decomposition_Mapping; <code point>
333 # Decomposition_Type (dt)
335 dt ; Can ; Canonical ; can
336 dt ; Com ; Compat ; com
337 dt ; Enc ; Circle ; enc
338 dt ; Fin ; Final ; fin
340 dt ; Fra ; Fraction ; fra
341 dt ; Init ; Initial ; init
342 dt ; Iso ; Isolated ; iso
343 dt ; Med ; Medial ; med
344 dt ; Nar ; Narrow ; nar
345 dt ; Nb ; Nobreak ; nb
347 dt ; Sml ; Small ; sml
348 dt ; Sqr ; Square ; sqr
350 dt ; Sup ; Super ; sup
351 dt ; Vert ; Vertical ; vert
354 # Default_Ignorable_Code_Point (DI)
356 DI ; N ; No ; F ; False
357 DI ; Y ; Yes ; T ; True
361 Dep; N ; No ; F ; False
362 Dep; Y ; Yes ; T ; True
366 Dia; N ; No ; F ; False
367 Dia; Y ; Yes ; T ; True
369 # East_Asian_Width (ea)
378 # Expands_On_NFC (XO_NFC)
380 XO_NFC; N ; No ; F ; False
381 XO_NFC; Y ; Yes ; T ; True
383 # Expands_On_NFD (XO_NFD)
385 XO_NFD; N ; No ; F ; False
386 XO_NFD; Y ; Yes ; T ; True
388 # Expands_On_NFKC (XO_NFKC)
390 XO_NFKC; N ; No ; F ; False
391 XO_NFKC; Y ; Yes ; T ; True
393 # Expands_On_NFKD (XO_NFKD)
395 XO_NFKD; N ; No ; F ; False
396 XO_NFKD; Y ; Yes ; T ; True
400 Ext; N ; No ; F ; False
401 Ext; Y ; Yes ; T ; True
403 # FC_NFKC_Closure (FC_NFKC)
405 # @missing: 0000..10FFFF; FC_NFKC_Closure; <code point>
407 # Full_Composition_Exclusion (Comp_Ex)
409 Comp_Ex; N ; No ; F ; False
410 Comp_Ex; Y ; Yes ; T ; True
412 # General_Category (gc)
414 gc ; C ; Other # Cc | Cf | Cn | Co | Cs
415 gc ; Cc ; Control ; cntrl
418 gc ; Co ; Private_Use
420 gc ; L ; Letter # Ll | Lm | Lo | Lt | Lu
421 gc ; LC ; Cased_Letter # Ll | Lt | Lu
422 gc ; Ll ; Lowercase_Letter
423 gc ; Lm ; Modifier_Letter
424 gc ; Lo ; Other_Letter
425 gc ; Lt ; Titlecase_Letter
426 gc ; Lu ; Uppercase_Letter
427 gc ; M ; Mark # Mc | Me | Mn
428 gc ; Mc ; Spacing_Mark
429 gc ; Me ; Enclosing_Mark
430 gc ; Mn ; Nonspacing_Mark
431 gc ; N ; Number # Nd | Nl | No
432 gc ; Nd ; Decimal_Number ; digit
433 gc ; Nl ; Letter_Number
434 gc ; No ; Other_Number
435 gc ; P ; Punctuation ; punct # Pc | Pd | Pe | Pf | Pi | Po | Ps
436 gc ; Pc ; Connector_Punctuation
437 gc ; Pd ; Dash_Punctuation
438 gc ; Pe ; Close_Punctuation
439 gc ; Pf ; Final_Punctuation
440 gc ; Pi ; Initial_Punctuation
441 gc ; Po ; Other_Punctuation
442 gc ; Ps ; Open_Punctuation
443 gc ; S ; Symbol # Sc | Sk | Sm | So
444 gc ; Sc ; Currency_Symbol
445 gc ; Sk ; Modifier_Symbol
446 gc ; Sm ; Math_Symbol
447 gc ; So ; Other_Symbol
448 gc ; Z ; Separator # Zl | Zp | Zs
449 gc ; Zl ; Line_Separator
450 gc ; Zp ; Paragraph_Separator
451 gc ; Zs ; Space_Separator
453 # Grapheme_Base (Gr_Base)
455 Gr_Base; N ; No ; F ; False
456 Gr_Base; Y ; Yes ; T ; True
458 # Grapheme_Cluster_Break (GCB)
468 GCB; SM ; SpacingMark
473 # Grapheme_Extend (Gr_Ext)
475 Gr_Ext; N ; No ; F ; False
476 Gr_Ext; Y ; Yes ; T ; True
478 # Grapheme_Link (Gr_Link)
480 Gr_Link; N ; No ; F ; False
481 Gr_Link; Y ; Yes ; T ; True
483 # Hangul_Syllable_Type (hst)
485 hst; L ; Leading_Jamo
486 hst; LV ; LV_Syllable
487 hst; LVT ; LVT_Syllable
488 hst; NA ; Not_Applicable
489 hst; T ; Trailing_Jamo
494 Hex; N ; No ; F ; False
495 Hex; Y ; Yes ; T ; True
499 Hyphen; N ; No ; F ; False
500 Hyphen; Y ; Yes ; T ; True
502 # IDS_Binary_Operator (IDSB)
504 IDSB; N ; No ; F ; False
505 IDSB; Y ; Yes ; T ; True
507 # IDS_Trinary_Operator (IDST)
509 IDST; N ; No ; F ; False
510 IDST; Y ; Yes ; T ; True
514 IDC; N ; No ; F ; False
515 IDC; Y ; Yes ; T ; True
519 IDS; N ; No ; F ; False
520 IDS; Y ; Yes ; T ; True
524 # @missing: 0000..10FFFF; ISO_Comment; <none>
528 Ideo; N ; No ; F ; False
529 Ideo; Y ; Yes ; T ; True
531 # Jamo_Short_Name (JSN)
533 # @missing: 0000..10FFFF; Jamo_Short_Name; <none>
587 # Join_Control (Join_C)
589 Join_C; N ; No ; F ; False
590 Join_C; Y ; Yes ; T ; True
599 jg ; n/a ; Burushaski_Yeh_Barree
601 jg ; n/a ; Dalath_Rish
605 jg ; n/a ; Final_Semkath
609 jg ; n/a ; Hamza_On_Heh_Goal
617 jg ; n/a ; Knotted_Heh
622 jg ; n/a ; No_Joining_Group
629 jg ; n/a ; Reversed_Pe
636 jg ; n/a ; Syriac_Waw
639 jg ; n/a ; Teh_Marbuta
643 jg ; n/a ; Yeh_Barree
644 jg ; n/a ; Yeh_With_Tail
652 jt ; C ; Join_Causing
653 jt ; D ; Dual_Joining
654 jt ; L ; Left_Joining
655 jt ; R ; Right_Joining
664 lb ; BA ; Break_After
665 lb ; BB ; Break_Before
666 lb ; BK ; Mandatory_Break
667 lb ; CB ; Contingent_Break
668 lb ; CL ; Close_Punctuation
669 lb ; CM ; Combining_Mark
670 lb ; CR ; Carriage_Return
671 lb ; EX ; Exclamation
676 lb ; ID ; Ideographic
677 lb ; IN ; Inseparable ; Inseperable
678 lb ; IS ; Infix_Numeric
686 lb ; OP ; Open_Punctuation
687 lb ; PO ; Postfix_Numeric
688 lb ; PR ; Prefix_Numeric
690 lb ; SA ; Complex_Context
693 lb ; SY ; Break_Symbols
694 lb ; WJ ; Word_Joiner
698 # Logical_Order_Exception (LOE)
700 LOE; N ; No ; F ; False
701 LOE; Y ; Yes ; T ; True
705 Lower; N ; No ; F ; False
706 Lower; Y ; Yes ; T ; True
708 # Lowercase_Mapping (lc)
710 # @missing: 0000..10FFFF; Lowercase_Mapping; <code point>
714 Math; N ; No ; F ; False
715 Math; Y ; Yes ; T ; True
717 # NFC_Quick_Check (NFC_QC)
723 # NFD_Quick_Check (NFD_QC)
728 # NFKC_Quick_Check (NFKC_QC)
734 # NFKD_Quick_Check (NFKD_QC)
741 # @missing: 0000..10FFFF; Name; <none>
743 # Noncharacter_Code_Point (NChar)
745 NChar; N ; No ; F ; False
746 NChar; Y ; Yes ; T ; True
757 # @missing: 0000..10FFFF; Numeric_Value; NaN
759 # Other_Alphabetic (OAlpha)
761 OAlpha; N ; No ; F ; False
762 OAlpha; Y ; Yes ; T ; True
764 # Other_Default_Ignorable_Code_Point (ODI)
766 ODI; N ; No ; F ; False
767 ODI; Y ; Yes ; T ; True
769 # Other_Grapheme_Extend (OGr_Ext)
771 OGr_Ext; N ; No ; F ; False
772 OGr_Ext; Y ; Yes ; T ; True
774 # Other_ID_Continue (OIDC)
776 OIDC; N ; No ; F ; False
777 OIDC; Y ; Yes ; T ; True
779 # Other_ID_Start (OIDS)
781 OIDS; N ; No ; F ; False
782 OIDS; Y ; Yes ; T ; True
784 # Other_Lowercase (OLower)
786 OLower; N ; No ; F ; False
787 OLower; Y ; Yes ; T ; True
791 OMath; N ; No ; F ; False
792 OMath; Y ; Yes ; T ; True
794 # Other_Uppercase (OUpper)
796 OUpper; N ; No ; F ; False
797 OUpper; Y ; Yes ; T ; True
799 # Pattern_Syntax (Pat_Syn)
801 Pat_Syn; N ; No ; F ; False
802 Pat_Syn; Y ; Yes ; T ; True
804 # Pattern_White_Space (Pat_WS)
806 Pat_WS; N ; No ; F ; False
807 Pat_WS; Y ; Yes ; T ; True
809 # Quotation_Mark (QMark)
811 QMark; N ; No ; F ; False
812 QMark; Y ; Yes ; T ; True
816 Radical; N ; No ; F ; False
817 Radical; Y ; Yes ; T ; True
821 STerm; N ; No ; F ; False
822 STerm; Y ; Yes ; T ; True
834 sc ; Cans ; Canadian_Aboriginal
838 sc ; Copt ; Coptic ; Qaac
841 sc ; Deva ; Devanagari
845 sc ; Glag ; Glagolitic
855 sc ; Hrkt ; Katakana_Or_Hiragana
856 sc ; Ital ; Old_Italic
859 sc ; Khar ; Kharoshthi
869 sc ; Mlym ; Malayalam
870 sc ; Mong ; Mongolian
878 sc ; Phnx ; Phoenician
879 sc ; Qaai ; Inherited
882 sc ; Saur ; Saurashtra
885 sc ; Sund ; Sundanese
886 sc ; Sylo ; Syloti_Nagri
890 sc ; Talu ; New_Tai_Lue
900 sc ; Xpeo ; Old_Persian
901 sc ; Xsux ; Cuneiform
906 # Sentence_Break (SB)
924 # Simple_Case_Folding (scf)
926 # @missing: 0000..10FFFF; Simple_Case_Folding; <code point>
928 # Simple_Lowercase_Mapping (slc)
930 # @missing: 0000..10FFFF; Simple_Lowercase_Mapping; <code point>
932 # Simple_Titlecase_Mapping (stc)
934 # @missing: 0000..10FFFF; Simple_Titlecase_Mapping; <code point>
936 # Simple_Uppercase_Mapping (suc)
938 # @missing: 0000..10FFFF; Simple_Uppercase_Mapping; <code point>
942 SD ; N ; No ; F ; False
943 SD ; Y ; Yes ; T ; True
945 # Terminal_Punctuation (Term)
947 Term; N ; No ; F ; False
948 Term; Y ; Yes ; T ; True
950 # Titlecase_Mapping (tc)
952 # @missing: 0000..10FFFF; Titlecase_Mapping; <code point>
954 # Unicode_1_Name (na1)
956 # @missing: 0000..10FFFF; Unicode_1_Name; <none>
958 # Unicode_Radical_Stroke (URS)
960 # @missing: 0000..10FFFF; Unicode_Radical_Stroke; <none>
962 # Unified_Ideograph (UIdeo)
964 UIdeo; N ; No ; F ; False
965 UIdeo; Y ; Yes ; T ; True
969 Upper; N ; No ; F ; False
970 Upper; Y ; Yes ; T ; True
972 # Uppercase_Mapping (uc)
974 # @missing: 0000..10FFFF; Uppercase_Mapping; <code point>
976 # Variation_Selector (VS)
978 VS ; N ; No ; F ; False
979 VS ; Y ; Yes ; T ; True
981 # White_Space (WSpace)
983 WSpace; N ; No ; F ; False
984 WSpace; Y ; Yes ; T ; True
989 WB ; EX ; ExtendNumLet
1002 # XID_Continue (XIDC)
1004 XIDC; N ; No ; F ; False
1005 XIDC; Y ; Yes ; T ; True
1009 XIDS; N ; No ; F ; False
1010 XIDS; Y ; Yes ; T ; True