[p5sagit/p5-mst-13.2.git] / lib / unicore / PropValueAliases.txt

# PropertyValueAliases-4.0.0.txt
# Date: 2003-03-12, 23:46:08 GMT [MD]
#
# This file contains aliases for property values used in the UCD.
# These names can be used for XML formats of UCD data, for regular-expression
# property tests, and other programmatic textual descriptions of Unicode data.
# For information on which properties are normative, see UCD.html.
#
# The names may be translated in appropriate environments, and additional
# aliases may be useful.
#
# FORMAT
#
# Each line describes a property value name.
# This consists of three fields, separated by semicolons.
#
# First Field: The first field describes the property for which that
# property value name is used.
# There is one special pseudo-property: "qc" stands for any quick-check property
#
# Second Field: The second field is an abbreviated name.
# If there is no abbreviated name available, the field is marked with "n/a".
#
# Third Field: The third field is a long name.
#
# In the case of ccc, there are 4 fields. The second field is numeric, third
# is abbreviated, and fourth is long.
#
# With loose matching of property names, the case distinctions, whitespace,
# and '_' are ignored.
#
# NOTE: Currently there is at most one abbreviated name and one long name for
# property value. However, in the future additional aliases may be added.
# In such a case, the first line for the property value would have
# the preferred alias for output.
#
# NOTE: The property value names are NOT unique across properties, especially
# with loose matches. For example:
#
# AL means Arabic Letter for the Bidi_Class property, and
# AL means Alpha_Left for the Combining_Class property, and
# AL means Alphabetic for the Line_Break property.
#
# In addition, some property names may be the same as some property value names.
# For example:
#
#   cc means Combining_Class property, and
#   cc means the General_Category property value Control (cc)
#
# The combination of property value and property name is, however, unique.
# For more information, see UTR #18: Regular Expression Guidelines
# ================================================


bc ; AL        ; Arabic_Letter
bc ; AN        ; Arabic_Number
bc ; B         ; Paragraph_Separator
bc ; BN        ; Boundary_Neutral
bc ; CS        ; Common_Separator
bc ; EN        ; European_Number
bc ; ES        ; European_Separator
bc ; ET        ; European_Terminator
bc ; L         ; Left_To_Right
bc ; LRE       ; Left_To_Right_Embedding
bc ; LRO       ; Left_To_Right_Override
bc ; NSM       ; Nonspacing_Mark
bc ; ON        ; Other_Neutral
bc ; PDF       ; Pop_Directional_Format
bc ; R         ; Right_To_Left
bc ; RLE       ; Right_To_Left_Embedding
bc ; RLO       ; Right_To_Left_Override
bc ; S         ; Segment_Separator
bc ; WS        ; White_Space

blk; n/a       ; Aegean_Numbers
blk; n/a       ; Alphabetic_Presentation_Forms
blk; n/a       ; Arabic
blk; n/a       ; Arabic_Presentation_Forms-A
blk; n/a       ; Arabic_Presentation_Forms-B
blk; n/a       ; Armenian
blk; n/a       ; Arrows
blk; n/a       ; Basic_Latin
blk; n/a       ; Bengali
blk; n/a       ; Block_Elements
blk; n/a       ; Bopomofo
blk; n/a       ; Bopomofo_Extended
blk; n/a       ; Box_Drawing
blk; n/a       ; Braille_Patterns
blk; n/a       ; Buhid
blk; n/a       ; Byzantine_Musical_Symbols
blk; n/a       ; Cherokee
blk; n/a       ; CJK_Compatibility
blk; n/a       ; CJK_Compatibility_Forms
blk; n/a       ; CJK_Compatibility_Ideographs
blk; n/a       ; CJK_Compatibility_Ideographs_Supplement
blk; n/a       ; CJK_Radicals_Supplement
blk; n/a       ; CJK_Symbols_and_Punctuation
blk; n/a       ; CJK_Unified_Ideographs
blk; n/a       ; CJK_Unified_Ideographs_Extension_A
blk; n/a       ; CJK_Unified_Ideographs_Extension_B
blk; n/a       ; Combining_Diacritical_Marks
blk; n/a       ; Combining_Diacritical_Marks_for_Symbols
blk; n/a       ; Combining_Half_Marks
blk; n/a       ; Control_Pictures
blk; n/a       ; Currency_Symbols
blk; n/a       ; Cypriot_Syllabary
blk; n/a       ; Cyrillic
blk; n/a       ; Cyrillic_Supplementary
blk; n/a       ; Deseret
blk; n/a       ; Devanagari
blk; n/a       ; Dingbats
blk; n/a       ; Enclosed_Alphanumerics
blk; n/a       ; Enclosed_CJK_Letters_and_Months
blk; n/a       ; Ethiopic
blk; n/a       ; General_Punctuation
blk; n/a       ; Geometric_Shapes
blk; n/a       ; Georgian
blk; n/a       ; Gothic
blk; n/a       ; Greek_and_Coptic
blk; n/a       ; Greek_Extended
blk; n/a       ; Gujarati
blk; n/a       ; Gurmukhi
blk; n/a       ; Halfwidth_and_Fullwidth_Forms
blk; n/a       ; Hangul_Compatibility_Jamo
blk; n/a       ; Hangul_Jamo
blk; n/a       ; Hangul_Syllables
blk; n/a       ; Hanunoo
blk; n/a       ; Hebrew
blk; n/a       ; High_Private_Use_Surrogates
blk; n/a       ; High_Surrogates
blk; n/a       ; Hiragana
blk; n/a       ; Ideographic_Description_Characters
blk; n/a       ; IPA_Extensions
blk; n/a       ; Kanbun
blk; n/a       ; Kangxi_Radicals
blk; n/a       ; Kannada
blk; n/a       ; Katakana
blk; n/a       ; Katakana_Phonetic_Extensions
blk; n/a       ; Khmer
blk; n/a       ; Khmer_Symbols
blk; n/a       ; Lao
blk; n/a       ; Latin_Extended_Additional
blk; n/a       ; Latin_Extended-A
blk; n/a       ; Latin_Extended-B
blk; n/a       ; Latin-1_Supplement
blk; n/a       ; Letterlike_Symbols
blk; n/a       ; Limbu
blk; n/a       ; Linear_B_Ideograms
blk; n/a       ; Linear_B_Syllabary
blk; n/a       ; Low_Surrogates
blk; n/a       ; Malayalam
blk; n/a       ; Mathematical_Alphanumeric_Symbols
blk; n/a       ; Mathematical_Operators
blk; n/a       ; Miscellaneous_Mathematical_Symbols-A
blk; n/a       ; Miscellaneous_Mathematical_Symbols-B
blk; n/a       ; Miscellaneous_Symbols
blk; n/a       ; Miscellaneous_Symbols_and_Arrows
blk; n/a       ; Miscellaneous_Technical
blk; n/a       ; Mongolian
blk; n/a       ; Musical_Symbols
blk; n/a       ; Myanmar
blk; n/a       ; No_Block
blk; n/a       ; Number_Forms
blk; n/a       ; Ogham
blk; n/a       ; Old_Italic
blk; n/a       ; Optical_Character_Recognition
blk; n/a       ; Oriya
blk; n/a       ; Osmanya
blk; n/a       ; Phonetic_Extensions
blk; n/a       ; Private_Use_Area
blk; n/a       ; Runic
blk; n/a       ; Shavian
blk; n/a       ; Sinhala
blk; n/a       ; Small_Form_Variants
blk; n/a       ; Spacing_Modifier_Letters
blk; n/a       ; Specials
blk; n/a       ; Superscripts_and_Subscripts
blk; n/a       ; Supplemental_Arrows-A
blk; n/a       ; Supplemental_Arrows-B
blk; n/a       ; Supplemental_Mathematical_Operators
blk; n/a       ; Supplementary_Private_Use_Area-A
blk; n/a       ; Supplementary_Private_Use_Area-B
blk; n/a       ; Syriac
blk; n/a       ; Tagalog
blk; n/a       ; Tagbanwa
blk; n/a       ; Tags
blk; n/a       ; Tai_Le
blk; n/a       ; Tai_Xuan_Jing_Symbols
blk; n/a       ; Tamil
blk; n/a       ; Telugu
blk; n/a       ; Thaana
blk; n/a       ; Thai
blk; n/a       ; Tibetan
blk; n/a       ; Ugaritic
blk; n/a       ; Unified_Canadian_Aboriginal_Syllabics
blk; n/a       ; Variation_Selectors
blk; n/a       ; Variation_Selectors_Supplement
blk; n/a       ; Yi_Radicals
blk; n/a       ; Yi_Syllables
blk; n/a       ; Yijing_Hexagram_Symbols

ccc;   0; NR   ; Not_Reordered
ccc;   1; OV   ; Overlay
ccc; 202; ATB  ; Attached_Below
ccc; 216; ATAR ; Attached_Above_Right
ccc; 218; BL   ; Below_Left
ccc; 220; B    ; Below
ccc; 222; BR   ; Below_Right
ccc; 224; L    ; Left
ccc; 226; R    ; Right
ccc; 228; AL   ; Above_Left
ccc; 230; A    ; Above
ccc; 232; AR   ; Above_Right
ccc; 233; DB   ; Double_Below
ccc; 234; DA   ; Double_Above
ccc; 240; IS   ; Iota_Subscript
ccc;   7; NK   ; Nukta
ccc;   8; KV   ; Kana_Voicing
ccc;   9; VR   ; Virama

dt ; can       ; canonical
dt ; com       ; compat
dt ; enc       ; circle
dt ; fin       ; final
dt ; font      ; font
dt ; fra       ; fraction
dt ; init      ; initial
dt ; iso       ; isolated
dt ; med       ; medial
dt ; n/a       ; none
dt ; nar       ; narrow
dt ; nb        ; noBreak
dt ; sml       ; small
dt ; sqr       ; square
dt ; sub       ; sub
dt ; sup       ; super
dt ; vert      ; vertical
dt ; wide      ; wide

ea ; A         ; Ambiguous
ea ; F         ; Fullwidth
ea ; H         ; Halfwidth
ea ; N         ; Neutral
ea ; Na        ; Narrow
ea ; W         ; Wide

gc ; C         ; Other                            # Cc | Cf | Cn | Co | Cs
gc ; Cc        ; Control
gc ; Cf        ; Format
gc ; Cn        ; Unassigned
gc ; Co        ; Private_Use
gc ; Cs        ; Surrogate
gc ; L         ; Letter                           # Ll | Lm | Lo | Lt | Lu
gc ; LC        ; Cased_Letter                     # Ll | Lt | Lu
gc ; Ll        ; Lowercase_Letter
gc ; Lm        ; Modifier_Letter
gc ; Lo        ; Other_Letter
gc ; Lt        ; Titlecase_Letter
gc ; Lu        ; Uppercase_Letter
gc ; M         ; Mark                             # Mc | Me | Mn
gc ; Mc        ; Spacing_Mark
gc ; Me        ; Enclosing_Mark
gc ; Mn        ; Nonspacing_Mark
gc ; N         ; Number                           # Nd | Nl | No
gc ; Nd        ; Decimal_Number
gc ; Nl        ; Letter_Number
gc ; No        ; Other_Number
gc ; P         ; Punctuation                      # Pc | Pd | Pe | Pf | Pi | Po | Ps
gc ; Pc        ; Connector_Punctuation
gc ; Pd        ; Dash_Punctuation
gc ; Pe        ; Close_Punctuation
gc ; Pf        ; Final_Punctuation
gc ; Pi        ; Initial_Punctuation
gc ; Po        ; Other_Punctuation
gc ; Ps        ; Open_Punctuation
gc ; S         ; Symbol                           # Sc | Sk | Sm | So
gc ; Sc        ; Currency_Symbol
gc ; Sk        ; Modifier_Symbol
gc ; Sm        ; Math_Symbol
gc ; So        ; Other_Symbol
gc ; Z         ; Separator                        # Zl | Zp | Zs
gc ; Zl        ; Line_Separator
gc ; Zp        ; Paragraph_Separator
gc ; Zs        ; Space_Separator

hst; L         ; Leading_Jamo
hst; LV        ; LV_Syllable
hst; LVT       ; LVT_Syllable
hst; NA        ; Not_Applicable
hst; T         ; Trailing_Jamo
hst; V         ; Vowel_Jamo

jg ; n/a       ; AIN
jg ; n/a       ; ALAPH
jg ; n/a       ; ALEF
jg ; n/a       ; BEH
jg ; n/a       ; BETH
jg ; n/a       ; DAL
jg ; n/a       ; DALATH_RISH
jg ; n/a       ; E
jg ; n/a       ; FE
jg ; n/a       ; FEH
jg ; n/a       ; FINAL_SEMKATH
jg ; n/a       ; GAF
jg ; n/a       ; GAMAL
jg ; n/a       ; HAH
jg ; n/a       ; HAMZA_ON_HEH_GOAL
jg ; n/a       ; HE
jg ; n/a       ; HEH
jg ; n/a       ; HEH_GOAL
jg ; n/a       ; HETH
jg ; n/a       ; KAF
jg ; n/a       ; KAPH
jg ; n/a       ; KHAPH
jg ; n/a       ; KNOTTED_HEH
jg ; n/a       ; LAM
jg ; n/a       ; LAMADH
jg ; n/a       ; MEEM
jg ; n/a       ; MIM
jg ; n/a       ; NO_JOINING_GROUP
jg ; n/a       ; NOON
jg ; n/a       ; NUN
jg ; n/a       ; PE
jg ; n/a       ; QAF
jg ; n/a       ; QAPH
jg ; n/a       ; REH
jg ; n/a       ; REVERSED_PE
jg ; n/a       ; SAD
jg ; n/a       ; SADHE
jg ; n/a       ; SEEN
jg ; n/a       ; SEMKATH
jg ; n/a       ; SHIN
jg ; n/a       ; SWASH_KAF
jg ; n/a       ; SYRIAC_WAW
jg ; n/a       ; TAH
jg ; n/a       ; TAW
jg ; n/a       ; TEH_MARBUTA
jg ; n/a       ; TETH
jg ; n/a       ; WAW
jg ; n/a       ; YEH
jg ; n/a       ; YEH_BARREE
jg ; n/a       ; YEH_WITH_TAIL
jg ; n/a       ; YUDH
jg ; n/a       ; YUDH_HE
jg ; n/a       ; ZAIN
jg ; n/a       ; ZHAIN

jt ; C         ; Join_Causing
jt ; D         ; Dual_Joining
jt ; L         ; Left_Joining
jt ; R         ; Right_Joining
jt ; T         ; Transparent
jt ; U         ; Non_Joining

lb ; AI        ; Ambiguous
lb ; AL        ; Alphabetic
lb ; B2        ; Break_Both
lb ; BA        ; Break_After
lb ; BB        ; Break_Before
lb ; BK        ; Mandatory_Break
lb ; CB        ; Contingent_Break
lb ; CL        ; Close_Punctuation
lb ; CM        ; Combining_Mark
lb ; CR        ; Carriage_Return
lb ; EX        ; Exclamation
lb ; GL        ; Glue
lb ; HY        ; Hyphen
lb ; ID        ; Ideographic
lb ; IN        ; Inseperable
lb ; IS        ; Infix_Numeric
lb ; LF        ; Line_Feed
lb ; NL        ; Next_Line
lb ; NS        ; Nonstarter
lb ; NU        ; Numeric
lb ; OP        ; Open_Punctuation
lb ; PO        ; Postfix_Numeric
lb ; PR        ; Prefix_Numeric
lb ; QU        ; Quotation
lb ; SA        ; Complex_Context
lb ; SG        ; Surrogate
lb ; SP        ; Space
lb ; SY        ; Break_Symbols
lb ; WJ        ; Word_Joiner
lb ; XX        ; Unknown
lb ; ZW        ; ZWSpace

nt ; de        ; Decimal
nt ; di        ; Digit
nt ; n/a       ; None
nt ; nu        ; Numeric

qc ; M         ; Maybe
qc ; N         ; No
qc ; Y         ; Yes

sc ; Arab      ; Arabic
sc ; Armn      ; Armenian
sc ; Beng      ; Bengali
sc ; Bopo      ; Bopomofo
sc ; Brai      ; Braille
sc ; Buhd      ; Buhid
sc ; Cans      ; Canadian_Aboriginal
sc ; Cher      ; Cherokee
sc ; Cprt      ; Cypriot
sc ; Cyrl      ; Cyrillic
sc ; Deva      ; Devanagari
sc ; Dsrt      ; Deseret
sc ; Ethi      ; Ethiopic
sc ; Geor      ; Georgian
sc ; Goth      ; Gothic
sc ; Grek      ; Greek
sc ; Gujr      ; Gujarati
sc ; Guru      ; Gurmukhi
sc ; Hang      ; Hangul
sc ; Hani      ; Han
sc ; Hano      ; Hanunoo
sc ; Hebr      ; Hebrew
sc ; Hira      ; Hiragana
sc ; Ital      ; Old_Italic
sc ; Kana      ; Katakana
sc ; Khmr      ; Khmer
sc ; Knda      ; Kannada
sc ; Laoo      ; Lao
sc ; Latn      ; Latin
sc ; Limb      ; Limbu
sc ; Linb      ; Linear_B
sc ; Mlym      ; Malayalam
sc ; Mong      ; Mongolian
sc ; Mymr      ; Myanmar
sc ; Ogam      ; Ogham
sc ; Orya      ; Oriya
sc ; Osma      ; Osmanya
sc ; Qaai      ; Inherited
sc ; Runr      ; Runic
sc ; Shaw      ; Shavian
sc ; Sinh      ; Sinhala
sc ; Syrc      ; Syriac
sc ; Tagb      ; Tagbanwa
sc ; Tale      ; Tai_Le
sc ; Taml      ; Tamil
sc ; Telu      ; Telugu
sc ; Tglg      ; Tagalog
sc ; Thaa      ; Thaana
sc ; Thai      ; Thai
sc ; Tibt      ; Tibetan
sc ; Ugar      ; Ugaritic
sc ; Yiii      ; Yi
sc ; Zyyy      ; Common
Commit	Line	Data
1911be83	1	# PropertyValueAliases-4.0.0.txt
1911be83	2	# Date: 2003-03-12, 23:46:08 GMT [MD]
822ebcc8	3	#
	4	# This file contains aliases for property values used in the UCD.
	5	# These names can be used for XML formats of UCD data, for regular-expression
	6	# property tests, and other programmatic textual descriptions of Unicode data.
1911be83	7	# For information on which properties are normative, see UCD.html.
822ebcc8	8	#
	9	# The names may be translated in appropriate environments, and additional
	10	# aliases may be useful.
	11	#
	12	# FORMAT
	13	#
	14	# Each line describes a property value name.
	15	# This consists of three fields, separated by semicolons.
	16	#
	17	# First Field: The first field describes the property for which that
	18	# property value name is used.
	19	# There is one special pseudo-property: "qc" stands for any quick-check property
	20	#
	21	# Second Field: The second field is an abbreviated name.
	22	# If there is no abbreviated name available, the field is marked with "n/a".
	23	#
	24	# Third Field: The third field is a long name.
	25	#
1911be83	26	# In the case of ccc, there are 4 fields. The second field is numeric, third
822ebcc8	27	# is abbreviated, and fourth is long.
	28	#
	29	# With loose matching of property names, the case distinctions, whitespace,
	30	# and '_' are ignored.
	31	#
822ebcc8	32	# NOTE: Currently there is at most one abbreviated name and one long name for
1911be83	33	# property value. However, in the future additional aliases may be added.
	34	# In such a case, the first line for the property value would have
	35	# the preferred alias for output.
822ebcc8	36	#
822ebcc8	37	# NOTE: The property value names are NOT unique across properties, especially
1911be83	38	# with loose matches. For example:
1911be83	39	#
822ebcc8	40	# AL means Arabic Letter for the Bidi_Class property, and
	41	# AL means Alpha_Left for the Combining_Class property, and
	42	# AL means Alphabetic for the Line_Break property.
	43	#
1911be83	44	# In addition, some property names may be the same as some property value names.
	45	# For example:
	46	#
	47	# cc means Combining_Class property, and
	48	# cc means the General_Category property value Control (cc)
822ebcc8	49	#
822ebcc8	50	# The combination of property value and property name is, however, unique.
1911be83	51	# For more information, see UTR #18: Regular Expression Guidelines
822ebcc8	52	# ================================================
	53
	54
	55	bc ; AL ; Arabic_Letter
	56	bc ; AN ; Arabic_Number
	57	bc ; B ; Paragraph_Separator
	58	bc ; BN ; Boundary_Neutral
	59	bc ; CS ; Common_Separator
	60	bc ; EN ; European_Number
	61	bc ; ES ; European_Separator
	62	bc ; ET ; European_Terminator
	63	bc ; L ; Left_To_Right
	64	bc ; LRE ; Left_To_Right_Embedding
	65	bc ; LRO ; Left_To_Right_Override
	66	bc ; NSM ; Nonspacing_Mark
	67	bc ; ON ; Other_Neutral
	68	bc ; PDF ; Pop_Directional_Format
	69	bc ; R ; Right_To_Left
	70	bc ; RLE ; Right_To_Left_Embedding
	71	bc ; RLO ; Right_To_Left_Override
	72	bc ; S ; Segment_Separator
	73	bc ; WS ; White_Space
	74
1911be83	75	blk; n/a ; Aegean_Numbers
	76	blk; n/a ; Alphabetic_Presentation_Forms
	77	blk; n/a ; Arabic
	78	blk; n/a ; Arabic_Presentation_Forms-A
	79	blk; n/a ; Arabic_Presentation_Forms-B
	80	blk; n/a ; Armenian
	81	blk; n/a ; Arrows
	82	blk; n/a ; Basic_Latin
	83	blk; n/a ; Bengali
	84	blk; n/a ; Block_Elements
	85	blk; n/a ; Bopomofo
	86	blk; n/a ; Bopomofo_Extended
	87	blk; n/a ; Box_Drawing
	88	blk; n/a ; Braille_Patterns
	89	blk; n/a ; Buhid
	90	blk; n/a ; Byzantine_Musical_Symbols
	91	blk; n/a ; Cherokee
	92	blk; n/a ; CJK_Compatibility
	93	blk; n/a ; CJK_Compatibility_Forms
	94	blk; n/a ; CJK_Compatibility_Ideographs
	95	blk; n/a ; CJK_Compatibility_Ideographs_Supplement
	96	blk; n/a ; CJK_Radicals_Supplement
	97	blk; n/a ; CJK_Symbols_and_Punctuation
	98	blk; n/a ; CJK_Unified_Ideographs
	99	blk; n/a ; CJK_Unified_Ideographs_Extension_A
	100	blk; n/a ; CJK_Unified_Ideographs_Extension_B
	101	blk; n/a ; Combining_Diacritical_Marks
	102	blk; n/a ; Combining_Diacritical_Marks_for_Symbols
	103	blk; n/a ; Combining_Half_Marks
	104	blk; n/a ; Control_Pictures
	105	blk; n/a ; Currency_Symbols
	106	blk; n/a ; Cypriot_Syllabary
	107	blk; n/a ; Cyrillic
	108	blk; n/a ; Cyrillic_Supplementary
	109	blk; n/a ; Deseret
	110	blk; n/a ; Devanagari
	111	blk; n/a ; Dingbats
	112	blk; n/a ; Enclosed_Alphanumerics
	113	blk; n/a ; Enclosed_CJK_Letters_and_Months
	114	blk; n/a ; Ethiopic
	115	blk; n/a ; General_Punctuation
	116	blk; n/a ; Geometric_Shapes
	117	blk; n/a ; Georgian
	118	blk; n/a ; Gothic
	119	blk; n/a ; Greek_and_Coptic
	120	blk; n/a ; Greek_Extended
	121	blk; n/a ; Gujarati
	122	blk; n/a ; Gurmukhi
	123	blk; n/a ; Halfwidth_and_Fullwidth_Forms
	124	blk; n/a ; Hangul_Compatibility_Jamo
	125	blk; n/a ; Hangul_Jamo
	126	blk; n/a ; Hangul_Syllables
	127	blk; n/a ; Hanunoo
	128	blk; n/a ; Hebrew
	129	blk; n/a ; High_Private_Use_Surrogates
	130	blk; n/a ; High_Surrogates
	131	blk; n/a ; Hiragana
	132	blk; n/a ; Ideographic_Description_Characters
	133	blk; n/a ; IPA_Extensions
	134	blk; n/a ; Kanbun
	135	blk; n/a ; Kangxi_Radicals
	136	blk; n/a ; Kannada
	137	blk; n/a ; Katakana
	138	blk; n/a ; Katakana_Phonetic_Extensions
139	blk; n/a ; Khmer
140	blk; n/a ; Khmer_Symbols
141	blk; n/a ; Lao
142	blk; n/a ; Latin_Extended_Additional
143	blk; n/a ; Latin_Extended-A
144	blk; n/a ; Latin_Extended-B
145	blk; n/a ; Latin-1_Supplement
146	blk; n/a ; Letterlike_Symbols
147	blk; n/a ; Limbu
148	blk; n/a ; Linear_B_Ideograms
149	blk; n/a ; Linear_B_Syllabary
150	blk; n/a ; Low_Surrogates
151	blk; n/a ; Malayalam
152	blk; n/a ; Mathematical_Alphanumeric_Symbols
153	blk; n/a ; Mathematical_Operators
154	blk; n/a ; Miscellaneous_Mathematical_Symbols-A
155	blk; n/a ; Miscellaneous_Mathematical_Symbols-B
156	blk; n/a ; Miscellaneous_Symbols
157	blk; n/a ; Miscellaneous_Symbols_and_Arrows
158	blk; n/a ; Miscellaneous_Technical
159	blk; n/a ; Mongolian
160	blk; n/a ; Musical_Symbols
161	blk; n/a ; Myanmar
162	blk; n/a ; No_Block
163	blk; n/a ; Number_Forms
164	blk; n/a ; Ogham
165	blk; n/a ; Old_Italic
166	blk; n/a ; Optical_Character_Recognition
167	blk; n/a ; Oriya
168	blk; n/a ; Osmanya
169	blk; n/a ; Phonetic_Extensions
170	blk; n/a ; Private_Use_Area
171	blk; n/a ; Runic
172	blk; n/a ; Shavian
173	blk; n/a ; Sinhala
174	blk; n/a ; Small_Form_Variants
175	blk; n/a ; Spacing_Modifier_Letters
176	blk; n/a ; Specials
177	blk; n/a ; Superscripts_and_Subscripts
178	blk; n/a ; Supplemental_Arrows-A
179	blk; n/a ; Supplemental_Arrows-B
180	blk; n/a ; Supplemental_Mathematical_Operators
181	blk; n/a ; Supplementary_Private_Use_Area-A
182	blk; n/a ; Supplementary_Private_Use_Area-B
183	blk; n/a ; Syriac
184	blk; n/a ; Tagalog
185	blk; n/a ; Tagbanwa
186	blk; n/a ; Tags
187	blk; n/a ; Tai_Le
188	blk; n/a ; Tai_Xuan_Jing_Symbols
189	blk; n/a ; Tamil
190	blk; n/a ; Telugu
191	blk; n/a ; Thaana
192	blk; n/a ; Thai
193	blk; n/a ; Tibetan
194	blk; n/a ; Ugaritic
195	blk; n/a ; Unified_Canadian_Aboriginal_Syllabics
196	blk; n/a ; Variation_Selectors
197	blk; n/a ; Variation_Selectors_Supplement
198	blk; n/a ; Yi_Radicals
199	blk; n/a ; Yi_Syllables
200	blk; n/a ; Yijing_Hexagram_Symbols
201
822ebcc8	202	ccc; 0; NR ; Not_Reordered
822ebcc8	203	ccc; 1; OV ; Overlay
1911be83	204	ccc; 202; ATB ; Attached_Below
822ebcc8	205	ccc; 216; ATAR ; Attached_Above_Right
	206	ccc; 218; BL ; Below_Left
	207	ccc; 220; B ; Below
	208	ccc; 222; BR ; Below_Right
	209	ccc; 224; L ; Left
	210	ccc; 226; R ; Right
	211	ccc; 228; AL ; Above_Left
	212	ccc; 230; A ; Above
	213	ccc; 232; AR ; Above_Right
	214	ccc; 233; DB ; Double_Below
	215	ccc; 234; DA ; Double_Above
	216	ccc; 240; IS ; Iota_Subscript
	217	ccc; 7; NK ; Nukta
	218	ccc; 8; KV ; Kana_Voicing
	219	ccc; 9; VR ; Virama
	220
	221	dt ; can ; canonical
	222	dt ; com ; compat
	223	dt ; enc ; circle
	224	dt ; fin ; final
	225	dt ; font ; font
	226	dt ; fra ; fraction
	227	dt ; init ; initial
	228	dt ; iso ; isolated
	229	dt ; med ; medial
	230	dt ; n/a ; none
	231	dt ; nar ; narrow
	232	dt ; nb ; noBreak
	233	dt ; sml ; small
	234	dt ; sqr ; square
	235	dt ; sub ; sub
	236	dt ; sup ; super
	237	dt ; vert ; vertical
	238	dt ; wide ; wide
	239
	240	ea ; A ; Ambiguous
	241	ea ; F ; Fullwidth
	242	ea ; H ; Halfwidth
	243	ea ; N ; Neutral
	244	ea ; Na ; Narrow
	245	ea ; W ; Wide
	246
	247	gc ; C ; Other # Cc \| Cf \| Cn \| Co \| Cs
	248	gc ; Cc ; Control
	249	gc ; Cf ; Format
	250	gc ; Cn ; Unassigned
	251	gc ; Co ; Private_Use
	252	gc ; Cs ; Surrogate
	253	gc ; L ; Letter # Ll \| Lm \| Lo \| Lt \| Lu
	254	gc ; LC ; Cased_Letter # Ll \| Lt \| Lu
	255	gc ; Ll ; Lowercase_Letter
	256	gc ; Lm ; Modifier_Letter
	257	gc ; Lo ; Other_Letter
	258	gc ; Lt ; Titlecase_Letter
	259	gc ; Lu ; Uppercase_Letter
	260	gc ; M ; Mark # Mc \| Me \| Mn
	261	gc ; Mc ; Spacing_Mark
	262	gc ; Me ; Enclosing_Mark
	263	gc ; Mn ; Nonspacing_Mark
	264	gc ; N ; Number # Nd \| Nl \| No
	265	gc ; Nd ; Decimal_Number
	266	gc ; Nl ; Letter_Number
	267	gc ; No ; Other_Number
	268	gc ; P ; Punctuation # Pc \| Pd \| Pe \| Pf \| Pi \| Po \| Ps
269	gc ; Pc ; Connector_Punctuation
270	gc ; Pd ; Dash_Punctuation
271	gc ; Pe ; Close_Punctuation
272	gc ; Pf ; Final_Punctuation
273	gc ; Pi ; Initial_Punctuation
274	gc ; Po ; Other_Punctuation
275	gc ; Ps ; Open_Punctuation
276	gc ; S ; Symbol # Sc \| Sk \| Sm \| So
277	gc ; Sc ; Currency_Symbol
278	gc ; Sk ; Modifier_Symbol
279	gc ; Sm ; Math_Symbol
280	gc ; So ; Other_Symbol
281	gc ; Z ; Separator # Zl \| Zp \| Zs
282	gc ; Zl ; Line_Separator
283	gc ; Zp ; Paragraph_Separator
284	gc ; Zs ; Space_Separator
285
1911be83	286	hst; L ; Leading_Jamo
	287	hst; LV ; LV_Syllable
	288	hst; LVT ; LVT_Syllable
	289	hst; NA ; Not_Applicable
	290	hst; T ; Trailing_Jamo
	291	hst; V ; Vowel_Jamo
	292
822ebcc8	293	jg ; n/a ; AIN
	294	jg ; n/a ; ALAPH
	295	jg ; n/a ; ALEF
	296	jg ; n/a ; BEH
	297	jg ; n/a ; BETH
	298	jg ; n/a ; DAL
	299	jg ; n/a ; DALATH_RISH
	300	jg ; n/a ; E
1911be83	301	jg ; n/a ; FE
822ebcc8	302	jg ; n/a ; FEH
	303	jg ; n/a ; FINAL_SEMKATH
	304	jg ; n/a ; GAF
	305	jg ; n/a ; GAMAL
	306	jg ; n/a ; HAH
	307	jg ; n/a ; HAMZA_ON_HEH_GOAL
	308	jg ; n/a ; HE
	309	jg ; n/a ; HEH
	310	jg ; n/a ; HEH_GOAL
	311	jg ; n/a ; HETH
	312	jg ; n/a ; KAF
	313	jg ; n/a ; KAPH
1911be83	314	jg ; n/a ; KHAPH
822ebcc8	315	jg ; n/a ; KNOTTED_HEH
	316	jg ; n/a ; LAM
	317	jg ; n/a ; LAMADH
	318	jg ; n/a ; MEEM
	319	jg ; n/a ; MIM
	320	jg ; n/a ; NO_JOINING_GROUP
	321	jg ; n/a ; NOON
	322	jg ; n/a ; NUN
	323	jg ; n/a ; PE
	324	jg ; n/a ; QAF
	325	jg ; n/a ; QAPH
	326	jg ; n/a ; REH
	327	jg ; n/a ; REVERSED_PE
	328	jg ; n/a ; SAD
	329	jg ; n/a ; SADHE
	330	jg ; n/a ; SEEN
	331	jg ; n/a ; SEMKATH
	332	jg ; n/a ; SHIN
	333	jg ; n/a ; SWASH_KAF
	334	jg ; n/a ; SYRIAC_WAW
	335	jg ; n/a ; TAH
	336	jg ; n/a ; TAW
	337	jg ; n/a ; TEH_MARBUTA
	338	jg ; n/a ; TETH
	339	jg ; n/a ; WAW
	340	jg ; n/a ; YEH
	341	jg ; n/a ; YEH_BARREE
	342	jg ; n/a ; YEH_WITH_TAIL
	343	jg ; n/a ; YUDH
	344	jg ; n/a ; YUDH_HE
	345	jg ; n/a ; ZAIN
1911be83	346	jg ; n/a ; ZHAIN
822ebcc8	347
	348	jt ; C ; Join_Causing
	349	jt ; D ; Dual_Joining
	350	jt ; L ; Left_Joining
	351	jt ; R ; Right_Joining
	352	jt ; T ; Transparent
	353	jt ; U ; Non_Joining
	354
	355	lb ; AI ; Ambiguous
	356	lb ; AL ; Alphabetic
	357	lb ; B2 ; Break_Both
	358	lb ; BA ; Break_After
	359	lb ; BB ; Break_Before
	360	lb ; BK ; Mandatory_Break
	361	lb ; CB ; Contingent_Break
	362	lb ; CL ; Close_Punctuation
	363	lb ; CM ; Combining_Mark
	364	lb ; CR ; Carriage_Return
	365	lb ; EX ; Exclamation
	366	lb ; GL ; Glue
	367	lb ; HY ; Hyphen
	368	lb ; ID ; Ideographic
	369	lb ; IN ; Inseperable
	370	lb ; IS ; Infix_Numeric
	371	lb ; LF ; Line_Feed
1911be83	372	lb ; NL ; Next_Line
822ebcc8	373	lb ; NS ; Nonstarter
	374	lb ; NU ; Numeric
	375	lb ; OP ; Open_Punctuation
	376	lb ; PO ; Postfix_Numeric
	377	lb ; PR ; Prefix_Numeric
	378	lb ; QU ; Quotation
	379	lb ; SA ; Complex_Context
	380	lb ; SG ; Surrogate
	381	lb ; SP ; Space
	382	lb ; SY ; Break_Symbols
1911be83	383	lb ; WJ ; Word_Joiner
822ebcc8	384	lb ; XX ; Unknown
	385	lb ; ZW ; ZWSpace
	386
	387	nt ; de ; Decimal
	388	nt ; di ; Digit
	389	nt ; n/a ; None
	390	nt ; nu ; Numeric
	391
	392	qc ; M ; Maybe
	393	qc ; N ; No
	394	qc ; Y ; Yes
	395
	396	sc ; Arab ; Arabic
	397	sc ; Armn ; Armenian
	398	sc ; Beng ; Bengali
	399	sc ; Bopo ; Bopomofo
1911be83	400	sc ; Brai ; Braille
822ebcc8	401	sc ; Buhd ; Buhid
	402	sc ; Cans ; Canadian_Aboriginal
	403	sc ; Cher ; Cherokee
1911be83	404	sc ; Cprt ; Cypriot
822ebcc8	405	sc ; Cyrl ; Cyrillic
	406	sc ; Deva ; Devanagari
	407	sc ; Dsrt ; Deseret
	408	sc ; Ethi ; Ethiopic
	409	sc ; Geor ; Georgian
	410	sc ; Goth ; Gothic
	411	sc ; Grek ; Greek
	412	sc ; Gujr ; Gujarati
	413	sc ; Guru ; Gurmukhi
	414	sc ; Hang ; Hangul
	415	sc ; Hani ; Han
	416	sc ; Hano ; Hanunoo
	417	sc ; Hebr ; Hebrew
	418	sc ; Hira ; Hiragana
	419	sc ; Ital ; Old_Italic
	420	sc ; Kana ; Katakana
	421	sc ; Khmr ; Khmer
	422	sc ; Knda ; Kannada
	423	sc ; Laoo ; Lao
	424	sc ; Latn ; Latin
1911be83	425	sc ; Limb ; Limbu
1911be83	426	sc ; Linb ; Linear_B
822ebcc8	427	sc ; Mlym ; Malayalam
	428	sc ; Mong ; Mongolian
	429	sc ; Mymr ; Myanmar
	430	sc ; Ogam ; Ogham
	431	sc ; Orya ; Oriya
1911be83	432	sc ; Osma ; Osmanya
822ebcc8	433	sc ; Qaai ; Inherited
822ebcc8	434	sc ; Runr ; Runic
1911be83	435	sc ; Shaw ; Shavian
822ebcc8	436	sc ; Sinh ; Sinhala
	437	sc ; Syrc ; Syriac
	438	sc ; Tagb ; Tagbanwa
1911be83	439	sc ; Tale ; Tai_Le
822ebcc8	440	sc ; Taml ; Tamil
	441	sc ; Telu ; Telugu
	442	sc ; Tglg ; Tagalog
	443	sc ; Thaa ; Thaana
	444	sc ; Thai ; Thai
	445	sc ; Tibt ; Tibetan
1911be83	446	sc ; Ugar ; Ugaritic
822ebcc8	447	sc ; Yiii ; Yi
822ebcc8	448	sc ; Zyyy ; Common