1 # CompositionExclusions-4.0.0.txt
2 # Date: 2003-02-14,16:49:03 GMT [MD]
4 # This file lists the characters from the UAX #15 Composition Exclusion Table.
6 # For more information, see
7 # http://www.unicode.org/unicode/reports/tr15/#Primary Exclusion List Table
8 # ================================================
10 # (1) Script Specifics
11 # This list of characters cannot be derived from the UnicodeData file.
12 # ================================================
14 0958 # DEVANAGARI LETTER QA
15 0959 # DEVANAGARI LETTER KHHA
16 095A # DEVANAGARI LETTER GHHA
17 095B # DEVANAGARI LETTER ZA
18 095C # DEVANAGARI LETTER DDDHA
19 095D # DEVANAGARI LETTER RHA
20 095E # DEVANAGARI LETTER FA
21 095F # DEVANAGARI LETTER YYA
22 09DC # BENGALI LETTER RRA
23 09DD # BENGALI LETTER RHA
24 09DF # BENGALI LETTER YYA
25 0A33 # GURMUKHI LETTER LLA
26 0A36 # GURMUKHI LETTER SHA
27 0A59 # GURMUKHI LETTER KHHA
28 0A5A # GURMUKHI LETTER GHHA
29 0A5B # GURMUKHI LETTER ZA
30 0A5E # GURMUKHI LETTER FA
31 0B5C # ORIYA LETTER RRA
32 0B5D # ORIYA LETTER RHA
33 0F43 # TIBETAN LETTER GHA
34 0F4D # TIBETAN LETTER DDHA
35 0F52 # TIBETAN LETTER DHA
36 0F57 # TIBETAN LETTER BHA
37 0F5C # TIBETAN LETTER DZHA
38 0F69 # TIBETAN LETTER KSSA
39 0F76 # TIBETAN VOWEL SIGN VOCALIC R
40 0F78 # TIBETAN VOWEL SIGN VOCALIC L
41 0F93 # TIBETAN SUBJOINED LETTER GHA
42 0F9D # TIBETAN SUBJOINED LETTER DDHA
43 0FA2 # TIBETAN SUBJOINED LETTER DHA
44 0FA7 # TIBETAN SUBJOINED LETTER BHA
45 0FAC # TIBETAN SUBJOINED LETTER DZHA
46 0FB9 # TIBETAN SUBJOINED LETTER KSSA
47 FB1D # HEBREW LETTER YOD WITH HIRIQ
48 FB1F # HEBREW LIGATURE YIDDISH YOD YOD PATAH
49 FB2A # HEBREW LETTER SHIN WITH SHIN DOT
50 FB2B # HEBREW LETTER SHIN WITH SIN DOT
51 FB2C # HEBREW LETTER SHIN WITH DAGESH AND SHIN DOT
52 FB2D # HEBREW LETTER SHIN WITH DAGESH AND SIN DOT
53 FB2E # HEBREW LETTER ALEF WITH PATAH
54 FB2F # HEBREW LETTER ALEF WITH QAMATS
55 FB30 # HEBREW LETTER ALEF WITH MAPIQ
56 FB31 # HEBREW LETTER BET WITH DAGESH
57 FB32 # HEBREW LETTER GIMEL WITH DAGESH
58 FB33 # HEBREW LETTER DALET WITH DAGESH
59 FB34 # HEBREW LETTER HE WITH MAPIQ
60 FB35 # HEBREW LETTER VAV WITH DAGESH
61 FB36 # HEBREW LETTER ZAYIN WITH DAGESH
62 FB38 # HEBREW LETTER TET WITH DAGESH
63 FB39 # HEBREW LETTER YOD WITH DAGESH
64 FB3A # HEBREW LETTER FINAL KAF WITH DAGESH
65 FB3B # HEBREW LETTER KAF WITH DAGESH
66 FB3C # HEBREW LETTER LAMED WITH DAGESH
67 FB3E # HEBREW LETTER MEM WITH DAGESH
68 FB40 # HEBREW LETTER NUN WITH DAGESH
69 FB41 # HEBREW LETTER SAMEKH WITH DAGESH
70 FB43 # HEBREW LETTER FINAL PE WITH DAGESH
71 FB44 # HEBREW LETTER PE WITH DAGESH
72 FB46 # HEBREW LETTER TSADI WITH DAGESH
73 FB47 # HEBREW LETTER QOF WITH DAGESH
74 FB48 # HEBREW LETTER RESH WITH DAGESH
75 FB49 # HEBREW LETTER SHIN WITH DAGESH
76 FB4A # HEBREW LETTER TAV WITH DAGESH
77 FB4B # HEBREW LETTER VAV WITH HOLAM
78 FB4C # HEBREW LETTER BET WITH RAFE
79 FB4D # HEBREW LETTER KAF WITH RAFE
80 FB4E # HEBREW LETTER PE WITH RAFE
82 # Total code points: 67
84 # ================================================
85 # (2) Post Composition Version precomposed characters
86 # These characters cannot be derived solely from the UnicodeData.txt file
87 # in this version of Unicode.
88 # ================================================
91 1D15E # MUSICAL SYMBOL HALF NOTE
92 1D15F # MUSICAL SYMBOL QUARTER NOTE
93 1D160 # MUSICAL SYMBOL EIGHTH NOTE
94 1D161 # MUSICAL SYMBOL SIXTEENTH NOTE
95 1D162 # MUSICAL SYMBOL THIRTY-SECOND NOTE
96 1D163 # MUSICAL SYMBOL SIXTY-FOURTH NOTE
97 1D164 # MUSICAL SYMBOL ONE HUNDRED TWENTY-EIGHTH NOTE
98 1D1BB # MUSICAL SYMBOL MINIMA
99 1D1BC # MUSICAL SYMBOL MINIMA BLACK
100 1D1BD # MUSICAL SYMBOL SEMIMINIMA WHITE
101 1D1BE # MUSICAL SYMBOL SEMIMINIMA BLACK
102 1D1BF # MUSICAL SYMBOL FUSA WHITE
103 1D1C0 # MUSICAL SYMBOL FUSA BLACK
105 # Total code points: 14
107 # ================================================
108 # (3) Singleton Decompositions
109 # These characters can be derived from the UnicodeData file
110 # by including all characters whose canonical decomposition
111 # consists of a single character.
112 # These characters are simply quoted here for reference.
113 # ================================================
115 # 0340..0341 [2] COMBINING GRAVE TONE MARK..COMBINING ACUTE TONE MARK
116 # 0343 COMBINING GREEK KORONIS
117 # 0374 GREEK NUMERAL SIGN
118 # 037E GREEK QUESTION MARK
119 # 0387 GREEK ANO TELEIA
120 # 1F71 GREEK SMALL LETTER ALPHA WITH OXIA
121 # 1F73 GREEK SMALL LETTER EPSILON WITH OXIA
122 # 1F75 GREEK SMALL LETTER ETA WITH OXIA
123 # 1F77 GREEK SMALL LETTER IOTA WITH OXIA
124 # 1F79 GREEK SMALL LETTER OMICRON WITH OXIA
125 # 1F7B GREEK SMALL LETTER UPSILON WITH OXIA
126 # 1F7D GREEK SMALL LETTER OMEGA WITH OXIA
127 # 1FBB GREEK CAPITAL LETTER ALPHA WITH OXIA
128 # 1FBE GREEK PROSGEGRAMMENI
129 # 1FC9 GREEK CAPITAL LETTER EPSILON WITH OXIA
130 # 1FCB GREEK CAPITAL LETTER ETA WITH OXIA
131 # 1FD3 GREEK SMALL LETTER IOTA WITH DIALYTIKA AND OXIA
132 # 1FDB GREEK CAPITAL LETTER IOTA WITH OXIA
133 # 1FE3 GREEK SMALL LETTER UPSILON WITH DIALYTIKA AND OXIA
134 # 1FEB GREEK CAPITAL LETTER UPSILON WITH OXIA
135 # 1FEE..1FEF [2] GREEK DIALYTIKA AND OXIA..GREEK VARIA
136 # 1FF9 GREEK CAPITAL LETTER OMICRON WITH OXIA
137 # 1FFB GREEK CAPITAL LETTER OMEGA WITH OXIA
139 # 2000..2001 [2] EN QUAD..EM QUAD
141 # 212A..212B [2] KELVIN SIGN..ANGSTROM SIGN
142 # 2329 LEFT-POINTING ANGLE BRACKET
143 # 232A RIGHT-POINTING ANGLE BRACKET
144 # F900..FA0D [270] CJK COMPATIBILITY IDEOGRAPH-F900..CJK COMPATIBILITY IDEOGRAPH-FA0D
145 # FA10 CJK COMPATIBILITY IDEOGRAPH-FA10
146 # FA12 CJK COMPATIBILITY IDEOGRAPH-FA12
147 # FA15..FA1E [10] CJK COMPATIBILITY IDEOGRAPH-FA15..CJK COMPATIBILITY IDEOGRAPH-FA1E
148 # FA20 CJK COMPATIBILITY IDEOGRAPH-FA20
149 # FA22 CJK COMPATIBILITY IDEOGRAPH-FA22
150 # FA25..FA26 [2] CJK COMPATIBILITY IDEOGRAPH-FA25..CJK COMPATIBILITY IDEOGRAPH-FA26
151 # FA2A..FA2D [4] CJK COMPATIBILITY IDEOGRAPH-FA2A..CJK COMPATIBILITY IDEOGRAPH-FA2D
152 # FA30..FA6A [59] CJK COMPATIBILITY IDEOGRAPH-FA30..CJK COMPATIBILITY IDEOGRAPH-FA6A
153 # 2F800..2FA1D [542] CJK COMPATIBILITY IDEOGRAPH-2F800..CJK COMPATIBILITY IDEOGRAPH-2FA1D
155 # Total code points: 924
157 # ================================================
158 # (4) Non-Starter Decompositions
159 # These characters can be derived from the UnicodeData file
160 # by including all characters whose canonical decomposition consists
161 # of a sequence of characters, the first of which has a non-zero
163 # These characters are simply quoted here for reference.
164 # ================================================
166 # 0344 COMBINING GREEK DIALYTIKA TONOS
167 # 0F73 TIBETAN VOWEL SIGN II
168 # 0F75 TIBETAN VOWEL SIGN UU
169 # 0F81 TIBETAN VOWEL SIGN REVERSED II
171 # Total code points: 4