Commit | Line | Data |
3e2f796a |
1 | # CompositionExclusions-3.txt |
8836d2a5 |
2 | # |
d357d9fe |
3 | # Composition Exclusions |
3e2f796a |
4 | # This file lists the characters from the UAX #15 Composition Exclusion Table. |
d357d9fe |
5 | # |
6 | # For more information, see |
7 | # http://www.unicode.org/unicode/reports/tr15/#Primary Exclusion List Table |
8 | |
9 | # (1) Script Specifics |
10 | # This list of characters cannot be derived from the UnicodeData file. |
11 | |
12 | 0958 # DEVANAGARI LETTER QA |
13 | 0959 # DEVANAGARI LETTER KHHA |
14 | 095A # DEVANAGARI LETTER GHHA |
15 | 095B # DEVANAGARI LETTER ZA |
16 | 095C # DEVANAGARI LETTER DDDHA |
17 | 095D # DEVANAGARI LETTER RHA |
18 | 095E # DEVANAGARI LETTER FA |
19 | 095F # DEVANAGARI LETTER YYA |
20 | 09DC # BENGALI LETTER RRA |
21 | 09DD # BENGALI LETTER RHA |
22 | 09DF # BENGALI LETTER YYA |
23 | 0A33 # GURMUKHI LETTER LLA |
24 | 0A36 # GURMUKHI LETTER SHA |
25 | 0A59 # GURMUKHI LETTER KHHA |
26 | 0A5A # GURMUKHI LETTER GHHA |
27 | 0A5B # GURMUKHI LETTER ZA |
28 | 0A5E # GURMUKHI LETTER FA |
29 | 0B5C # ORIYA LETTER RRA |
30 | 0B5D # ORIYA LETTER RHA |
31 | 0F43 # TIBETAN LETTER GHA |
32 | 0F4D # TIBETAN LETTER DDHA |
33 | 0F52 # TIBETAN LETTER DHA |
34 | 0F57 # TIBETAN LETTER BHA |
35 | 0F5C # TIBETAN LETTER DZHA |
36 | 0F69 # TIBETAN LETTER KSSA |
37 | 0F76 # TIBETAN VOWEL SIGN VOCALIC R |
38 | 0F78 # TIBETAN VOWEL SIGN VOCALIC L |
39 | 0F93 # TIBETAN SUBJOINED LETTER GHA |
40 | 0F9D # TIBETAN SUBJOINED LETTER DDHA |
41 | 0FA2 # TIBETAN SUBJOINED LETTER DHA |
42 | 0FA7 # TIBETAN SUBJOINED LETTER BHA |
43 | 0FAC # TIBETAN SUBJOINED LETTER DZHA |
44 | 0FB9 # TIBETAN SUBJOINED LETTER KSSA |
3e2f796a |
45 | FB1D # HEBREW LETTER YOD WITH HIRIQ |
d357d9fe |
46 | FB1F # HEBREW LIGATURE YIDDISH YOD YOD PATAH |
47 | FB2A # HEBREW LETTER SHIN WITH SHIN DOT |
48 | FB2B # HEBREW LETTER SHIN WITH SIN DOT |
49 | FB2C # HEBREW LETTER SHIN WITH DAGESH AND SHIN DOT |
50 | FB2D # HEBREW LETTER SHIN WITH DAGESH AND SIN DOT |
51 | FB2E # HEBREW LETTER ALEF WITH PATAH |
52 | FB2F # HEBREW LETTER ALEF WITH QAMATS |
53 | FB30 # HEBREW LETTER ALEF WITH MAPIQ |
54 | FB31 # HEBREW LETTER BET WITH DAGESH |
55 | FB32 # HEBREW LETTER GIMEL WITH DAGESH |
56 | FB33 # HEBREW LETTER DALET WITH DAGESH |
57 | FB34 # HEBREW LETTER HE WITH MAPIQ |
58 | FB35 # HEBREW LETTER VAV WITH DAGESH |
59 | FB36 # HEBREW LETTER ZAYIN WITH DAGESH |
60 | FB38 # HEBREW LETTER TET WITH DAGESH |
61 | FB39 # HEBREW LETTER YOD WITH DAGESH |
62 | FB3A # HEBREW LETTER FINAL KAF WITH DAGESH |
63 | FB3B # HEBREW LETTER KAF WITH DAGESH |
64 | FB3C # HEBREW LETTER LAMED WITH DAGESH |
65 | FB3E # HEBREW LETTER MEM WITH DAGESH |
66 | FB40 # HEBREW LETTER NUN WITH DAGESH |
67 | FB41 # HEBREW LETTER SAMEKH WITH DAGESH |
68 | FB43 # HEBREW LETTER FINAL PE WITH DAGESH |
69 | FB44 # HEBREW LETTER PE WITH DAGESH |
70 | FB46 # HEBREW LETTER TSADI WITH DAGESH |
71 | FB47 # HEBREW LETTER QOF WITH DAGESH |
72 | FB48 # HEBREW LETTER RESH WITH DAGESH |
73 | FB49 # HEBREW LETTER SHIN WITH DAGESH |
74 | FB4A # HEBREW LETTER TAV WITH DAGESH |
75 | FB4B # HEBREW LETTER VAV WITH HOLAM |
76 | FB4C # HEBREW LETTER BET WITH RAFE |
77 | FB4D # HEBREW LETTER KAF WITH RAFE |
78 | FB4E # HEBREW LETTER PE WITH RAFE |
79 | |
3e2f796a |
80 | # (2) Post Composition Version precomposed characters |
d357d9fe |
81 | # These characters cannot be derived from the UnicodeData file. |
3e2f796a |
82 | |
83 | 1D15E # MUSICAL SYMBOL HALF NOTE |
84 | 1D15F # MUSICAL SYMBOL QUARTER NOTE |
85 | 1D160 # MUSICAL SYMBOL EIGHTH NOTE |
86 | 1D161 # MUSICAL SYMBOL SIXTEENTH NOTE |
87 | 1D162 # MUSICAL SYMBOL THIRTY-SECOND NOTE |
88 | 1D163 # MUSICAL SYMBOL SIXTY-FOURTH NOTE |
89 | 1D164 # MUSICAL SYMBOL ONE HUNDRED TWENTY-EIGHTH NOTE |
90 | 1D1BB # MUSICAL SYMBOL MINIMA |
91 | 1D1BC # MUSICAL SYMBOL MINIMA BLACK |
92 | 1D1BD # MUSICAL SYMBOL SEMIMINIMA WHITE |
93 | 1D1BE # MUSICAL SYMBOL SEMIMINIMA BLACK |
94 | 1D1BF # MUSICAL SYMBOL FUSA WHITE |
95 | 1D1C0 # MUSICAL SYMBOL FUSA BLACK |
d357d9fe |
96 | |
97 | # (3) Singleton Decompositions |
98 | # These characters can be derived from the UnicodeData file |
99 | # by including all characters whose canonical decomposition |
100 | # consists of a single character. |
101 | # These characters are simply quoted here for reference. |
102 | |
103 | # 0340 COMBINING GRAVE TONE MARK |
104 | # 0341 COMBINING ACUTE TONE MARK |
105 | # 0343 COMBINING GREEK KORONIS |
106 | # 0374 GREEK NUMERAL SIGN |
107 | # 037E GREEK QUESTION MARK |
108 | # 0387 GREEK ANO TELEIA |
109 | # 1F71 GREEK SMALL LETTER ALPHA WITH OXIA |
110 | # 1F73 GREEK SMALL LETTER EPSILON WITH OXIA |
111 | # 1F75 GREEK SMALL LETTER ETA WITH OXIA |
112 | # 1F77 GREEK SMALL LETTER IOTA WITH OXIA |
113 | # 1F79 GREEK SMALL LETTER OMICRON WITH OXIA |
114 | # 1F7B GREEK SMALL LETTER UPSILON WITH OXIA |
115 | # 1F7D GREEK SMALL LETTER OMEGA WITH OXIA |
116 | # 1FBB GREEK CAPITAL LETTER ALPHA WITH OXIA |
117 | # 1FBE GREEK PROSGEGRAMMENI |
118 | # 1FC9 GREEK CAPITAL LETTER EPSILON WITH OXIA |
119 | # 1FCB GREEK CAPITAL LETTER ETA WITH OXIA |
120 | # 1FD3 GREEK SMALL LETTER IOTA WITH DIALYTIKA AND OXIA |
121 | # 1FDB GREEK CAPITAL LETTER IOTA WITH OXIA |
122 | # 1FE3 GREEK SMALL LETTER UPSILON WITH DIALYTIKA AND OXIA |
123 | # 1FEB GREEK CAPITAL LETTER UPSILON WITH OXIA |
124 | # 1FEE GREEK DIALYTIKA AND OXIA |
125 | # 1FEF GREEK VARIA |
126 | # 1FF9 GREEK CAPITAL LETTER OMICRON WITH OXIA |
127 | # 1FFB GREEK CAPITAL LETTER OMEGA WITH OXIA |
128 | # 1FFD GREEK OXIA |
129 | # 2000 EN QUAD |
130 | # 2001 EM QUAD |
131 | # 2126 OHM SIGN |
132 | # 212A KELVIN SIGN |
133 | # 212B ANGSTROM SIGN |
134 | # 2329 LEFT-POINTING ANGLE BRACKET |
135 | # 232A RIGHT-POINTING ANGLE BRACKET |
136 | # F900 CJK COMPATIBILITY IDEOGRAPH-F900 |
137 | #.. FA0D CJK COMPATIBILITY IDEOGRAPH-FA0D |
138 | # FA10 CJK COMPATIBILITY IDEOGRAPH-FA10 |
139 | # FA12 CJK COMPATIBILITY IDEOGRAPH-FA12 |
140 | # FA15 CJK COMPATIBILITY IDEOGRAPH-FA15 |
141 | #.. FA1E CJK COMPATIBILITY IDEOGRAPH-FA1E |
142 | # FA20 CJK COMPATIBILITY IDEOGRAPH-FA20 |
143 | # FA22 CJK COMPATIBILITY IDEOGRAPH-FA22 |
144 | # FA25 CJK COMPATIBILITY IDEOGRAPH-FA25 |
145 | # FA26 CJK COMPATIBILITY IDEOGRAPH-FA26 |
146 | # FA2A CJK COMPATIBILITY IDEOGRAPH-FA2A |
147 | #.. FA2D CJK COMPATIBILITY IDEOGRAPH-FA2D |
3e2f796a |
148 | # 2F800 CJK COMPATIBILITY IDEOGRAPH-2F800 |
149 | #.. 2FA1D CJK COMPATIBILITY IDEOGRAPH-2FA1D |
d357d9fe |
150 | |
151 | # (4) Non-Starter Decompositions |
152 | # These characters can be derived from the UnicodeData file |
153 | # by including all characters whose canonical decomposition consists |
8836d2a5 |
154 | # of a sequence of characters, the first of which has a non-zero |
155 | # combining class. |
d357d9fe |
156 | # These characters are simply quoted here for reference. |
157 | |
158 | # 0344 COMBINING GREEK DIALYTIKA TONOS |
159 | # 0F73 TIBETAN VOWEL SIGN II |
160 | # 0F75 TIBETAN VOWEL SIGN UU |
161 | # 0F81 TIBETAN VOWEL SIGN REVERSED II |