|
1 # CompositionExclusions-5.0.0.txt |
|
2 # Date: 2006-05-23, 12:42:00 PST [KW] |
|
3 # |
|
4 # This file lists the characters for the Composition Exclusion Table |
|
5 # defined in UAX #15, Unicode Normalization Forms. |
|
6 # |
|
7 # This file is a normative contributory data file in the |
|
8 # Unicode Character Database. |
|
9 # |
|
10 # Copyright (c) 1991-2006 Unicode, Inc. |
|
11 # For terms of use, see http://www.unicode.org/terms_of_use.html |
|
12 # |
|
13 # For more information, see |
|
14 # http://www.unicode.org/unicode/reports/tr15/#Primary Exclusion List Table |
|
15 # |
|
16 # For a full derivation of composition exclusions, see the derived property |
|
17 # Full_Composition_Exclusion in DerivedNormalizationProps.txt |
|
18 # |
|
19 |
|
20 # ================================================ |
|
21 # (1) Script Specifics |
|
22 # |
|
23 # This list of characters cannot be derived from the UnicodeData.txt file. |
|
24 # ================================================ |
|
25 |
|
26 0958 # DEVANAGARI LETTER QA |
|
27 0959 # DEVANAGARI LETTER KHHA |
|
28 095A # DEVANAGARI LETTER GHHA |
|
29 095B # DEVANAGARI LETTER ZA |
|
30 095C # DEVANAGARI LETTER DDDHA |
|
31 095D # DEVANAGARI LETTER RHA |
|
32 095E # DEVANAGARI LETTER FA |
|
33 095F # DEVANAGARI LETTER YYA |
|
34 09DC # BENGALI LETTER RRA |
|
35 09DD # BENGALI LETTER RHA |
|
36 09DF # BENGALI LETTER YYA |
|
37 0A33 # GURMUKHI LETTER LLA |
|
38 0A36 # GURMUKHI LETTER SHA |
|
39 0A59 # GURMUKHI LETTER KHHA |
|
40 0A5A # GURMUKHI LETTER GHHA |
|
41 0A5B # GURMUKHI LETTER ZA |
|
42 0A5E # GURMUKHI LETTER FA |
|
43 0B5C # ORIYA LETTER RRA |
|
44 0B5D # ORIYA LETTER RHA |
|
45 0F43 # TIBETAN LETTER GHA |
|
46 0F4D # TIBETAN LETTER DDHA |
|
47 0F52 # TIBETAN LETTER DHA |
|
48 0F57 # TIBETAN LETTER BHA |
|
49 0F5C # TIBETAN LETTER DZHA |
|
50 0F69 # TIBETAN LETTER KSSA |
|
51 0F76 # TIBETAN VOWEL SIGN VOCALIC R |
|
52 0F78 # TIBETAN VOWEL SIGN VOCALIC L |
|
53 0F93 # TIBETAN SUBJOINED LETTER GHA |
|
54 0F9D # TIBETAN SUBJOINED LETTER DDHA |
|
55 0FA2 # TIBETAN SUBJOINED LETTER DHA |
|
56 0FA7 # TIBETAN SUBJOINED LETTER BHA |
|
57 0FAC # TIBETAN SUBJOINED LETTER DZHA |
|
58 0FB9 # TIBETAN SUBJOINED LETTER KSSA |
|
59 FB1D # HEBREW LETTER YOD WITH HIRIQ |
|
60 FB1F # HEBREW LIGATURE YIDDISH YOD YOD PATAH |
|
61 FB2A # HEBREW LETTER SHIN WITH SHIN DOT |
|
62 FB2B # HEBREW LETTER SHIN WITH SIN DOT |
|
63 FB2C # HEBREW LETTER SHIN WITH DAGESH AND SHIN DOT |
|
64 FB2D # HEBREW LETTER SHIN WITH DAGESH AND SIN DOT |
|
65 FB2E # HEBREW LETTER ALEF WITH PATAH |
|
66 FB2F # HEBREW LETTER ALEF WITH QAMATS |
|
67 FB30 # HEBREW LETTER ALEF WITH MAPIQ |
|
68 FB31 # HEBREW LETTER BET WITH DAGESH |
|
69 FB32 # HEBREW LETTER GIMEL WITH DAGESH |
|
70 FB33 # HEBREW LETTER DALET WITH DAGESH |
|
71 FB34 # HEBREW LETTER HE WITH MAPIQ |
|
72 FB35 # HEBREW LETTER VAV WITH DAGESH |
|
73 FB36 # HEBREW LETTER ZAYIN WITH DAGESH |
|
74 FB38 # HEBREW LETTER TET WITH DAGESH |
|
75 FB39 # HEBREW LETTER YOD WITH DAGESH |
|
76 FB3A # HEBREW LETTER FINAL KAF WITH DAGESH |
|
77 FB3B # HEBREW LETTER KAF WITH DAGESH |
|
78 FB3C # HEBREW LETTER LAMED WITH DAGESH |
|
79 FB3E # HEBREW LETTER MEM WITH DAGESH |
|
80 FB40 # HEBREW LETTER NUN WITH DAGESH |
|
81 FB41 # HEBREW LETTER SAMEKH WITH DAGESH |
|
82 FB43 # HEBREW LETTER FINAL PE WITH DAGESH |
|
83 FB44 # HEBREW LETTER PE WITH DAGESH |
|
84 FB46 # HEBREW LETTER TSADI WITH DAGESH |
|
85 FB47 # HEBREW LETTER QOF WITH DAGESH |
|
86 FB48 # HEBREW LETTER RESH WITH DAGESH |
|
87 FB49 # HEBREW LETTER SHIN WITH DAGESH |
|
88 FB4A # HEBREW LETTER TAV WITH DAGESH |
|
89 FB4B # HEBREW LETTER VAV WITH HOLAM |
|
90 FB4C # HEBREW LETTER BET WITH RAFE |
|
91 FB4D # HEBREW LETTER KAF WITH RAFE |
|
92 FB4E # HEBREW LETTER PE WITH RAFE |
|
93 |
|
94 # Total code points: 67 |
|
95 |
|
96 # ================================================ |
|
97 # (2) Post Composition Version precomposed characters |
|
98 # |
|
99 # These characters cannot be derived solely from the UnicodeData.txt file |
|
100 # in this version of Unicode. |
|
101 # |
|
102 # Note that characters added to the standard after the |
|
103 # Composition Version and which have canonical decomposition mappings |
|
104 # are not automatically added to this list of Post Composition |
|
105 # Version precomposed characters. |
|
106 # ================================================ |
|
107 |
|
108 2ADC # FORKING |
|
109 1D15E # MUSICAL SYMBOL HALF NOTE |
|
110 1D15F # MUSICAL SYMBOL QUARTER NOTE |
|
111 1D160 # MUSICAL SYMBOL EIGHTH NOTE |
|
112 1D161 # MUSICAL SYMBOL SIXTEENTH NOTE |
|
113 1D162 # MUSICAL SYMBOL THIRTY-SECOND NOTE |
|
114 1D163 # MUSICAL SYMBOL SIXTY-FOURTH NOTE |
|
115 1D164 # MUSICAL SYMBOL ONE HUNDRED TWENTY-EIGHTH NOTE |
|
116 1D1BB # MUSICAL SYMBOL MINIMA |
|
117 1D1BC # MUSICAL SYMBOL MINIMA BLACK |
|
118 1D1BD # MUSICAL SYMBOL SEMIMINIMA WHITE |
|
119 1D1BE # MUSICAL SYMBOL SEMIMINIMA BLACK |
|
120 1D1BF # MUSICAL SYMBOL FUSA WHITE |
|
121 1D1C0 # MUSICAL SYMBOL FUSA BLACK |
|
122 |
|
123 # Total code points: 14 |
|
124 |
|
125 # ================================================ |
|
126 # (3) Singleton Decompositions |
|
127 # |
|
128 # These characters can be derived from the UnicodeData.txt file |
|
129 # by including all characters whose canonical decomposition |
|
130 # consists of a single character. |
|
131 # |
|
132 # These characters are simply quoted here for reference. |
|
133 # See also Full_Composition_Exclusion in DerivedNormalizationProps.txt |
|
134 # ================================================ |
|
135 |
|
136 # 0340..0341 [2] COMBINING GRAVE TONE MARK..COMBINING ACUTE TONE MARK |
|
137 # 0343 COMBINING GREEK KORONIS |
|
138 # 0374 GREEK NUMERAL SIGN |
|
139 # 037E GREEK QUESTION MARK |
|
140 # 0387 GREEK ANO TELEIA |
|
141 # 1F71 GREEK SMALL LETTER ALPHA WITH OXIA |
|
142 # 1F73 GREEK SMALL LETTER EPSILON WITH OXIA |
|
143 # 1F75 GREEK SMALL LETTER ETA WITH OXIA |
|
144 # 1F77 GREEK SMALL LETTER IOTA WITH OXIA |
|
145 # 1F79 GREEK SMALL LETTER OMICRON WITH OXIA |
|
146 # 1F7B GREEK SMALL LETTER UPSILON WITH OXIA |
|
147 # 1F7D GREEK SMALL LETTER OMEGA WITH OXIA |
|
148 # 1FBB GREEK CAPITAL LETTER ALPHA WITH OXIA |
|
149 # 1FBE GREEK PROSGEGRAMMENI |
|
150 # 1FC9 GREEK CAPITAL LETTER EPSILON WITH OXIA |
|
151 # 1FCB GREEK CAPITAL LETTER ETA WITH OXIA |
|
152 # 1FD3 GREEK SMALL LETTER IOTA WITH DIALYTIKA AND OXIA |
|
153 # 1FDB GREEK CAPITAL LETTER IOTA WITH OXIA |
|
154 # 1FE3 GREEK SMALL LETTER UPSILON WITH DIALYTIKA AND OXIA |
|
155 # 1FEB GREEK CAPITAL LETTER UPSILON WITH OXIA |
|
156 # 1FEE..1FEF [2] GREEK DIALYTIKA AND OXIA..GREEK VARIA |
|
157 # 1FF9 GREEK CAPITAL LETTER OMICRON WITH OXIA |
|
158 # 1FFB GREEK CAPITAL LETTER OMEGA WITH OXIA |
|
159 # 1FFD GREEK OXIA |
|
160 # 2000..2001 [2] EN QUAD..EM QUAD |
|
161 # 2126 OHM SIGN |
|
162 # 212A..212B [2] KELVIN SIGN..ANGSTROM SIGN |
|
163 # 2329 LEFT-POINTING ANGLE BRACKET |
|
164 # 232A RIGHT-POINTING ANGLE BRACKET |
|
165 # F900..FA0D [270] CJK COMPATIBILITY IDEOGRAPH-F900..CJK COMPATIBILITY IDEOGRAPH-FA0D |
|
166 # FA10 CJK COMPATIBILITY IDEOGRAPH-FA10 |
|
167 # FA12 CJK COMPATIBILITY IDEOGRAPH-FA12 |
|
168 # FA15..FA1E [10] CJK COMPATIBILITY IDEOGRAPH-FA15..CJK COMPATIBILITY IDEOGRAPH-FA1E |
|
169 # FA20 CJK COMPATIBILITY IDEOGRAPH-FA20 |
|
170 # FA22 CJK COMPATIBILITY IDEOGRAPH-FA22 |
|
171 # FA25..FA26 [2] CJK COMPATIBILITY IDEOGRAPH-FA25..CJK COMPATIBILITY IDEOGRAPH-FA26 |
|
172 # FA2A..FA2D [4] CJK COMPATIBILITY IDEOGRAPH-FA2A..CJK COMPATIBILITY IDEOGRAPH-FA2D |
|
173 # FA30..FA6A [59] CJK COMPATIBILITY IDEOGRAPH-FA30..CJK COMPATIBILITY IDEOGRAPH-FA6A |
|
174 # FA70..FAD9 [106] CJK COMPATIBILITY IDEOGRAPH-FA70..CJK COMPATIBILITY IDEOGRAPH-FAD9 |
|
175 # 2F800..2FA1D [542] CJK COMPATIBILITY IDEOGRAPH-2F800..CJK COMPATIBILITY IDEOGRAPH-2FA1D |
|
176 |
|
177 # Total code points: 924 |
|
178 |
|
179 # ================================================ |
|
180 # (4) Non-Starter Decompositions |
|
181 # |
|
182 # These characters can be derived from the UnicodeData file |
|
183 # by including all characters whose canonical decomposition consists |
|
184 # of a sequence of characters, the first of which has a non-zero |
|
185 # combining class. |
|
186 # |
|
187 # These characters are simply quoted here for reference. |
|
188 # See also Full_Composition_Exclusion in DerivedNormalizationProps.txt |
|
189 # ================================================ |
|
190 |
|
191 # 0344 COMBINING GREEK DIALYTIKA TONOS |
|
192 # 0F73 TIBETAN VOWEL SIGN II |
|
193 # 0F75 TIBETAN VOWEL SIGN UU |
|
194 # 0F81 TIBETAN VOWEL SIGN REVERSED II |
|
195 |
|
196 # Total code points: 4 |
|
197 |