1 # CompositionExclusions-4.1.0.txt
\r
2 # Date: 2005-03-17, 15:21:00 PST [KW]
\r
4 # This file lists the characters from the UAX #15 Composition Exclusion Table.
\r
6 # This file is a normative contributory data file in the
\r
7 # Unicode Character Database.
\r
9 # Copyright (c) 1991-2005 Unicode, Inc.
\r
10 # For terms of use, see http://www.unicode.org/terms_of_use.html
\r
12 # For more information, see
\r
13 # http://www.unicode.org/unicode/reports/tr15/#Primary Exclusion List Table
\r
14 # ================================================
\r
16 # (1) Script Specifics
\r
17 # This list of characters cannot be derived from the UnicodeData file.
\r
18 # ================================================
\r
20 0958 # DEVANAGARI LETTER QA
\r
21 0959 # DEVANAGARI LETTER KHHA
\r
22 095A # DEVANAGARI LETTER GHHA
\r
23 095B # DEVANAGARI LETTER ZA
\r
24 095C # DEVANAGARI LETTER DDDHA
\r
25 095D # DEVANAGARI LETTER RHA
\r
26 095E # DEVANAGARI LETTER FA
\r
27 095F # DEVANAGARI LETTER YYA
\r
28 09DC # BENGALI LETTER RRA
\r
29 09DD # BENGALI LETTER RHA
\r
30 09DF # BENGALI LETTER YYA
\r
31 0A33 # GURMUKHI LETTER LLA
\r
32 0A36 # GURMUKHI LETTER SHA
\r
33 0A59 # GURMUKHI LETTER KHHA
\r
34 0A5A # GURMUKHI LETTER GHHA
\r
35 0A5B # GURMUKHI LETTER ZA
\r
36 0A5E # GURMUKHI LETTER FA
\r
37 0B5C # ORIYA LETTER RRA
\r
38 0B5D # ORIYA LETTER RHA
\r
39 0F43 # TIBETAN LETTER GHA
\r
40 0F4D # TIBETAN LETTER DDHA
\r
41 0F52 # TIBETAN LETTER DHA
\r
42 0F57 # TIBETAN LETTER BHA
\r
43 0F5C # TIBETAN LETTER DZHA
\r
44 0F69 # TIBETAN LETTER KSSA
\r
45 0F76 # TIBETAN VOWEL SIGN VOCALIC R
\r
46 0F78 # TIBETAN VOWEL SIGN VOCALIC L
\r
47 0F93 # TIBETAN SUBJOINED LETTER GHA
\r
48 0F9D # TIBETAN SUBJOINED LETTER DDHA
\r
49 0FA2 # TIBETAN SUBJOINED LETTER DHA
\r
50 0FA7 # TIBETAN SUBJOINED LETTER BHA
\r
51 0FAC # TIBETAN SUBJOINED LETTER DZHA
\r
52 0FB9 # TIBETAN SUBJOINED LETTER KSSA
\r
53 FB1D # HEBREW LETTER YOD WITH HIRIQ
\r
54 FB1F # HEBREW LIGATURE YIDDISH YOD YOD PATAH
\r
55 FB2A # HEBREW LETTER SHIN WITH SHIN DOT
\r
56 FB2B # HEBREW LETTER SHIN WITH SIN DOT
\r
57 FB2C # HEBREW LETTER SHIN WITH DAGESH AND SHIN DOT
\r
58 FB2D # HEBREW LETTER SHIN WITH DAGESH AND SIN DOT
\r
59 FB2E # HEBREW LETTER ALEF WITH PATAH
\r
60 FB2F # HEBREW LETTER ALEF WITH QAMATS
\r
61 FB30 # HEBREW LETTER ALEF WITH MAPIQ
\r
62 FB31 # HEBREW LETTER BET WITH DAGESH
\r
63 FB32 # HEBREW LETTER GIMEL WITH DAGESH
\r
64 FB33 # HEBREW LETTER DALET WITH DAGESH
\r
65 FB34 # HEBREW LETTER HE WITH MAPIQ
\r
66 FB35 # HEBREW LETTER VAV WITH DAGESH
\r
67 FB36 # HEBREW LETTER ZAYIN WITH DAGESH
\r
68 FB38 # HEBREW LETTER TET WITH DAGESH
\r
69 FB39 # HEBREW LETTER YOD WITH DAGESH
\r
70 FB3A # HEBREW LETTER FINAL KAF WITH DAGESH
\r
71 FB3B # HEBREW LETTER KAF WITH DAGESH
\r
72 FB3C # HEBREW LETTER LAMED WITH DAGESH
\r
73 FB3E # HEBREW LETTER MEM WITH DAGESH
\r
74 FB40 # HEBREW LETTER NUN WITH DAGESH
\r
75 FB41 # HEBREW LETTER SAMEKH WITH DAGESH
\r
76 FB43 # HEBREW LETTER FINAL PE WITH DAGESH
\r
77 FB44 # HEBREW LETTER PE WITH DAGESH
\r
78 FB46 # HEBREW LETTER TSADI WITH DAGESH
\r
79 FB47 # HEBREW LETTER QOF WITH DAGESH
\r
80 FB48 # HEBREW LETTER RESH WITH DAGESH
\r
81 FB49 # HEBREW LETTER SHIN WITH DAGESH
\r
82 FB4A # HEBREW LETTER TAV WITH DAGESH
\r
83 FB4B # HEBREW LETTER VAV WITH HOLAM
\r
84 FB4C # HEBREW LETTER BET WITH RAFE
\r
85 FB4D # HEBREW LETTER KAF WITH RAFE
\r
86 FB4E # HEBREW LETTER PE WITH RAFE
\r
88 # Total code points: 67
\r
90 # ================================================
\r
91 # (2) Post Composition Version precomposed characters
\r
92 # These characters cannot be derived solely from the UnicodeData.txt file
\r
93 # in this version of Unicode.
\r
94 # ================================================
\r
97 1D15E # MUSICAL SYMBOL HALF NOTE
\r
98 1D15F # MUSICAL SYMBOL QUARTER NOTE
\r
99 1D160 # MUSICAL SYMBOL EIGHTH NOTE
\r
100 1D161 # MUSICAL SYMBOL SIXTEENTH NOTE
\r
101 1D162 # MUSICAL SYMBOL THIRTY-SECOND NOTE
\r
102 1D163 # MUSICAL SYMBOL SIXTY-FOURTH NOTE
\r
103 1D164 # MUSICAL SYMBOL ONE HUNDRED TWENTY-EIGHTH NOTE
\r
104 1D1BB # MUSICAL SYMBOL MINIMA
\r
105 1D1BC # MUSICAL SYMBOL MINIMA BLACK
\r
106 1D1BD # MUSICAL SYMBOL SEMIMINIMA WHITE
\r
107 1D1BE # MUSICAL SYMBOL SEMIMINIMA BLACK
\r
108 1D1BF # MUSICAL SYMBOL FUSA WHITE
\r
109 1D1C0 # MUSICAL SYMBOL FUSA BLACK
\r
111 # Total code points: 14
\r
113 # ================================================
\r
114 # (3) Singleton Decompositions
\r
115 # These characters can be derived from the UnicodeData file
\r
116 # by including all characters whose canonical decomposition
\r
117 # consists of a single character.
\r
118 # These characters are simply quoted here for reference.
\r
119 # ================================================
\r
121 # 0340..0341 [2] COMBINING GRAVE TONE MARK..COMBINING ACUTE TONE MARK
\r
122 # 0343 COMBINING GREEK KORONIS
\r
123 # 0374 GREEK NUMERAL SIGN
\r
124 # 037E GREEK QUESTION MARK
\r
125 # 0387 GREEK ANO TELEIA
\r
126 # 1F71 GREEK SMALL LETTER ALPHA WITH OXIA
\r
127 # 1F73 GREEK SMALL LETTER EPSILON WITH OXIA
\r
128 # 1F75 GREEK SMALL LETTER ETA WITH OXIA
\r
129 # 1F77 GREEK SMALL LETTER IOTA WITH OXIA
\r
130 # 1F79 GREEK SMALL LETTER OMICRON WITH OXIA
\r
131 # 1F7B GREEK SMALL LETTER UPSILON WITH OXIA
\r
132 # 1F7D GREEK SMALL LETTER OMEGA WITH OXIA
\r
133 # 1FBB GREEK CAPITAL LETTER ALPHA WITH OXIA
\r
134 # 1FBE GREEK PROSGEGRAMMENI
\r
135 # 1FC9 GREEK CAPITAL LETTER EPSILON WITH OXIA
\r
136 # 1FCB GREEK CAPITAL LETTER ETA WITH OXIA
\r
137 # 1FD3 GREEK SMALL LETTER IOTA WITH DIALYTIKA AND OXIA
\r
138 # 1FDB GREEK CAPITAL LETTER IOTA WITH OXIA
\r
139 # 1FE3 GREEK SMALL LETTER UPSILON WITH DIALYTIKA AND OXIA
\r
140 # 1FEB GREEK CAPITAL LETTER UPSILON WITH OXIA
\r
141 # 1FEE..1FEF [2] GREEK DIALYTIKA AND OXIA..GREEK VARIA
\r
142 # 1FF9 GREEK CAPITAL LETTER OMICRON WITH OXIA
\r
143 # 1FFB GREEK CAPITAL LETTER OMEGA WITH OXIA
\r
145 # 2000..2001 [2] EN QUAD..EM QUAD
\r
147 # 212A..212B [2] KELVIN SIGN..ANGSTROM SIGN
\r
148 # 2329 LEFT-POINTING ANGLE BRACKET
\r
149 # 232A RIGHT-POINTING ANGLE BRACKET
\r
150 # F900..FA0D [270] CJK COMPATIBILITY IDEOGRAPH-F900..CJK COMPATIBILITY IDEOGRAPH-FA0D
\r
151 # FA10 CJK COMPATIBILITY IDEOGRAPH-FA10
\r
152 # FA12 CJK COMPATIBILITY IDEOGRAPH-FA12
\r
153 # FA15..FA1E [10] CJK COMPATIBILITY IDEOGRAPH-FA15..CJK COMPATIBILITY IDEOGRAPH-FA1E
\r
154 # FA20 CJK COMPATIBILITY IDEOGRAPH-FA20
\r
155 # FA22 CJK COMPATIBILITY IDEOGRAPH-FA22
\r
156 # FA25..FA26 [2] CJK COMPATIBILITY IDEOGRAPH-FA25..CJK COMPATIBILITY IDEOGRAPH-FA26
\r
157 # FA2A..FA2D [4] CJK COMPATIBILITY IDEOGRAPH-FA2A..CJK COMPATIBILITY IDEOGRAPH-FA2D
\r
158 # FA30..FA6A [59] CJK COMPATIBILITY IDEOGRAPH-FA30..CJK COMPATIBILITY IDEOGRAPH-FA6A
\r
159 # FA70..FAD9 [106] CJK COMPATIBILITY IDEOGRAPH-FA70..CJK COMPATIBILITY IDEOGRAPH-FAD9
\r
160 # 2F800..2FA1D [542] CJK COMPATIBILITY IDEOGRAPH-2F800..CJK COMPATIBILITY IDEOGRAPH-2FA1D
\r
162 # Total code points: 924
\r
164 # ================================================
\r
165 # (4) Non-Starter Decompositions
\r
166 # These characters can be derived from the UnicodeData file
\r
167 # by including all characters whose canonical decomposition consists
\r
168 # of a sequence of characters, the first of which has a non-zero
\r
170 # These characters are simply quoted here for reference.
\r
171 # ================================================
\r
173 # 0344 COMBINING GREEK DIALYTIKA TONOS
\r
174 # 0F73 TIBETAN VOWEL SIGN II
\r
175 # 0F75 TIBETAN VOWEL SIGN UU
\r
176 # 0F81 TIBETAN VOWEL SIGN REVERSED II
\r
178 # Total code points: 4
\r