/[cmucl]/src/i18n/CompositionExclusions.txt
ViewVC logotype

Contents of /src/i18n/CompositionExclusions.txt

Parent Directory Parent Directory | Revision Log Revision Log


Revision 1.1.2.1 - (hide annotations)
Fri May 29 14:37:41 2009 UTC (4 years, 10 months ago) by rtoy
Branch: unicode-utf16-extfmt-branch
CVS Tags: unicode-snapshot-2009-06, unicode-utf16-extfmt-2009-06-11
Changes since 1.1: +197 -0 lines
File MIME type: text/plain
Initial version from Unicode 5.1.0.
1 rtoy 1.1.2.1 # CompositionExclusions-5.1.0.txt
2     # Date: 2008-03-20, 17:45:00 PDT [KW]
3     #
4     # This file lists the characters for the Composition Exclusion Table
5     # defined in UAX #15, Unicode Normalization Forms.
6     #
7     # This file is a normative contributory data file in the
8     # Unicode Character Database.
9     #
10     # Copyright (c) 1991-2008 Unicode, Inc.
11     # For terms of use, see http://www.unicode.org/terms_of_use.html
12     #
13     # For more information, see
14     # http://www.unicode.org/unicode/reports/tr15/#Primary Exclusion List Table
15     #
16     # For a full derivation of composition exclusions, see the derived property
17     # Full_Composition_Exclusion in DerivedNormalizationProps.txt
18     #
19    
20     # ================================================
21     # (1) Script Specifics
22     #
23     # This list of characters cannot be derived from the UnicodeData.txt file.
24     # ================================================
25    
26     0958 # DEVANAGARI LETTER QA
27     0959 # DEVANAGARI LETTER KHHA
28     095A # DEVANAGARI LETTER GHHA
29     095B # DEVANAGARI LETTER ZA
30     095C # DEVANAGARI LETTER DDDHA
31     095D # DEVANAGARI LETTER RHA
32     095E # DEVANAGARI LETTER FA
33     095F # DEVANAGARI LETTER YYA
34     09DC # BENGALI LETTER RRA
35     09DD # BENGALI LETTER RHA
36     09DF # BENGALI LETTER YYA
37     0A33 # GURMUKHI LETTER LLA
38     0A36 # GURMUKHI LETTER SHA
39     0A59 # GURMUKHI LETTER KHHA
40     0A5A # GURMUKHI LETTER GHHA
41     0A5B # GURMUKHI LETTER ZA
42     0A5E # GURMUKHI LETTER FA
43     0B5C # ORIYA LETTER RRA
44     0B5D # ORIYA LETTER RHA
45     0F43 # TIBETAN LETTER GHA
46     0F4D # TIBETAN LETTER DDHA
47     0F52 # TIBETAN LETTER DHA
48     0F57 # TIBETAN LETTER BHA
49     0F5C # TIBETAN LETTER DZHA
50     0F69 # TIBETAN LETTER KSSA
51     0F76 # TIBETAN VOWEL SIGN VOCALIC R
52     0F78 # TIBETAN VOWEL SIGN VOCALIC L
53     0F93 # TIBETAN SUBJOINED LETTER GHA
54     0F9D # TIBETAN SUBJOINED LETTER DDHA
55     0FA2 # TIBETAN SUBJOINED LETTER DHA
56     0FA7 # TIBETAN SUBJOINED LETTER BHA
57     0FAC # TIBETAN SUBJOINED LETTER DZHA
58     0FB9 # TIBETAN SUBJOINED LETTER KSSA
59     FB1D # HEBREW LETTER YOD WITH HIRIQ
60     FB1F # HEBREW LIGATURE YIDDISH YOD YOD PATAH
61     FB2A # HEBREW LETTER SHIN WITH SHIN DOT
62     FB2B # HEBREW LETTER SHIN WITH SIN DOT
63     FB2C # HEBREW LETTER SHIN WITH DAGESH AND SHIN DOT
64     FB2D # HEBREW LETTER SHIN WITH DAGESH AND SIN DOT
65     FB2E # HEBREW LETTER ALEF WITH PATAH
66     FB2F # HEBREW LETTER ALEF WITH QAMATS
67     FB30 # HEBREW LETTER ALEF WITH MAPIQ
68     FB31 # HEBREW LETTER BET WITH DAGESH
69     FB32 # HEBREW LETTER GIMEL WITH DAGESH
70     FB33 # HEBREW LETTER DALET WITH DAGESH
71     FB34 # HEBREW LETTER HE WITH MAPIQ
72     FB35 # HEBREW LETTER VAV WITH DAGESH
73     FB36 # HEBREW LETTER ZAYIN WITH DAGESH
74     FB38 # HEBREW LETTER TET WITH DAGESH
75     FB39 # HEBREW LETTER YOD WITH DAGESH
76     FB3A # HEBREW LETTER FINAL KAF WITH DAGESH
77     FB3B # HEBREW LETTER KAF WITH DAGESH
78     FB3C # HEBREW LETTER LAMED WITH DAGESH
79     FB3E # HEBREW LETTER MEM WITH DAGESH
80     FB40 # HEBREW LETTER NUN WITH DAGESH
81     FB41 # HEBREW LETTER SAMEKH WITH DAGESH
82     FB43 # HEBREW LETTER FINAL PE WITH DAGESH
83     FB44 # HEBREW LETTER PE WITH DAGESH
84     FB46 # HEBREW LETTER TSADI WITH DAGESH
85     FB47 # HEBREW LETTER QOF WITH DAGESH
86     FB48 # HEBREW LETTER RESH WITH DAGESH
87     FB49 # HEBREW LETTER SHIN WITH DAGESH
88     FB4A # HEBREW LETTER TAV WITH DAGESH
89     FB4B # HEBREW LETTER VAV WITH HOLAM
90     FB4C # HEBREW LETTER BET WITH RAFE
91     FB4D # HEBREW LETTER KAF WITH RAFE
92     FB4E # HEBREW LETTER PE WITH RAFE
93    
94     # Total code points: 67
95    
96     # ================================================
97     # (2) Post Composition Version precomposed characters
98     #
99     # These characters cannot be derived solely from the UnicodeData.txt file
100     # in this version of Unicode.
101     #
102     # Note that characters added to the standard after the
103     # Composition Version and which have canonical decomposition mappings
104     # are not automatically added to this list of Post Composition
105     # Version precomposed characters.
106     # ================================================
107    
108     2ADC # FORKING
109     1D15E # MUSICAL SYMBOL HALF NOTE
110     1D15F # MUSICAL SYMBOL QUARTER NOTE
111     1D160 # MUSICAL SYMBOL EIGHTH NOTE
112     1D161 # MUSICAL SYMBOL SIXTEENTH NOTE
113     1D162 # MUSICAL SYMBOL THIRTY-SECOND NOTE
114     1D163 # MUSICAL SYMBOL SIXTY-FOURTH NOTE
115     1D164 # MUSICAL SYMBOL ONE HUNDRED TWENTY-EIGHTH NOTE
116     1D1BB # MUSICAL SYMBOL MINIMA
117     1D1BC # MUSICAL SYMBOL MINIMA BLACK
118     1D1BD # MUSICAL SYMBOL SEMIMINIMA WHITE
119     1D1BE # MUSICAL SYMBOL SEMIMINIMA BLACK
120     1D1BF # MUSICAL SYMBOL FUSA WHITE
121     1D1C0 # MUSICAL SYMBOL FUSA BLACK
122    
123     # Total code points: 14
124    
125     # ================================================
126     # (3) Singleton Decompositions
127     #
128     # These characters can be derived from the UnicodeData.txt file
129     # by including all characters whose canonical decomposition
130     # consists of a single character.
131     #
132     # These characters are simply quoted here for reference.
133     # See also Full_Composition_Exclusion in DerivedNormalizationProps.txt
134     # ================================================
135    
136     # 0340..0341 [2] COMBINING GRAVE TONE MARK..COMBINING ACUTE TONE MARK
137     # 0343 COMBINING GREEK KORONIS
138     # 0374 GREEK NUMERAL SIGN
139     # 037E GREEK QUESTION MARK
140     # 0387 GREEK ANO TELEIA
141     # 1F71 GREEK SMALL LETTER ALPHA WITH OXIA
142     # 1F73 GREEK SMALL LETTER EPSILON WITH OXIA
143     # 1F75 GREEK SMALL LETTER ETA WITH OXIA
144     # 1F77 GREEK SMALL LETTER IOTA WITH OXIA
145     # 1F79 GREEK SMALL LETTER OMICRON WITH OXIA
146     # 1F7B GREEK SMALL LETTER UPSILON WITH OXIA
147     # 1F7D GREEK SMALL LETTER OMEGA WITH OXIA
148     # 1FBB GREEK CAPITAL LETTER ALPHA WITH OXIA
149     # 1FBE GREEK PROSGEGRAMMENI
150     # 1FC9 GREEK CAPITAL LETTER EPSILON WITH OXIA
151     # 1FCB GREEK CAPITAL LETTER ETA WITH OXIA
152     # 1FD3 GREEK SMALL LETTER IOTA WITH DIALYTIKA AND OXIA
153     # 1FDB GREEK CAPITAL LETTER IOTA WITH OXIA
154     # 1FE3 GREEK SMALL LETTER UPSILON WITH DIALYTIKA AND OXIA
155     # 1FEB GREEK CAPITAL LETTER UPSILON WITH OXIA
156     # 1FEE..1FEF [2] GREEK DIALYTIKA AND OXIA..GREEK VARIA
157     # 1FF9 GREEK CAPITAL LETTER OMICRON WITH OXIA
158     # 1FFB GREEK CAPITAL LETTER OMEGA WITH OXIA
159     # 1FFD GREEK OXIA
160     # 2000..2001 [2] EN QUAD..EM QUAD
161     # 2126 OHM SIGN
162     # 212A..212B [2] KELVIN SIGN..ANGSTROM SIGN
163     # 2329 LEFT-POINTING ANGLE BRACKET
164     # 232A RIGHT-POINTING ANGLE BRACKET
165     # F900..FA0D [270] CJK COMPATIBILITY IDEOGRAPH-F900..CJK COMPATIBILITY IDEOGRAPH-FA0D
166     # FA10 CJK COMPATIBILITY IDEOGRAPH-FA10
167     # FA12 CJK COMPATIBILITY IDEOGRAPH-FA12
168     # FA15..FA1E [10] CJK COMPATIBILITY IDEOGRAPH-FA15..CJK COMPATIBILITY IDEOGRAPH-FA1E
169     # FA20 CJK COMPATIBILITY IDEOGRAPH-FA20
170     # FA22 CJK COMPATIBILITY IDEOGRAPH-FA22
171     # FA25..FA26 [2] CJK COMPATIBILITY IDEOGRAPH-FA25..CJK COMPATIBILITY IDEOGRAPH-FA26
172     # FA2A..FA2D [4] CJK COMPATIBILITY IDEOGRAPH-FA2A..CJK COMPATIBILITY IDEOGRAPH-FA2D
173     # FA30..FA6A [59] CJK COMPATIBILITY IDEOGRAPH-FA30..CJK COMPATIBILITY IDEOGRAPH-FA6A
174     # FA70..FAD9 [106] CJK COMPATIBILITY IDEOGRAPH-FA70..CJK COMPATIBILITY IDEOGRAPH-FAD9
175     # 2F800..2FA1D [542] CJK COMPATIBILITY IDEOGRAPH-2F800..CJK COMPATIBILITY IDEOGRAPH-2FA1D
176    
177     # Total code points: 1030
178    
179     # ================================================
180     # (4) Non-Starter Decompositions
181     #
182     # These characters can be derived from the UnicodeData file
183     # by including all characters whose canonical decomposition consists
184     # of a sequence of characters, the first of which has a non-zero
185     # combining class.
186     #
187     # These characters are simply quoted here for reference.
188     # See also Full_Composition_Exclusion in DerivedNormalizationProps.txt
189     # ================================================
190    
191     # 0344 COMBINING GREEK DIALYTIKA TONOS
192     # 0F73 TIBETAN VOWEL SIGN II
193     # 0F75 TIBETAN VOWEL SIGN UU
194     # 0F81 TIBETAN VOWEL SIGN REVERSED II
195    
196     # Total code points: 4
197    

  ViewVC Help
Powered by ViewVC 1.1.5