os/kernelhwsrv/kernel/eka/euser/unicode/perl/CompositionExclusions-5_0_0.txt
author sl
Tue, 10 Jun 2014 14:32:02 +0200
changeset 1 260cb5ec6c19
permissions -rw-r--r--
Update contrib.
sl@0
     1
# CompositionExclusions-5.0.0.txt
sl@0
     2
# Date: 2006-05-23, 12:42:00 PST [KW]
sl@0
     3
#
sl@0
     4
# This file lists the characters for the Composition Exclusion Table
sl@0
     5
# defined in UAX #15, Unicode Normalization Forms.
sl@0
     6
#
sl@0
     7
# This file is a normative contributory data file in the
sl@0
     8
# Unicode Character Database.
sl@0
     9
#
sl@0
    10
# Copyright (c) 1991-2006 Unicode, Inc.
sl@0
    11
# For terms of use, see http://www.unicode.org/terms_of_use.html
sl@0
    12
#
sl@0
    13
# For more information, see
sl@0
    14
# http://www.unicode.org/unicode/reports/tr15/#Primary Exclusion List Table
sl@0
    15
#
sl@0
    16
# For a full derivation of composition exclusions, see the derived property
sl@0
    17
# Full_Composition_Exclusion in DerivedNormalizationProps.txt
sl@0
    18
#
sl@0
    19
sl@0
    20
# ================================================
sl@0
    21
# (1) Script Specifics
sl@0
    22
#
sl@0
    23
# This list of characters cannot be derived from the UnicodeData.txt file.
sl@0
    24
# ================================================
sl@0
    25
sl@0
    26
0958    #  DEVANAGARI LETTER QA
sl@0
    27
0959    #  DEVANAGARI LETTER KHHA
sl@0
    28
095A    #  DEVANAGARI LETTER GHHA
sl@0
    29
095B    #  DEVANAGARI LETTER ZA
sl@0
    30
095C    #  DEVANAGARI LETTER DDDHA
sl@0
    31
095D    #  DEVANAGARI LETTER RHA
sl@0
    32
095E    #  DEVANAGARI LETTER FA
sl@0
    33
095F    #  DEVANAGARI LETTER YYA
sl@0
    34
09DC    #  BENGALI LETTER RRA
sl@0
    35
09DD    #  BENGALI LETTER RHA
sl@0
    36
09DF    #  BENGALI LETTER YYA
sl@0
    37
0A33    #  GURMUKHI LETTER LLA
sl@0
    38
0A36    #  GURMUKHI LETTER SHA
sl@0
    39
0A59    #  GURMUKHI LETTER KHHA
sl@0
    40
0A5A    #  GURMUKHI LETTER GHHA
sl@0
    41
0A5B    #  GURMUKHI LETTER ZA
sl@0
    42
0A5E    #  GURMUKHI LETTER FA
sl@0
    43
0B5C    #  ORIYA LETTER RRA
sl@0
    44
0B5D    #  ORIYA LETTER RHA
sl@0
    45
0F43    #  TIBETAN LETTER GHA
sl@0
    46
0F4D    #  TIBETAN LETTER DDHA
sl@0
    47
0F52    #  TIBETAN LETTER DHA
sl@0
    48
0F57    #  TIBETAN LETTER BHA
sl@0
    49
0F5C    #  TIBETAN LETTER DZHA
sl@0
    50
0F69    #  TIBETAN LETTER KSSA
sl@0
    51
0F76    #  TIBETAN VOWEL SIGN VOCALIC R
sl@0
    52
0F78    #  TIBETAN VOWEL SIGN VOCALIC L
sl@0
    53
0F93    #  TIBETAN SUBJOINED LETTER GHA
sl@0
    54
0F9D    #  TIBETAN SUBJOINED LETTER DDHA
sl@0
    55
0FA2    #  TIBETAN SUBJOINED LETTER DHA
sl@0
    56
0FA7    #  TIBETAN SUBJOINED LETTER BHA
sl@0
    57
0FAC    #  TIBETAN SUBJOINED LETTER DZHA
sl@0
    58
0FB9    #  TIBETAN SUBJOINED LETTER KSSA
sl@0
    59
FB1D    #  HEBREW LETTER YOD WITH HIRIQ
sl@0
    60
FB1F    #  HEBREW LIGATURE YIDDISH YOD YOD PATAH
sl@0
    61
FB2A    #  HEBREW LETTER SHIN WITH SHIN DOT
sl@0
    62
FB2B    #  HEBREW LETTER SHIN WITH SIN DOT
sl@0
    63
FB2C    #  HEBREW LETTER SHIN WITH DAGESH AND SHIN DOT
sl@0
    64
FB2D    #  HEBREW LETTER SHIN WITH DAGESH AND SIN DOT
sl@0
    65
FB2E    #  HEBREW LETTER ALEF WITH PATAH
sl@0
    66
FB2F    #  HEBREW LETTER ALEF WITH QAMATS
sl@0
    67
FB30    #  HEBREW LETTER ALEF WITH MAPIQ
sl@0
    68
FB31    #  HEBREW LETTER BET WITH DAGESH
sl@0
    69
FB32    #  HEBREW LETTER GIMEL WITH DAGESH
sl@0
    70
FB33    #  HEBREW LETTER DALET WITH DAGESH
sl@0
    71
FB34    #  HEBREW LETTER HE WITH MAPIQ
sl@0
    72
FB35    #  HEBREW LETTER VAV WITH DAGESH
sl@0
    73
FB36    #  HEBREW LETTER ZAYIN WITH DAGESH
sl@0
    74
FB38    #  HEBREW LETTER TET WITH DAGESH
sl@0
    75
FB39    #  HEBREW LETTER YOD WITH DAGESH
sl@0
    76
FB3A    #  HEBREW LETTER FINAL KAF WITH DAGESH
sl@0
    77
FB3B    #  HEBREW LETTER KAF WITH DAGESH
sl@0
    78
FB3C    #  HEBREW LETTER LAMED WITH DAGESH
sl@0
    79
FB3E    #  HEBREW LETTER MEM WITH DAGESH
sl@0
    80
FB40    #  HEBREW LETTER NUN WITH DAGESH
sl@0
    81
FB41    #  HEBREW LETTER SAMEKH WITH DAGESH
sl@0
    82
FB43    #  HEBREW LETTER FINAL PE WITH DAGESH
sl@0
    83
FB44    #  HEBREW LETTER PE WITH DAGESH
sl@0
    84
FB46    #  HEBREW LETTER TSADI WITH DAGESH
sl@0
    85
FB47    #  HEBREW LETTER QOF WITH DAGESH
sl@0
    86
FB48    #  HEBREW LETTER RESH WITH DAGESH
sl@0
    87
FB49    #  HEBREW LETTER SHIN WITH DAGESH
sl@0
    88
FB4A    #  HEBREW LETTER TAV WITH DAGESH
sl@0
    89
FB4B    #  HEBREW LETTER VAV WITH HOLAM
sl@0
    90
FB4C    #  HEBREW LETTER BET WITH RAFE
sl@0
    91
FB4D    #  HEBREW LETTER KAF WITH RAFE
sl@0
    92
FB4E    #  HEBREW LETTER PE WITH RAFE
sl@0
    93
sl@0
    94
# Total code points: 67
sl@0
    95
sl@0
    96
# ================================================
sl@0
    97
# (2) Post Composition Version precomposed characters
sl@0
    98
#
sl@0
    99
# These characters cannot be derived solely from the UnicodeData.txt file
sl@0
   100
# in this version of Unicode.
sl@0
   101
#
sl@0
   102
# Note that characters added to the standard after the
sl@0
   103
# Composition Version and which have canonical decomposition mappings
sl@0
   104
# are not automatically added to this list of Post Composition
sl@0
   105
# Version precomposed characters.
sl@0
   106
# ================================================
sl@0
   107
sl@0
   108
2ADC    #  FORKING
sl@0
   109
1D15E   #  MUSICAL SYMBOL HALF NOTE
sl@0
   110
1D15F   #  MUSICAL SYMBOL QUARTER NOTE
sl@0
   111
1D160   #  MUSICAL SYMBOL EIGHTH NOTE
sl@0
   112
1D161   #  MUSICAL SYMBOL SIXTEENTH NOTE
sl@0
   113
1D162   #  MUSICAL SYMBOL THIRTY-SECOND NOTE
sl@0
   114
1D163   #  MUSICAL SYMBOL SIXTY-FOURTH NOTE
sl@0
   115
1D164   #  MUSICAL SYMBOL ONE HUNDRED TWENTY-EIGHTH NOTE
sl@0
   116
1D1BB   #  MUSICAL SYMBOL MINIMA
sl@0
   117
1D1BC   #  MUSICAL SYMBOL MINIMA BLACK
sl@0
   118
1D1BD   #  MUSICAL SYMBOL SEMIMINIMA WHITE
sl@0
   119
1D1BE   #  MUSICAL SYMBOL SEMIMINIMA BLACK
sl@0
   120
1D1BF   #  MUSICAL SYMBOL FUSA WHITE
sl@0
   121
1D1C0   #  MUSICAL SYMBOL FUSA BLACK
sl@0
   122
sl@0
   123
# Total code points: 14
sl@0
   124
sl@0
   125
# ================================================
sl@0
   126
# (3) Singleton Decompositions
sl@0
   127
#
sl@0
   128
# These characters can be derived from the UnicodeData.txt file
sl@0
   129
# by including all characters whose canonical decomposition
sl@0
   130
# consists of a single character.
sl@0
   131
#
sl@0
   132
# These characters are simply quoted here for reference.
sl@0
   133
# See also Full_Composition_Exclusion in DerivedNormalizationProps.txt
sl@0
   134
# ================================================
sl@0
   135
sl@0
   136
# 0340..0341       [2] COMBINING GRAVE TONE MARK..COMBINING ACUTE TONE MARK
sl@0
   137
# 0343                 COMBINING GREEK KORONIS
sl@0
   138
# 0374                 GREEK NUMERAL SIGN
sl@0
   139
# 037E                 GREEK QUESTION MARK
sl@0
   140
# 0387                 GREEK ANO TELEIA
sl@0
   141
# 1F71                 GREEK SMALL LETTER ALPHA WITH OXIA
sl@0
   142
# 1F73                 GREEK SMALL LETTER EPSILON WITH OXIA
sl@0
   143
# 1F75                 GREEK SMALL LETTER ETA WITH OXIA
sl@0
   144
# 1F77                 GREEK SMALL LETTER IOTA WITH OXIA
sl@0
   145
# 1F79                 GREEK SMALL LETTER OMICRON WITH OXIA
sl@0
   146
# 1F7B                 GREEK SMALL LETTER UPSILON WITH OXIA
sl@0
   147
# 1F7D                 GREEK SMALL LETTER OMEGA WITH OXIA
sl@0
   148
# 1FBB                 GREEK CAPITAL LETTER ALPHA WITH OXIA
sl@0
   149
# 1FBE                 GREEK PROSGEGRAMMENI
sl@0
   150
# 1FC9                 GREEK CAPITAL LETTER EPSILON WITH OXIA
sl@0
   151
# 1FCB                 GREEK CAPITAL LETTER ETA WITH OXIA
sl@0
   152
# 1FD3                 GREEK SMALL LETTER IOTA WITH DIALYTIKA AND OXIA
sl@0
   153
# 1FDB                 GREEK CAPITAL LETTER IOTA WITH OXIA
sl@0
   154
# 1FE3                 GREEK SMALL LETTER UPSILON WITH DIALYTIKA AND OXIA
sl@0
   155
# 1FEB                 GREEK CAPITAL LETTER UPSILON WITH OXIA
sl@0
   156
# 1FEE..1FEF       [2] GREEK DIALYTIKA AND OXIA..GREEK VARIA
sl@0
   157
# 1FF9                 GREEK CAPITAL LETTER OMICRON WITH OXIA
sl@0
   158
# 1FFB                 GREEK CAPITAL LETTER OMEGA WITH OXIA
sl@0
   159
# 1FFD                 GREEK OXIA
sl@0
   160
# 2000..2001       [2] EN QUAD..EM QUAD
sl@0
   161
# 2126                 OHM SIGN
sl@0
   162
# 212A..212B       [2] KELVIN SIGN..ANGSTROM SIGN
sl@0
   163
# 2329                 LEFT-POINTING ANGLE BRACKET
sl@0
   164
# 232A                 RIGHT-POINTING ANGLE BRACKET
sl@0
   165
# F900..FA0D     [270] CJK COMPATIBILITY IDEOGRAPH-F900..CJK COMPATIBILITY IDEOGRAPH-FA0D
sl@0
   166
# FA10                 CJK COMPATIBILITY IDEOGRAPH-FA10
sl@0
   167
# FA12                 CJK COMPATIBILITY IDEOGRAPH-FA12
sl@0
   168
# FA15..FA1E      [10] CJK COMPATIBILITY IDEOGRAPH-FA15..CJK COMPATIBILITY IDEOGRAPH-FA1E
sl@0
   169
# FA20                 CJK COMPATIBILITY IDEOGRAPH-FA20
sl@0
   170
# FA22                 CJK COMPATIBILITY IDEOGRAPH-FA22
sl@0
   171
# FA25..FA26       [2] CJK COMPATIBILITY IDEOGRAPH-FA25..CJK COMPATIBILITY IDEOGRAPH-FA26
sl@0
   172
# FA2A..FA2D       [4] CJK COMPATIBILITY IDEOGRAPH-FA2A..CJK COMPATIBILITY IDEOGRAPH-FA2D
sl@0
   173
# FA30..FA6A      [59] CJK COMPATIBILITY IDEOGRAPH-FA30..CJK COMPATIBILITY IDEOGRAPH-FA6A
sl@0
   174
# FA70..FAD9     [106] CJK COMPATIBILITY IDEOGRAPH-FA70..CJK COMPATIBILITY IDEOGRAPH-FAD9
sl@0
   175
# 2F800..2FA1D   [542] CJK COMPATIBILITY IDEOGRAPH-2F800..CJK COMPATIBILITY IDEOGRAPH-2FA1D
sl@0
   176
sl@0
   177
# Total code points: 924
sl@0
   178
sl@0
   179
# ================================================
sl@0
   180
# (4) Non-Starter Decompositions
sl@0
   181
#
sl@0
   182
# These characters can be derived from the UnicodeData file
sl@0
   183
# by including all characters whose canonical decomposition consists
sl@0
   184
# of a sequence of characters, the first of which has a non-zero
sl@0
   185
# combining class.
sl@0
   186
#
sl@0
   187
# These characters are simply quoted here for reference.
sl@0
   188
# See also Full_Composition_Exclusion in DerivedNormalizationProps.txt
sl@0
   189
# ================================================
sl@0
   190
sl@0
   191
# 0344                 COMBINING GREEK DIALYTIKA TONOS
sl@0
   192
# 0F73                 TIBETAN VOWEL SIGN II
sl@0
   193
# 0F75                 TIBETAN VOWEL SIGN UU
sl@0
   194
# 0F81                 TIBETAN VOWEL SIGN REVERSED II
sl@0
   195
sl@0
   196
# Total code points: 4
sl@0
   197