os/textandloc/textandlocutils/sortutil/src/SortUtilJapan.cpp
author sl
Tue, 10 Jun 2014 14:32:02 +0200
changeset 1 260cb5ec6c19
permissions -rw-r--r--
Update contrib.
     1 /*
     2 * Copyright (c) 2002-2004 Nokia Corporation and/or its subsidiary(-ies). 
     3 * All rights reserved.
     4 * This component and the accompanying materials are made available
     5 * under the terms of the License "Eclipse Public License v1.0"
     6 * which accompanies this distribution, and is available
     7 * at the URL "http://www.eclipse.org/legal/epl-v10.html".
     8 *
     9 * Initial Contributors:
    10 * Nokia Corporation - initial contribution.
    11 *
    12 * Contributors:
    13 *
    14 * Description:     
    15 *
    16 */
    17 
    18 
    19 
    20 
    21 
    22 
    23 // INCLUDE FILES
    24 #include "SortUtilJapan.h"
    25 #include "SortUtilImpl.h"
    26 #include "SortUtilImplExport.h"
    27 #include <jplangutil.h>
    28 
    29 // Unnamed namespace for local definitions
    30 namespace
    31     {
    32 
    33     /**
    34      * Character classes for Japanese sorting, in sorting order.
    35      */
    36     enum TJapaneseCharClass
    37         {
    38         ECharClassKana,
    39         ECharClassLatin,
    40         ECharClassDigit,
    41         ECharClassKanji,
    42         ECharClassSpecial
    43         };
    44 
    45     /**
    46      * Returns the Japanese character class of aChar.
    47      */
    48     TJapaneseCharClass CharClass(TUint aChar)
    49         {
    50         const TChar ch(aChar);
    51         // Special characters
    52         if (ch.IsSpace() || ch.IsPunctuation() || ch.IsControl()
    53             || aChar >= 0xF0000 && aChar <= 0xFFFD)
    54             {
    55             return ECharClassSpecial;
    56             }
    57         // Digit
    58         else if (aChar >= '0' && aChar <= '9' ||
    59             aChar >= 0xFF10 && aChar <= 0xFF19)
    60             {
    61             return ECharClassDigit;
    62             }
    63         // Latin
    64         else if (aChar >= 'A' && aChar <= 'Z' ||
    65             aChar >= 'a' && aChar <= 'z' ||
    66             aChar >= 0x00C0 && aChar <= 0x1EF3 && aChar != 0x00D7 && aChar != 0x00F7 ||
    67             aChar >= 0xFF21 && aChar <= 0xFF3A ||
    68             aChar >= 0xFF41 && aChar <= 0xFF5A)
    69             {
    70             return ECharClassLatin;
    71             }
    72         // Kana
    73         else if (JPLangUtil::IsKatakana(static_cast<TText>(aChar)) ||
    74             JPLangUtil::IsHiragana(static_cast<TText>(aChar)))
    75             {
    76             return ECharClassKana;
    77             }
    78         // Kanji
    79         else if (JPLangUtil::IsKanji(static_cast<TText>(aChar)))
    80             {
    81             return ECharClassKanji;
    82             }
    83         // All other charcters are "special"
    84         else
    85             {
    86             return ECharClassSpecial;
    87             }
    88         }
    89 
    90     /**
    91      * Compares two characters with Japanese comparison rules.
    92      */
    93     TInt JapaneseCompareC(TUint aLhs, TUint aRhs)
    94         {
    95         // First compare character classes
    96         const TInt lhsCls = CharClass(aLhs);
    97         const TInt rhsCls = CharClass(aRhs);
    98         return lhsCls - rhsCls;
    99         }
   100 
   101     /**
   102      * Compares two strings with Japanese comparison rules.
   103      */
   104     TInt JapaneseCompareS(const TDesC& aLhs, const TDesC& aRhs)
   105         {
   106         TInt result = 0;
   107 
   108         const TInt minLen = Min(aLhs.Length(), aRhs.Length());
   109         TInt i;
   110         TInt prevCompPos(0);
   111         for (i = 0; i < minLen && result == 0; ++i)
   112             {
   113             result = JapaneseCompareC(aLhs[i], aRhs[i]);
   114             if (result == 0)
   115                 {
   116                 TInt orgClass = CharClass(aLhs[i]);
   117                 TPtrC lPart;
   118                 TPtrC rPart;
   119                 if (orgClass == ECharClassKana)
   120                     {
   121                     int j = i;
   122                     for (; j < aLhs.Length(); ++j)
   123                         {
   124                         if (orgClass != CharClass(aLhs[j]))
   125                             {
   126                             break;
   127                             }
   128                         }
   129                     lPart.Set(aLhs.Mid(prevCompPos, j - prevCompPos));
   130                     for (j = i; j < aRhs.Length(); ++j)
   131                         {
   132                         if (orgClass != CharClass(aRhs[j]))
   133                             {
   134                             break;
   135                             }
   136                         }
   137                     rPart.Set(aRhs.Mid(prevCompPos, j - prevCompPos));
   138                     result = lPart.CompareC(rPart);
   139                     if (result != 0)
   140                         {
   141                         const TInt minKanaLen = Min(lPart.Length(), rPart.Length());
   142                         TPtrC lKanaPart(lPart.Left(minKanaLen));
   143                         TPtrC rKanaPart(rPart.Left(minKanaLen));
   144                         TInt resultKana = lKanaPart.MatchC(rKanaPart);
   145                         if (resultKana == 0)
   146                             {
   147                             TInt maxKanaLen = i+minKanaLen;
   148                             if (i+minKanaLen+1 >= minLen)
   149                                 {
   150                                 if (maxKanaLen < aLhs.Length()
   151                                  || maxKanaLen < aRhs.Length())
   152                                     {
   153                                     result = 0;
   154                                     i += (minKanaLen-1);
   155                                     }
   156                                 else
   157                                     {
   158                                     result = lKanaPart.CompareC(rKanaPart);;
   159                                     }
   160                                 }
   161                             else
   162                                 {
   163                                 result = 0;
   164                                 i += (minKanaLen-1);
   165                                 }
   166                             }
   167                         }
   168 
   169                     }
   170                 else
   171                     {
   172                     lPart.Set(aLhs.Mid(i, 1));
   173                     rPart.Set(aRhs.Mid(i, 1));
   174                     result = lPart.CompareC(rPart);
   175                     }
   176                 }
   177             else
   178                 {
   179                 prevCompPos = i;
   180                 }
   181             }
   182         if (result == 0)
   183             {
   184             if (i < aLhs.Length())
   185                 {
   186                 // aLhs is longer than aRhs
   187                 result += User::Collate(aLhs[i]);
   188                 }
   189             if (i < aRhs.Length())
   190                 {
   191                 // aRhs is longer that aLhs
   192                 result -= User::Collate(aRhs[i]);
   193                 }
   194             }
   195         return result;
   196         }
   197     }  // namespace
   198 
   199 // Only export in DLL
   200 EXPORT_C MSortUtil* SortUtilFactoryFunctionL()
   201     {
   202     MSortUtil* util = new (ELeave) TSortUtilJapan;
   203     return util;
   204     }
   205 
   206 inline TSortUtilJapan::TSortUtilJapan()
   207     {
   208     }
   209 
   210 TSortUtilJapan::~TSortUtilJapan()
   211     {
   212     }
   213 
   214 TInt TSortUtilJapan::CompareItems
   215         (const MSortKeyArray& aLhs,
   216         const MSortKeyArray& aRhs) const
   217     {
   218     TInt result(0);
   219     TInt lhsIndex(0);
   220     TInt rhsIndex(0);
   221 
   222     // Compare only pronounciation keys in the first pass
   223     do
   224         {
   225         const TDesC& lhsText =
   226             SortUtilImpl::FindNextNonEmptyKey(aLhs, ESortKeyPronounciation, lhsIndex);
   227         const TDesC& rhsText =
   228             SortUtilImpl::FindNextNonEmptyKey(aRhs, ESortKeyPronounciation, rhsIndex);
   229         if (lhsText.Length() > 0)
   230             {
   231             // lhs has pronounciation key
   232             if (rhsText.Length() > 0)
   233                 {
   234                 // Both lhs and rhs have pronounciation key: compare the key texts
   235                 result = JapaneseCompareS(lhsText, rhsText);
   236                 }
   237             else
   238                 {
   239                 // Only lhs has pronounciation key
   240                 result = -1;
   241                 }
   242             }
   243         else
   244             {
   245             // lhs does not have pronounciation key
   246             if (rhsText.Length() > 0)
   247                 {
   248                 // Only rhs has pronounciation key
   249                 result = 1;
   250                 }
   251             }
   252 
   253         if (result != 0)
   254             {
   255             return result;
   256             }
   257         }
   258     while (lhsIndex <= aLhs.SortKeyCount() && rhsIndex < aRhs.SortKeyCount());
   259 
   260     // No difference found with pronounciation keys: compare basic keys
   261     lhsIndex = 0;
   262     rhsIndex = 0;
   263     do
   264         {
   265         const TDesC& lhsText =
   266             SortUtilImpl::FindNextNonEmptyKey(aLhs, ESortKeyBasic, lhsIndex);
   267         const TDesC& rhsText =
   268             SortUtilImpl::FindNextNonEmptyKey(aRhs, ESortKeyBasic, rhsIndex);
   269         result = JapaneseCompareS(lhsText, rhsText);
   270         if (result != 0)
   271             {
   272             return result;
   273             }
   274         }
   275     while (lhsIndex <= aLhs.SortKeyCount() && rhsIndex < aRhs.SortKeyCount());
   276 
   277     return result;
   278     }
   279 
   280 // End of file