os/textandloc/textandlocutils/jplangutil/src/jplangutil.cpp
author sl
Tue, 10 Jun 2014 14:32:02 +0200
changeset 1 260cb5ec6c19
permissions -rw-r--r--
Update contrib.
sl@0
     1
/*
sl@0
     2
* Copyright (c) 2002 Nokia Corporation and/or its subsidiary(-ies).
sl@0
     3
* All rights reserved.
sl@0
     4
* This component and the accompanying materials are made available
sl@0
     5
* under the terms of the License "Eclipse Public License v1.0"
sl@0
     6
* which accompanies this distribution, and is available
sl@0
     7
* at the URL "http://www.eclipse.org/legal/epl-v10.html".
sl@0
     8
*
sl@0
     9
* Initial Contributors:
sl@0
    10
* Nokia Corporation - initial contribution.
sl@0
    11
*
sl@0
    12
* Contributors:
sl@0
    13
*
sl@0
    14
* Description: 
sl@0
    15
*     A utility for providing Japanese Language-specific (UNICODE) functions.
sl@0
    16
*
sl@0
    17
*
sl@0
    18
*/
sl@0
    19
sl@0
    20
sl@0
    21
// INCLUDES FILES
sl@0
    22
#include "jplangutil.h"
sl@0
    23
#include "jplangutil.tables.h"
sl@0
    24
sl@0
    25
// LOCAL DEFINES
sl@0
    26
sl@0
    27
// LOCAL CONSTANTS AND ENUMS
sl@0
    28
sl@0
    29
#if defined(_DEBUG)
sl@0
    30
_LIT( KJPLangUtilPanic, "JPLangUtil" );
sl@0
    31
enum TJPLangUtilPanicCodes
sl@0
    32
    {
sl@0
    33
    EErrNotKatakana = 0x777,
sl@0
    34
    EErrNotVoicedKatakana
sl@0
    35
    };
sl@0
    36
#endif
sl@0
    37
sl@0
    38
enum TConvDirection
sl@0
    39
    {
sl@0
    40
    EHalfToFullWidth,
sl@0
    41
    EFullToHalfWidth
sl@0
    42
    };
sl@0
    43
sl@0
    44
const TInt KHalfWidthKatakanaRange = 59;
sl@0
    45
const TInt KHalfWidthIndex = 0;
sl@0
    46
const TInt KFullWidthIndex = 1;
sl@0
    47
const TInt KFullWidthVoicableKatakanaRange = 23;
sl@0
    48
const TInt KFullWidthSemiVoicableKatakanaRange = 5;
sl@0
    49
const TInt KHalfWidthSpecialCharRange = 21;
sl@0
    50
sl@0
    51
const TText KHalfWidthKatakanaVoicedSoundMark     = 0xff9e;
sl@0
    52
const TText KHalfWidthKatakanaSemiVoicedSoundMark = 0xff9f;
sl@0
    53
sl@0
    54
// The following Full-width (semi-)voiced markers are
sl@0
    55
// *also* considered Hiragana, per Unicode spec.
sl@0
    56
const TText KFullWidthKatakanaVoicedSoundMark     = 0x309b;
sl@0
    57
const TText KFullWidthKatakanaSemiVoicedSoundMark = 0x309c;
sl@0
    58
sl@0
    59
const TText KHalfWidthKatakanaLowerBound = 0xff65;
sl@0
    60
const TText KHalfWidthKatakanaUpperBound = 0xff9f;
sl@0
    61
const TText KFullWidthKatakanaLowerBound = 0x30a0;
sl@0
    62
const TText KFullWidthKatakanaUpperBound = 0x30ff;
sl@0
    63
sl@0
    64
const TText KCJKUnifiedIdiographLowerBound = 0x4e00;
sl@0
    65
const TText KCJKUnifiedIdiographUpperBound = 0x9fa5;
sl@0
    66
const TText KCJKUnifiedIdeographExtALowerBound = 0x3400;
sl@0
    67
const TText KCJKUnifiedIdeographExtAUpperBound = 0x4dbf;
sl@0
    68
sl@0
    69
const TText KHalfToFullWidthASCIIOffset = 0xfee0;
sl@0
    70
const TText KHalfWidthASCIILowerBound = 0x0021; // Leaves out space (0x0020)
sl@0
    71
const TText KHalfWidthASCIIUpperBound = 0x007e;
sl@0
    72
const TText KFullWidthASCIILowerBound = 0xff01;
sl@0
    73
const TText KFullWidthASCIIUpperBound = 0xff5e;
sl@0
    74
sl@0
    75
const TUint KFullWidthHiraganaSmallA = 0x3041;
sl@0
    76
const TUint KFullWidthHiraganaVU = 0x3094;
sl@0
    77
const TUint KFullWidthHiraganaU = 0x3046;
sl@0
    78
const TUint KFullWidthHiraganaVoicedSound = 0x309B;
sl@0
    79
const TUint KFullWidthKatakanaSmallA = 0x30a1;
sl@0
    80
const TUint KFullWidthKatakanaSmallVU = 0x30F4;
sl@0
    81
sl@0
    82
sl@0
    83
// ============================== LOCAL CLASSES ================================
sl@0
    84
sl@0
    85
/**
sl@0
    86
 *  This is an internal utility class used by the JPLangUtil class
sl@0
    87
 *  and is intended for encapsulation only.
sl@0
    88
 *
sl@0
    89
 *  @lib JPLangUtil.lib
sl@0
    90
 *  @since 2.6
sl@0
    91
 */
sl@0
    92
class UnicodeTextUtil
sl@0
    93
    {
sl@0
    94
    public: // Query Functions
sl@0
    95
sl@0
    96
        /**
sl@0
    97
        * Determines if aUnicodeChar is a base Katakana that is capable
sl@0
    98
        * of being converted into either a Vioced or Semi-voiced Full-width
sl@0
    99
        * Katakana character.
sl@0
   100
        * If aSemiVoiced is true, then the check is only performed
sl@0
   101
        * for Semi-voiced conversion capability.
sl@0
   102
        *
sl@0
   103
        * @param aUnicodeChar The character to be tested.
sl@0
   104
        * @param aSemiVoiced  Whether or not the character is to be tested
sl@0
   105
        *                     as convertable to a Semi-voiced Full-width
sl@0
   106
        *                     Katakana, rather than just voiced.
sl@0
   107
        *
sl@0
   108
        * @return ETrue is the character is in fact convertable to either
sl@0
   109
        *         a voiced or semi-voiced fullwidth katakana character,
sl@0
   110
        *         depending on the aSemiVoiced flag.
sl@0
   111
        */
sl@0
   112
        static TBool IsFullWidthVoicedConvertableHalfWidthBaseKatakana
sl@0
   113
                             ( TText aUnicodeChar, TBool aSemiVoiced = EFalse );
sl@0
   114
sl@0
   115
        /**
sl@0
   116
        * Determines if aUnicodeChar is a  Vioced or Semi-voiced Full-width
sl@0
   117
        * Katakana character.
sl@0
   118
        * If aSemiVoiced is true, then the check is only performed
sl@0
   119
        * for Semi-voiced.
sl@0
   120
        *
sl@0
   121
        * @param aUnicodeChar The character to be tested.
sl@0
   122
        * @param aSemiVoiced  Whether or not the character is a Semi-voiced
sl@0
   123
        *                     Full-width Katakana, rather than just voiced.
sl@0
   124
        *
sl@0
   125
        * @return ETrue is the character is in fact a voiced or semi-voiced
sl@0
   126
        *         fullwidth katakana character, depending on the aSemiVoiced
sl@0
   127
        *         flag.
sl@0
   128
        */
sl@0
   129
        static TBool IsFullWidthVoicedKatakana( TText aUnicodeChar,
sl@0
   130
                                                TBool aSemiVoiced = EFalse);
sl@0
   131
sl@0
   132
    public: // Conversion Functions
sl@0
   133
sl@0
   134
        /**
sl@0
   135
        * Converts one Katakana character from either Half to Full-width
sl@0
   136
        * or vice versa, depending on the direction specified by aDirection
sl@0
   137
        *
sl@0
   138
        * @param aDirection Direction to convert.
sl@0
   139
        * @param aKatakanaChar The character to convert.
sl@0
   140
        *
sl@0
   141
        * @return The opposite width Katakana character.
sl@0
   142
        */
sl@0
   143
        static TChar ConvertKatakanaChar( TConvDirection aDirection,
sl@0
   144
                                          TText aKatakanaChar );
sl@0
   145
sl@0
   146
        /**
sl@0
   147
        * Converts one voiced Katakana character from either Half to Full-width
sl@0
   148
        * or vice versa, depending on the direction specified by aDirection,
sl@0
   149
        * and appends the converted character to the descriptor aTarget.
sl@0
   150
        * In the case that it is from Full to Half-width, it is necessary to
sl@0
   151
        * convert it into a base-katakana + (semi-)voiced mark pair, thus
sl@0
   152
        * the necessity for passing in the TDes reference return type.
sl@0
   153
        * In the case of converting from Half to Full-width, it is only
sl@0
   154
        * necessary to pass in a base-katakana that has a (semi-)voiced
sl@0
   155
        * Full-width counterpart.
sl@0
   156
        *
sl@0
   157
        * @param aDirection Direction to convert.
sl@0
   158
        * @param aVoicedKatakana The character to convert.
sl@0
   159
        * @param aTarget The descriptor to append the converted character(s) to.
sl@0
   160
        * @param aSemiVoiced ETrue if performing a Semi-voiced conversion.
sl@0
   161
        *                    Default is EFalse.
sl@0
   162
        */
sl@0
   163
        static void ConvertVoicedKatakanaCharAndAppendToTarget(
sl@0
   164
                                                   TConvDirection aDirection,
sl@0
   165
                                                   TText aVoicedKatakana,
sl@0
   166
                                                   TDes& aTarget,
sl@0
   167
                                                   TBool aSemiVoiced = EFalse );
sl@0
   168
sl@0
   169
        /**
sl@0
   170
        * Converts all special characters *in-place* from either Half to
sl@0
   171
        * Full-width or vice versa, depending on the direction specified
sl@0
   172
        * by aDirection
sl@0
   173
        *
sl@0
   174
        * @param aDirection Direction to convert.
sl@0
   175
        * @param aUnicodeText The character to convert.
sl@0
   176
        *
sl@0
   177
        * @return The number of converted special characters.
sl@0
   178
        */
sl@0
   179
        static TInt ConvertSpecialCharactersInPlace( TConvDirection aDirection,
sl@0
   180
                                                     TDes16& aUnicodeText );
sl@0
   181
sl@0
   182
        /**
sl@0
   183
        * Converts all ASCII *in-place* from either Half to
sl@0
   184
        * Full-width or vice versa, depending on the direction specified
sl@0
   185
        * by aDirection
sl@0
   186
        *
sl@0
   187
        * @param aDirection Direction to convert.
sl@0
   188
        * @param aUnicodeText The character to convert.
sl@0
   189
        *
sl@0
   190
        * @return The number of converted ASCII-range characters.
sl@0
   191
        */
sl@0
   192
        static TInt ConvertASCIIInPlace( TConvDirection aDirection,
sl@0
   193
                                         TDes16& aUnicodeText );
sl@0
   194
    };
sl@0
   195
sl@0
   196
// ============================= LOCAL FUNCTIONS ===============================
sl@0
   197
sl@0
   198
// -----------------------------------------------------------------------------
sl@0
   199
// UnicodeTextUtil::IsFullWidthVoicedConvertableHalfWidthBaseKatakana
sl@0
   200
// Determines if aUnicodeChar is a base Katakana that is capable
sl@0
   201
// of being converted into either a Vioced or Semi-voiced
sl@0
   202
// Full-width character.
sl@0
   203
// If aSemiVoiced is true, then the check is only performed
sl@0
   204
// for Semi-voiced conversion capability.
sl@0
   205
// Returns: ETrue if it is convertable.
sl@0
   206
// -----------------------------------------------------------------------------
sl@0
   207
//
sl@0
   208
TBool UnicodeTextUtil::IsFullWidthVoicedConvertableHalfWidthBaseKatakana
sl@0
   209
                                       ( TText aUnicodeChar, TBool aSemiVoiced )
sl@0
   210
    {
sl@0
   211
    if( aSemiVoiced )
sl@0
   212
        {
sl@0
   213
        return ( aUnicodeChar >= 0xff8a && aUnicodeChar <= 0xff8e );
sl@0
   214
        }
sl@0
   215
    else
sl@0
   216
        {
sl@0
   217
        return ( ( aUnicodeChar == 0xff73 ) ||
sl@0
   218
                 ( aUnicodeChar >= 0xff76 && aUnicodeChar <= 0xff7f ) ||
sl@0
   219
                 ( aUnicodeChar >= 0xff80 && aUnicodeChar <= 0xff84 ) ||
sl@0
   220
                 ( aUnicodeChar >= 0xff8a && aUnicodeChar <= 0xff8e ) ||
sl@0
   221
                 ( aUnicodeChar == 0xff9c ) ||
sl@0
   222
                 ( aUnicodeChar == 0xff66 ) );
sl@0
   223
        }
sl@0
   224
    }
sl@0
   225
sl@0
   226
// -----------------------------------------------------------------------------
sl@0
   227
// UnicodeTextUtil::IsFullWidthVoicedKatakana
sl@0
   228
// Determines if aUnicodeChar is Full-width Katakana.
sl@0
   229
// Returns: ETrue if it is Full-width Katakana.
sl@0
   230
// -----------------------------------------------------------------------------
sl@0
   231
//
sl@0
   232
TBool UnicodeTextUtil::IsFullWidthVoicedKatakana( TText aUnicodeChar,
sl@0
   233
                                                  TBool aSemiVoiced )
sl@0
   234
    {
sl@0
   235
    const TInt voicableRange( aSemiVoiced ?
sl@0
   236
                              KFullWidthSemiVoicableKatakanaRange :
sl@0
   237
                              KFullWidthVoicableKatakanaRange );
sl@0
   238
    const TText* const (*voicedTable) = aSemiVoiced ?
sl@0
   239
                              KHalfWidthBaseToFullWidthSemiVoicedKatakanaTable :
sl@0
   240
                              KHalfWidthBaseToFullWidthVoicedKatakanaTable;
sl@0
   241
    for( TInt i( 0 ); i < voicableRange; ++i )
sl@0
   242
        {
sl@0
   243
        if( aUnicodeChar == voicedTable[i][KFullWidthIndex] )
sl@0
   244
            {
sl@0
   245
            return ETrue;
sl@0
   246
            }
sl@0
   247
        }
sl@0
   248
    return EFalse;
sl@0
   249
    }
sl@0
   250
sl@0
   251
// -----------------------------------------------------------------------------
sl@0
   252
// UnicodeTextUtil::ConvertKatakanaChar
sl@0
   253
// Converts one Katakana Char in the direction specified by aDirection.
sl@0
   254
// Assumes aKatakanaChar is within range.
sl@0
   255
// Returns: A TText containing either the varient character or the character
sl@0
   256
//          itself, in the case there is no conversion.
sl@0
   257
// -----------------------------------------------------------------------------
sl@0
   258
//
sl@0
   259
TChar UnicodeTextUtil::ConvertKatakanaChar( TConvDirection aDirection,
sl@0
   260
                                            TText aKatakanaChar )
sl@0
   261
    {
sl@0
   262
    __ASSERT_DEBUG(
sl@0
   263
        JPLangUtil::IsKatakana( aKatakanaChar ) &&
sl@0
   264
        !IsFullWidthVoicedKatakana( aKatakanaChar ),
sl@0
   265
        User::Panic( KJPLangUtilPanic, EErrNotKatakana )
sl@0
   266
    );
sl@0
   267
    TChar convChar( aKatakanaChar );
sl@0
   268
    const TInt directionIndex( ( aDirection == EHalfToFullWidth ) ?
sl@0
   269
                                   KHalfWidthIndex : KFullWidthIndex );
sl@0
   270
    for( TInt i( 0 ); i < KHalfWidthKatakanaRange; ++i )
sl@0
   271
        {
sl@0
   272
        if( aKatakanaChar ==
sl@0
   273
                KHalfToFullWidthKatakanaCharTable[i][directionIndex] )
sl@0
   274
            {
sl@0
   275
            convChar = KHalfToFullWidthKatakanaCharTable[i][!directionIndex];
sl@0
   276
            break;
sl@0
   277
            }
sl@0
   278
        }
sl@0
   279
    return convChar;
sl@0
   280
    }
sl@0
   281
sl@0
   282
// -----------------------------------------------------------------------------
sl@0
   283
// UnicodeTextUtil::ConvertVoicedKatakanaChar
sl@0
   284
// Converts one Voiced Katakana Char in the direction specified by aDirection,
sl@0
   285
// and appends to the descriptor, aTarget.
sl@0
   286
// If aSemiVoiced is ETrue, then the code point is converted to the Semi-voiced
sl@0
   287
// variant.
sl@0
   288
// Assumes aVoicedKatakana is within range.
sl@0
   289
// -----------------------------------------------------------------------------
sl@0
   290
//
sl@0
   291
void UnicodeTextUtil::ConvertVoicedKatakanaCharAndAppendToTarget(
sl@0
   292
                                                      TConvDirection aDirection,
sl@0
   293
                                                      TText aVoicedKatakana,
sl@0
   294
                                                      TDes& aTarget,
sl@0
   295
                                                      TBool aSemiVoiced )
sl@0
   296
    {
sl@0
   297
    __ASSERT_DEBUG(
sl@0
   298
        IsFullWidthVoicedConvertableHalfWidthBaseKatakana( aVoicedKatakana ) ||
sl@0
   299
        IsFullWidthVoicedKatakana( aVoicedKatakana, aSemiVoiced ),
sl@0
   300
        User::Panic( KJPLangUtilPanic, EErrNotVoicedKatakana )
sl@0
   301
    );
sl@0
   302
sl@0
   303
    const TInt  voicableRange( aSemiVoiced ?
sl@0
   304
                               KFullWidthSemiVoicableKatakanaRange :
sl@0
   305
                               KFullWidthVoicableKatakanaRange );
sl@0
   306
    const TText* const (*voicedTable) = aSemiVoiced ?
sl@0
   307
                              KHalfWidthBaseToFullWidthSemiVoicedKatakanaTable :
sl@0
   308
                              KHalfWidthBaseToFullWidthVoicedKatakanaTable;
sl@0
   309
    if( aDirection == EHalfToFullWidth )
sl@0
   310
        {
sl@0
   311
        // In the case of Half Width, only the base character is needed for
sl@0
   312
        // the conversion
sl@0
   313
        for( TInt i( 0 ); i < voicableRange; ++i )
sl@0
   314
            {
sl@0
   315
            if( aVoicedKatakana == voicedTable[i][KHalfWidthIndex] )
sl@0
   316
                {
sl@0
   317
                const TChar uniChar( voicedTable[i][KFullWidthIndex] );
sl@0
   318
                aTarget.Append( uniChar );
sl@0
   319
                break;
sl@0
   320
                }
sl@0
   321
            }
sl@0
   322
        }
sl@0
   323
    else
sl@0
   324
        {
sl@0
   325
        for( TInt i( 0 ); i < voicableRange; ++i )
sl@0
   326
            {
sl@0
   327
            if( aVoicedKatakana == voicedTable[i][KFullWidthIndex] )
sl@0
   328
                {
sl@0
   329
                const TChar uniChar( voicedTable[i][KHalfWidthIndex] );
sl@0
   330
                aTarget.Append( uniChar );
sl@0
   331
                break;
sl@0
   332
                }
sl@0
   333
            }
sl@0
   334
        const TChar voicedSoundMark( aSemiVoiced ?
sl@0
   335
                                     KHalfWidthKatakanaSemiVoicedSoundMark :
sl@0
   336
                                     KHalfWidthKatakanaVoicedSoundMark );
sl@0
   337
        aTarget.Append( voicedSoundMark );
sl@0
   338
        }
sl@0
   339
    }
sl@0
   340
sl@0
   341
// -----------------------------------------------------------------------------
sl@0
   342
// UnicodeTextUtil::ConvertSpecialCharactersInPlace
sl@0
   343
// Converts all special characters in the aUnicodeText descriptor in-place
sl@0
   344
// that have both Full and Half-width variants.
sl@0
   345
// Conversion occurs in the direction specified by aDirection.
sl@0
   346
// Returns: The total number of characters converted.
sl@0
   347
// -----------------------------------------------------------------------------
sl@0
   348
//
sl@0
   349
TInt UnicodeTextUtil::ConvertSpecialCharactersInPlace
sl@0
   350
                             ( TConvDirection aDirection, TDes16& aUnicodeText )
sl@0
   351
    {
sl@0
   352
    TInt totalConverted( 0 );
sl@0
   353
    const TInt directionIndex( ( aDirection == EHalfToFullWidth ) ?
sl@0
   354
                                 KHalfWidthIndex : KFullWidthIndex );
sl@0
   355
    for( TInt i( 0 ); i < aUnicodeText.Length(); ++i )
sl@0
   356
        {
sl@0
   357
        const TText uniChar( aUnicodeText[i] );
sl@0
   358
        for( TInt j( 0 ); j < KHalfWidthSpecialCharRange; ++j )
sl@0
   359
            {
sl@0
   360
            if( uniChar == KHalfToFullWidthSpecialCharTable[j][directionIndex] )
sl@0
   361
                {
sl@0
   362
                aUnicodeText[i] =
sl@0
   363
                    KHalfToFullWidthSpecialCharTable[j][!directionIndex];
sl@0
   364
                totalConverted++;
sl@0
   365
                break;
sl@0
   366
                }
sl@0
   367
            }
sl@0
   368
        }
sl@0
   369
    return totalConverted;
sl@0
   370
    }
sl@0
   371
sl@0
   372
// -----------------------------------------------------------------------------
sl@0
   373
// UnicodeTextUtil::ConvertASCIIInPlace
sl@0
   374
// Converts all ASCII *in-place* from either Half to Full-width or vice versa,
sl@0
   375
// depending on the direction specified by aDirection.
sl@0
   376
// Returns: The total number of characters converted.
sl@0
   377
// -----------------------------------------------------------------------------
sl@0
   378
//
sl@0
   379
TInt UnicodeTextUtil::ConvertASCIIInPlace( TConvDirection aDirection,
sl@0
   380
                                           TDes16& aUnicodeText )
sl@0
   381
    {
sl@0
   382
    TInt totalConverted( 0 );
sl@0
   383
    TText lowerBound( ( aDirection == EHalfToFullWidth ) ?
sl@0
   384
                        KHalfWidthASCIILowerBound :
sl@0
   385
                        KFullWidthASCIILowerBound );
sl@0
   386
    TText upperBound( ( aDirection == EHalfToFullWidth ) ?
sl@0
   387
                        KHalfWidthASCIIUpperBound :
sl@0
   388
                        KFullWidthASCIIUpperBound );
sl@0
   389
    TInt offset( ( aDirection == EHalfToFullWidth ) ?
sl@0
   390
                   KHalfToFullWidthASCIIOffset :
sl@0
   391
                   -KHalfToFullWidthASCIIOffset );
sl@0
   392
    for( TInt i( 0 ); i < aUnicodeText.Length(); ++i )
sl@0
   393
        {
sl@0
   394
        const TText uniChar( aUnicodeText[i] );
sl@0
   395
        if( uniChar >= lowerBound && uniChar <= upperBound )
sl@0
   396
            {
sl@0
   397
            TText convertedChar( static_cast<TText>( uniChar + offset ) );
sl@0
   398
            aUnicodeText[i] = convertedChar;
sl@0
   399
            totalConverted++;
sl@0
   400
            }
sl@0
   401
        }
sl@0
   402
    return totalConverted;
sl@0
   403
    }
sl@0
   404
sl@0
   405
// EXPORTED FUNCTIONS
sl@0
   406
sl@0
   407
// ============================ MEMBER FUNCTIONS ===============================
sl@0
   408
sl@0
   409
// -----------------------------------------------------------------------------
sl@0
   410
// JPLangUtil::ConvertHalfToFullWidth
sl@0
   411
// Converts all Half-width conformant text (including ASCII, Special Characters
sl@0
   412
// and Katakana) found in aUnicodeSource to their Full-width counterparts and
sl@0
   413
// places the resulting text into aUnicodeTarget.
sl@0
   414
// (detailed information about the parameters and return values can be found
sl@0
   415
//  in the header file)
sl@0
   416
// -----------------------------------------------------------------------------
sl@0
   417
//
sl@0
   418
EXPORT_C TInt JPLangUtil::ConvertHalfToFullWidth( const TDesC16& aUnicodeSource,
sl@0
   419
                                                  TDes16& aUnicodeTarget )
sl@0
   420
    {
sl@0
   421
    TInt totalConverted( 0 );
sl@0
   422
    // Special Characters are handled in the Katakana conversion...
sl@0
   423
    totalConverted =  ConvertHalfToFullWidthKatakana( aUnicodeSource,
sl@0
   424
                                                      aUnicodeTarget );
sl@0
   425
    totalConverted += UnicodeTextUtil::ConvertASCIIInPlace( EHalfToFullWidth,
sl@0
   426
                                                            aUnicodeTarget );
sl@0
   427
    return totalConverted;
sl@0
   428
    }
sl@0
   429
sl@0
   430
// -----------------------------------------------------------------------------
sl@0
   431
// JPLangUtil::ConvertFullToHalfWidth
sl@0
   432
// Converts all Full-width conformant text found in aUnicodeSource to their
sl@0
   433
// Full-width counterparts and places the resulting text into aUnicodeTarget.
sl@0
   434
// Only those characters with existing Half-width variants are converted. There
sl@0
   435
// will be a 2-for-1 conversion for each Full-width Voiced and Semi-voiced
sl@0
   436
// Katakana character.
sl@0
   437
// (detailed information about the parameters and return values can be found in
sl@0
   438
// the header file)
sl@0
   439
// -----------------------------------------------------------------------------
sl@0
   440
//
sl@0
   441
EXPORT_C TInt JPLangUtil::ConvertFullToHalfWidth( const TDesC16& aUnicodeSource,
sl@0
   442
                                                  TDes16& aUnicodeTarget )
sl@0
   443
    {
sl@0
   444
    TInt totalConverted( 0 );
sl@0
   445
    // Special Characters are handled in the Katakana conversion...
sl@0
   446
    totalConverted =  ConvertFullToHalfWidthKatakana( aUnicodeSource,
sl@0
   447
                                                      aUnicodeTarget );
sl@0
   448
    totalConverted += UnicodeTextUtil::ConvertASCIIInPlace( EFullToHalfWidth,
sl@0
   449
                                                            aUnicodeTarget );
sl@0
   450
    return totalConverted;
sl@0
   451
    }
sl@0
   452
sl@0
   453
// -----------------------------------------------------------------------------
sl@0
   454
// JPLangUtil::ConvertHalfToFullWidthKatakana
sl@0
   455
// Converts Half-width Katakana and Special Character text found in
sl@0
   456
// aUnicodeSource to their Full-width counterparts and places the resulting text
sl@0
   457
// into aUnicodeTarget.
sl@0
   458
// (detailed information about the parameters and return values can be found in
sl@0
   459
// the header file)
sl@0
   460
// -----------------------------------------------------------------------------
sl@0
   461
//
sl@0
   462
EXPORT_C TInt JPLangUtil::ConvertHalfToFullWidthKatakana
sl@0
   463
                       ( const TDesC16& aUnicodeSource, TDes16& aUnicodeTarget )
sl@0
   464
    {
sl@0
   465
    TInt totalConverted( 0 );
sl@0
   466
    const TInt length( aUnicodeSource.Length() );
sl@0
   467
    if( length > aUnicodeTarget.MaxLength() )
sl@0
   468
        {
sl@0
   469
        return KErrTooBig;
sl@0
   470
        }
sl@0
   471
    aUnicodeTarget.Zero();
sl@0
   472
    for( TInt i( 0 ); i < length; ++i )
sl@0
   473
        {
sl@0
   474
        const TText uniChar( aUnicodeSource[i] );
sl@0
   475
        // Check if the next character is a Half Width Katakana (Semi-)Voiced
sl@0
   476
        // Sound Mark and if the current character + the voiced sound mark have
sl@0
   477
        // a Full Width counterpart
sl@0
   478
        if( i + 1 < length )
sl@0
   479
            {
sl@0
   480
            const TBool isVoiced(
sl@0
   481
            ( UnicodeTextUtil::IsFullWidthVoicedConvertableHalfWidthBaseKatakana
sl@0
   482
                  ( uniChar ) &&
sl@0
   483
              ( aUnicodeSource[i + 1] == KHalfWidthKatakanaVoicedSoundMark )
sl@0
   484
            ) );
sl@0
   485
sl@0
   486
            const TBool isSemiVoiced(
sl@0
   487
            ( UnicodeTextUtil::IsFullWidthVoicedConvertableHalfWidthBaseKatakana
sl@0
   488
                  ( uniChar, ETrue ) &&
sl@0
   489
              ( aUnicodeSource[i + 1] == KHalfWidthKatakanaSemiVoicedSoundMark )
sl@0
   490
            ) );
sl@0
   491
sl@0
   492
            if( isVoiced || isSemiVoiced )
sl@0
   493
                {
sl@0
   494
                UnicodeTextUtil::ConvertVoicedKatakanaCharAndAppendToTarget(
sl@0
   495
                    EHalfToFullWidth,
sl@0
   496
                    uniChar,
sl@0
   497
                    aUnicodeTarget,
sl@0
   498
                    isSemiVoiced
sl@0
   499
                );
sl@0
   500
                i++; // Skip the (semi-)voice marker
sl@0
   501
                totalConverted++;
sl@0
   502
                continue;
sl@0
   503
                }
sl@0
   504
            }
sl@0
   505
        // If not, then just convert directly if in range
sl@0
   506
        if( uniChar >= KHalfWidthKatakanaLowerBound &&
sl@0
   507
            uniChar <= KHalfWidthKatakanaUpperBound )
sl@0
   508
            {
sl@0
   509
            aUnicodeTarget.Append(
sl@0
   510
                UnicodeTextUtil::ConvertKatakanaChar( EHalfToFullWidth,
sl@0
   511
                                                      uniChar )
sl@0
   512
            );
sl@0
   513
            totalConverted++;
sl@0
   514
            }
sl@0
   515
        // Else this is not Half Width Katakana, so copy directly...
sl@0
   516
        else
sl@0
   517
            {
sl@0
   518
            const TChar uniCharacter( uniChar );
sl@0
   519
            aUnicodeTarget.Append( uniCharacter );
sl@0
   520
            }
sl@0
   521
        }
sl@0
   522
sl@0
   523
    // Now handle special characters
sl@0
   524
    // This logic may be moved into this function to avoid another
sl@0
   525
    // loop over the text.
sl@0
   526
    totalConverted +=
sl@0
   527
        UnicodeTextUtil::ConvertSpecialCharactersInPlace( EHalfToFullWidth,
sl@0
   528
                                                          aUnicodeTarget );
sl@0
   529
sl@0
   530
    return totalConverted;
sl@0
   531
    }
sl@0
   532
sl@0
   533
// -----------------------------------------------------------------------------
sl@0
   534
// JPLangUtil::ConvertFullToHalfWidthKatakana
sl@0
   535
// Converts Full-width Katakana and Special Character text found in
sl@0
   536
// aUnicodeSource to their Half-width counterparts and places the resulting text
sl@0
   537
// into aUnicodeTarget. There will be a 2-for-1 conversion for each Full-width
sl@0
   538
// Voiced and Semi-voiced Katakana character.
sl@0
   539
// (detailed information about the parameters and return values can be found in
sl@0
   540
// the header file)
sl@0
   541
// -----------------------------------------------------------------------------
sl@0
   542
//
sl@0
   543
EXPORT_C TInt JPLangUtil::ConvertFullToHalfWidthKatakana
sl@0
   544
                       ( const TDesC16& aUnicodeSource, TDes16& aUnicodeTarget )
sl@0
   545
    {
sl@0
   546
    TInt totalConverted( 0 );
sl@0
   547
    const TInt length( aUnicodeSource.Length() );
sl@0
   548
    const TInt maxLength( aUnicodeTarget.MaxLength() );
sl@0
   549
    if( length > maxLength )
sl@0
   550
        {
sl@0
   551
        return KErrTooBig;
sl@0
   552
        }
sl@0
   553
    aUnicodeTarget.Zero();
sl@0
   554
    for( TInt i( 0 ); i < length; ++i )
sl@0
   555
        {
sl@0
   556
        const TText uniChar( aUnicodeSource[i] );
sl@0
   557
        // First check if this is this Full Width Katakana
sl@0
   558
        if( ( uniChar >= KFullWidthKatakanaLowerBound &&
sl@0
   559
              uniChar <= KFullWidthKatakanaUpperBound ) ||
sl@0
   560
            ( uniChar == KFullWidthKatakanaVoicedSoundMark ||
sl@0
   561
              uniChar == KFullWidthKatakanaSemiVoicedSoundMark ) )
sl@0
   562
            {
sl@0
   563
            // Then check if it is (Semi-)Voiced and convert it properly
sl@0
   564
            const TBool isVoiced(
sl@0
   565
                UnicodeTextUtil::IsFullWidthVoicedKatakana( uniChar )
sl@0
   566
            );
sl@0
   567
            const TBool isSemiVoiced(
sl@0
   568
                UnicodeTextUtil::IsFullWidthVoicedKatakana( uniChar, ETrue )
sl@0
   569
            );
sl@0
   570
            if( isVoiced || isSemiVoiced )
sl@0
   571
                {
sl@0
   572
                if( aUnicodeTarget.Length() + 2 > maxLength )
sl@0
   573
                    {
sl@0
   574
                    // This descriptor can't hold the new data
sl@0
   575
                    aUnicodeTarget.Zero();
sl@0
   576
                    return KErrTooBig;
sl@0
   577
                    }
sl@0
   578
                UnicodeTextUtil::ConvertVoicedKatakanaCharAndAppendToTarget(
sl@0
   579
                    EFullToHalfWidth,
sl@0
   580
                    uniChar,
sl@0
   581
                    aUnicodeTarget,
sl@0
   582
                    isSemiVoiced
sl@0
   583
                );
sl@0
   584
                totalConverted++;
sl@0
   585
                }
sl@0
   586
            else
sl@0
   587
                {
sl@0
   588
                if( aUnicodeTarget.Length() + 1 > maxLength )
sl@0
   589
                    {
sl@0
   590
                    // This descriptor can't hold the new data
sl@0
   591
                    aUnicodeTarget.Zero();
sl@0
   592
                    return KErrTooBig;
sl@0
   593
                    }
sl@0
   594
                aUnicodeTarget.Append(
sl@0
   595
                    UnicodeTextUtil::ConvertKatakanaChar(
sl@0
   596
                        EFullToHalfWidth,
sl@0
   597
                        uniChar
sl@0
   598
                    )
sl@0
   599
                );
sl@0
   600
                totalConverted++;
sl@0
   601
                }
sl@0
   602
            }
sl@0
   603
        // This is not Full Width Katakana, so copy directly...
sl@0
   604
        else
sl@0
   605
            {
sl@0
   606
            if( aUnicodeTarget.Length() + 1 > maxLength )
sl@0
   607
                {
sl@0
   608
                // This descriptor can't hold the new data
sl@0
   609
                aUnicodeTarget.Zero();
sl@0
   610
                return KErrTooBig;
sl@0
   611
                }
sl@0
   612
            const TChar uniCharacter( uniChar );
sl@0
   613
            aUnicodeTarget.Append( uniCharacter );
sl@0
   614
            }
sl@0
   615
        }
sl@0
   616
sl@0
   617
    // Now handle special characters
sl@0
   618
    // This logic may be moved into this function to avoid another loop over
sl@0
   619
    // the text
sl@0
   620
    totalConverted +=
sl@0
   621
        UnicodeTextUtil::ConvertSpecialCharactersInPlace( EFullToHalfWidth,
sl@0
   622
                                                          aUnicodeTarget );
sl@0
   623
sl@0
   624
    return totalConverted;
sl@0
   625
    }
sl@0
   626
sl@0
   627
// -----------------------------------------------------------------------------
sl@0
   628
// JPLangUtil::ConvertFullHiragnaToFullKatakana
sl@0
   629
// Converts Full-width Hiragana and Special Character text found in
sl@0
   630
// aUnicodeSource to their Full-width counterparts and places the
sl@0
   631
// resulting text into aUnicodeTarget.
sl@0
   632
// -----------------------------------------------------------------------------
sl@0
   633
//
sl@0
   634
EXPORT_C TInt JPLangUtil::ConvertFullHiragnaToFullKatakana
sl@0
   635
                       ( const TDesC16& aUnicodeSource, TDes16& aUnicodeTarget )
sl@0
   636
    {
sl@0
   637
    TInt totalConverted( 0 );
sl@0
   638
    const TInt length( aUnicodeSource.Length() );
sl@0
   639
    const TInt maxLength( aUnicodeTarget.MaxLength() );
sl@0
   640
    if( length > maxLength )
sl@0
   641
        {
sl@0
   642
        return KErrTooBig;
sl@0
   643
        }
sl@0
   644
sl@0
   645
    const TUint comp = KFullWidthKatakanaSmallA - KFullWidthHiraganaSmallA;
sl@0
   646
sl@0
   647
    aUnicodeTarget.Zero();
sl@0
   648
    for( TInt i( 0 ); i < length; ++i )
sl@0
   649
        {
sl@0
   650
        const TText uniChar( aUnicodeSource[i] );
sl@0
   651
        TText uniChar2(0);
sl@0
   652
        if (i + 1 < length)
sl@0
   653
            {
sl@0
   654
            uniChar2 = aUnicodeSource[i+1];
sl@0
   655
            }
sl@0
   656
        // First check if this is this Full Width Katakana
sl@0
   657
        if (KFullWidthHiraganaSmallA <= uniChar && uniChar <= KFullWidthHiraganaVU)
sl@0
   658
            {
sl@0
   659
            if (uniChar == KFullWidthHiraganaU
sl@0
   660
             && uniChar2 == KFullWidthHiraganaVoicedSound)
sl@0
   661
                {
sl@0
   662
                aUnicodeTarget.Append(KFullWidthKatakanaSmallVU);
sl@0
   663
                totalConverted++;
sl@0
   664
                i++;
sl@0
   665
                }
sl@0
   666
            else
sl@0
   667
                {
sl@0
   668
                TUint katakana = uniChar + comp;
sl@0
   669
                if (IsKatakana(katakana))
sl@0
   670
                    {
sl@0
   671
                    aUnicodeTarget.Append(katakana);
sl@0
   672
                    totalConverted++;
sl@0
   673
                    }
sl@0
   674
                }
sl@0
   675
            }
sl@0
   676
        else
sl@0
   677
            {
sl@0
   678
            aUnicodeTarget.Append(uniChar);
sl@0
   679
            totalConverted++;
sl@0
   680
            }
sl@0
   681
        }
sl@0
   682
sl@0
   683
    // Now handle special characters
sl@0
   684
    // This logic may be moved into this function to avoid another loop over
sl@0
   685
    // the text
sl@0
   686
    totalConverted +=
sl@0
   687
        UnicodeTextUtil::ConvertSpecialCharactersInPlace( EFullToHalfWidth,
sl@0
   688
                                                          aUnicodeTarget );
sl@0
   689
sl@0
   690
    return totalConverted;
sl@0
   691
    }
sl@0
   692
sl@0
   693
// -----------------------------------------------------------------------------
sl@0
   694
// JPLangUtil::IsKatakana
sl@0
   695
// Determines whether or not the character is Katakana
sl@0
   696
// (detailed information about the parameters and return values can be found in
sl@0
   697
// the header file)
sl@0
   698
// -----------------------------------------------------------------------------
sl@0
   699
//
sl@0
   700
EXPORT_C TBool JPLangUtil::IsKatakana( const TText aUnicodeChar )
sl@0
   701
    {
sl@0
   702
    return ( ( aUnicodeChar >= KFullWidthKatakanaLowerBound &&
sl@0
   703
               aUnicodeChar <= KFullWidthKatakanaUpperBound ) ||
sl@0
   704
             ( aUnicodeChar >= KHalfWidthKatakanaLowerBound &&
sl@0
   705
               aUnicodeChar <= KHalfWidthKatakanaUpperBound ) ||
sl@0
   706
             ( aUnicodeChar == KFullWidthKatakanaVoicedSoundMark ||
sl@0
   707
               aUnicodeChar == KFullWidthKatakanaSemiVoicedSoundMark ) );
sl@0
   708
    }
sl@0
   709
sl@0
   710
// -----------------------------------------------------------------------------
sl@0
   711
// JPLangUtil::IsHiragana
sl@0
   712
// Determines whether or not the character is Hiragana
sl@0
   713
// (detailed information about the parameters and return values can be found in
sl@0
   714
// the header file)
sl@0
   715
// -----------------------------------------------------------------------------
sl@0
   716
//
sl@0
   717
EXPORT_C TBool JPLangUtil::IsHiragana( const TText aUnicodeChar )
sl@0
   718
    {
sl@0
   719
    return ( ( aUnicodeChar >= 0x3041 && aUnicodeChar <= 0x3096 ) ||
sl@0
   720
             ( aUnicodeChar >= 0x3099 && aUnicodeChar <= 0x309f ) );
sl@0
   721
    }
sl@0
   722
sl@0
   723
// -----------------------------------------------------------------------------
sl@0
   724
// JPLangUtil::IsKanji
sl@0
   725
// Determines whether or not the character is a CJK Unified Ideograph (ExtA)
sl@0
   726
// (detailed information about the parameters and return values can be found in
sl@0
   727
// the header file)
sl@0
   728
// -----------------------------------------------------------------------------
sl@0
   729
//
sl@0
   730
EXPORT_C TBool JPLangUtil::IsKanji( const TText aUnicodeChar )
sl@0
   731
    {
sl@0
   732
    return( ( aUnicodeChar >= KCJKUnifiedIdiographLowerBound &&
sl@0
   733
              aUnicodeChar <= KCJKUnifiedIdiographUpperBound ) ||
sl@0
   734
            ( aUnicodeChar >= KCJKUnifiedIdeographExtALowerBound &&
sl@0
   735
              aUnicodeChar <= KCJKUnifiedIdeographExtAUpperBound ) );
sl@0
   736
    }
sl@0
   737
sl@0
   738
// -----------------------------------------------------------------------------
sl@0
   739
// JPLangUtil::IsHalfWidth
sl@0
   740
// Determines whether or not the character is UNICODE defined Half-width.
sl@0
   741
// (detailed information about the parameters and return values can be found in
sl@0
   742
// the header file)
sl@0
   743
// -----------------------------------------------------------------------------
sl@0
   744
//
sl@0
   745
EXPORT_C TBool JPLangUtil::IsHalfWidth( const TText aUnicodeChar )
sl@0
   746
    {
sl@0
   747
    return // HW Katakana
sl@0
   748
           ( ( aUnicodeChar >= 0xff61 && aUnicodeChar <= 0xff9f ) ||
sl@0
   749
           // ASCII
sl@0
   750
             ( aUnicodeChar >= 0x0020 && aUnicodeChar <= 0x007e ) ||
sl@0
   751
           // Special Characters
sl@0
   752
             ( aUnicodeChar == 0x00a2 || aUnicodeChar == 0x00a3 ||
sl@0
   753
               aUnicodeChar == 0x00a5 || aUnicodeChar == 0x00a6 ||
sl@0
   754
               aUnicodeChar == 0x00a9 || aUnicodeChar == 0x00ac ||
sl@0
   755
               aUnicodeChar == 0x00af || aUnicodeChar == 0x2985 ||
sl@0
   756
               aUnicodeChar == 0x2986 ) ||
sl@0
   757
           // HW Symbol Variants
sl@0
   758
             ( aUnicodeChar >= 0xffe8 && aUnicodeChar <= 0xffee ) );
sl@0
   759
    }
sl@0
   760
sl@0
   761
// -----------------------------------------------------------------------------
sl@0
   762
// JPLangUtil::IsFullWidth
sl@0
   763
// Determines whether or not the character is UNICODE defined Full-width.
sl@0
   764
// Essentially, all code values that are not Half-width.
sl@0
   765
// (detailed information about the parameters and return values can be found in
sl@0
   766
// the header file)
sl@0
   767
// -----------------------------------------------------------------------------
sl@0
   768
//
sl@0
   769
EXPORT_C TBool JPLangUtil::IsFullWidth( const TText aUnicodeChar )
sl@0
   770
    {
sl@0
   771
        return !IsHalfWidth( aUnicodeChar );
sl@0
   772
    }
sl@0
   773
sl@0
   774
// End of File