Update contrib.
2 * Copyright (c) 2005-2009 Nokia Corporation and/or its subsidiary(-ies).
4 * This component and the accompanying materials are made available
5 * under the terms of "Eclipse Public License v1.0"
6 * which accompanies this distribution, and is available
7 * at the URL "http://www.eclipse.org/legal/epl-v10.html".
9 * Initial Contributors:
10 * Nokia Corporation - initial contribution.
21 #include <convgeneratedcpp.h>
23 #include <ecom/implementationproxy.h>
24 #include <charactersetconverter.h>
26 class CUCS2ConverterImpl : public CCharacterSetConverterPluginInterface
30 virtual const TDesC8& ReplacementForUnconvertibleUnicodeCharacters();
32 virtual TInt ConvertFromUnicode(
33 CCnvCharacterSetConverter::TEndianness aDefaultEndiannessOfForeignCharacters,
34 const TDesC8& aReplacementForUnconvertibleUnicodeCharacters,
36 const TDesC16& aUnicode,
37 CCnvCharacterSetConverter::TArrayOfAscendingIndices& aIndicesOfUnconvertibleCharacters);
39 virtual TInt ConvertToUnicode(
40 CCnvCharacterSetConverter::TEndianness aDefaultEndiannessOfForeignCharacters,
42 const TDesC8& aForeign,
44 TInt& aNumberOfUnconvertibleCharacters,
45 TInt& aIndexOfFirstByteOfFirstUnconvertibleCharacter);
47 virtual TBool IsInThisCharacterSetL(
49 TInt& aConfidenceLevel,
50 const TDesC8& aSample);
52 static CUCS2ConverterImpl* NewL();
53 virtual ~CUCS2ConverterImpl();
62 // The following code has been copied and modified from the plugin computer generated code
63 // that is generated from the charconv/data/???.cpl && /???.txt files
64 // *** code begins ***
65 #define ARRAY_LENGTH(aArray) (sizeof(aArray)/sizeof((aArray)[0]))
67 #pragma warning (disable: 4049) // compiler limit : terminating line number emission
69 _LIT8(KLit8ReplacementForUnconvertibleUnicodeCharacters, "\xff\xfd");
71 GLDEF_C const TDesC8& ReplacementForUnconvertibleUnicodeCharacters_internal()
73 return KLit8ReplacementForUnconvertibleUnicodeCharacters;
76 GLDEF_D const SCnvConversionData conversionData=
78 SCnvConversionData::EUnspecified,
87 const TInt KByteOrderMark = 0xfeff;
88 const TInt KStateOffset = 0x1000;
91 const TDesC8& CUCS2ConverterImpl::ReplacementForUnconvertibleUnicodeCharacters()
93 return ReplacementForUnconvertibleUnicodeCharacters_internal();
98 * Takes a 16 bit UCS2 descriptor with or without BOM and translates it to an
99 * eight bit descriptor in Big Endian format.
101 * Note aDefaultEndiannessOfForeignCharacters is not used by this converter
103 * @param CCnvCharacterSetConverter::TEndianness aDefaultEndiannessOfForeignCharacters
104 * @param const TDesC8&
105 * @param TDes8& aForeign
106 * @param const TDesC16& aUnicode
107 * @param CCnvCharacterSetConverter::TArrayOfAscendingIndices&
109 * returns number of converted characters
111 TInt CUCS2ConverterImpl::ConvertFromUnicode(CCnvCharacterSetConverter::TEndianness /*aDefaultEndiannessOfForeignCharacters*/,
112 const TDesC8& /*aReplacementForUnconvertibleUnicodeCharacters*/,
114 const TDesC16& aUnicode,
115 CCnvCharacterSetConverter::TArrayOfAscendingIndices& /*aIndicesOfUnconvertibleCharacters*/)
117 TInt numberOfUnicodeCharacters =0;
120 // start at the begining of the output buffer
123 // while there is unicode data to convert and space in the output buffer
124 while ( (aForeign.Length() + 1 < aForeign.MaxLength()) && (numberOfUnicodeCharacters < aUnicode.Length()) )
126 nextChar = aUnicode[numberOfUnicodeCharacters];
128 // Note - this always converts to EBigEndian
129 aForeign.Append((nextChar & 0xff00) >> 8);
130 aForeign.Append(nextChar & 0xff );
132 numberOfUnicodeCharacters++;
135 // returns the number of unconverted characters left at the end of the input descriptor
136 return aUnicode.Length() - numberOfUnicodeCharacters;
140 * Takes an 8 bit descriptor with or without a BOM and translates it to unicode
141 * Input endiness is determined by Byte Order Markers (BOM) in the source text.
142 * If no BOM is present aDefaultEndiannessOfForeignCharacters is used.
144 * When the data is too large to fit in the output buffer, the endiness is saved in the state
145 * variable between conversions
147 * @param aDefaultEndiannessOfForeignCharacters Default endiness if no BOMs present in the source
148 * @param aUnicode Contains the converted text in the Unicode character set
149 * @param aForeign The non-Unicode source text to be converted
150 * @param aState Not used by this converter
151 * @param aNumberOfUnconvertibleCharacters Contains the number of bytes which could not be converted to unicode
152 * @param aIndexOfFirstByteOfFirstUnconvertibleCharacter The index of the first unconvertable byte or -1 if all converted.
154 * @return aNumberOfUnconvertibleCharacters The number of unconverted bytes left at the end of the input
155 * descriptor (e.g. because the output descriptor is not long enough to hold all the text), or one of the
156 * error values defined in TError.
157 * @internalTechnology
159 TInt CUCS2ConverterImpl::ConvertToUnicode(CCnvCharacterSetConverter::TEndianness aDefaultEndiannessOfForeignCharacters,
161 const TDesC8& aForeign,
163 TInt& aNumberOfUnconvertibleCharacters,
164 TInt& aIndexOfFirstByteOfFirstUnconvertibleCharacter)
166 TInt numberOfBytesConverted = 0;
167 TInt numberOfUnicodeCharacters =0;
170 // work out what byte order to use
171 CCnvCharacterSetConverter::TEndianness byteOrderMark;
172 if ( aState==CCnvCharacterSetConverter::KStateDefault )
174 // this is the first call so use the default or BOM for byte order
175 byteOrderMark = aDefaultEndiannessOfForeignCharacters;
179 // this is not the first call so use the saved byte order
180 byteOrderMark = STATIC_CAST( CCnvCharacterSetConverter::TEndianness, aState - KStateOffset );
183 if ( aForeign.Length() < 2)
184 { // too small to do anything with
187 // If the state is KStateDefault (this is the first call) check for BOM markers
188 else if (aState==CCnvCharacterSetConverter::KStateDefault)
190 // is there a Little Endian BOM
191 if (aForeign[0]==0xff && aForeign[1]==0xfe )
193 byteOrderMark = CCnvCharacterSetConverter::ELittleEndian;
195 else if (aForeign[0]==0xfe && aForeign[1]==0xff )
197 byteOrderMark = CCnvCharacterSetConverter::EBigEndian;
199 // remember the detected state
200 aState = byteOrderMark + KStateOffset;
203 // start at begining of the output buffer provided
206 // while there is at least 2 bytes of data to convert and space in the output buffer
207 while ( (numberOfBytesConverted+1 < aForeign.Size()) && (numberOfUnicodeCharacters < aUnicode.MaxLength()) )
209 if (byteOrderMark == CCnvCharacterSetConverter::ELittleEndian )
211 // ELittleEndian 0x??00
212 nextChar = aForeign[numberOfBytesConverted] + ( aForeign[numberOfBytesConverted+1] << 8);
217 nextChar = ( aForeign[numberOfBytesConverted] <<8 ) + aForeign[numberOfBytesConverted+1];
220 // save the unicode character extracted unless it's a BOM
221 if ( nextChar != KByteOrderMark )
223 aUnicode.Append( nextChar );
224 numberOfUnicodeCharacters++;
227 numberOfBytesConverted+=2;
230 // there are no uncovertable characters with UCS2,
231 aNumberOfUnconvertibleCharacters = 0;
232 // a negative value indicates that all characters converted
233 aIndexOfFirstByteOfFirstUnconvertibleCharacter = -1;
235 // returns the number of unconverted bytes left at the end of the input descriptor
236 // Note there could be 1 byte left over if an odd number of bytes provided for conversion
237 return aForeign.Size() - numberOfBytesConverted;
242 * This converter does not support autodetect so always returns a confidence value of 0.
243 * @internalTechnology
245 TBool CUCS2ConverterImpl::IsInThisCharacterSetL(TBool& aSetToTrue, TInt& aConfidenceLevel, const TDesC8&)
252 CUCS2ConverterImpl* CUCS2ConverterImpl::NewL()
254 CUCS2ConverterImpl* self = new(ELeave) CUCS2ConverterImpl();
258 CUCS2ConverterImpl::~CUCS2ConverterImpl()
262 CUCS2ConverterImpl::CUCS2ConverterImpl()
266 const TImplementationProxy ImplementationTable[] =
268 IMPLEMENTATION_PROXY_ENTRY(0x101FF492, CUCS2ConverterImpl::NewL)
271 EXPORT_C const TImplementationProxy* ImplementationGroupProxy(TInt& aTableCount)
273 aTableCount = sizeof(ImplementationTable) / sizeof(TImplementationProxy);
275 return ImplementationTable;