First public contribution.
2 * Copyright (c) 1997-2009 Nokia Corporation and/or its subsidiary(-ies).
4 * This component and the accompanying materials are made available
5 * under the terms of "Eclipse Public License v1.0"
6 * which accompanies this distribution, and is available
7 * at the URL "http://www.eclipse.org/legal/epl-v10.html".
9 * Initial Contributors:
10 * Nokia Corporation - initial contribution.
25 #include <ecom/ecom.h>
26 #include <charactersetconverter.h>
27 #include "chcnvpanic.h"
28 #include "charconv_tls.h"
29 #include "OstTraceDefinitions.h"
30 #ifdef OST_TRACE_COMPILER_IN_USE
31 #include "charconvTraces.h"
36 #define NON_DEBUG_INLINE
38 #define NON_DEBUG_INLINE inline
41 GLREF_D const SCnvConversionData codePage1252ConversionData;
42 GLREF_D const SCnvConversionData iso88591ConversionData;
43 GLREF_D const SCnvConversionData asciiConversionData;
44 GLREF_D const SCnvConversionData sms7BitConversionData;
45 GLREF_D const SCnvConversionData unicodeConversionDataLittle;
46 GLREF_D const SCnvConversionData unicodeConversionDataBig;
48 GLREF_C void IsCharacterSetAscii(TInt& aConfidenceLevel, const TDesC8& aSample);
49 GLREF_C void IsCharacterSetSMS7Bit(TInt& aConfidenceLevel, const TDesC8& aSample);
50 GLREF_C void IsCharacterSetISO88591(TInt& aConfidenceLevel, const TDesC8& aSample);
51 GLREF_C void IsCharacterSetCP1252(TInt& aConfidenceLevel, const TDesC8& aSample);
52 GLREF_C void IsCharacterSetUTF8(TInt& aConfidenceLevel, const TDesC8& aSample);
53 GLREF_C void IsCharacterSetUTF7(TInt& aConfidenceLevel, const TDesC8& aSample);
54 GLREF_C void IsCharacterSetUnicodeLittle(TInt& aConfidenceLevel, const TDesC8& aSample);
55 GLREF_C void IsCharacterSetUnicodeBig(TInt& aConfidenceLevel, const TDesC8& aSample);
57 _LIT(KLitWildCard, "*");
59 _LIT(KLitSystemCharconvDirectory, "\\resource\\charconv\\");
60 _LIT(KLitROMSystemCharconvDirectory, "z:\\resource\\charconv\\");
62 _LIT(KLitCharacterSetNameUtf7, "UTF-7");
63 _LIT(KLitCharacterSetNameUtf8, "UTF-8");
64 _LIT(KLitCharacterSetNameImapUtf7, "IMAP UTF-7");
65 _LIT(KLitCharacterSetNameJavaConformantUtf8, "Java UTF-8");
66 _LIT(KLitCharacterSetNameCodePage1252, "Code Page 1252");
67 _LIT(KLitCharacterSetNameIso88591, "ISO-8859-1");
68 _LIT(KLitCharacterSetNameAscii, "ASCII");
69 _LIT(KLitCharacterSetNameUnicodeLittle, "Little-Endian UNICODE");
70 _LIT(KLitCharacterSetNameUnicodeBig, "Big-Endian UNICODE");
71 _LIT(KLitCharacterSetNameSms7Bit, "SMS 7-bit");
72 _LIT8(KLit8AsciiSubstituteCharacter, "\x1a");
73 _LIT8(KLit8Sms7BitSubstituteCharacter, "\x3f");
75 const TUint KNoConversionAvailable=KMaxTUint;
77 const TUint KCharacterSetIdentifierWin1252=0x101F873B; // same as built-in cp1252, just to be compliance with S60 CP1252
81 EConversionDataFilePositionOfName=24,
82 EConversionDataFileMaximumLengthOfName=KMaxTUint8
85 LOCAL_C TBool StandardNamesMatch(const TDesC8& aStandardName1, const TDesC8& aStandardName2)
87 return aStandardName1.CompareF(aStandardName2)==0; // "no distinction is made between use of upper and lower case letters" as stated by ftp.isi.edu/in-notes/iana/assignments/character-sets
90 LOCAL_C void ResetAndDestroyRImplInfoPtrArray(TAny* aPtr)
92 RImplInfoPtrArray* array = reinterpret_cast <RImplInfoPtrArray*> (aPtr);
93 array->ResetAndDestroy();
96 LOCAL_C void CloseECOMSession(TAny*)
98 REComSession::FinalClose();
101 static void IsBuiltInCharacterSet(const TUint& aCharacterSetIdentifier,
102 TInt& aConfidenceLevel,
103 const TDesC8& aSample)
105 switch(aCharacterSetIdentifier)
107 case KCharacterSetIdentifierUtf7:
108 IsCharacterSetUTF7(aConfidenceLevel,aSample);
110 case KCharacterSetIdentifierUtf8:
111 IsCharacterSetUTF8(aConfidenceLevel,aSample);
113 case KCharacterSetIdentifierImapUtf7:
114 case KCharacterSetIdentifierJavaConformantUtf8:
116 case KCharacterSetIdentifierCodePage1252:
117 case KCharacterSetIdentifierWin1252:
118 IsCharacterSetCP1252(aConfidenceLevel,aSample);
120 case KCharacterSetIdentifierIso88591:
121 IsCharacterSetISO88591(aConfidenceLevel,aSample);
123 case KCharacterSetIdentifierAscii:
124 IsCharacterSetAscii(aConfidenceLevel,aSample);
126 case KCharacterSetIdentifierSms7Bit:
127 IsCharacterSetSMS7Bit(aConfidenceLevel,aSample);
129 case KCharacterSetIdentifierUnicodeLittle:
130 IsCharacterSetUnicodeLittle(aConfidenceLevel,aSample);
132 case KCharacterSetIdentifierUnicodeBig:
133 IsCharacterSetUnicodeBig(aConfidenceLevel,aSample);
137 OstTraceExt3( TRACE_DUMP, _ISBUILTINCHARACTERSET, "::IsBuiltInCharacterSet;aCharacterSetIdentifier=%u;aConfidenceLevel=%d;aSample=%x", aCharacterSetIdentifier, aConfidenceLevel, ( TUint )&( aSample ) );
138 Panic(EPanicCharacterSetNotPresent);
145 void TTlsData::CharacterSetConverterIsBeingCreatedL()
147 TTlsData* tlsData=STATIC_CAST(TTlsData*, Dll::Tls());
150 ++tlsData->iReferenceCount;
154 tlsData=new(ELeave) TTlsData;
155 CleanupStack::PushL(tlsData);
156 User::LeaveIfError(Dll::SetTls(tlsData));
157 CleanupStack::Pop(); // tlsData
161 void TTlsData::CharacterSetConverterIsBeingDestroyed()
163 TTlsData* tlsData=STATIC_CAST(TTlsData*, Dll::Tls());
166 if ( tlsData->iCurrentCharacterSetConverter!=NULL )
168 OstTrace0( TRACE_DUMP, TTLSDATA_CHARACTERSETCONVERTERISBEINGDESTROYED, "EPanicDestructionDuringConversion" );
170 __ASSERT_DEBUG(tlsData->iCurrentCharacterSetConverter==NULL, Panic(EPanicDestructionDuringConversion));
171 --tlsData->iReferenceCount;
172 if ( tlsData->iReferenceCount < 0 )
174 OstTrace0( TRACE_DUMP, DUP1_TTLSDATA_CHARACTERSETCONVERTERISBEINGDESTROYED, "EPanicBadTlsDataReferenceCount" );
176 __ASSERT_DEBUG(tlsData->iReferenceCount>=0, Panic(EPanicBadTlsDataReferenceCount));
177 if (tlsData->iReferenceCount<=0)
185 void TTlsData::SetCurrentCharacterSetConverter(const CCnvCharacterSetConverter* aCharacterSetConverter)
187 TTlsData* tlsData=STATIC_CAST(TTlsData*, Dll::Tls());
190 OstTrace0( TRACE_FATAL, DUP1_TTLSDATA_SETCURRENTCHARACTERSETCONVERTER, "No Tls Data in TTlsData::SetCurrentCharacterSetConverter" );
192 __ASSERT_ALWAYS(tlsData!=NULL, Panic(EPanicNoTlsData));
193 if ( (tlsData->iCurrentCharacterSetConverter==NULL)==(aCharacterSetConverter==NULL) )
195 OstTrace0( TRACE_FATAL, TTLSDATA_SETCURRENTCHARACTERSETCONVERTER, "Bad Toggle of current characater set converter in TTlsData::SetCurrentCharacterSetConverter" );
197 __ASSERT_ALWAYS((tlsData->iCurrentCharacterSetConverter==NULL)!=(aCharacterSetConverter==NULL), Panic(EPanicBadToggleOfCurrentCharacterSetConverter));
198 tlsData->iCurrentCharacterSetConverter=aCharacterSetConverter;
201 EXPORT_C const CCnvCharacterSetConverter* TTlsData::CurrentCharacterSetConverter()
203 TTlsData* tlsData=STATIC_CAST(TTlsData*, Dll::Tls());
204 return (tlsData!=NULL)? tlsData->iCurrentCharacterSetConverter: NULL;
207 // CDeepDestructingArrayOfCharactersSets
209 NONSHARABLE_CLASS(CDeepDestructingArrayOfCharactersSets) : public CArrayFixFlat<CCnvCharacterSetConverter::SCharacterSet>
212 static CDeepDestructingArrayOfCharactersSets* NewLC(TInt aGranularity);
213 virtual ~CDeepDestructingArrayOfCharactersSets();
215 CDeepDestructingArrayOfCharactersSets(TInt aGranularity);
218 CDeepDestructingArrayOfCharactersSets* CDeepDestructingArrayOfCharactersSets::NewLC(TInt aGranularity)
220 CDeepDestructingArrayOfCharactersSets* deepDestructingArrayOfCharactersSets=new(ELeave) CDeepDestructingArrayOfCharactersSets(aGranularity);
221 CleanupStack::PushL(deepDestructingArrayOfCharactersSets);
222 return deepDestructingArrayOfCharactersSets;
225 CDeepDestructingArrayOfCharactersSets::~CDeepDestructingArrayOfCharactersSets()
227 for (TInt i=Count()-1; i>=0; --i)
229 delete (*this)[i].iName;
233 CDeepDestructingArrayOfCharactersSets::CDeepDestructingArrayOfCharactersSets(TInt aGranularity)
234 :CArrayFixFlat<CCnvCharacterSetConverter::SCharacterSet>(aGranularity)
240 NONSHARABLE_CLASS(CFileReader) : public CBase
243 static CFileReader* NewLC(RFile& aFile);
244 static CFileReader* NewLC(const TUint8* aRomFile, TInt aLengthOfRomFile);
245 virtual ~CFileReader();
246 void SkipL(TInt aNumberOfBytes);
250 TInt ReadPositiveIntegerCompacted15L();
251 TInt ReadPositiveIntegerCompacted30L();
252 TInt ReadSignedIntegerCompacted29L();
253 void ReadBufferL(TDes8& aBuffer, TInt aBufferLength);
254 HBufC8* ReadBufferL(TInt aBufferLength);
255 HBufC8* ReadBufferLC(TInt aBufferLength);
256 inline TBool IsEndOfFile() const {if ( iNextByteToConsume>iOnePastEndOfBuffer ) {OstTrace0( TRACE_DUMP, _NONSHARABLE_CLASS, "EPanicPastEndOfFile" );}__ASSERT_DEBUG(iNextByteToConsume<=iOnePastEndOfBuffer, Panic(EPanicPastEndOfFile)); return iNextByteToConsume>=iOnePastEndOfBuffer;}
258 enum {ENumberOfBytesToConsumeBetweenEachReAllocation=1000};
261 CFileReader(const TUint8* aRomFile, TInt aLengthOfRomFile);
262 void ConstructForNonRomFileL(RFile& aFile);
263 NON_DEBUG_INLINE void ReAllocateTheBuffer();
265 inline void CheckPointers(TPanic aPanic) {__ASSERT_DEBUG((iNextByteToConsume!=NULL) && (iOnePastEndOfBuffer!=NULL) && (iNextByteToConsume<=iOnePastEndOfBuffer), Panic(aPanic)); if (iBuffer==NULL) {__ASSERT_DEBUG(iFlagPoleForReAllocation==NULL, Panic(aPanic));} else {__ASSERT_DEBUG(iNextByteToConsume<iFlagPoleForReAllocation, Panic(aPanic));}}
267 inline void CheckPointers(TPanic) {}
271 const TUint8* iNextByteToConsume;
272 const TUint8* iOnePastEndOfBuffer;
273 const TUint8* iFlagPoleForReAllocation;
276 void CFileReader::ReAllocateTheBuffer() // put this function first so that the compiler does actually inline it for non-DEBUG builds
278 if ( (iBuffer==NULL) || (iNextByteToConsume<iFlagPoleForReAllocation ) )
280 OstTrace0( TRACE_DUMP, CFILEREADER_REALLOCATETHEBUFFER, "EPanicNotPastFlagPoleForReAllocation" );
283 __ASSERT_DEBUG((iBuffer!=NULL) && (iNextByteToConsume>=iFlagPoleForReAllocation), Panic(EPanicNotPastFlagPoleForReAllocation));
284 const TInt lengthOfBuffer=iOnePastEndOfBuffer-iNextByteToConsume;
285 Mem::Copy(STATIC_CAST(TAny*, iBuffer), iNextByteToConsume, lengthOfBuffer);
286 const TAny* reAllocatedCell=
287 User::ReAlloc(STATIC_CAST(TAny*, iBuffer), lengthOfBuffer);
288 if ( reAllocatedCell!=iBuffer )
290 OstTrace0( TRACE_DUMP, DUP1_CFILEREADER_REALLOCATETHEBUFFER, "EPanicReAllocatedCellMoved" );
292 __ASSERT_DEBUG(reAllocatedCell==iBuffer, Panic(EPanicReAllocatedCellMoved));
293 iNextByteToConsume=iBuffer;
294 iOnePastEndOfBuffer=iBuffer+lengthOfBuffer;
295 // iFlagPoleForReAllocation can stay as it is
298 CFileReader* CFileReader::NewLC(RFile& aFile)
300 CFileReader* fileReader=new(ELeave) CFileReader;
301 CleanupStack::PushL(fileReader);
302 fileReader->ConstructForNonRomFileL(aFile);
306 CFileReader* CFileReader::NewLC(const TUint8* aRomFile, TInt aLengthOfRomFile)
308 CFileReader* fileReader=new(ELeave) CFileReader(aRomFile, aLengthOfRomFile);
309 CleanupStack::PushL(fileReader);
313 CFileReader::~CFileReader()
318 void CFileReader::SkipL(TInt aNumberOfBytes)
320 if ( aNumberOfBytes<0 )
322 OstTrace0( TRACE_DUMP, CFILEREADER_SKIPL, "EPanicNegativeNumberOfBytes" );
324 __ASSERT_DEBUG(aNumberOfBytes>=0, Panic(EPanicNegativeNumberOfBytes));
325 CheckPointers(EPanicInconsistentFileReader1);
326 const TUint8* newNextByteToConsume=iNextByteToConsume+aNumberOfBytes;
327 if (newNextByteToConsume>iOnePastEndOfBuffer)
329 OstTrace0( TRACE_FATAL, DUP2_CFILEREADER_SKIPL, "KErrCorrupt" );
330 User::Leave(KErrCorrupt);
332 iNextByteToConsume=newNextByteToConsume;
333 if ((iBuffer!=NULL) && (iNextByteToConsume>=iFlagPoleForReAllocation))
335 ReAllocateTheBuffer();
337 CheckPointers(EPanicInconsistentFileReader2);
340 TInt CFileReader::ReadUint8L()
342 CheckPointers(EPanicInconsistentFileReader3);
343 const TUint8* newNextByteToConsume=iNextByteToConsume+sizeof(TUint8);
344 if (newNextByteToConsume>iOnePastEndOfBuffer)
346 User::Leave(KErrCorrupt);
348 const TInt integer=*iNextByteToConsume;
349 iNextByteToConsume=newNextByteToConsume;
350 if ((iBuffer!=NULL) && (iNextByteToConsume>=iFlagPoleForReAllocation))
352 ReAllocateTheBuffer();
354 CheckPointers(EPanicInconsistentFileReader4);
358 TInt CFileReader::ReadUint16L() // little-endian
360 CheckPointers(EPanicInconsistentFileReader5);
361 const TUint8* newNextByteToConsume=iNextByteToConsume+sizeof(TUint16);
362 if (newNextByteToConsume>iOnePastEndOfBuffer)
364 OstTrace0( TRACE_FATAL, CFILEREADER_READUINT16L, "KErrCorrupt" );
365 User::Leave(KErrCorrupt);
367 const TInt integer=(*iNextByteToConsume|(*(iNextByteToConsume+1)<<8));
368 iNextByteToConsume=newNextByteToConsume;
369 if ((iBuffer!=NULL) && (iNextByteToConsume>=iFlagPoleForReAllocation))
371 ReAllocateTheBuffer();
373 CheckPointers(EPanicInconsistentFileReader6);
377 TUint CFileReader::ReadUint32L() // little-endian
379 CheckPointers(EPanicInconsistentFileReader7);
380 const TUint8* newNextByteToConsume=iNextByteToConsume+sizeof(TUint32);
381 if (newNextByteToConsume>iOnePastEndOfBuffer)
383 User::Leave(KErrCorrupt);
385 const TInt integer=(*iNextByteToConsume|(*(iNextByteToConsume+1)<<8)|(*(iNextByteToConsume+2)<<16)|(*(iNextByteToConsume+3)<<24));
386 iNextByteToConsume=newNextByteToConsume;
387 if ((iBuffer!=NULL) && (iNextByteToConsume>=iFlagPoleForReAllocation))
389 ReAllocateTheBuffer();
391 CheckPointers(EPanicInconsistentFileReader8);
395 TInt CFileReader::ReadPositiveIntegerCompacted15L() // big-endian
397 CheckPointers(EPanicInconsistentFileReader9);
398 const TUint8* bytePointer=iNextByteToConsume;
399 if (bytePointer>=iOnePastEndOfBuffer)
401 User::Leave(KErrCorrupt);
403 TInt integer=*bytePointer;
404 if (integer&0x00000080)
406 integer&=~0x00000080;
408 if (bytePointer>=iOnePastEndOfBuffer)
410 User::Leave(KErrCorrupt);
413 integer|=*bytePointer;
416 iNextByteToConsume=bytePointer;
417 if ((iBuffer!=NULL) && (iNextByteToConsume>=iFlagPoleForReAllocation))
419 ReAllocateTheBuffer();
421 CheckPointers(EPanicInconsistentFileReader10);
425 TInt CFileReader::ReadPositiveIntegerCompacted30L() // big-endian
427 CheckPointers(EPanicInconsistentFileReader11);
428 const TUint8* bytePointer=iNextByteToConsume;
429 if (bytePointer>=iOnePastEndOfBuffer)
431 OstTrace0( TRACE_FATAL, CFILEREADER_READPOSITIVEINTEGERCOMPACTED30L, "KErrCorrupt" );
432 User::Leave(KErrCorrupt);
434 TInt integer=*bytePointer;
435 if (integer&0x00000080)
437 integer&=~0x00000080;
439 if (bytePointer>=iOnePastEndOfBuffer)
441 OstTrace0( TRACE_FATAL, DUP1_CFILEREADER_READPOSITIVEINTEGERCOMPACTED30L, "KErrCorrupt" );
442 User::Leave(KErrCorrupt);
445 integer|=*bytePointer;
446 if (integer&0x00004000)
448 integer&=~0x00004000;
449 if (bytePointer+2>=iOnePastEndOfBuffer)
451 OstTrace0( TRACE_FATAL, DUP2_CFILEREADER_READPOSITIVEINTEGERCOMPACTED30L, "KErrCorrupt" );
452 User::Leave(KErrCorrupt);
456 integer|=*bytePointer;
459 integer|=*bytePointer;
463 iNextByteToConsume=bytePointer;
464 if ((iBuffer!=NULL) && (iNextByteToConsume>=iFlagPoleForReAllocation))
466 ReAllocateTheBuffer();
468 CheckPointers(EPanicInconsistentFileReader12);
472 TInt CFileReader::ReadSignedIntegerCompacted29L() // big-endian
474 CheckPointers(EPanicInconsistentFileReader13);
475 const TUint8* bytePointer=iNextByteToConsume;
476 if (bytePointer>=iOnePastEndOfBuffer)
478 OstTrace0( TRACE_FATAL, CFILEREADER_READSIGNEDINTEGERCOMPACTED29L, "KErrCorrupt" );
479 User::Leave(KErrCorrupt);
481 TInt integer=*bytePointer;
482 const TBool isNegative=(integer&0x00000080);
483 integer&=~0x00000080;
484 if (integer&0x00000040)
486 integer&=~0x00000040;
488 if (bytePointer>=iOnePastEndOfBuffer)
490 OstTrace0( TRACE_FATAL, DUP1_CFILEREADER_READSIGNEDINTEGERCOMPACTED29L, "KErrCorrupt" );
491 User::Leave(KErrCorrupt);
494 integer|=*bytePointer;
495 if (integer&0x00002000)
497 integer&=~0x00002000;
498 if (bytePointer+2>=iOnePastEndOfBuffer)
500 OstTrace0( TRACE_FATAL, DUP2_CFILEREADER_READSIGNEDINTEGERCOMPACTED29L, "KErrCorrupt" );
501 User::Leave(KErrCorrupt);
505 integer|=*bytePointer;
508 integer|=*bytePointer;
516 iNextByteToConsume=bytePointer;
517 if ((iBuffer!=NULL) && (iNextByteToConsume>=iFlagPoleForReAllocation))
519 ReAllocateTheBuffer();
521 CheckPointers(EPanicInconsistentFileReader14);
522 return isNegative? -integer: integer;
525 void CFileReader::ReadBufferL(TDes8& aBuffer, TInt aBufferLength)
527 if ( aBufferLength<0 )
529 OstTrace0( TRACE_DUMP, CFILEREADER_READBUFFERL, "EPanicNegativeBufferLength1" );
531 __ASSERT_DEBUG(aBufferLength>=0, Panic(EPanicNegativeBufferLength1));
532 CheckPointers(EPanicInconsistentFileReader15);
533 const TUint8* newNextByteToConsume=iNextByteToConsume+aBufferLength;
534 if (newNextByteToConsume>iOnePastEndOfBuffer)
536 OstTrace0( TRACE_FATAL, DUP1_CFILEREADER_READBUFFERL, "KErrCorrupt" );
537 User::Leave(KErrCorrupt);
539 aBuffer=TPtrC8(iNextByteToConsume, aBufferLength);
540 iNextByteToConsume=newNextByteToConsume;
541 if ((iBuffer!=NULL) && (iNextByteToConsume>=iFlagPoleForReAllocation))
543 ReAllocateTheBuffer();
545 CheckPointers(EPanicInconsistentFileReader16);
548 HBufC8* CFileReader::ReadBufferL(TInt aBufferLength)
550 if ( aBufferLength<0 )
552 OstTrace0( TRACE_DUMP, DUP2_CFILEREADER_READBUFFERL, "EPanicNegativeBufferLength2" );
554 __ASSERT_DEBUG(aBufferLength>=0, Panic(EPanicNegativeBufferLength2));
555 CheckPointers(EPanicInconsistentFileReader17);
556 const TUint8* newNextByteToConsume=iNextByteToConsume+aBufferLength;
557 if (newNextByteToConsume>iOnePastEndOfBuffer)
559 OstTrace0( TRACE_FATAL, DUP3_CFILEREADER_READBUFFERL, "KErrCorrupt" );
560 User::Leave(KErrCorrupt);
562 HBufC8* buffer=TPtrC8(iNextByteToConsume, aBufferLength).AllocL();
563 iNextByteToConsume=newNextByteToConsume;
564 if ((iBuffer!=NULL) && (iNextByteToConsume>=iFlagPoleForReAllocation))
566 ReAllocateTheBuffer();
568 CheckPointers(EPanicInconsistentFileReader18);
572 HBufC8* CFileReader::ReadBufferLC(TInt aBufferLength)
574 HBufC8* buffer=ReadBufferL(aBufferLength);
575 CleanupStack::PushL(buffer);
579 CFileReader::CFileReader()
581 iNextByteToConsume(NULL),
582 iOnePastEndOfBuffer(NULL),
583 iFlagPoleForReAllocation(NULL)
587 CFileReader::CFileReader(const TUint8* aRomFile, TInt aLengthOfRomFile)
589 iNextByteToConsume(aRomFile),
590 iOnePastEndOfBuffer(aRomFile+aLengthOfRomFile),
591 iFlagPoleForReAllocation(NULL)
595 void CFileReader::ConstructForNonRomFileL(RFile& aFile)
598 if ( aFile.Size(lengthOfBuffer) < 0 )
600 OstTrace0( TRACE_FATAL, DUP1_CFILEREADER_CONSTRUCTFORNONROMFILEL, "aFile.Size(lengthOfBuffer) < 0" );
602 User::LeaveIfError(aFile.Size(lengthOfBuffer));
603 iBuffer=STATIC_CAST(TUint8*, User::AllocL(lengthOfBuffer+1));
604 TPtr8 buffer(iBuffer, 0, lengthOfBuffer);
605 User::LeaveIfError(aFile.Read(buffer));
606 if ((buffer.Length()!=lengthOfBuffer) || (lengthOfBuffer<=0))
608 OstTrace0( TRACE_FATAL, CFILEREADER_CONSTRUCTFORNONROMFILEL, "KErrCorrupt" );
609 User::Leave(KErrCorrupt);
611 iNextByteToConsume=iBuffer;
612 iOnePastEndOfBuffer=iBuffer+lengthOfBuffer;
613 iFlagPoleForReAllocation=iBuffer+ENumberOfBytesToConsumeBetweenEachReAllocation;
616 // CStandardNamesAndMibEnums
618 NONSHARABLE_CLASS(CStandardNamesAndMibEnums) : public CBase
621 static CStandardNamesAndMibEnums* NewLC();
622 virtual ~CStandardNamesAndMibEnums();
623 void AddFromFileL(RFs& aFileServerSession, const TDesC& aFileName);
624 TUint Identifier(const TDesC8& aStandardName) const;
625 TUint Identifier(TInt aMibEnum) const;
626 HBufC8* StandardNameL(TUint aIdentifier) const;
627 TInt MibEnum(TUint aIdentifier) const;
629 /** Stores information about a non-Unicode character set. The information
630 is used to locate the conversion information required by ConvertFromUnicode()
631 and ConvertToUnicode().
633 An array of these structs, which contains all available character sets,
634 can be generated by CreateArrayOfCharacterSetsAvailableLC() and
635 CreateArrayOfCharacterSetsAvailableL(),
636 and is used by one of the overloads of PrepareToConvertToOrFromL(). */
639 inline SCharacterSet(TUint aIdentifier, TInt aNumberOfStandardNames, TInt aNumberOfMibEnums) :iIdentifier(aIdentifier), iArrayOfStandardNames(Max(aNumberOfStandardNames, 1)), iArrayOfMibEnums(Max(aNumberOfMibEnums, 1)) {}
640 const TUint iIdentifier;
641 RPointerArray<HBufC8> iArrayOfStandardNames;
642 RArray<TInt> iArrayOfMibEnums;
645 CStandardNamesAndMibEnums();
646 TBool CharacterSetExists(TUint aIdentifier, TInt& aIndex) const;
647 static TInt CompareFunction(const SCharacterSet& aCharacterSet1, const SCharacterSet& aCharacterSet2);
649 RArray<SCharacterSet> iArrayOfCharacterSets;
652 CStandardNamesAndMibEnums* CStandardNamesAndMibEnums::NewLC()
654 CStandardNamesAndMibEnums* standardNamesAndMibEnums=new(ELeave) CStandardNamesAndMibEnums;
655 CleanupStack::PushL(standardNamesAndMibEnums);
656 return standardNamesAndMibEnums;
659 CStandardNamesAndMibEnums::~CStandardNamesAndMibEnums()
661 for (TInt i=iArrayOfCharacterSets.Count()-1; i>=0; --i)
663 SCharacterSet& characterSet=iArrayOfCharacterSets[i];
664 characterSet.iArrayOfStandardNames.ResetAndDestroy();
665 characterSet.iArrayOfStandardNames.Close();
666 characterSet.iArrayOfMibEnums.Close();
668 iArrayOfCharacterSets.Close();
671 void CStandardNamesAndMibEnums::AddFromFileL(RFs& aFileServerSession, const TDesC& aFileName)
673 const TUint8* const romFile=aFileServerSession.IsFileInRom(aFileName);
675 CFileReader* fileReader=NULL;
679 User::LeaveIfError(aFileServerSession.Entry(aFileName, entry));
680 fileReader=CFileReader::NewLC(romFile, entry.iSize);
684 CleanupClosePushL(file);
685 User::LeaveIfError(file.Open(aFileServerSession, aFileName, EFileShareReadersOnly|EFileStream|EFileRead));
686 fileReader=CFileReader::NewLC(file);
688 fileReader->SkipL(16); // skip the UIDs
689 while (!fileReader->IsEndOfFile())
691 const TUint identifier=fileReader->ReadUint32L();
692 const TInt numberOfStandardNames=fileReader->ReadPositiveIntegerCompacted15L();
693 const TInt numberOfMibEnums=fileReader->ReadPositiveIntegerCompacted15L();
694 SCharacterSet* characterSet=NULL;
695 TInt indexOfCharacterSet;
696 if (CharacterSetExists(identifier, indexOfCharacterSet))
698 characterSet=&iArrayOfCharacterSets[indexOfCharacterSet];
702 User::LeaveIfError(iArrayOfCharacterSets.Insert(SCharacterSet(identifier, numberOfStandardNames, numberOfMibEnums), indexOfCharacterSet));
703 characterSet=&iArrayOfCharacterSets[indexOfCharacterSet];
706 for (i=0; i<numberOfStandardNames; ++i)
708 const TInt lengthOfStandardName=fileReader->ReadPositiveIntegerCompacted15L();
709 User::LeaveIfError(characterSet->iArrayOfStandardNames.Append(fileReader->ReadBufferLC(lengthOfStandardName)));
710 CleanupStack::Pop(); // fileReader->ReadBufferLC(lengthOfStandardName)
712 for (i=0; i<numberOfMibEnums; ++i)
714 User::LeaveIfError(characterSet->iArrayOfMibEnums.Append(fileReader->ReadPositiveIntegerCompacted30L()));
717 CleanupStack::PopAndDestroy((romFile!=NULL)? 1: 2); // fileReader and (possibly) file
721 TUint CStandardNamesAndMibEnums::Identifier(const TDesC8& aStandardName) const
723 for (TInt i=iArrayOfCharacterSets.Count()-1; i>=0; --i)
725 const SCharacterSet& characterSet=iArrayOfCharacterSets[i];
726 for (TInt j=characterSet.iArrayOfStandardNames.Count()-1; j>=0; --j)
728 if (StandardNamesMatch(*characterSet.iArrayOfStandardNames[j], aStandardName))
730 return characterSet.iIdentifier;
737 TUint CStandardNamesAndMibEnums::Identifier(TInt aMibEnum) const
739 for (TInt i=iArrayOfCharacterSets.Count()-1; i>=0; --i)
741 const SCharacterSet& characterSet=iArrayOfCharacterSets[i];
742 for (TInt j=characterSet.iArrayOfMibEnums.Count()-1; j>=0; --j)
744 if (characterSet.iArrayOfMibEnums[j]==aMibEnum)
746 return characterSet.iIdentifier;
753 HBufC8* CStandardNamesAndMibEnums::StandardNameL(TUint aIdentifier) const
755 TInt indexOfCharacterSet;
756 if (CharacterSetExists(aIdentifier, indexOfCharacterSet))
758 const RPointerArray<HBufC8>& arrayOfStandardNames=iArrayOfCharacterSets[indexOfCharacterSet].iArrayOfStandardNames;
759 if (arrayOfStandardNames.Count()>0)
761 return arrayOfStandardNames[0]->AllocL();
767 TInt CStandardNamesAndMibEnums::MibEnum(TUint aIdentifier) const
769 TInt indexOfCharacterSet;
770 if (CharacterSetExists(aIdentifier, indexOfCharacterSet))
772 const RArray<TInt>& arrayOfMibEnums=iArrayOfCharacterSets[indexOfCharacterSet].iArrayOfMibEnums;
773 if (arrayOfMibEnums.Count()>0)
775 return arrayOfMibEnums[0];
781 CStandardNamesAndMibEnums::CStandardNamesAndMibEnums()
782 :iArrayOfCharacterSets(5)
786 TBool CStandardNamesAndMibEnums::CharacterSetExists(TUint aIdentifier, TInt& aIndex) const
788 TUint characterSet[sizeof(SCharacterSet)/sizeof(TUint)]; // use this as a pretend SCharacterSet object (the only field of it that will be used is iIdentifier)
789 characterSet[_FOFF(SCharacterSet, iIdentifier)/sizeof(TUint)]=aIdentifier;
791 for (TInt i=iArrayOfCharacterSets.Count()-1; i>0; --i) // i>0 (rather than i>=0) is correct as we are comparing the character set identifier at [i] with the one at [i-1]
793 __ASSERT_DEBUG(CompareFunction(iArrayOfCharacterSets[i-1], iArrayOfCharacterSets[i])<0, Panic(EPanicCharacterSetsNotSorted));
796 return iArrayOfCharacterSets.FindInOrder(*REINTERPRET_CAST(const SCharacterSet*, characterSet), aIndex, TLinearOrder<SCharacterSet>(CompareFunction))==KErrNone;
799 TInt CStandardNamesAndMibEnums::CompareFunction(const SCharacterSet& aCharacterSet1, const SCharacterSet& aCharacterSet2)
801 return aCharacterSet2.iIdentifier-aCharacterSet1.iIdentifier;
804 ///////////////////////////////////////////////////////////////////////////////////////////////////////////////////////
805 // class CCharsetCnvCache
808 CCharsetCnvCache is used to accelerate the access to character set converter implementations.
809 On a client request the CCharsetCnvCache instance will load the required character set converter
810 implementation if it is not loaded yet and give it to the client. If the requested
811 character set converter is in the cache, it will be used and no time will be spend for loading it.
812 The type of the used caching algorithm is LRU.
813 The implementation UID of the converter is used as a key, uniquely identifying cache entries.
814 GetConverterL()/Converter() return results should not be stored across the calls. The cache
815 has limited max size. It will remove the last entries if it reaches its max limit - that may
816 make stored GetConverterL()/Converter() return results invalid.
819 NONSHARABLE_CLASS(CCharsetCnvCache) : public CBase
824 /** Default cache size*/
825 KDefaultMaxCacheSize = 32
829 /** Min allowed cache size*/
834 static CCharsetCnvCache* NewL();
835 virtual ~CCharsetCnvCache();
837 CCharacterSetConverterPluginInterface* GetConverterL(TUid aImplUid);
838 CCharacterSetConverterPluginInterface* Converter(TUid aImplUid);
839 void SetMaxSize(TInt aSize);
843 The class represents an entry in CCharsetCnvCache cache.
846 NONSHARABLE_CLASS(TCharsetCnvEntry)
849 static TInt Offset();
852 CCharacterSetConverterPluginInterface* iCharsetCnv;
857 TSglQue<TCharsetCnvEntry> iCache;
861 TCharsetCnvEntry* Find(TUid aImplUid);
862 TCharsetCnvEntry* CreateNewL(TUid aImplUid);
868 @return The offset of iLink data member from the beginning of CCharsetCnvCache::TCharsetCnvEntry
869 object. The method is used internally - the character set converter cache implementation
873 TInt CCharsetCnvCache::TCharsetCnvEntry::Offset()
875 return (_FOFF(TCharsetCnvEntry, iLink));
879 Standard factory method for CCharsetCnvCache objects creation.
881 @return A pointer to the created CCharsetCnvCache instance.
884 CCharsetCnvCache* CCharsetCnvCache::NewL()
886 CCharsetCnvCache* self = new (ELeave) CCharsetCnvCache;
892 CCharsetCnvCache::~CCharsetCnvCache()
894 //Destroy all cache entries - destroy the implementation, delete the entry.
895 TSglQueIter<TCharsetCnvEntry> it(iCache);
897 TCharsetCnvEntry* entry;
898 while((entry = it++) != NULL)
900 delete entry->iCharsetCnv;
904 //If iCacheSize is not 0, then there is something wrong with adding/removing cache entry functionality
905 if ( iCacheSize != 0)
907 OstTrace0( TRACE_DUMP, CCHARSETCNVCACHE_CCHARSETCNVCACHE, "iCacheSize not zero in CCharsetCnvCache::~CCharsetCnvCache" );
909 __ASSERT_DEBUG(iCacheSize == 0, User::Invariant());
913 The method searches the cache for a character set converter, which implementation UID matches
914 aImplUid argument. If such converter does not exist in the cache - its implementaion will
915 be loaded and cached. If the cache has more than iMaxCacheSize entries, the last cache entry
916 will be removed. The found/loaded library will be moved to be the first entry in the cache.
917 The implementation UID of the converter is used as a key, uniquely identifying the cache entries.
918 @param aImplUid Implementation UID of the required character set converter.
919 @return A pointer to CCharacterSetConverterPluginInterface instance.
921 @leave System-wide error codes as well - loading converter implementation related problems.
922 @panic User::Invariant() The returned cache entry is NULL.
924 CCharacterSetConverterPluginInterface* CCharsetCnvCache::GetConverterL(TUid aImplUid)
926 TCharsetCnvEntry* entry = Find(aImplUid);
928 {//The requested entry exists in the cache.
929 //1) Remove the entry (iCache object maintains a list of pointers).
930 //2) Add it as a first entry in the cache. It guarantees that if a cache overflow
931 //happens, the last used/loaded cache entry won't be removed and destroyed.
932 iCache.Remove(*entry);
933 iCache.AddFirst(*entry);
936 {//The requested entry is not in the cache - load it.
937 //If the cache gets too big - remove and destroy the last cache entry.
938 TCharsetCnvEntry* newEntry = CreateNewL(aImplUid);
939 iCache.AddFirst(*newEntry);
940 entry = iCache.First();
941 if(++iCacheSize > iMaxCacheSize)
949 OstTrace0( TRACE_FATAL, CCHARSETCNVCACHE_GETCONVERTERL, "entry NULL in CCharsetCnvCache::GetConverterL" );
951 __ASSERT_ALWAYS(entry, User::Invariant());
952 return entry->iCharsetCnv;
956 The method searches the cache for a character set converter, which implementation UID matches
957 the supplied UID argument. If such converter does not exist in the cache - the method panics.
958 The implementation UID of the converter is used as a key, uniquely identifying the cache entries.
959 @param aImplUid Implementation UID of the required character set converter.
960 @return A pointer to CCharacterSetConverterPluginInterface instance.
961 @panic EPanicCharacterSetConverterNotLoaded There is no converter implementation in the cache, which
962 implementation UID is equal to aImplUid.
964 CCharacterSetConverterPluginInterface* CCharsetCnvCache::Converter(TUid aImplUid)
966 TCharsetCnvEntry* entry = Find(aImplUid);
967 if ( entry == NULL || entry->iCharsetCnv == NULL )
969 OstTrace0( TRACE_FATAL, CCHARSETCNVCACHE_CONVERTER, "entry or entry->iCharsetCnv NULL in CCharsetCnvCache::Converter" );
971 __ASSERT_ALWAYS(entry != NULL && entry->iCharsetCnv != NULL, Panic(EPanicCharacterSetConverterNotLoaded));
972 iCache.Remove(*entry);
973 iCache.AddFirst(*entry);
974 return entry->iCharsetCnv;
978 The method sets the max size of the character set converter cache.
979 By default (if SetMaxSize() is never called) the max cache size is limited to
980 KDefaultMaxCacheSize entries.
981 Note: Setting very small cache size will impact the overall performance of CHARCONV functions.
982 @param aSize The new max cache size. It must be bigger or equal to KMinCacheSize.
983 @panic User::Invariant() if the new max cache size is less than KMinCacheSize.
984 @see KDefaultMaxCacheSize
987 void CCharsetCnvCache::SetMaxSize(TInt aSize)
989 if ( aSize < KMinCacheSize )
991 OstTrace0( TRACE_FATAL, CCHARSETCNVCACHE_SETMAXSIZE, "aSize < KMinCacheSize in CCharsetCnvCache::SetMaxSize" );
993 __ASSERT_ALWAYS(aSize >= KMinCacheSize, User::Invariant());
994 //Remove and destroy the last cache entries, if iCacheSize > aSize.
995 for(;iCacheSize>aSize;--iCacheSize)
999 iMaxCacheSize = aSize;
1004 CCharsetCnvCache::CCharsetCnvCache() :
1005 iMaxCacheSize(KDefaultMaxCacheSize),
1007 iCache(TCharsetCnvEntry::Offset())
1012 The method searches the cache for a converter which implementation UID matches aImplUid argument.
1013 If such entry exists, a pointer to it will be returned.
1014 @param aImplUid Implementation UID of the searched character set converter.
1015 @return A pointer to the found cache entry or NULL if there is no such entry.
1017 CCharsetCnvCache::TCharsetCnvEntry* CCharsetCnvCache::Find(TUid aImplUid)
1019 TSglQueIter<TCharsetCnvEntry> it(iCache);
1021 TCharsetCnvEntry* entry = NULL;
1022 while((entry = it++) != NULL && entry->iImplUid != aImplUid)
1029 The method creates a new CCharsetCnvCache::TCharsetCnvEntry instance in the heap. It will load
1030 the required character set converter plugin.
1031 @param aImplUid Implementation UID of the character set converter to be loaded.
1032 @return A pointer to the created CCharsetCnvCache::TCharsetCnvEntry instance.
1034 @leave System-wide error codes as well - loading converter plugin related problems.
1035 @panic User::Invariant(), if the loaded library does not export all expected functions.
1037 CCharsetCnvCache::TCharsetCnvEntry* CCharsetCnvCache::CreateNewL(TUid aImplUid)
1039 CCharsetCnvCache::TCharsetCnvEntry* newEntry = new (ELeave) CCharsetCnvCache::TCharsetCnvEntry;
1040 CleanupStack::PushL(newEntry);
1042 newEntry->iCharsetCnv = CCharacterSetConverterPluginInterface::NewL(aImplUid);
1043 newEntry->iImplUid = aImplUid;
1045 CleanupStack::Pop(newEntry);
1050 The method removes and destroys the last cache entry.
1051 The related converter implementation will be destroyed, the entry - deleted.
1052 @panic User::Invariant() If the last cache entry is NULL.
1054 void CCharsetCnvCache::RemoveLast()
1056 TCharsetCnvEntry* lastEntry = iCache.Last();
1059 OstTrace0( TRACE_FATAL, CCHARSETCNVCACHE_REMOVELAST, "lastEntry NULL in CCharsetCnvCache::RemoveLast" );
1061 __ASSERT_ALWAYS(lastEntry, User::Invariant());
1062 iCache.Remove(*lastEntry);
1063 delete lastEntry->iCharsetCnv;
1067 // CCnvCharacterSetConverter
1069 /** Allocates and constructs a CCnvCharacterSetConverter object. If there is
1070 insufficient memory to create the object, the function leaves.
1072 Since the memory is allocated on the heap, objects of this type should be
1073 destroyed using the delete operator when the required conversions are complete.
1075 @return The newly created object. */
1076 EXPORT_C CCnvCharacterSetConverter* CCnvCharacterSetConverter::NewL()
1078 CCnvCharacterSetConverter* characterSetConverter=NewLC();
1079 CleanupStack::Pop(); // characterSetConverter
1080 return characterSetConverter;
1083 /** Allocates and constructs a CCnvCharacterSetConverter object, and leaves the
1084 object on the cleanup stack. If there is insufficient memory to create the
1085 object, the function leaves.
1087 Since the memory is allocated on the heap, objects of this type should be
1088 destroyed using either the CleanupStack::Pop() function and then the delete
1089 operator, or the CleanupStack::PopAndDestroy() function.
1091 @return The newly created object. */
1092 EXPORT_C CCnvCharacterSetConverter* CCnvCharacterSetConverter::NewLC()
1094 CCnvCharacterSetConverter* characterSetConverter=new(ELeave) CCnvCharacterSetConverter;
1095 characterSetConverter->iTlsDataConstructed=EFalse;
1096 CleanupStack::PushL(characterSetConverter);
1097 characterSetConverter->ConstructL();
1098 return characterSetConverter;
1102 /** The destructor frees all resources owned by the object, prior to its
1104 EXPORT_C CCnvCharacterSetConverter::~CCnvCharacterSetConverter()
1106 delete iStandardNamesAndMibEnums;
1107 if (iTlsDataConstructed)
1109 TTlsData::CharacterSetConverterIsBeingDestroyed();
1111 delete iCharsetCnvCache;
1112 REComSession::FinalClose();
1116 /** Creates an array identifying all the character sets for which conversion is
1117 available. These can be character sets for which conversion is built into
1118 Symbian OS, or they may be character sets for which conversion is implemented
1121 The array returned can be used by one of the PrepareToConvertToOrFromL()
1122 overloads to provide a list of all the character sets available for conversion.
1123 The caller of this function is responsible for deleting the array, and should
1126 Not all encoders returned will be suitable for conversion from Unicode.
1127 Such encoders have no name and no MIB enum and so will generally not be understood by
1128 a receiving process. The function ConvertCharacterSetIdentifierToMibEnumL can be used
1129 to determine whether this is the case or not.
1131 @param aFileServerSession A file server session. This is no longer used, but is kept for Binary Compatibility.
1132 @return An array identifying all supported character sets. */
1133 EXPORT_C CArrayFix<CCnvCharacterSetConverter::SCharacterSet>*
1134 CCnvCharacterSetConverter::CreateArrayOfCharacterSetsAvailableL(RFs& aFileServerSession)
1137 CArrayFix<SCharacterSet>* arrayOfCharacterSetsAvailable=CreateArrayOfCharacterSetsAvailableLC(aFileServerSession);
1138 CleanupStack::Pop(); // arrayOfCharacterSetsAvailable
1139 return arrayOfCharacterSetsAvailable;
1144 /** Creates an array identifying all the character sets for which conversion is
1145 available and pushes a pointer to it onto the cleanup stack. These can be
1146 character sets for which conversion is built into Symbian OS, or they may
1147 be character sets for which conversion is implemented by a plug-in DLL.
1149 The array returned can be used by one of the PrepareToConvertToOrFromL()
1150 overloads to provide a list of all the character sets available for conversion.
1151 The caller of this function is responsible for deleting the array, and should
1154 Not all encoders returned will be suitable for conversion from Unicode.
1155 Such encoders have no name and no MIB enum and so will generally not be understood by
1156 a receiving process. The function ConvertCharacterSetIdentifierToMibEnumL can be used
1157 to determine whether this is the case or not.
1159 This is a static function which uses ECOM functionality. It cleans up ECOM by calling FinalClose()
1161 @param aFileServerSession A file server session. This is no longer required, kept for Binary Compatibilty.
1162 @return An array of references to all supported character sets. */
1163 EXPORT_C CArrayFix<CCnvCharacterSetConverter::SCharacterSet>*
1164 CCnvCharacterSetConverter::CreateArrayOfCharacterSetsAvailableLC(RFs& aFileServerSession)
1167 CleanupStack::PushL(TCleanupItem(CloseECOMSession, NULL));
1169 CArrayFix<CCnvCharacterSetConverter::SCharacterSet>* result =
1170 DoCreateArrayOfCharacterSetsAvailableLC(aFileServerSession, 0);
1172 CleanupStack::Pop();//CArrayFix<CCnvCharacterSetConverter::SCharacterSet>* result
1173 CleanupStack::PopAndDestroy(); //CloseECOMSession
1174 CleanupStack::PushL(result);
1180 /** Gets the UID of a character set identified by its Internet-standard name
1181 (the matching is case-insensitive).
1183 If the character set specified is not one for which Symbian OS provides
1184 built-in conversion, the function searches the file system for plug-ins
1185 which implement the conversion and which provide the name-to-UID mapping
1188 @param aStandardNameOfCharacterSet Internet-standard name of a character set.
1189 @param aFileServerSession Connection to a file server session.
1190 @return The UID for the character set if the character set with a Internet-standard name
1191 has a known name and MIB enum.Otherwise zero is returned. */
1193 CCnvCharacterSetConverter::ConvertStandardNameOfCharacterSetToIdentifierL(
1194 const TDesC8& aStandardNameOfCharacterSet,
1195 RFs& aFileServerSession)
1197 if (iStandardNamesAndMibEnums==NULL)
1199 ScanForStandardNamesAndMibEnumsROMOnlyL(aFileServerSession);
1201 TUint result=iStandardNamesAndMibEnums->Identifier(aStandardNameOfCharacterSet);
1206 if(!iIsSystemStandardNamesAndMibEnumsScanned)
1208 //If SNM files in system haven't been scan yet, scan them
1209 ScanForStandardNamesAndMibEnumsL(aFileServerSession);
1210 iIsSystemStandardNamesAndMibEnumsScanned = ETrue;
1211 return iStandardNamesAndMibEnums->Identifier(aStandardNameOfCharacterSet);
1215 //iStandardNamesAndMibEnums has included those snm files in system
1221 /** Returns the Internet-standard name of a character set identified in Symbian
1224 If the character set specified is not one for which Symbian OS provides
1225 built-in conversion, the file system is searched for plug-ins which implement
1226 the conversion, hence the need for a file server session.
1228 @param aCharacterSetIdentifier The UID of the character set.
1229 @param aFileServerSession A file server session.
1230 @return The Internet-standard name for the character set if the character set with an identifier
1231 has a known name and MIB enum.Otherwise NULL is returned. */
1233 CCnvCharacterSetConverter::ConvertCharacterSetIdentifierToStandardNameL(
1234 TUint aCharacterSetIdentifier,
1235 RFs& aFileServerSession)
1237 if (iStandardNamesAndMibEnums==NULL)
1239 ScanForStandardNamesAndMibEnumsROMOnlyL(aFileServerSession);
1241 HBufC8* result = iStandardNamesAndMibEnums->StandardNameL(aCharacterSetIdentifier);
1246 if(!iIsSystemStandardNamesAndMibEnumsScanned)
1248 //If SNM files in system haven't been scan yet, scan them
1249 ScanForStandardNamesAndMibEnumsL(aFileServerSession);
1250 iIsSystemStandardNamesAndMibEnumsScanned = ETrue;
1251 return iStandardNamesAndMibEnums->StandardNameL(aCharacterSetIdentifier);
1255 //iStandardNamesAndMibEnums has included those snm files in system
1261 /** Converts a MIB enum value to the UID value of the character set.
1263 If the character set identified is not one for which Symbian OS provides
1264 built-in conversion, the function searches the file system for plug-ins
1265 which implement the conversion and which provide the MIB enum-to-UID mapping
1268 @param aMibEnumOfCharacterSet The MIB enum value of the character set.
1269 @param aFileServerSession Connection to a file server session.
1270 @return TThe UID of the character set if the character set with a Mib enum
1271 has a known name and MIB enum.Otherwise zero is returned. */
1273 CCnvCharacterSetConverter::ConvertMibEnumOfCharacterSetToIdentifierL(
1274 TInt aMibEnumOfCharacterSet,
1275 RFs& aFileServerSession)
1277 if (iStandardNamesAndMibEnums==NULL)
1279 ScanForStandardNamesAndMibEnumsROMOnlyL(aFileServerSession);
1281 TUint result = iStandardNamesAndMibEnums->Identifier(aMibEnumOfCharacterSet);
1286 if(!iIsSystemStandardNamesAndMibEnumsScanned)
1288 //If SNM files in system haven't been scan yet, scan them
1289 ScanForStandardNamesAndMibEnumsL(aFileServerSession);
1290 iIsSystemStandardNamesAndMibEnumsScanned = ETrue;
1291 return iStandardNamesAndMibEnums->Identifier(aMibEnumOfCharacterSet);
1295 //iStandardNamesAndMibEnums has included those snm files in system
1301 /** Converts the UID of a character set to its MIB enum value.
1303 If the character set identified is not one for which Symbian OS provides
1304 built-in conversion, the function searches the file system for plug-ins
1305 which implement the conversion and which provide the UID-to-MIB enum mapping
1308 @param aCharacterSetIdentifier The UID of the character set.
1309 @param aFileServerSession Connection to a file server session.
1310 @return The MIB enum value of the character set if the character set with Identifier
1311 has a known name and MIB enum.Otherwise zero is returned. */
1313 CCnvCharacterSetConverter::ConvertCharacterSetIdentifierToMibEnumL(
1314 TUint aCharacterSetIdentifier,
1315 RFs& aFileServerSession)
1317 if (iStandardNamesAndMibEnums==NULL)
1319 ScanForStandardNamesAndMibEnumsROMOnlyL(aFileServerSession);
1321 TInt result = iStandardNamesAndMibEnums->MibEnum(aCharacterSetIdentifier);
1326 if(!iIsSystemStandardNamesAndMibEnumsScanned)
1328 //If SNM files in system haven't been scan yet, scan them
1329 ScanForStandardNamesAndMibEnumsL(aFileServerSession);
1330 iIsSystemStandardNamesAndMibEnumsScanned = ETrue;
1331 return iStandardNamesAndMibEnums->MibEnum(aCharacterSetIdentifier);
1335 //iStandardNamesAndMibEnums has included those snm files in system
1340 /** Specifies the character set to convert to or from. aCharacterSetIdentifier
1341 is a UID which identifies a character set. It can be one of the character
1342 sets for which conversion is built into Symbian OS, or it may be a character
1343 set for which the conversion is implemented by a plug-in DLL.
1345 The function searches the character set array specified
1346 (aArrayOfCharacterSetsAvailable). This is an array containing all of the
1347 character sets for which conversion is available. It is created by calling
1348 CreateArrayOfCharacterSetsAvailableL() or
1349 CreateArrayOfCharacterSetsAvailableLC(). You should be sure that conversion
1350 is available for aCharacterSetIdentifier, because if not, a panic occurs.
1351 Otherwise, use the other overload of this function.
1353 Either this function or its overload, must be called before using the conversion
1354 functions ConvertFromUnicode() or ConvertToUnicode().
1356 Unlike the other overload, this function does not search the file system for
1357 plug-in conversion DLLs, (unless aArrayOfCharacterSetsAvailable is NULL).
1358 This function should be used if conversions are to be performed often, or
1359 if the conversion character set is to be selected by the user. Generating
1360 the array of all the available character sets once and searching though it
1361 is more efficient than the method used by the other overload, in which the
1362 file system may be searched every time it is invoked.
1366 The file server session argument is used to open the required character set
1367 conversion data file.
1369 The array passed to this function can also be used to provide a list from
1370 which a user can select the desired conversion character set.
1372 @param aCharacterSetIdentifier The UID of the non-Unicode character set from
1373 or to which to convert. Must not be zero, or a panic occurs.
1374 @param aArrayOfCharacterSetsAvailable Array of all character sets for which
1375 conversion is available, created by either
1376 CreateArrayOfCharacterSetsAvailableLC() or
1377 CreateArrayOfCharacterSetsAvailableL().
1378 @param aFileServerSession A file server session. No longer used, kept for Binary Compatibility */
1380 CCnvCharacterSetConverter::PrepareToConvertToOrFromL(
1381 TUint aCharacterSetIdentifier,
1382 const CArrayFix<SCharacterSet>& aArrayOfCharacterSetsAvailable,
1383 RFs& aFileServerSession)
1385 const TAvailability availability=DoPrepareToConvertToOrFromL(aCharacterSetIdentifier,
1386 &aArrayOfCharacterSetsAvailable,
1387 aFileServerSession);
1388 if (availability!=EAvailable)
1390 OstTrace0( TRACE_FATAL, CCNVCHARACTERSETCONVERTER_PREPARETOCONVERTTOORFROML, "Conversion Not found in CCnvCharacterSetConverter::PrepareToConvertToOrFromL" );
1391 User::Leave(KErrNotFound);
1395 /** Specifies the character set to convert to or from. aCharacterSetIdentifier
1396 is a UID which identifies a character set. It can be one of the character
1397 sets for which conversion is built into Symbian OS, or it may be a character
1398 set for which conversion is implemented by a plug-in DLL. In the latter case,
1399 the function searches through the file system for the DLL which implements
1400 the character conversion.
1402 Either this function or its overload must be called before using the conversion
1403 functions ConvertFromUnicode() or ConvertToUnicode().
1405 This overload of the function is simpler to use than the other and does not
1406 panic if the character set with the specified UID is not available at run
1407 timeÂ, it simply returns ENotAvailable. It should be used when the conversion
1408 character set is specified within the text object being converted, e.g. an
1409 email message, or an HTML document. If the character set is not specified,
1410 the user must be presented with a list of all available sets, so it makes
1411 sense to use the other overload.
1413 The function may need to search the file system each time it is called. If
1414 conversion takes place repeatedly over a short period, it may be more efficient
1415 to use the other overload.
1419 Although the other overload of this function is more efficient, if the
1420 character set is one for which conversion is built into Symbian OS, the
1421 difference in speed is negligible.
1423 @param aCharacterSetIdentifier The UID of the non-Unicode character set from
1424 or to which to convert. Must not be zero, or a panic occurs.
1425 @param aFileServerSession A file server session. No longer used, kept for Binary Compatibility
1426 @return The availability of the specified character set. If EAvailable is
1427 returned, then the conversion functions ConvertToUnicode() and
1428 ConvertFromUnicode() will use aCharacterSetIdentifier as the foreign character
1429 set. If ENotAvailable is returned, then the foreign character set will either
1430 be undefined (and trying to use the conversion functions will cause a panic),
1431 or if it has previously been set, it will remain unchanged. */
1432 EXPORT_C CCnvCharacterSetConverter::TAvailability
1433 CCnvCharacterSetConverter::PrepareToConvertToOrFromL(TUint aCharacterSetIdentifier,
1434 RFs& aFileServerSession)
1436 return DoPrepareToConvertToOrFromL(aCharacterSetIdentifier, NULL, aFileServerSession);
1440 /** Sets the default endian-ness used by the ConvertFromUnicode() and
1441 ConvertToUnicode() functions to convert between Unicode and non-Unicode
1444 The endian-ness of a multi-byte character set may be defined in the character
1445 set definition or, as in the case of UCS-2, be operating system dependent.
1446 If the endian-ness of the current character set is defined by the character
1447 set itself, then the default endian-ness specified by this function is ignored.
1451 The issue of endian-ness does not apply to single byte character sets
1452 as there is no byte order.
1454 This function should be called (if at all) after calling
1455 PrepareToConvertToOrFromL() and before calling ConvertFromUnicode() and/or
1458 @param aEndianness The default endian-ness of the current character set. */
1460 CCnvCharacterSetConverter::SetDefaultEndiannessOfForeignCharacters(
1461 TEndianness aDefaultEndiannessOfForeignCharacters)
1463 if ( (aDefaultEndiannessOfForeignCharacters!=ELittleEndian) && (aDefaultEndiannessOfForeignCharacters!=EBigEndian) )
1465 OstTrace0( TRACE_FATAL, CCNVCHARACTERSETCONVERTER_SETDEFAULTENDIANNESSOFFOREIGNCHARACTERS, "Bad Default Endianness Of Foreign Characters in CCnvCharacterSetConverter::SetDefaultEndiannessOfForeignCharacters" );
1467 __ASSERT_ALWAYS((aDefaultEndiannessOfForeignCharacters==ELittleEndian) || (aDefaultEndiannessOfForeignCharacters==EBigEndian), Panic(EPanicBadDefaultEndiannessOfForeignCharacters));
1468 iDefaultEndiannessOfForeignCharacters=aDefaultEndiannessOfForeignCharacters;
1472 /** Sets whether the Unicode 'line separator' and 'paragraph separator'
1473 characters (0x2028 and 0x2029 respectively) should be converted into a
1474 carriage return / line feed pair, or into a line feed only when converting
1475 from Unicode into a foreign character set. This applies to all foreign
1476 character sets that do not contain a direct equivalent of these Unicode
1479 By default, line and paragraph separators are converted into a CR/LF pair.
1480 This function should be called (if at all) after calling
1481 PrepareToConvertToOrFromL() and before calling ConvertFromUnicode() and/or
1484 @param aDowngradeForExoticLineTerminatingCharacters Specify
1485 EDowngradeExoticLineTerminatingCharactersToCarriageReturnLineFeed if
1486 line/paragraph separators should be converted into a carriage return and
1487 line feed combination and
1488 EDowngradeExoticLineTerminatingCharactersToJustLineFeed if they should be
1489 converted into line feeds only. Any other value causes the function to panic. */
1491 CCnvCharacterSetConverter::SetDowngradeForExoticLineTerminatingCharacters(
1492 TDowngradeForExoticLineTerminatingCharacters aDowngradeForExoticLineTerminatingCharacters)
1494 if ( (aDowngradeForExoticLineTerminatingCharacters!=EDowngradeExoticLineTerminatingCharactersToCarriageReturnLineFeed) && (aDowngradeForExoticLineTerminatingCharacters!=EDowngradeExoticLineTerminatingCharactersToJustLineFeed) )
1496 OstTrace0( TRACE_FATAL, CCNVCHARACTERSETCONVERTER_SETDOWNGRADEFOREXOTICLINETERMINATINGCHARACTERS, "Bad Downgrade For Exotic Line Terminating Characters1 in CCnvCharacterSetConverter::SetDowngradeForExoticLineTerminatingCharacters" );
1498 __ASSERT_ALWAYS((aDowngradeForExoticLineTerminatingCharacters==EDowngradeExoticLineTerminatingCharactersToCarriageReturnLineFeed) || (aDowngradeForExoticLineTerminatingCharacters==EDowngradeExoticLineTerminatingCharactersToJustLineFeed), Panic(EPanicBadDowngradeForExoticLineTerminatingCharacters1));
1499 iDowngradeForExoticLineTerminatingCharacters=aDowngradeForExoticLineTerminatingCharacters;
1502 /** Sets the character used to replace unconvertible characters in the output
1503 descriptor, when converting from Unicode into another character set.
1505 The default replacement for unconvertible Unicode characters is specified
1506 in the conversion data for the character set. The replacement text which is
1507 set using this function overrides the default value.
1511 If the replacement character is multi-byte, and its endian-ness is undefined
1512 in the character set, then its byte order is taken by default to be
1515 PrepareToConvertToOrFromL() undoes the effect of any previous calls to this
1516 function. So, to have any effect, this function should be called between the
1517 PrepareToConvertToOrFromL() call and the subsequent ConvertFromUnicode() call
1520 The value only applies when converting from Unicode to another character set.
1521 In Unicode, the code for 'unknown character'is always 0xFFFD.
1523 @param aReplacementForUnconvertibleUnicodeCharacters The single character
1524 which is to be used to replace unconvertible characters. */
1526 CCnvCharacterSetConverter::SetReplacementForUnconvertibleUnicodeCharactersL(
1527 const TDesC8& aReplacementForUnconvertibleUnicodeCharacters)
1529 iReplacementForUnconvertibleUnicodeCharacters=aReplacementForUnconvertibleUnicodeCharacters;
1532 /** Converts text encoded in the Unicode character set (UCS-2) into other
1535 The first overload of the function simply performs the conversion. The
1536 second overload converts the text and gets the number of characters
1537 that could not be converted. The third overload converts the text,
1538 gets the number of characters that could not be converted, and also
1539 gets the index of the first character that could not be converted. A
1540 fourth overload was introduced in v6.0 see below.All overloads cause a
1541 panic if no target character set has been selected to convert to (i.e.
1542 either overload of PrepareToConvertToOrFromL() must have
1543 been successfully called beforehand). You may also need to call
1544 SetDefaultEndiannessOfForeignCharacters() to define the
1545 endian-ness of the output descriptor.Notes:A sixteen-bit descriptor is
1546 used to hold the source Unicode encoded text, and an eight-bit
1547 descriptor is used to hold the converted non-Unicode text. Eight-bit
1548 descriptors are used because non-Unicode character sets may use a
1549 single byte per character (e.g. Code Page 1252) or more than one byte
1550 per character (e.g. GB 2312-80) or even a variable number of bytes per
1551 character (e.g. Shift-JIS).The function will fail to convert all the
1552 input descriptor if the output descriptor is not long enough to hold
1553 all the text.Unicode characters cannot be converted if there is no
1554 equivalent for them in the target character set. This does not stop
1555 the conversion, the missing character is simply replaced by the
1556 character in the target character set which represents unknown
1557 characters. This default unknown character can be changed using
1558 SetReplacementForUnconvertibleUnicodeCharactersL().
1560 @param aForeign On return, contains the converted text in a non-Unicode
1562 @param aUnicode The source Unicode text to be converted.
1563 @param aNumberOfUnconvertibleCharacters On return contains the number of
1564 characters which could not be converted.
1565 @param aIndexOfFirstUnconvertibleCharacter On return, contains the index
1566 of the first character in the input text that could not be converted. The
1567 value is negative if all characters were converted.
1568 @return The number of unconverted characters left at the end of the input
1569 descriptor (e.g. because the output descriptor is not long enough to hold
1570 all the text), or one of the error values defined in TError. */
1571 EXPORT_C TInt CCnvCharacterSetConverter::ConvertFromUnicode(TDes8& aForeign,
1572 const TDesC16& aUnicode) const
1574 TArrayOfAscendingIndices notUsed;
1575 return ConvertFromUnicode(aForeign, aUnicode, notUsed);
1578 EXPORT_C TInt CCnvCharacterSetConverter::ConvertFromUnicode(TDes8& aForeign, const TDesC16& aUnicode, TInt& aNumberOfUnconvertibleCharacters) const
1580 TArrayOfAscendingIndices indicesOfUnconvertibleCharacters;
1581 const TInt returnValue=ConvertFromUnicode(aForeign, aUnicode, indicesOfUnconvertibleCharacters);
1582 aNumberOfUnconvertibleCharacters=indicesOfUnconvertibleCharacters.NumberOfIndices();
1586 /** Converts text encoded in the Unicode character set (UCS-2) into other
1589 The first overload of the function simply performs the conversion. The second
1590 overload converts the text and gets the number of characters that could not
1591 be converted. The third overload converts the text, gets the number of
1592 characters that could not be converted, and also gets the index of the first
1593 character that could not be converted. A fourth overload was introduced in v6,
1596 All overloads cause a panic if no target character set has been selected to
1597 convert to (i.e. either overload of PrepareToConvertToOrFromL() must have
1598 been successfully called beforehand). You may also need to call
1599 SetDefaultEndiannessOfForeignCharacters() to define the endian-ness of the
1604 A sixteen-bit descriptor is used to hold the source Unicode encoded text,
1605 and an eight-bit descriptor is used to hold the converted non-Unicode text.
1606 Eight-bit descriptors are used because non-Unicode character sets may use
1607 a single byte per character (e.g. Code Page 1252) or more than one byte per
1608 character (e.g. GB 2312-80) or even a variable number of bytes per character
1611 The function will fail to convert all the input descriptor if the output
1612 descriptor is not long enough to hold all the text.
1614 Unicode characters cannot be converted if there is no equivalent for them
1615 in the target character set. This does not stop the conversion, the missing
1616 character is simply replaced by the character in the target character set
1617 which represents unknown characters. This default unknown character can be
1618 changed using SetReplacementForUnconvertibleUnicodeCharactersL().
1620 @param aForeign On return, contains the converted text in a non-Unicode
1622 @param aUnicode The source Unicode text to be converted.
1623 @param aNumberOfUnconvertibleCharacters On return contains the number of
1624 characters which could not be converted.
1625 @param aIndexOfFirstUnconvertibleCharacter On return, contains the index of
1626 the first character in the input text that could not be converted. The value
1627 is negative if all characters were converted.
1628 @return The number of unconverted characters left at the end of the input
1629 descriptor (e.g. because the output descriptor is not long enough to hold all
1630 the text), or one of the error values defined in TError. */
1631 EXPORT_C TInt CCnvCharacterSetConverter::ConvertFromUnicode(
1633 const TDesC16& aUnicode,
1634 TInt& aNumberOfUnconvertibleCharacters,
1635 TInt& aIndexOfFirstUnconvertibleCharacter) const
1637 TArrayOfAscendingIndices indicesOfUnconvertibleCharacters;
1638 const TInt returnValue=ConvertFromUnicode(aForeign, aUnicode, indicesOfUnconvertibleCharacters);
1639 aNumberOfUnconvertibleCharacters=indicesOfUnconvertibleCharacters.NumberOfIndices();
1640 aIndexOfFirstUnconvertibleCharacter=(aNumberOfUnconvertibleCharacters==0)? -1: indicesOfUnconvertibleCharacters[0];
1644 /** Converts Unicode text into another character set.
1646 Differs from the other overloads of this function by returning the indices
1647 of all of the characters in the source Unicode text which could not be converted.
1649 @param aForeign On return, contains the converted text in a non-Unicode
1651 @param aUnicode The source Unicode text to be converted.
1652 @param aIndicesOfUnconvertibleCharacters On return, holds the indices of each
1653 Unicode character in the source text which could not be converted.
1654 @return The number of unconverted characters left at the end of the input
1655 descriptor (e.g. because the output descriptor is not long enough to hold all
1656 the text), or one of the error values defined in TError. */
1657 EXPORT_C TInt CCnvCharacterSetConverter::ConvertFromUnicode(
1659 const TDesC16& aUnicode,
1660 TArrayOfAscendingIndices& aIndicesOfUnconvertibleCharacters) const
1662 if ( iCharacterSetIdentifierOfLoadedConversionData==0 )
1664 OstTrace0( TRACE_FATAL, CCNVCHARACTERSETCONVERTER_CONVERTFROMUNICODE, "NullCharacterSetIdentifier1 in CCnvCharacterSetConverter::ConvertFromUnicode" );
1666 __ASSERT_ALWAYS(iCharacterSetIdentifierOfLoadedConversionData!=0, Panic(EPanicNullCharacterSetIdentifier1));
1667 if (aUnicode.Length()==0)
1669 aForeign.SetLength(0);
1672 if (aForeign.MaxLength()==0)
1674 return aUnicode.Length();
1676 TTlsData::SetCurrentCharacterSetConverter(this);
1678 if (iStoredFlags&EStoredFlagConversionPlugInLibraryIsLoaded)
1682 implUid.iUid = iCharacterSetIdentifierOfLoadedConversionData;
1683 returnValue = (iCharsetCnvCache->Converter(implUid))->ConvertFromUnicode(
1684 iDefaultEndiannessOfForeignCharacters,
1685 iReplacementForUnconvertibleUnicodeCharacters,
1688 aIndicesOfUnconvertibleCharacters);
1692 switch (iCharacterSetIdentifierOfLoadedConversionData)
1694 case KCharacterSetIdentifierUtf7:
1695 returnValue=CnvUtfConverter::ConvertFromUnicodeToUtf7(aForeign, aUnicode, ETrue);
1697 case KCharacterSetIdentifierUtf8:
1698 returnValue=CnvUtfConverter::ConvertFromUnicodeToUtf8(aForeign, aUnicode);
1700 case KCharacterSetIdentifierImapUtf7:
1701 returnValue=CnvUtfConverter::ConvertFromUnicodeToUtf7(aForeign, aUnicode, ETrue, EFalse);
1703 case KCharacterSetIdentifierJavaConformantUtf8:
1704 returnValue=CnvUtfConverter::ConvertFromUnicodeToUtf8(aForeign, aUnicode, ETrue);
1707 __ASSERT_ALWAYS(iConversionData!=NULL, Panic(EPanicNoConversionData1));
1708 returnValue=DoConvertFromUnicode(*iConversionData, iDefaultEndiannessOfForeignCharacters, iReplacementForUnconvertibleUnicodeCharacters, aForeign, aUnicode, aIndicesOfUnconvertibleCharacters);
1712 TTlsData::SetCurrentCharacterSetConverter(NULL);
1718 /** Converts text encoded in a non-Unicode character set into the Unicode
1719 character set (UCS-2).
1721 The first overload of the function simply performs the conversion. The
1722 second overload converts the text and gets the number of bytes in the
1723 input string that could not be converted. The third overload converts
1724 the text, gets the number of bytes that could not be converted, and
1725 also gets the index of the first byte that could not be converted.All
1726 overloads cause a panic if no source character set has been selected
1727 to convert from (i.e. either overload of PrepareToConvertToOrFromL()
1728 must have been successfully called beforehand). You may also need to call
1729 SetDefaultEndiannessOfForeignCharacters() to define the
1730 endian-ness of the input descriptor.Notes: Since Unicode is intended to
1731 be the superset of all character sets, the function should usually
1732 report zero unconverted characters. Unconvertible characters will
1733 exist if the input descriptor contains illegal characters, i.e. values
1734 not in the selected non-Unicode character set.The presence of illegal
1735 characters does not stop the conversion. The missing character is
1736 simply replaced by the Unicode character which represents unknown
1737 characters (0xFFFD).If the source text consists solely of a
1738 character that is not complete, the function returns
1739 EErrorIllFormedInput. The reason for this is to prevent
1740 the possibility of the calling code getting into a infinite loop.
1742 @param aUnicode On return, contains the converted text in the Unicode
1743 character aForeign The non-Unicode source text to be converted.
1744 @param aState This is used to save state information across multiple
1745 calls to ConvertToUnicode(). You should initialise the value
1746 to KStateDefault, and then do not change it in a series of
1748 @param aNumberOfUnconvertibleCharacters On return, contains the number of
1749 bytes which were not converted.
1750 @param aIndexOfFirstByteOfFirstUnconvertibleCharacter On return, the index
1751 of the first byte of the first unconvertible character. For instance if
1752 the first character in the input descriptor (aForeign) could
1753 not be converted, then this parameter is set to the first byte of that
1754 character, i.e. zero. A negative value is returned if all the characters
1756 @return The number of unconverted bytes left at the end of the input
1757 descriptor (e.g. because the output descriptor is not long enough to hold
1758 all the text), or one of the error values defined in TError.*/
1759 EXPORT_C TInt CCnvCharacterSetConverter::ConvertToUnicode(TDes16& aUnicode,
1760 const TDesC8& aForeign,
1765 return ConvertToUnicode(aUnicode, aForeign, aState, notUsed1, notUsed2);
1768 EXPORT_C TInt CCnvCharacterSetConverter::ConvertToUnicode(TDes16& aUnicode, const TDesC8& aForeign, TInt& aState, TInt& aNumberOfUnconvertibleCharacters) const
1771 return ConvertToUnicode(aUnicode, aForeign, aState, aNumberOfUnconvertibleCharacters, notUsed);
1774 /** Converts text encoded in a non-Unicode character set into the Unicode
1775 character set (UCS-2).
1777 The first overload of the function simply performs the conversion. The second
1778 overload converts the text and gets the number of bytes in the input string
1779 that could not be converted. The third overload converts the text, gets the
1780 number of bytes that could not be converted, and also gets the index of the
1781 first byte that could not be converted.
1783 All overloads cause a panic if no source character set has been selected to
1784 convert from (i.e. either overload of PrepareToConvertToOrFromL() must have
1785 been successfully called beforehand). You may also need to call
1786 SetDefaultEndiannessOfForeignCharacters() to define the endian-ness of the
1791 Since Unicode is intended to be the superset of all character sets, the function
1792 should usually report zero unconverted characters. Unconvertible characters
1793 will exist if the input descriptor contains illegal characters, i.e. values
1794 not in the selected non-Unicode character set.
1796 The presence of illegal characters does not stop the conversion. The missing
1797 character is simply replaced by the Unicode character which represents unknown
1798 characters (0xFFFD).
1800 If the source text consists solely of a character that is not complete, the function
1801 returns EErrorIllFormedInput. The reason for this is to prevent the possibility
1802 of the calling code getting into a infinite loop.
1804 @param aUnicode On return, contains the converted text in the Unicode character
1806 @param aForeign The non-Unicode source text to be converted.
1807 @param aState This is used to save state information across multiple calls
1808 to ConvertToUnicode(). You should initialise the value to KStateDefault, and
1809 then do not change it in a series of related calls.
1810 @param aNumberOfUnconvertibleCharacters On return, contains the number of bytes
1811 which were not converted.
1812 @param aIndexOfFirstByteOfFirstUnconvertibleCharacter On return, the index
1813 of the first byte of the first unconvertible character. For instance if the
1814 first character in the input descriptor (aForeign) could not be converted,
1815 then this parameter is set to the first byte of that character, i.e. zero.
1816 A negative value is returned if all the characters were converted.
1817 @return The number of unconverted bytes left at the end of the input descriptor
1818 (e.g. because the output descriptor is not long enough to hold all the text),
1819 or one of the error values defined in TError. */
1820 EXPORT_C TInt CCnvCharacterSetConverter::ConvertToUnicode(
1822 const TDesC8& aForeign,
1824 TInt& aNumberOfUnconvertibleCharacters,
1825 TInt& aIndexOfFirstByteOfFirstUnconvertibleCharacter) const
1827 if ( iCharacterSetIdentifierOfLoadedConversionData==0 )
1829 OstTrace0( TRACE_FATAL, CCNVCHARACTERSETCONVERTER_CONVERTTOUNICODE, "Null CharacterSetIdentifier2 in CCnvCharacterSetConverter::ConvertToUnicode" );
1831 __ASSERT_ALWAYS(iCharacterSetIdentifierOfLoadedConversionData!=0, Panic(EPanicNullCharacterSetIdentifier2));
1832 aNumberOfUnconvertibleCharacters=0;
1833 aIndexOfFirstByteOfFirstUnconvertibleCharacter=-1;
1834 if (aForeign.Length()==0)
1836 aUnicode.SetLength(0);
1839 if (aUnicode.MaxLength()==0)
1841 return aForeign.Length();
1843 TTlsData::SetCurrentCharacterSetConverter(this);
1845 if (iStoredFlags&EStoredFlagConversionPlugInLibraryIsLoaded)
1848 implUid.iUid = iCharacterSetIdentifierOfLoadedConversionData;
1849 returnValue = (iCharsetCnvCache->Converter(implUid))->ConvertToUnicode(
1850 iDefaultEndiannessOfForeignCharacters,
1854 aNumberOfUnconvertibleCharacters,
1855 aIndexOfFirstByteOfFirstUnconvertibleCharacter);
1859 switch (iCharacterSetIdentifierOfLoadedConversionData)
1861 case KCharacterSetIdentifierUtf7:
1862 returnValue=CnvUtfConverter::ConvertToUnicodeFromUtf7(aUnicode, aForeign, aState);
1864 case KCharacterSetIdentifierUtf8:
1865 returnValue=CnvUtfConverter::ConvertToUnicodeFromUtf8(aUnicode, aForeign, EFalse, aNumberOfUnconvertibleCharacters, aIndexOfFirstByteOfFirstUnconvertibleCharacter);
1867 case KCharacterSetIdentifierJavaConformantUtf8:
1868 returnValue=CnvUtfConverter::ConvertToUnicodeFromUtf8(aUnicode, aForeign, ETrue, aNumberOfUnconvertibleCharacters, aIndexOfFirstByteOfFirstUnconvertibleCharacter);
1870 case KCharacterSetIdentifierImapUtf7:
1871 returnValue=CnvUtfConverter::ConvertToUnicodeFromUtf7(aUnicode, aForeign, ETrue, aState);
1874 if ( iConversionData==NULL )
1876 OstTrace0( TRACE_FATAL, DUP1_CCNVCHARACTERSETCONVERTER_CONVERTTOUNICODE, "No ConversionData2 in CCnvCharacterSetConverter::ConvertToUnicode" );
1878 __ASSERT_ALWAYS(iConversionData!=NULL, Panic(EPanicNoConversionData2));
1879 returnValue=DoConvertToUnicode(*iConversionData, iDefaultEndiannessOfForeignCharacters, aUnicode, aForeign, aNumberOfUnconvertibleCharacters, aIndexOfFirstByteOfFirstUnconvertibleCharacter);
1883 TTlsData::SetCurrentCharacterSetConverter(NULL);
1890 @see AutoDetectCharSetL
1895 EXPORT_C void CCnvCharacterSetConverter::AutoDetectCharacterSetL(
1896 TInt& aConfidenceLevel,
1897 TUint& aCharacterSetIdentifier,
1898 const CArrayFix<SCharacterSet>& aArrayOfCharacterSetsAvailable,
1899 const TDesC8& aSample)
1901 CCnvCharacterSetConverter* converter = CCnvCharacterSetConverter::NewLC();
1902 converter->AutoDetectCharSetL(aConfidenceLevel,
1903 aCharacterSetIdentifier,
1904 aArrayOfCharacterSetsAvailable,
1906 CleanupStack::Pop(converter);
1911 /** Attempts to determine the character set of the sample text from
1912 those supported on the phone.
1914 For each of the available character sets, its implementation of
1915 IsInThisCharacterSetL() is called. The character set which returns the highest
1916 confidence level (i.e. which generates the fewest 0xFFFD Unicode replacement
1917 characters) is returned in aCharacterSetIdentifier.
1919 This function merely determines if the sample text is convertible with this
1920 converter: it does no textual analysis on the result. Therefore, this function
1921 is not capable of differentiating between very similar encodings (for example
1922 the different ISO 8859 variants).
1924 Any code making use of this function should provide a way for the user to
1925 override the selection that this function makes.
1927 Please note that the operation of this function is slow.It takes no account of the usual
1928 ontext that would be used in guessing a character set (for example, the language that
1929 is expected to be encoded or the transport used). For situations where such context is known,
1930 a faster, more accurate solution is advisable.
1932 To improve a performance of autodetection, a size (default is one) of interface proxy cache
1933 should be increased (see SetCharacterSetCacheSize()).However a boost of performance
1934 will not be visible within a first funtion call because during this first call character sets
1935 are loaded to a cache. Once created it will be preserved until CCnvCharacterSetConverter
1936 object is destroyed.
1939 This is a static function which uses ECOM functionality.
1940 It cleans up ECOM by calling FinalClose()
1942 @param aConfidenceLevel Set by the function to a value between 0 and 100.
1943 0 indicates the function has no idea what character set aSample is encoded
1944 in. In this case, aCharacterSetIdentifier is undefined. 100 indicates total
1945 confidence that aCharacterSetIdentifier is the character set of aSample.
1946 @param aCharacterSetIdentifier On return, the UID of the best available
1947 character set for the sample text aSample. Character set UIDs are defined
1949 @param aArrayOfCharacterSetsAvailable The array of character sets available
1950 on the phone. If this is not already available, it can be created using
1951 CreateArrayOfCharacterSetsAvailableL() or
1952 CreateArrayOfCharacterSetsAvailableLC().
1953 @param aSample The non-Unicode sample text string. */
1954 EXPORT_C void CCnvCharacterSetConverter::AutoDetectCharSetL(
1955 TInt& aConfidenceLevel,
1956 TUint& aCharacterSetIdentifier,
1957 const CArrayFix<SCharacterSet>& aArrayOfCharacterSetsAvailable,
1958 const TDesC8& aSample)
1961 CleanupStack::PushL(TCleanupItem(CloseECOMSession, NULL));
1964 aCharacterSetIdentifier=0;
1965 // loop through the aArrayofCharacterSetAvailable
1966 TInt previousConfidenceLevel = 0;
1967 RArray<TUint> chid(25);
1968 CleanupClosePushL(chid);
1970 for (TInt i=aArrayOfCharacterSetsAvailable.Count()-1; i>=0; --i)
1972 const CCnvCharacterSetConverter::SCharacterSet& charactersSet=aArrayOfCharacterSetsAvailable[i];
1974 if (charactersSet.Identifier() == KCharacterSetIdentifierWin1252)
1975 continue; // Win1252 is same as CP1252, so just ignore it
1977 if (charactersSet.FileIsConversionPlugInLibrary())
1980 TBool plugInImplementsAutoDetect=EFalse;
1983 implUid.iUid = charactersSet.Identifier();
1984 TBool isInThisCharSet = (iCharsetCnvCache->GetConverterL(implUid))->IsInThisCharacterSetL(
1985 plugInImplementsAutoDetect,
1988 OstTraceExt3( TRACE_DUMP, CCNVCHARACTERSETCONVERTER_AUTODETECTCHARSETL, "detect identifier 0x%x, return isInThisCharSet=%d, aConfidenceLevel=%d", implUid.iUid, isInThisCharSet, aConfidenceLevel);
1989 if ((!plugInImplementsAutoDetect) || !isInThisCharSet)
1994 else if (charactersSet.NameIsFileName())
2000 TUint characterIdentifier = charactersSet.Identifier();
2001 ::IsBuiltInCharacterSet(characterIdentifier,aConfidenceLevel,aSample);
2003 if (aConfidenceLevel > previousConfidenceLevel)
2005 previousConfidenceLevel = aConfidenceLevel;
2007 User::LeaveIfError(chid.Append(charactersSet.Identifier()));
2009 else if ((aConfidenceLevel == previousConfidenceLevel) && (previousConfidenceLevel != 0))
2011 User::LeaveIfError(chid.Append(charactersSet.Identifier()));
2015 TInt min = KMaxTInt;;
2016 const TInt numberOfCandidateCharacterSets=chid.Count();
2017 if (numberOfCandidateCharacterSets ==0)
2019 OstTrace0( TRACE_DUMP, DUP2_CCNVCHARACTERSETCONVERTER_AUTODETECTCHARSETL, "We donot find any candidate in first run, so add all plugin as candidate." );
2020 // all the charcterset returned 0, so take all and find then one with least unconvertible
2022 for (TInt i=aArrayOfCharacterSetsAvailable.Count()-1; i>=0; --i)
2024 const CCnvCharacterSetConverter::SCharacterSet& charactersSettoAppend=aArrayOfCharacterSetsAvailable[i];
2025 User::LeaveIfError(chid.Append(charactersSettoAppend.Identifier()));
2028 if (numberOfCandidateCharacterSets>1)
2030 // convert and check for the number of unconvertible characters
2031 CCnvCharacterSetConverter* const charconverter=NewLC();
2032 TBuf<256>* const convertedToUnicode=new(ELeave) TBuf<256>;
2033 CleanupStack::PushL(convertedToUnicode);
2034 RFs dummyFileServerSession; // PrepareToConvertToOrFromL will not actually use this parameter
2035 for (TInt i=0; i<numberOfCandidateCharacterSets; ++i)
2037 charconverter->PrepareToConvertToOrFromL(chid[i], aArrayOfCharacterSetsAvailable, dummyFileServerSession);
2038 TInt state=KStateDefault;
2039 TInt unconvertibleChars;
2040 charconverter->ConvertToUnicode(*convertedToUnicode,aSample,state,unconvertibleChars);
2041 OstTraceExt2( TRACE_DUMP, DUP1_CCNVCHARACTERSETCONVERTER_AUTODETECTCHARSETL, "Plugin 0x%x has %d unconvertibleChars", chid[i], unconvertibleChars);
2043 if (unconvertibleChars < min)
2045 min = unconvertibleChars;
2049 CleanupStack::PopAndDestroy(2, charconverter);
2052 aConfidenceLevel=previousConfidenceLevel;
2054 //aConfidenceLevel=another;
2055 aCharacterSetIdentifier = chid[result];
2056 OstTrace1( TRACE_DUMP, DUP3_CCNVCHARACTERSETCONVERTER_AUTODETECTCHARSETL, "Use 0x%x as the auto detected plugin", aCharacterSetIdentifier);
2058 if (aConfidenceLevel <= ELowestThreshold)
2060 // go through all the charset available again and start converting the sample test
2061 // the one with the least 0xfffd is the winner !!
2063 CleanupStack::PopAndDestroy(&chid);
2064 CleanupStack::PopAndDestroy(); //CloseECOMSession
2070 @see ConvertibleToCharSetL
2075 EXPORT_C void CCnvCharacterSetConverter::ConvertibleToCharacterSetL(
2076 TInt& aConfidenceLevel,
2077 const TUint aCharacterSetIdentifier,
2078 const CArrayFix<SCharacterSet>& aArrayOfCharacterSetsAvailable,
2079 const TDesC8& aSample)
2081 CCnvCharacterSetConverter* converter = CCnvCharacterSetConverter::NewLC();
2082 converter->ConvertibleToCharSetL(aConfidenceLevel,
2083 aCharacterSetIdentifier,
2084 aArrayOfCharacterSetsAvailable,
2086 CleanupStack::Pop(converter);
2091 /** Given a character set UID aCharacterSetIdentifier,
2092 ConvertibleToCharacterSetL returns the likelihood that aSample
2093 is encoded in that character set. It goes through the array of character sets
2094 aArrayOfCharacterSetsAvailable and searches for the character set
2095 matching aCharacterSetIdentifier. The character sets
2096 IsInThisCharacterSetL function is called to determine the probability
2097 of it being encoded in that character set.
2099 This is a static function which uses ECOM functionality. It cleans up ECOM by calling FinalClose()
2102 @param aConfidenceLevel Set by the function to a value between 0 and 100. It
2103 indicates the likelihood that aSample is encoded in aCharacterSetIdentifier.
2104 @param aCharacterSetIdentifier the likelihood of aSample being
2105 encoded in that character set.
2106 @param aArrayOfCharacterSetsAvailable The array of character sets available on
2107 the device. If this is not already available, it can be created using
2108 CreateArrayOfCharacterSetsAvailableL() or
2109 CreateArrayOfCharacterSetsAvailableLC().
2110 @param aSample The non-Unicode sample text string. */
2111 EXPORT_C void CCnvCharacterSetConverter::ConvertibleToCharSetL(
2112 TInt& aConfidenceLevel,
2113 const TUint aCharacterSetIdentifier,
2114 const CArrayFix<SCharacterSet>& aArrayOfCharacterSetsAvailable,
2115 const TDesC8& aSample)
2117 CleanupStack::PushL(TCleanupItem(CloseECOMSession, NULL));
2119 aConfidenceLevel = 0;
2121 // for each charcater set in the array of character set see if it matches
2122 // aCharacterSetIdentifier
2124 TInt charsetsInArray = aArrayOfCharacterSetsAvailable.Count();
2125 for (TInt i=0; i<charsetsInArray; ++i)
2127 const CCnvCharacterSetConverter::SCharacterSet& charactersSet=aArrayOfCharacterSetsAvailable[i];
2128 if (charactersSet.Identifier()==aCharacterSetIdentifier)
2130 // found the Charset matching the UID, Use this to find the confidence Level
2131 if ((charactersSet.FileIsConversionPlugInLibrary()) && (charactersSet.NameIsFileName()))
2134 TBool plugInConvertibleTo=EFalse;
2136 implUid.iUid = charactersSet.Identifier();
2137 TBool isThisCharSet = (iCharsetCnvCache->GetConverterL(implUid))->IsInThisCharacterSetL(
2138 plugInConvertibleTo,
2141 if ((!plugInConvertibleTo) || !isThisCharSet)
2148 ::IsBuiltInCharacterSet(aCharacterSetIdentifier,aConfidenceLevel,aSample);
2152 CleanupStack::PopAndDestroy(); //CloseECOMSession
2155 LOCAL_C TUint OutputCharacterCode(TUint aInputCharacterCode,
2156 const SCnvConversionData::SOneDirectionData::SRange& aRange)
2158 if ( (aInputCharacterCode<aRange.iFirstInputCharacterCodeInRange) || (aInputCharacterCode>aRange.iLastInputCharacterCodeInRange) )
2160 OstTrace0( TRACE_FATAL, _OUTPUTCHARACTERCODE, "Input Character Code Not In Range in ::OutputCharacterCode" );
2162 __ASSERT_DEBUG((aInputCharacterCode>=aRange.iFirstInputCharacterCodeInRange) && (aInputCharacterCode<=aRange.iLastInputCharacterCodeInRange), Panic(EPanicInputCharacterCodeNotInRange));
2163 switch (aRange.iAlgorithm)
2165 case SCnvConversionData::SOneDirectionData::SRange::EDirect:
2166 return aInputCharacterCode;
2167 case SCnvConversionData::SOneDirectionData::SRange::EOffset:
2168 #if defined(CONST_STATIC_UNIONS_ARE_POSSIBLE)
2169 if (aRange.iData.iOffset==0)
2171 OstTrace0( TRACE_DUMP, DUP1__OUTPUTCHARACTERCODE, "EPanicZeroOffset1" );
2173 __ASSERT_DEBUG(aRange.iData.iOffset!=0, Panic(EPanicZeroOffset1));
2174 return aInputCharacterCode+aRange.iData.iOffset;
2176 if (STATIC_CAST(TInt, aRange.iData.iWord1)==0)
2178 OstTrace0( TRACE_DUMP, DUP2__OUTPUTCHARACTERCODE, "EPanicZeroOffset2" );
2180 __ASSERT_DEBUG(STATIC_CAST(TInt, aRange.iData.iWord1)!=0, Panic(EPanicZeroOffset2));
2181 return aInputCharacterCode+STATIC_CAST(TInt, aRange.iData.iWord1);
2183 case SCnvConversionData::SOneDirectionData::SRange::EIndexedTable16:
2184 #if defined(CONST_STATIC_UNIONS_ARE_POSSIBLE)
2185 return aRange.iData.iIndexedTable16.iEntryArray
2187 return REINTERPRET_CAST(SCnvConversionData::SOneDirectionData::SRange::UData::SIndexedTable16::SEntry*, aRange.iData.iWord1)
2189 [aInputCharacterCode-aRange.iFirstInputCharacterCodeInRange].iOutputCharacterCode;
2190 case SCnvConversionData::SOneDirectionData::SRange::EKeyedTable1616:
2193 #if defined(CONST_STATIC_UNIONS_ARE_POSSIBLE)
2194 TInt rightIndex=aRange.iData.iKeyedTable1616.iNumberOfEntries;
2195 const SCnvConversionData::SOneDirectionData::SRange::UData::SKeyedTable1616::SEntry* const entryArray=aRange.iData.iKeyedTable1616.iEntryArray;
2197 TInt rightIndex=STATIC_CAST(TInt, aRange.iData.iWord1);
2198 const SCnvConversionData::SOneDirectionData::SRange::UData::SKeyedTable1616::SEntry* const entryArray=REINTERPRET_CAST(SCnvConversionData::SOneDirectionData::SRange::UData::SKeyedTable1616::SEntry*, aRange.iData.iWord2);
2202 OstTrace0( TRACE_DUMP, DUP3__OUTPUTCHARACTERCODE, "EPanicEmptyKeyedTable1616" );
2204 __ASSERT_DEBUG(rightIndex>0, Panic(EPanicEmptyKeyedTable1616));
2207 if (leftIndex>rightIndex)
2209 OstTrace0( TRACE_DUMP, DUP4__OUTPUTCHARACTERCODE, "EPanicBadIndices1" );
2211 __ASSERT_DEBUG(leftIndex<=rightIndex, Panic(EPanicBadIndices1));
2212 if (leftIndex==rightIndex)
2214 return KNoConversionAvailable;
2216 const TInt middleIndex=(leftIndex+rightIndex)>>1;
2217 const TUint key=entryArray[middleIndex].iKey;
2218 if (aInputCharacterCode<key)
2220 rightIndex=middleIndex;
2222 else if (aInputCharacterCode>key)
2224 leftIndex=middleIndex+1;
2228 return entryArray[middleIndex].iOutputCharacterCode;
2232 case SCnvConversionData::SOneDirectionData::SRange::EKeyedTable16OfIndexedTables16:
2235 #if defined(CONST_STATIC_UNIONS_ARE_POSSIBLE)
2236 TInt rightIndex=aRange.iData.iKeyedTable16OfIndexedTables16.iNumberOfKeyedEntries;
2237 const SCnvConversionData::SOneDirectionData::SRange::UData::SKeyedTable16OfIndexedTables16::SKeyedEntry* const keyedEntryArray=aRange.iData.iKeyedTable16OfIndexedTables16.iKeyedEntryArray;
2239 TInt rightIndex=STATIC_CAST(TInt, aRange.iData.iWord1);
2240 const SCnvConversionData::SOneDirectionData::SRange::UData::SKeyedTable16OfIndexedTables16::SKeyedEntry* const keyedEntryArray=REINTERPRET_CAST(SCnvConversionData::SOneDirectionData::SRange::UData::SKeyedTable16OfIndexedTables16::SKeyedEntry*, aRange.iData.iWord2);
2244 OstTrace0( TRACE_DUMP, DUP5__OUTPUTCHARACTERCODE, "EPanicEmptyKeyedTable16OfIndexedTables16" );
2246 __ASSERT_DEBUG(rightIndex>0, Panic(EPanicEmptyKeyedTable16OfIndexedTables16));
2249 if (leftIndex>rightIndex)
2251 OstTrace0( TRACE_DUMP, DUP6__OUTPUTCHARACTERCODE, "EPanicBadIndices2" );
2253 __ASSERT_DEBUG(leftIndex<=rightIndex, Panic(EPanicBadIndices2));
2254 if (leftIndex==rightIndex)
2256 return KNoConversionAvailable;
2258 const TInt middleIndex=(leftIndex+rightIndex)>>1;
2259 const SCnvConversionData::SOneDirectionData::SRange::UData::SKeyedTable16OfIndexedTables16::SKeyedEntry& keyedEntry=keyedEntryArray[middleIndex];
2260 if (aInputCharacterCode<keyedEntry.iFirstInputCharacterCodeInIndexedTable)
2262 rightIndex=middleIndex;
2264 else if (aInputCharacterCode>keyedEntry.iLastInputCharacterCodeInIndexedTable)
2266 leftIndex=middleIndex+1;
2270 return keyedEntry.iIndexedEntryArray[aInputCharacterCode-keyedEntry.iFirstInputCharacterCodeInIndexedTable];
2275 //new 32 bit algorithms start
2276 case SCnvConversionData::SOneDirectionData::SRange::EIndexedTable32:
2277 #if defined(CONST_STATIC_UNIONS_ARE_POSSIBLE)
2278 return aRange.iData.iIndexedTable32.iEntryArray
2280 return REINTERPRET_CAST(SCnvConversionData::SOneDirectionData::SRange::UData::SIndexedTable32::SEntry*, aRange.iData.iWord1)
2282 [aInputCharacterCode-aRange.iFirstInputCharacterCodeInRange].iOutputCharacterCode;
2283 case SCnvConversionData::SOneDirectionData::SRange::EKeyedTable3232:
2286 #if defined(CONST_STATIC_UNIONS_ARE_POSSIBLE)
2287 TInt rightIndex=aRange.iData.iKeyedTable3232.iNumberOfEntries;
2288 const SCnvConversionData::SOneDirectionData::SRange::UData::SKeyedTable3232::SEntry* const entryArray=aRange.iData.iKeyedTable3232.iEntryArray;
2290 TInt rightIndex=STATIC_CAST(TInt, aRange.iData.iWord1);
2291 const SCnvConversionData::SOneDirectionData::SRange::UData::SKeyedTable3232::SEntry* const entryArray=REINTERPRET_CAST(SCnvConversionData::SOneDirectionData::SRange::UData::SKeyedTable3232::SEntry*, aRange.iData.iWord2);
2295 OstTrace0( TRACE_DUMP, DUP7__OUTPUTCHARACTERCODE, "EPanicEmptyKeyedTable3232" );
2297 __ASSERT_DEBUG(rightIndex>0, Panic(EPanicEmptyKeyedTable3232));
2300 if (leftIndex>rightIndex)
2302 OstTrace0( TRACE_DUMP, DUP8__OUTPUTCHARACTERCODE, "EPanicBadIndices1" );
2304 __ASSERT_DEBUG(leftIndex<=rightIndex, Panic(EPanicBadIndices1));
2305 if (leftIndex==rightIndex)
2307 return KNoConversionAvailable;
2309 const TInt middleIndex=(leftIndex+rightIndex)>>1;
2310 const TUint key=entryArray[middleIndex].iKey;
2311 if (aInputCharacterCode<key)
2313 rightIndex=middleIndex;
2315 else if (aInputCharacterCode>key)
2317 leftIndex=middleIndex+1;
2321 return entryArray[middleIndex].iOutputCharacterCode;
2325 case SCnvConversionData::SOneDirectionData::SRange::EKeyedTable32OfIndexedTables32:
2328 #if defined(CONST_STATIC_UNIONS_ARE_POSSIBLE)
2329 TInt rightIndex=aRange.iData.iKeyedTable32OfIndexedTables32.iNumberOfKeyedEntries;
2330 const SCnvConversionData::SOneDirectionData::SRange::UData::SKeyedTable32OfIndexedTables32::SKeyedEntry* const keyedEntryArray=aRange.iData.iKeyedTable32OfIndexedTables32.iKeyedEntryArray;
2332 TInt rightIndex=STATIC_CAST(TInt, aRange.iData.iWord1);
2333 const SCnvConversionData::SOneDirectionData::SRange::UData::SKeyedTable32OfIndexedTables32::SKeyedEntry* const keyedEntryArray=REINTERPRET_CAST(SCnvConversionData::SOneDirectionData::SRange::UData::SKeyedTable32OfIndexedTables32::SKeyedEntry*, aRange.iData.iWord2);
2337 OstTrace0( TRACE_DUMP, DUP9__OUTPUTCHARACTERCODE, "EPanicEmptyKeyedTable32OfIndexedTables32" );
2339 __ASSERT_DEBUG(rightIndex>0, Panic(EPanicEmptyKeyedTable32OfIndexedTables32));
2342 if (leftIndex>rightIndex)
2344 OstTrace0( TRACE_DUMP, DUP10__OUTPUTCHARACTERCODE, "EPanicBadIndices2" );
2346 __ASSERT_DEBUG(leftIndex<=rightIndex, Panic(EPanicBadIndices2));
2347 if (leftIndex==rightIndex)
2349 return KNoConversionAvailable;
2351 const TInt middleIndex=(leftIndex+rightIndex)>>1;
2352 const SCnvConversionData::SOneDirectionData::SRange::UData::SKeyedTable32OfIndexedTables32::SKeyedEntry& keyedEntry=keyedEntryArray[middleIndex];
2353 if (aInputCharacterCode<keyedEntry.iFirstInputCharacterCodeInIndexedTable)
2355 rightIndex=middleIndex;
2357 else if (aInputCharacterCode>keyedEntry.iLastInputCharacterCodeInIndexedTable)
2359 leftIndex=middleIndex+1;
2363 return keyedEntry.iIndexedEntryArray[aInputCharacterCode-keyedEntry.iFirstInputCharacterCodeInIndexedTable];
2367 //new 32 bit algorithms end
2371 OstTrace0( TRACE_DUMP, DUP11__OUTPUTCHARACTERCODE, "EPanicBadAlgorithm1" );
2372 Panic(EPanicBadAlgorithm1);
2375 return 0; // dummy return to prevent compiler error
2379 ConvertsToForeignCharacterSet(
2380 TInt& aSizeOfOutputForeignCharacterCodeInBytes,
2381 TUint aInputUnicodeCharacterCode,
2382 const SCnvConversionData::SOneDirectionData::SRange* aFirstUnicodeToForeignRange,
2383 const SCnvConversionData::SOneDirectionData::SRange* aLastUnicodeToForeignRange)
2385 if (aFirstUnicodeToForeignRange==NULL)
2387 OstTrace0( TRACE_DUMP, _CONVERTSTOFOREIGNCHARACTERSET, "EPanicNullPointer1" );
2389 __ASSERT_DEBUG(aFirstUnicodeToForeignRange!=NULL, Panic(EPanicNullPointer1));
2390 if (aLastUnicodeToForeignRange==NULL)
2392 OstTrace0( TRACE_DUMP, DUP1__CONVERTSTOFOREIGNCHARACTERSET, "EPanicNullPointer2" );
2394 __ASSERT_DEBUG(aLastUnicodeToForeignRange!=NULL, Panic(EPanicNullPointer2));
2395 if (aFirstUnicodeToForeignRange>aLastUnicodeToForeignRange)
2397 OstTrace0( TRACE_DUMP, DUP2__CONVERTSTOFOREIGNCHARACTERSET, "EPanicCrossedPointers" );
2399 __ASSERT_DEBUG(aFirstUnicodeToForeignRange<=aLastUnicodeToForeignRange, Panic(EPanicCrossedPointers));
2400 for (const SCnvConversionData::SOneDirectionData::SRange* currentUnicodeToForeignRange=aFirstUnicodeToForeignRange; ; ++currentUnicodeToForeignRange)
2402 if ((aInputUnicodeCharacterCode>=currentUnicodeToForeignRange->iFirstInputCharacterCodeInRange) &&
2403 (aInputUnicodeCharacterCode<=currentUnicodeToForeignRange->iLastInputCharacterCodeInRange))
2405 if (OutputCharacterCode(aInputUnicodeCharacterCode, *currentUnicodeToForeignRange)!=KNoConversionAvailable)
2407 aSizeOfOutputForeignCharacterCodeInBytes=currentUnicodeToForeignRange->iSizeOfOutputCharacterCodeInBytesIfForeign;
2411 if (currentUnicodeToForeignRange>aLastUnicodeToForeignRange)
2413 OstTrace0( TRACE_DUMP, DUP3__CONVERTSTOFOREIGNCHARACTERSET, "EPanicPointerPastUpperLimit21" );
2415 __ASSERT_DEBUG(currentUnicodeToForeignRange<=aLastUnicodeToForeignRange, Panic(EPanicPointerPastUpperLimit21));
2416 if (currentUnicodeToForeignRange>=aLastUnicodeToForeignRange)
2424 /** Converts Unicode text into another character set. The Unicode text specified
2425 in aUnicode is converted using the conversion data object (aConversionData)
2426 provided by the plug-in for the foreign character set, and the converted text
2427 is returned in aForeign.
2431 This is a utility function that should only be called from a plug-in conversion
2432 library's implementation of ConvertFromUnicode(). Users of the Character
2433 Conversion API should use one of the overloads of ConvertFromUnicode() instead.
2435 @param aConversionData The conversion data object. Typically, you should specify
2436 conversionData, as declared in convgeneratedcpp.h. This is the
2437 SCnvConversionData object which is created in the cnvtool-generated .cpp file
2438 (although for some complex character sets you may want to pass other
2439 SCnvConversionData objects into this parameter).
2440 @param aDefaultEndiannessOfForeignCharacters The default endian-ness to use
2441 when writing the characters in the foreign character set. If an endian-ness
2442 for foreign characters is specified in aConversionData (i.e. not
2443 SCnvConversionData::EUnspecified), then that value is used and the value of
2444 aDefaultEndiannessOfForeignCharacters is ignored.
2445 @param aReplacementForUnconvertibleUnicodeCharacters The single character which
2446 is to be used to replace unconvertible characters.
2447 @param aForeign On return, contains the converted text in a non-Unicode
2449 @param aUnicode The source Unicode text to be converted.
2450 @param aIndicesOfUnconvertibleCharacters On return holds the indices of each
2451 Unicode character in the source text which could not be converted (because
2452 the target character set does not have an equivalent character).
2453 @return The number of unconverted characters left at the end of the input
2454 descriptor (e.g. because aForeign was not long enough to hold all the text),
2455 or a negative error value, as defined in TError. */
2456 EXPORT_C TInt CCnvCharacterSetConverter::DoConvertFromUnicode(
2457 const SCnvConversionData& aConversionData,
2458 TEndianness aDefaultEndiannessOfForeignCharacters,
2459 const TDesC8& aReplacementForUnconvertibleUnicodeCharacters,
2461 const TDesC16& aUnicode,
2462 TArrayOfAscendingIndices& aIndicesOfUnconvertibleCharacters)
2465 return DoConvertFromUnicode(aConversionData, aDefaultEndiannessOfForeignCharacters, aReplacementForUnconvertibleUnicodeCharacters, aForeign, aUnicode, aIndicesOfUnconvertibleCharacters, notUsed, 0);
2468 /** Converts Unicode text into another character set. The Unicode text specified
2469 in aUnicode is converted using the conversion data object (aConversionData)
2470 provided by the plug-in for the foreign character set, and the converted text
2471 is returned in aForeign.
2473 This overload differs from the previous one in that it allows the caller to
2474 specify flags which give more control over the conversion.
2478 This is a utility function that should only be called from a plug-in conversion
2479 library's implementation of ConvertFromUnicode(). Users of the Character
2480 Conversion API should use one of the overloads of ConvertFromUnicode() instead.
2482 @param aConversionData The conversion data object. Typically, you should specify
2483 conversionData, as declared in convgeneratedcpp.h. This is the
2484 SCnvConversionData object which is created in the cnvtool-generated .cpp file
2485 (although for some complex character sets you may want to pass other
2486 SCnvConversionData objects into this parameter).
2487 @param aDefaultEndiannessOfForeignCharacters The default endian-ness to use
2488 when writing the characters in the foreign character set. If an endian-ness
2489 for foreign characters is specified in aConversionData (i.e. not
2490 SCnvConversionData::EUnspecified), then that value is used and the value of
2491 aDefaultEndiannessOfForeignCharacters is ignored.
2492 @param aReplacementForUnconvertibleUnicodeCharacters The single character which
2493 is to be used to replace unconvertible characters. If aInputConversionFlags
2494 is set to EInputConversionFlagStopAtFirstUnconvertibleCharacter, this
2495 replacement character is used to replace the first unconvertible character,
2496 then the conversion will stop.
2497 @param aForeign On return, contains the converted text in a non-Unicode
2498 character set. This may already contain some text. If it does, and if
2499 aInputConversionFlags specifies EInputConversionFlagAppend, then the converted
2500 text is appended to this descriptor.
2501 @param aUnicode The source Unicode text to be converted.
2502 @param aIndicesOfUnconvertibleCharacters On return holds the indices of each
2503 Unicode character in the source descriptor aUnicode which could not be converted.
2504 The maximum size of this array is KMaximumNumberOfIndices whose value is 25 now.
2505 so only the first 25 unconvertible characters will be recorded.
2506 (because the target character set does not have an equivalent character).
2507 @param aOutputConversionFlags If the input descriptor ended in a truncated
2508 sequence, e.g. the first half of a Unicode surrogate pair,
2509 aOutputConversionFlags returns with the EOutputConversionFlagInputIsTruncated
2511 @param aInputConversionFlags Specify EInputConversionFlagAppend to append the
2512 text in aUnicode to aForeign. Specify
2513 EInputConversionFlagStopAtFirstUnconvertibleCharacter to stop converting when
2514 the first unconvertible character is reached. Specify
2515 EInputConversionFlagAllowTruncatedInputNotEvenPartlyConsumable to prevent
2516 the function from returning the error-code EErrorIllFormedInput when the input
2517 descriptor consists of nothing but a truncated sequence.
2518 @return The number of unconverted characters left at the end of the input
2519 descriptor (e.g. because aForeign was not long enough to hold all the text),
2520 or a negative error value, as defined in TError. */
2521 EXPORT_C TInt CCnvCharacterSetConverter::DoConvertFromUnicode(
2522 const SCnvConversionData& aConversionData,
2523 TEndianness aDefaultEndiannessOfForeignCharacters,
2524 const TDesC8& aReplacementForUnconvertibleUnicodeCharacters,
2526 const TDesC16& aUnicode,
2527 TArrayOfAscendingIndices& aIndicesOfUnconvertibleCharacters,
2528 TUint& aOutputConversionFlags,
2529 TUint aInputConversionFlags)
2531 aOutputConversionFlags=0;
2532 if (aUnicode.Length()==0)
2534 if (~aInputConversionFlags&EInputConversionFlagAppend)
2536 aForeign.SetLength(0);
2540 if (aForeign.MaxLength()==((aInputConversionFlags&EInputConversionFlagAppend)? aForeign.Length(): 0))
2542 return aUnicode.Length();
2544 TUint8* pointerToPreviousForeignByte=CONST_CAST(TUint8*, aForeign.Ptr()-1);
2545 const TUint8* const pointerToLastForeignByte=pointerToPreviousForeignByte+aForeign.MaxLength();
2546 if (aInputConversionFlags&EInputConversionFlagAppend)
2548 pointerToPreviousForeignByte+=aForeign.Length();
2550 const TUint16* pointerToCurrentUnicodeCharacter=aUnicode.Ptr();
2551 const TUint16* const pointerToLastUnicodeCharacter=pointerToCurrentUnicodeCharacter+(aUnicode.Length()-1);
2552 if (aConversionData.iUnicodeToForeignData.iNumberOfRanges<=0)
2554 OstTrace0( TRACE_DUMP, CCNVCHARACTERSETCONVERTER_DOCONVERTFROMUNICODE, "EPanicBadNumberOfRanges1" );
2556 __ASSERT_DEBUG(aConversionData.iUnicodeToForeignData.iNumberOfRanges>0, Panic(EPanicBadNumberOfRanges1));
2557 const SCnvConversionData::SOneDirectionData::SRange* const firstRange=aConversionData.iUnicodeToForeignData.iRangeArray;
2558 const SCnvConversionData::SOneDirectionData::SRange* const lastRange=firstRange+(aConversionData.iUnicodeToForeignData.iNumberOfRanges-1);
2559 const TEndianness endiannessToWriteForeignCharactersIn=EndiannessOfForeignCharacters(aConversionData, aDefaultEndiannessOfForeignCharacters);
2560 const TEndianness endiannessOfReplacementForUnconvertibleUnicodeCharacters=EndiannessOfForeignCharacters(aConversionData, ELittleEndian); // this has a hard-coded default
2561 const CCnvCharacterSetConverter* const currentCharacterSetConverter=TTlsData::CurrentCharacterSetConverter();
2562 const TBool downgradingPermitted=(currentCharacterSetConverter!=NULL); // downgrading is only permitted if we're not doing VFAT short-name generation
2563 const TDowngradeForExoticLineTerminatingCharacters downgradeForExoticLineTerminatingCharacters=(currentCharacterSetConverter!=NULL)? currentCharacterSetConverter->iDowngradeForExoticLineTerminatingCharacters: EDowngradeExoticLineTerminatingCharactersToCarriageReturnLineFeed;
2564 TUint nextInputCharacterCode=KNoConversionAvailable;
2567 if (pointerToPreviousForeignByte>pointerToLastForeignByte)
2569 OstTrace0( TRACE_DUMP, DUP1_CCNVCHARACTERSETCONVERTER_DOCONVERTFROMUNICODE, "EPanicPointerPastUpperLimit6" );
2571 __ASSERT_DEBUG(pointerToPreviousForeignByte<=pointerToLastForeignByte, Panic(EPanicPointerPastUpperLimit6));
2572 if (pointerToCurrentUnicodeCharacter>pointerToLastUnicodeCharacter)
2574 OstTrace0( TRACE_DUMP, DUP2_CCNVCHARACTERSETCONVERTER_DOCONVERTFROMUNICODE, "EPanicPointerPastUpperLimit7" );
2576 __ASSERT_DEBUG(pointerToCurrentUnicodeCharacter<=pointerToLastUnicodeCharacter, Panic(EPanicPointerPastUpperLimit7));
2578 TUint inputCharacterCode;
2579 if (nextInputCharacterCode==KNoConversionAvailable)
2581 inputCharacterCode=*pointerToCurrentUnicodeCharacter;
2585 inputCharacterCode=nextInputCharacterCode;
2586 nextInputCharacterCode=KNoConversionAvailable;
2588 if ((inputCharacterCode>=0xd800) && (inputCharacterCode<0xdc00))
2590 if (pointerToCurrentUnicodeCharacter>pointerToLastUnicodeCharacter)
2592 OstTrace0( TRACE_DUMP, DUP3_CCNVCHARACTERSETCONVERTER_DOCONVERTFROMUNICODE, "EPanicPointerPastUpperLimit8" );
2594 __ASSERT_DEBUG(pointerToCurrentUnicodeCharacter<=pointerToLastUnicodeCharacter, Panic(EPanicPointerPastUpperLimit8));
2595 if (pointerToCurrentUnicodeCharacter>=pointerToLastUnicodeCharacter)
2597 aOutputConversionFlags|=EOutputConversionFlagInputIsTruncated;
2600 TUint secondHalfOfSurrogatePair=*(pointerToCurrentUnicodeCharacter+1);
2601 if ((secondHalfOfSurrogatePair<0xdc00) || (secondHalfOfSurrogatePair>=0xe000))
2603 return EErrorIllFormedInput;
2605 inputCharacterCode&=~0xd800;
2606 inputCharacterCode<<=10;
2607 secondHalfOfSurrogatePair&=~0xdc00;
2608 inputCharacterCode|=secondHalfOfSurrogatePair;
2609 inputCharacterCode+=0x00010000; // this must be added - it cannot be bitwise-"or"-ed
2610 if (!(inputCharacterCode&0xffff0000) || !(inputCharacterCode<0x00110000))
2612 OstTrace0( TRACE_DUMP, DUP4_CCNVCHARACTERSETCONVERTER_DOCONVERTFROMUNICODE, "EPanicBadNon16BitCharacterCode1" );
2614 __ASSERT_DEBUG((inputCharacterCode&0xffff0000) && (inputCharacterCode<0x00110000), Panic(EPanicBadNon16BitCharacterCode1));
2616 convertInputCharacterCode:
2617 const SCnvConversionData::SOneDirectionData::SRange* currentRange=firstRange;
2620 if ((inputCharacterCode>=currentRange->iFirstInputCharacterCodeInRange) &&
2621 (inputCharacterCode<=currentRange->iLastInputCharacterCodeInRange))
2623 TUint outputCharacterCode=OutputCharacterCode(inputCharacterCode, *currentRange);
2624 if (outputCharacterCode!=KNoConversionAvailable)
2626 TInt temp=currentRange->iSizeOfOutputCharacterCodeInBytesIfForeign; // the meaning of temp changes during it's lifetime (hence the bland variable name)
2627 if ( (temp<=0) || ((temp>STATIC_CAST(TInt, sizeof(TUint)))) || !((temp==sizeof(TUint)) || (outputCharacterCode<STATIC_CAST(TUint, 1<<(temp*8)))) )
2629 OstTrace0( TRACE_DUMP, DUP5_CCNVCHARACTERSETCONVERTER_DOCONVERTFROMUNICODE, "EPanicBadSizeOfForeignOutputCharacterCode" );
2631 __ASSERT_DEBUG((temp>0) && (temp<=STATIC_CAST(TInt, sizeof(TUint))) && ((temp==sizeof(TUint)) || (outputCharacterCode<STATIC_CAST(TUint, 1<<(temp*8)))), Panic(EPanicBadSizeOfForeignOutputCharacterCode)); // ?? this second half of this assert needs a corresponding "KErrCorrupt"-check when loading the file
2632 if (pointerToLastForeignByte-pointerToPreviousForeignByte<temp)
2638 switch (endiannessToWriteForeignCharactersIn)
2643 if (pointerToPreviousForeignByte>=pointerToLastForeignByte)
2645 OstTrace0( TRACE_DUMP, DUP6_CCNVCHARACTERSETCONVERTER_DOCONVERTFROMUNICODE, "EPanicPointerPastUpperLimit9" );
2647 __ASSERT_DEBUG(pointerToPreviousForeignByte<pointerToLastForeignByte, Panic(EPanicPointerPastUpperLimit9));
2648 ++pointerToPreviousForeignByte;
2649 *pointerToPreviousForeignByte=STATIC_CAST(TUint8, outputCharacterCode);
2652 OstTrace0( TRACE_DUMP, DUP7_CCNVCHARACTERSETCONVERTER_DOCONVERTFROMUNICODE, "EPanicBadNumberOfRemainingForeignBytes1" );
2654 __ASSERT_DEBUG(temp>=0, Panic(EPanicBadNumberOfRemainingForeignBytes1));
2660 outputCharacterCode>>=8;
2666 if (pointerToPreviousForeignByte>=pointerToLastForeignByte)
2668 OstTrace0( TRACE_DUMP, DUP8_CCNVCHARACTERSETCONVERTER_DOCONVERTFROMUNICODE, "EPanicPointerPastUpperLimit10" );
2670 __ASSERT_DEBUG(pointerToPreviousForeignByte<pointerToLastForeignByte, Panic(EPanicPointerPastUpperLimit10));
2671 ++pointerToPreviousForeignByte;
2672 *pointerToPreviousForeignByte=STATIC_CAST(TUint8, outputCharacterCode>>temp);
2675 OstTrace0( TRACE_DUMP, DUP9_CCNVCHARACTERSETCONVERTER_DOCONVERTFROMUNICODE, "EPanicBadNumberOfRemainingForeignBytes2" );
2677 __ASSERT_DEBUG(temp>=0, Panic(EPanicBadNumberOfRemainingForeignBytes2));
2687 OstTrace0( TRACE_DUMP, DUP10_CCNVCHARACTERSETCONVERTER_DOCONVERTFROMUNICODE, "EPanicBadEndianness1" );
2688 Panic(EPanicBadEndianness1);
2695 if (currentRange>lastRange)
2697 OstTrace0( TRACE_DUMP, DUP11_CCNVCHARACTERSETCONVERTER_DOCONVERTFROMUNICODE, "EPanicPointerPastUpperLimit11" );
2699 __ASSERT_DEBUG(currentRange<=lastRange, Panic(EPanicPointerPastUpperLimit11));
2700 if (currentRange>=lastRange)
2702 if (downgradingPermitted)
2704 if ((inputCharacterCode==0x2029) || (inputCharacterCode==0x2028))
2706 switch (downgradeForExoticLineTerminatingCharacters)
2708 case EDowngradeExoticLineTerminatingCharactersToCarriageReturnLineFeed:
2710 // check that there's enough room for the subsequent line-feed character, and check that both the carriage-return and the line-feed convert into the foreign character set
2711 TInt sizeOfForeignCarriageReturnInBytes;
2712 TInt sizeOfForeignLineFeedInBytes;
2713 if (ConvertsToForeignCharacterSet(sizeOfForeignCarriageReturnInBytes, 0x000d, firstRange, lastRange) &&
2714 ConvertsToForeignCharacterSet(sizeOfForeignLineFeedInBytes, 0x000a, firstRange, lastRange) &&
2715 (pointerToLastForeignByte-pointerToPreviousForeignByte>=sizeOfForeignCarriageReturnInBytes+sizeOfForeignLineFeedInBytes))
2717 inputCharacterCode=0x000d;
2718 nextInputCharacterCode=0x000a;
2719 goto convertInputCharacterCode;
2723 case EDowngradeExoticLineTerminatingCharactersToJustLineFeed:
2724 inputCharacterCode=0x000a;
2725 goto convertInputCharacterCode;
2728 OstTrace0( TRACE_DUMP, DUP12_CCNVCHARACTERSETCONVERTER_DOCONVERTFROMUNICODE, "EPanicBadDowngradeForExoticLineTerminatingCharacters2" );
2729 Panic(EPanicBadDowngradeForExoticLineTerminatingCharacters2);
2735 const TInt lengthOfReplacementForUnconvertibleUnicodeCharacters=aReplacementForUnconvertibleUnicodeCharacters.Length();
2736 if (lengthOfReplacementForUnconvertibleUnicodeCharacters>0)
2738 if (pointerToLastForeignByte-pointerToPreviousForeignByte<lengthOfReplacementForUnconvertibleUnicodeCharacters)
2742 const TUint8* pointerToReadFrom=aReplacementForUnconvertibleUnicodeCharacters.Ptr();
2743 const TUint8* lastByteToReadFrom=pointerToReadFrom+(lengthOfReplacementForUnconvertibleUnicodeCharacters-1);
2745 if (endiannessOfReplacementForUnconvertibleUnicodeCharacters!=endiannessToWriteForeignCharactersIn)
2747 const TUint8* temp=pointerToReadFrom;
2748 pointerToReadFrom=lastByteToReadFrom;
2749 lastByteToReadFrom=temp;
2754 if (pointerToPreviousForeignByte>=pointerToLastForeignByte)
2756 OstTrace0( TRACE_DUMP, DUP13_CCNVCHARACTERSETCONVERTER_DOCONVERTFROMUNICODE, "EPanicPointerPastUpperLimit12" );
2758 __ASSERT_DEBUG(pointerToPreviousForeignByte<pointerToLastForeignByte, Panic(EPanicPointerPastUpperLimit12));
2759 ++pointerToPreviousForeignByte;
2760 *pointerToPreviousForeignByte=*pointerToReadFrom;
2761 if (pointerToReadFrom==lastByteToReadFrom)
2765 pointerToReadFrom+=increment;
2768 if (aInputConversionFlags&EInputConversionFlagStopAtFirstUnconvertibleCharacter)
2772 aIndicesOfUnconvertibleCharacters.AppendIndex(pointerToCurrentUnicodeCharacter-aUnicode.Ptr());
2777 if (inputCharacterCode>=0x00010000)
2779 if (pointerToCurrentUnicodeCharacter>=pointerToLastUnicodeCharacter)
2781 OstTrace0( TRACE_DUMP, DUP14_CCNVCHARACTERSETCONVERTER_DOCONVERTFROMUNICODE, "EPanicPointerPastUpperLimit13" );
2783 __ASSERT_DEBUG(pointerToCurrentUnicodeCharacter<pointerToLastUnicodeCharacter, Panic(EPanicPointerPastUpperLimit13));
2784 if (nextInputCharacterCode==KNoConversionAvailable)
2786 ++pointerToCurrentUnicodeCharacter;
2789 if (pointerToCurrentUnicodeCharacter>pointerToLastUnicodeCharacter)
2791 OstTrace0( TRACE_DUMP, DUP15_CCNVCHARACTERSETCONVERTER_DOCONVERTFROMUNICODE, "EPanicPointerPastUpperLimit14" );
2793 __ASSERT_DEBUG(pointerToCurrentUnicodeCharacter<=pointerToLastUnicodeCharacter, Panic(EPanicPointerPastUpperLimit14));
2794 if (nextInputCharacterCode==KNoConversionAvailable)
2796 if (pointerToCurrentUnicodeCharacter>=pointerToLastUnicodeCharacter)
2798 ++pointerToCurrentUnicodeCharacter; // this increment is done regardless of the test just above, but it's not done before the test as it may make pointerToCurrentUnicodeCharacter greater than pointerToLastUnicodeCharacter, and if pointerToLastUnicodeCharacter just happens to be pointing at 0xffffffff, pointerToCurrentUnicodeCharacter will be pointing at 0x00000000, thus the test (which would now be "if (pointerToCurrentUnicodeCharacter>pointerToLastUnicodeCharacter)") would fail
2801 ++pointerToCurrentUnicodeCharacter;
2809 if (pointerToCurrentUnicodeCharacter<aUnicode.Ptr())
2811 OstTrace0( TRACE_DUMP, DUP16_CCNVCHARACTERSETCONVERTER_DOCONVERTFROMUNICODE, "EPanicPointerPastLowerLimit1" );
2813 __ASSERT_DEBUG(pointerToCurrentUnicodeCharacter>=aUnicode.Ptr(), Panic(EPanicPointerPastLowerLimit1));
2814 if ((pointerToCurrentUnicodeCharacter<=aUnicode.Ptr()) && (aOutputConversionFlags&EOutputConversionFlagInputIsTruncated) && (~aInputConversionFlags&EInputConversionFlagAllowTruncatedInputNotEvenPartlyConsumable))
2816 return EErrorIllFormedInput;
2818 aForeign.SetLength((pointerToPreviousForeignByte+1)-aForeign.Ptr());
2819 return pointerToLastUnicodeCharacter-(pointerToCurrentUnicodeCharacter-1);
2822 /** Converts non-Unicode text into Unicode. The non-Unicode text specified in
2823 aForeign is converted using the conversion data object (aConversionData)
2824 provided by the plug-in for the foreign character set, and the converted text
2825 is returned in aUnicode.
2829 This is a utility function that should only be called from a plug-in conversion
2830 library's implementation of ConvertToUnicode(). Ordinary users of the Character
2831 Conversion API should use one of the overloads of ConvertToUnicode() instead.
2833 The last two arguments return information about unconverted characters. Because
2834 Unicode is intended to cover all possible characters, these rarely report
2835 anything other than zero characters. However they report the existence of
2836 unconvertible characters if the input descriptor aForeign contains illegal
2837 characters, i.e. values not in the foreign character set.
2839 @param aConversionData The conversion data object. Typically, you should specify
2840 conversionData, as declared in convgeneratedcpp.h. This is the
2841 SCnvConversionData object which is created in the cnvtool-generated .cpp file
2842 (although for some complex character sets you may want to pass other
2843 SCnvConversionData objects into this parameter).
2844 @param aDefaultEndiannessOfForeignCharacters The default endian-ness of the
2845 foreign characters. If an endian-ness for foreign characters is specified
2846 in aConversionData, then that is used instead and the value of
2847 aDefaultEndiannessOfForeignCharacters is ignored.
2848 @param aUnicode On return, contains the text converted into Unicode.
2849 @param aForeign The non-Unicode source text to be converted.
2850 @param aNumberOfUnconvertibleCharacters On return, contains the number of
2851 characters in aForeign which were not converted. Characters which cannot be
2852 converted are output as Unicode replacement characters (0xFFFD).
2853 @param aIndexOfFirstByteOfFirstUnconvertibleCharacter On return, the index
2854 of the first byte of the first unconvertible character. For instance if the
2855 first character in the input descriptor (aForeign) could not be converted,
2856 then this parameter is set to the first byte of that character, i.e. zero.
2857 A negative value is returned if all the characters were converted.
2858 @return The number of unconverted bytes left at the end of the input descriptor,
2859 or a negative error value, as defined in TError. */
2860 EXPORT_C TInt CCnvCharacterSetConverter::DoConvertToUnicode(
2861 const SCnvConversionData& aConversionData,
2862 TEndianness aDefaultEndiannessOfForeignCharacters,
2864 const TDesC8& aForeign,
2865 TInt& aNumberOfUnconvertibleCharacters,
2866 TInt& aIndexOfFirstByteOfFirstUnconvertibleCharacter)
2869 return DoConvertToUnicode(aConversionData, aDefaultEndiannessOfForeignCharacters, aUnicode, aForeign, aNumberOfUnconvertibleCharacters, aIndexOfFirstByteOfFirstUnconvertibleCharacter, notUsed, 0);
2872 /** Converts non-Unicode text into Unicode. The non-Unicode text specified in
2873 aForeign is converted using the conversion data object (aConversionData)
2874 provided by the plug-in for the foreign character set, and the converted text
2875 is returned in aUnicode.
2877 This overload differs from the previous one in that it allows the caller to
2878 specify flags which give more control over the conversion.
2882 This is a utility function that should only be called from a plug-in conversion
2883 library's implementation of ConvertToUnicode(). Ordinary users of the Character
2884 Conversion API should use one of the overloads of ConvertToUnicode() instead.
2886 The aNumberOfUnconvertibleCharacters and
2887 aIndexOfFirstByteOfFirstUnconvertibleCharacter arguments return information
2888 about unconverted characters. Because Unicode is intended to cover all
2889 possible characters, these rarely report anything other than zero characters.
2890 However they report the existence of unconvertible characters if the input
2891 descriptor aForeign contains illegal characters, i.e. values not in the
2892 foreign character set.
2894 @param aConversionData The conversion data object. Typically, you should specify
2895 conversionData, as declared in convgeneratedcpp.h. This is the
2896 SCnvConversionData object which is created in the cnvtool-generated .cpp file
2897 (although for some complex character sets you may want to pass other
2898 SCnvConversionData objects into this parameter).
2899 @param aDefaultEndiannessOfForeignCharacters The default endian-ness of the
2900 foreign characters. If an endian-ness for foreign characters is specified
2901 in aConversionData, then that is used instead and the value of
2902 aDefaultEndiannessOfForeignCharacters is ignored.
2903 @param aUnicode On return, contains the text converted into Unicode.
2904 @param aForeign The non-Unicode source text to be converted.
2905 @param aNumberOfUnconvertibleCharacters On return, contains the number of
2906 characters in aForeign which were not converted. Characters which cannot be
2907 converted are output as Unicode replacement characters (0xFFFD).
2908 @param aIndexOfFirstByteOfFirstUnconvertibleCharacter On return, the index
2909 of the first byte of the first unconvertible character. For instance if the
2910 first character in the input descriptor (aForeign) could not be converted,
2911 then this parameter is set to the first byte of that character, i.e. zero.
2912 A negative value is returned if all the characters were converted.
2913 @param aOutputConversionFlags If the input descriptor ended in a truncated
2914 sequence, e.g. a multi-byte character that is not complete, aOutputConversionFlags
2915 returns with the EOutputConversionFlagInputIsTruncated flag set.
2916 @param aInputConversionFlags Specify EInputConversionFlagAppend to append the
2917 converted text to aUnicode, otherwise the contents of aUnicode are overwritten.
2918 Specify EInputConversionFlagStopAtFirstUnconvertibleCharacter to stop converting
2919 when the first unconvertible character is reached. Specify
2920 EInputConversionFlagAllowTruncatedInputNotEvenPartlyConsumable to prevent the
2921 function from returning the error-code EErrorIllFormedInput when the input
2922 descriptor consists of nothing but a truncated sequence.
2923 @return The number of unconverted bytes left at the end of the input descriptor,
2924 or a negative error value defined in TError. */
2925 EXPORT_C TInt CCnvCharacterSetConverter::DoConvertToUnicode(
2926 const SCnvConversionData& aConversionData,
2927 TEndianness aDefaultEndiannessOfForeignCharacters,
2929 const TDesC8& aForeign,
2930 TInt& aNumberOfUnconvertibleCharacters,
2931 TInt& aIndexOfFirstByteOfFirstUnconvertibleCharacter,
2932 TUint& aOutputConversionFlags,
2933 TUint aInputConversionFlags)
2935 aNumberOfUnconvertibleCharacters=0;
2936 aIndexOfFirstByteOfFirstUnconvertibleCharacter=-1;
2937 aOutputConversionFlags=0;
2938 if (aForeign.Length()==0)
2940 if (~aInputConversionFlags&EInputConversionFlagAppend)
2942 aUnicode.SetLength(0);
2946 if (aUnicode.MaxLength()==((aInputConversionFlags&EInputConversionFlagAppend)? aUnicode.Length(): 0))
2948 return aForeign.Length();
2950 TUint16* pointerToPreviousUnicodeCharacter=CONST_CAST(TUint16*, aUnicode.Ptr()-1);
2951 const TUint16* const pointerToLastUnicodeCharacter=pointerToPreviousUnicodeCharacter+aUnicode.MaxLength();
2952 if (aInputConversionFlags&EInputConversionFlagAppend)
2954 pointerToPreviousUnicodeCharacter+=aUnicode.Length();
2956 const TUint8* pointerToCurrentForeignByte=aForeign.Ptr();
2957 const TUint8* const pointerToLastForeignByte=pointerToCurrentForeignByte+(aForeign.Length()-1);
2958 if (aConversionData.iForeignVariableByteData.iNumberOfRanges<=0)
2960 OstTrace0( TRACE_DUMP, CCNVCHARACTERSETCONVERTER_DOCONVERTTOUNICODE, "EPanicBadNumberOfRanges2" );
2962 __ASSERT_DEBUG(aConversionData.iForeignVariableByteData.iNumberOfRanges>0, Panic(EPanicBadNumberOfRanges2));
2963 const SCnvConversionData::SVariableByteData::SRange* const foreignVariableByteData_firstRange=aConversionData.iForeignVariableByteData.iRangeArray;
2964 const SCnvConversionData::SVariableByteData::SRange* const foreignVariableByteData_lastRange=foreignVariableByteData_firstRange+(aConversionData.iForeignVariableByteData.iNumberOfRanges-1);
2965 if (aConversionData.iForeignToUnicodeData.iNumberOfRanges<=0)
2967 OstTrace0( TRACE_DUMP, DUP1_CCNVCHARACTERSETCONVERTER_DOCONVERTTOUNICODE, "EPanicBadNumberOfRanges3" );
2969 __ASSERT_DEBUG(aConversionData.iForeignToUnicodeData.iNumberOfRanges>0, Panic(EPanicBadNumberOfRanges3));
2970 const SCnvConversionData::SOneDirectionData::SRange* const oneDirectionData_firstRange=aConversionData.iForeignToUnicodeData.iRangeArray;
2971 const SCnvConversionData::SOneDirectionData::SRange* const oneDirectionData_lastRange=oneDirectionData_firstRange+(aConversionData.iForeignToUnicodeData.iNumberOfRanges-1);
2974 if (pointerToPreviousUnicodeCharacter>pointerToLastUnicodeCharacter)
2976 OstTrace0( TRACE_DUMP, DUP2_CCNVCHARACTERSETCONVERTER_DOCONVERTTOUNICODE, "EPanicPointerPastUpperLimit15" );
2978 __ASSERT_DEBUG(pointerToPreviousUnicodeCharacter<=pointerToLastUnicodeCharacter, Panic(EPanicPointerPastUpperLimit15));
2979 if (pointerToCurrentForeignByte>pointerToLastForeignByte)
2981 OstTrace0( TRACE_DUMP, DUP3_CCNVCHARACTERSETCONVERTER_DOCONVERTTOUNICODE, "EPanicPointerPastUpperLimit16" );
2983 __ASSERT_DEBUG(pointerToCurrentForeignByte<=pointerToLastForeignByte, Panic(EPanicPointerPastUpperLimit16));
2985 TUint inputCharacterCode=*pointerToCurrentForeignByte;
2986 const SCnvConversionData::SVariableByteData::SRange* foreignVariableByteData_currentRange=foreignVariableByteData_firstRange;
2989 if (foreignVariableByteData_currentRange->iNumberOfSubsequentBytes>=sizeof(TUint))
2991 OstTrace0( TRACE_DUMP, DUP4_CCNVCHARACTERSETCONVERTER_DOCONVERTTOUNICODE, "EPanicBadNumberOfSubsequentBytes" );
2993 __ASSERT_DEBUG(foreignVariableByteData_currentRange->iNumberOfSubsequentBytes<sizeof(TUint), Panic(EPanicBadNumberOfSubsequentBytes));
2994 if ((inputCharacterCode>=foreignVariableByteData_currentRange->iFirstInitialByteValueInRange) && (inputCharacterCode<=foreignVariableByteData_currentRange->iLastInitialByteValueInRange))
2996 const TInt numberOfSubsequentBytes=foreignVariableByteData_currentRange->iNumberOfSubsequentBytes;
2997 if (pointerToCurrentForeignByte>pointerToLastForeignByte)
2999 OstTrace0( TRACE_DUMP, DUP5_CCNVCHARACTERSETCONVERTER_DOCONVERTTOUNICODE, "EPanicPointerPastUpperLimit17" );
3001 __ASSERT_DEBUG(pointerToCurrentForeignByte<=pointerToLastForeignByte, Panic(EPanicPointerPastUpperLimit17));
3002 if (pointerToLastForeignByte-pointerToCurrentForeignByte<numberOfSubsequentBytes)
3004 aOutputConversionFlags|=EOutputConversionFlagInputIsTruncated;
3007 switch (EndiannessOfForeignCharacters(aConversionData, aDefaultEndiannessOfForeignCharacters))
3011 for (TInt i=1; i<=numberOfSubsequentBytes; ++i)
3013 if (pointerToCurrentForeignByte>=pointerToLastForeignByte)
3015 OstTrace0( TRACE_DUMP, DUP6_CCNVCHARACTERSETCONVERTER_DOCONVERTTOUNICODE, "EPanicPointerPastUpperLimit18" );
3017 __ASSERT_DEBUG(pointerToCurrentForeignByte<pointerToLastForeignByte, Panic(EPanicPointerPastUpperLimit18));
3018 ++pointerToCurrentForeignByte;
3019 TUint currentForeignByte=*pointerToCurrentForeignByte;
3020 currentForeignByte<<=(i*8);
3021 inputCharacterCode|=currentForeignByte;
3027 for (TInt i=numberOfSubsequentBytes; i>0; --i)
3029 if (pointerToCurrentForeignByte>=pointerToLastForeignByte)
3031 OstTrace0( TRACE_DUMP, DUP7_CCNVCHARACTERSETCONVERTER_DOCONVERTTOUNICODE, "EPanicPointerPastUpperLimit19" );
3033 __ASSERT_DEBUG(pointerToCurrentForeignByte<pointerToLastForeignByte, Panic(EPanicPointerPastUpperLimit19));
3034 ++pointerToCurrentForeignByte;
3035 inputCharacterCode<<=8;
3036 inputCharacterCode|=*pointerToCurrentForeignByte;
3042 OstTrace0( TRACE_DUMP, DUP8_CCNVCHARACTERSETCONVERTER_DOCONVERTTOUNICODE, "EPanicBadEndianness2" );
3043 Panic(EPanicBadEndianness2);
3047 pointerToCurrentForeignByte-=numberOfSubsequentBytes; // resets pointerToCurrentForeignByte to its value before the loop above
3050 if (foreignVariableByteData_currentRange>foreignVariableByteData_lastRange)
3052 OstTrace0( TRACE_DUMP, DUP9_CCNVCHARACTERSETCONVERTER_DOCONVERTTOUNICODE, "EPanicPointerPastUpperLimit20" );
3054 __ASSERT_DEBUG(foreignVariableByteData_currentRange<=foreignVariableByteData_lastRange, Panic(EPanicPointerPastUpperLimit20));
3055 if (foreignVariableByteData_currentRange>=foreignVariableByteData_lastRange)
3057 return EErrorIllFormedInput;
3059 ++foreignVariableByteData_currentRange;
3061 const SCnvConversionData::SOneDirectionData::SRange* oneDirectionData_currentRange=oneDirectionData_firstRange;
3062 TUint outputCharacterCode=KNoConversionAvailable;
3065 if ((inputCharacterCode>=oneDirectionData_currentRange->iFirstInputCharacterCodeInRange) &&
3066 (inputCharacterCode<=oneDirectionData_currentRange->iLastInputCharacterCodeInRange))
3068 outputCharacterCode=OutputCharacterCode(inputCharacterCode, *oneDirectionData_currentRange);
3069 if (outputCharacterCode!=KNoConversionAvailable)
3074 if (oneDirectionData_currentRange>oneDirectionData_lastRange)
3076 OstTrace0( TRACE_DUMP, DUP10_CCNVCHARACTERSETCONVERTER_DOCONVERTTOUNICODE, "EPanicPointerPastUpperLimit21" );
3078 __ASSERT_DEBUG(oneDirectionData_currentRange<=oneDirectionData_lastRange, Panic(EPanicPointerPastUpperLimit21));
3079 if (oneDirectionData_currentRange>=oneDirectionData_lastRange)
3083 ++oneDirectionData_currentRange;
3085 if (pointerToPreviousUnicodeCharacter>pointerToLastUnicodeCharacter)
3087 OstTrace0( TRACE_DUMP, DUP11_CCNVCHARACTERSETCONVERTER_DOCONVERTTOUNICODE, "EPanicPointerPastUpperLimit22" );
3089 __ASSERT_DEBUG(pointerToPreviousUnicodeCharacter<=pointerToLastUnicodeCharacter, Panic(EPanicPointerPastUpperLimit22));
3090 if (pointerToPreviousUnicodeCharacter==pointerToLastUnicodeCharacter)
3094 if (outputCharacterCode==KNoConversionAvailable)
3096 outputCharacterCode=0xfffd; // Unicode's "REPLACEMENT CHARACTER"
3097 if (aNumberOfUnconvertibleCharacters<0)
3099 OstTrace0( TRACE_FATAL, DUP13_CCNVCHARACTERSETCONVERTER_DOCONVERTTOUNICODE, "EPanicBadNumberOfUnconvertibleCharacters" );
3101 __ASSERT_ALWAYS(aNumberOfUnconvertibleCharacters>=0, Panic(EPanicBadNumberOfUnconvertibleCharacters));
3102 if (aNumberOfUnconvertibleCharacters<=0)
3104 aIndexOfFirstByteOfFirstUnconvertibleCharacter=pointerToCurrentForeignByte-aForeign.Ptr();
3106 ++aNumberOfUnconvertibleCharacters;
3107 if (aInputConversionFlags&EInputConversionFlagStopAtFirstUnconvertibleCharacter)
3112 if (outputCharacterCode<0x00010000)
3114 ++pointerToPreviousUnicodeCharacter;
3115 *pointerToPreviousUnicodeCharacter=STATIC_CAST(TUint16, outputCharacterCode);
3119 if (outputCharacterCode>=0x00110000)
3121 OstTrace0( TRACE_DUMP, DUP12_CCNVCHARACTERSETCONVERTER_DOCONVERTTOUNICODE, "EPanicBadNon16BitCharacterCode2" );
3123 __ASSERT_DEBUG(outputCharacterCode<0x00110000, Panic(EPanicBadNon16BitCharacterCode2));
3124 if (pointerToPreviousUnicodeCharacter>pointerToLastUnicodeCharacter)
3126 OstTrace0( TRACE_DUMP, DUP14_CCNVCHARACTERSETCONVERTER_DOCONVERTTOUNICODE, "EPanicPointerPastUpperLimit23" );
3128 __ASSERT_DEBUG(pointerToPreviousUnicodeCharacter<=pointerToLastUnicodeCharacter, Panic(EPanicPointerPastUpperLimit23));
3129 if (pointerToLastUnicodeCharacter-pointerToPreviousUnicodeCharacter<2)
3133 outputCharacterCode-=0x00010000;
3134 ++pointerToPreviousUnicodeCharacter;
3135 *pointerToPreviousUnicodeCharacter=STATIC_CAST(TUint16, (outputCharacterCode>>10)|0xd800);
3136 ++pointerToPreviousUnicodeCharacter;
3137 *pointerToPreviousUnicodeCharacter=STATIC_CAST(TUint16, (outputCharacterCode&0x000003ff)|0xdc00);
3139 if (pointerToLastForeignByte-pointerToCurrentForeignByte<foreignVariableByteData_currentRange->iNumberOfSubsequentBytes)
3141 OstTrace0( TRACE_DUMP, DUP15_CCNVCHARACTERSETCONVERTER_DOCONVERTTOUNICODE, "EPanicPointerPastUpperLimit24" );
3143 __ASSERT_DEBUG(pointerToLastForeignByte-pointerToCurrentForeignByte>=foreignVariableByteData_currentRange->iNumberOfSubsequentBytes, Panic(EPanicPointerPastUpperLimit24));
3144 pointerToCurrentForeignByte+=foreignVariableByteData_currentRange->iNumberOfSubsequentBytes;
3145 if (pointerToCurrentForeignByte==pointerToLastForeignByte)
3147 ++pointerToCurrentForeignByte; // this increment is done regardless of the test just above, but it's not done before the test as it may make pointerToCurrentForeignByte greater than pointerToLastForeignByte, and if pointerToLastForeignByte just happens to be pointing at 0xffffffff, will pointerToCurrentForeignByte will be pointing at 0x00000000, thus the test (which would now be "if (pointerToCurrentForeignByte>pointerToLastForeignByte)") would fail
3150 ++pointerToCurrentForeignByte;
3157 if (pointerToCurrentForeignByte<aForeign.Ptr())
3159 OstTrace0( TRACE_DUMP, DUP16_CCNVCHARACTERSETCONVERTER_DOCONVERTTOUNICODE, "EPanicPointerPastLowerLimit2" );
3161 __ASSERT_DEBUG(pointerToCurrentForeignByte>=aForeign.Ptr(), Panic(EPanicPointerPastLowerLimit2));
3162 if ((pointerToCurrentForeignByte<=aForeign.Ptr()) && (aOutputConversionFlags&EOutputConversionFlagInputIsTruncated) && (~aInputConversionFlags&EInputConversionFlagAllowTruncatedInputNotEvenPartlyConsumable))
3164 return EErrorIllFormedInput;
3166 aUnicode.SetLength((pointerToPreviousUnicodeCharacter+1)-aUnicode.Ptr());
3167 return pointerToLastForeignByte-(pointerToCurrentForeignByte-1);
3171 /** Returns a ready-made SCnvConversionData object for converting between
3172 Unicode and ASCII. This can be passed into the aConversionData parameter to
3173 DoConvertFromUnicode() or DoConvertToUnicode().
3175 Note: This utility function should only be called by a plug-in conversion
3178 @return ASCII conversion data object. */
3179 EXPORT_C const SCnvConversionData& CCnvCharacterSetConverter::AsciiConversionData()
3181 return asciiConversionData;
3184 CCnvCharacterSetConverter::CCnvCharacterSetConverter()
3186 iCharacterSetIdentifierOfLoadedConversionData(0),
3187 iConversionData(NULL),
3188 iDefaultEndiannessOfForeignCharacters(ELittleEndian),
3189 iDowngradeForExoticLineTerminatingCharacters(EDowngradeExoticLineTerminatingCharactersToCarriageReturnLineFeed),
3190 iReplacementForUnconvertibleUnicodeCharacters(KNullDesC8),
3191 iStandardNamesAndMibEnums(NULL),
3192 iIsSystemStandardNamesAndMibEnumsScanned(EFalse)
3196 void CCnvCharacterSetConverter::ConstructL()
3198 iCharsetCnvCache = CCharsetCnvCache::NewL();
3199 TTlsData::CharacterSetConverterIsBeingCreatedL();
3200 iTlsDataConstructed = ETrue;
3203 // set aIdentifierOfOnlyCharacterSetOfInterest to 0 if all character sets are of interest
3204 //RFs& aFileServerSession function parameter is not used anymore.ECom plugin framework used.
3205 CArrayFix<CCnvCharacterSetConverter::SCharacterSet>*
3206 CCnvCharacterSetConverter::DoCreateArrayOfCharacterSetsAvailableLC(
3207 RFs& /*aFileServerSession*/,
3208 TUint aIdentifierOfOnlyCharacterSetOfInterest)
3210 CArrayFix<SCharacterSet>* arrayOfCharacterSetsAvailable=CDeepDestructingArrayOfCharactersSets::NewLC(12);
3211 if ((AppendHardCodedCharacterSetIfRequiredL(*arrayOfCharacterSetsAvailable, aIdentifierOfOnlyCharacterSetOfInterest, KCharacterSetIdentifierUtf7, KLitCharacterSetNameUtf7 )==EStopCharacterSetSearch) ||
3212 (AppendHardCodedCharacterSetIfRequiredL(*arrayOfCharacterSetsAvailable, aIdentifierOfOnlyCharacterSetOfInterest, KCharacterSetIdentifierUtf8, KLitCharacterSetNameUtf8 )==EStopCharacterSetSearch) ||
3213 (AppendHardCodedCharacterSetIfRequiredL(*arrayOfCharacterSetsAvailable, aIdentifierOfOnlyCharacterSetOfInterest, KCharacterSetIdentifierImapUtf7, KLitCharacterSetNameImapUtf7 )==EStopCharacterSetSearch) ||
3214 (AppendHardCodedCharacterSetIfRequiredL(*arrayOfCharacterSetsAvailable, aIdentifierOfOnlyCharacterSetOfInterest, KCharacterSetIdentifierJavaConformantUtf8, KLitCharacterSetNameJavaConformantUtf8 )==EStopCharacterSetSearch) ||
3215 (AppendHardCodedCharacterSetIfRequiredL(*arrayOfCharacterSetsAvailable, aIdentifierOfOnlyCharacterSetOfInterest, KCharacterSetIdentifierCodePage1252, KLitCharacterSetNameCodePage1252 )==EStopCharacterSetSearch) ||
3216 (AppendHardCodedCharacterSetIfRequiredL(*arrayOfCharacterSetsAvailable, aIdentifierOfOnlyCharacterSetOfInterest, KCharacterSetIdentifierWin1252, KLitCharacterSetNameCodePage1252 )==EStopCharacterSetSearch) ||
3217 (AppendHardCodedCharacterSetIfRequiredL(*arrayOfCharacterSetsAvailable, aIdentifierOfOnlyCharacterSetOfInterest, KCharacterSetIdentifierIso88591, KLitCharacterSetNameIso88591 )==EStopCharacterSetSearch) ||
3218 (AppendHardCodedCharacterSetIfRequiredL(*arrayOfCharacterSetsAvailable, aIdentifierOfOnlyCharacterSetOfInterest, KCharacterSetIdentifierAscii, KLitCharacterSetNameAscii )==EStopCharacterSetSearch) ||
3219 (AppendHardCodedCharacterSetIfRequiredL(*arrayOfCharacterSetsAvailable, aIdentifierOfOnlyCharacterSetOfInterest, KCharacterSetIdentifierUnicodeLittle, KLitCharacterSetNameUnicodeLittle )==EStopCharacterSetSearch) ||
3220 (AppendHardCodedCharacterSetIfRequiredL(*arrayOfCharacterSetsAvailable, aIdentifierOfOnlyCharacterSetOfInterest, KCharacterSetIdentifierUnicodeBig, KLitCharacterSetNameUnicodeBig )==EStopCharacterSetSearch) ||
3221 (AppendHardCodedCharacterSetIfRequiredL(*arrayOfCharacterSetsAvailable, aIdentifierOfOnlyCharacterSetOfInterest, KCharacterSetIdentifierSms7Bit, KLitCharacterSetNameSms7Bit )==EStopCharacterSetSearch))
3223 return arrayOfCharacterSetsAvailable;
3226 //Look for ECOM Character Set Convertors...
3227 RImplInfoPtrArray convertorsImplArray;
3228 REComSession::ListImplementationsL(KCharacterSetConvertorInterfaceUid, convertorsImplArray);
3229 CleanupStack::PushL(TCleanupItem(ResetAndDestroyRImplInfoPtrArray, &convertorsImplArray));
3230 TBool fileIsDll = ETrue;
3232 for(TInt i = 0; i < convertorsImplArray.Count(); i++)
3234 CImplementationInformation* implInfo = convertorsImplArray[i];
3235 const TUint characterSetIdentifier = (implInfo->ImplementationUid()).iUid;
3237 if(aIdentifierOfOnlyCharacterSetOfInterest == 0)
3238 // only if we're interested in all character sets do we need to make sure we've not already added this one to the array
3240 for(TInt j = arrayOfCharacterSetsAvailable->Count() - 1; j >= 0; --j)
3242 if((*arrayOfCharacterSetsAvailable)[j].Identifier() == characterSetIdentifier)
3244 goto afterAddingNewCharacterSet;
3251 for(TInt j = arrayOfCharacterSetsAvailable->Count() - 1; j >= 0; --j)
3253 if ((*arrayOfCharacterSetsAvailable)[j].Identifier() == characterSetIdentifier)
3255 OstTrace0( TRACE_DUMP, DUP1_CCNVCHARACTERSETCONVERTER_DOCREATEARRAYOFCHARACTERSETSAVAILABLELC, "EPanicCharacterSetAlreadyAdded" );
3257 __ASSERT_DEBUG((*arrayOfCharacterSetsAvailable)[j].Identifier() != characterSetIdentifier, Panic(EPanicCharacterSetAlreadyAdded));
3262 if((aIdentifierOfOnlyCharacterSetOfInterest == 0) || (aIdentifierOfOnlyCharacterSetOfInterest == characterSetIdentifier))
3264 SCharacterSet characterSet;
3265 characterSet.iIdentifier = characterSetIdentifier;
3266 characterSet.iFlags = SCharacterSet::EFlagNameIsFileName;
3270 characterSet.iFlags |= SCharacterSet::EFlagFileIsConversionPlugInLibrary;
3273 characterSet.iName = implInfo->DisplayName().AllocLC();
3275 arrayOfCharacterSetsAvailable->AppendL(characterSet);
3277 OstTraceDefExt1( OST_TRACE_CATEGORY_PRODUCTION | OST_TRACE_CATEGORY_RND, TRACE_INTERNALS,
3278 CCNVCHARACTERSETCONVERTER_DOCREATEARRAYOFCHARACTERSETSAVAILABLELC,
3279 "%S Appended to Character Set Array", *(characterSet.iName) );
3281 CleanupStack::Pop(characterSet.iName); //characterSet.iName
3284 if(aIdentifierOfOnlyCharacterSetOfInterest == characterSetIdentifier)
3286 CleanupStack::PopAndDestroy(&convertorsImplArray); //convertorsImplArray
3287 return arrayOfCharacterSetsAvailable;
3290 afterAddingNewCharacterSet:
3291 ; //dummy statement after label to prevent compiler warning
3293 }//end of for(TInt i = 0; i < convertorsImplArray.Count(); i++)
3295 CleanupStack::PopAndDestroy(&convertorsImplArray); //convertorsImplArray
3297 return arrayOfCharacterSetsAvailable;
3300 CCnvCharacterSetConverter::TCharacterSetSearch
3301 CCnvCharacterSetConverter::AppendHardCodedCharacterSetIfRequiredL(
3302 CArrayFix<SCharacterSet>& aArrayOfCharacterSets,
3303 TUint aIdentifierOfOnlyCharacterSetOfInterest,
3304 TUint aIdentifierOfHardCodedCharacterSet,
3305 const TDesC& aNameOfHardCodedCharacterSet)
3307 if ((aIdentifierOfOnlyCharacterSetOfInterest==0) || (aIdentifierOfOnlyCharacterSetOfInterest==aIdentifierOfHardCodedCharacterSet))
3309 SCharacterSet characterSet;
3310 characterSet.iIdentifier=aIdentifierOfHardCodedCharacterSet;
3311 characterSet.iFlags=0;
3312 characterSet.iName=aNameOfHardCodedCharacterSet.AllocLC();
3313 aArrayOfCharacterSets.AppendL(characterSet);
3314 CleanupStack::Pop(); // characterSet.iName
3315 if (aIdentifierOfOnlyCharacterSetOfInterest==aIdentifierOfHardCodedCharacterSet)
3317 return EStopCharacterSetSearch;
3320 return EContinueCharacterSetSearch;
3324 CCnvCharacterSetConverter::ScanForStandardNamesAndMibEnumsROMOnlyL(RFs& aFileServerSession)
3326 CStandardNamesAndMibEnums* standardNamesAndMibEnums=CStandardNamesAndMibEnums::NewLC();
3327 TFindFile* findFile=new(ELeave) TFindFile(aFileServerSession);
3328 CleanupStack::PushL(findFile);
3329 TParse* fileNameParser=new(ELeave) TParse;
3330 CleanupStack::PushL(fileNameParser);
3331 CDir* directory=NULL;
3332 TInt findResult=findFile->FindWildByDir(KLitWildCard, KLitROMSystemCharconvDirectory, directory);
3333 if (findResult==KErrNone)
3335 CleanupStack::PushL(directory);
3336 for (TInt i=directory->Count()-1; i>=0; --i)
3338 const TEntry& entry=(*directory)[i];
3339 if (entry.iType[0].iUid==0x1000589b)
3341 fileNameParser->SetNoWild(entry.iName, &findFile->File(), NULL);
3342 standardNamesAndMibEnums->AddFromFileL(aFileServerSession, fileNameParser->FullName());
3345 CleanupStack::PopAndDestroy(); // directory
3349 CleanupStack::PopAndDestroy(2); // fileNameParser and findFile
3350 delete iStandardNamesAndMibEnums;
3351 iStandardNamesAndMibEnums=standardNamesAndMibEnums;
3352 CleanupStack::Pop(); // standardNamesAndMibEnums
3356 void CCnvCharacterSetConverter::ScanForStandardNamesAndMibEnumsL(RFs& aFileServerSession)
3358 CStandardNamesAndMibEnums* standardNamesAndMibEnums=CStandardNamesAndMibEnums::NewLC();
3359 TFindFile* findFile=new(ELeave) TFindFile(aFileServerSession);
3360 CleanupStack::PushL(findFile);
3361 TParse* fileNameParser=new(ELeave) TParse;
3362 CleanupStack::PushL(fileNameParser);
3363 CDir* directory=NULL;
3364 for (TInt findResult=findFile->FindWildByDir(KLitWildCard, KLitSystemCharconvDirectory, directory); findResult!=KErrNotFound; findResult=findFile->FindWild(directory))
3366 CleanupStack::PushL(directory);
3367 User::LeaveIfError(findResult);
3368 for (TInt i=directory->Count()-1; i>=0; --i)
3370 const TEntry& entry=(*directory)[i];
3371 if (entry.iType[0].iUid==0x1000589b)
3373 fileNameParser->SetNoWild(entry.iName, &findFile->File(), NULL);
3374 standardNamesAndMibEnums->AddFromFileL(aFileServerSession, fileNameParser->FullName());
3377 CleanupStack::PopAndDestroy(); // directory
3381 CleanupStack::PopAndDestroy(2); // fileNameParser and findFile
3382 delete iStandardNamesAndMibEnums;
3383 iStandardNamesAndMibEnums=standardNamesAndMibEnums;
3384 CleanupStack::Pop(); // standardNamesAndMibEnums
3388 CCnvCharacterSetConverter::TAvailability
3389 CCnvCharacterSetConverter::DoPrepareToConvertToOrFromL(
3390 TUint aCharacterSetIdentifier,
3391 const CArrayFix<SCharacterSet>* aArrayOfCharacterSetsAvailable,
3392 RFs& aFileServerSession)
3394 OstTraceExt2( TRACE_DUMP, DUP3_CCNVCHARACTERSETCONVERTER_DOPREPARETOCONVERTTOORFROML, "Prepare to convert aCharacterSetIdentifier(0x%x) in aArrayOfCharacterSetsAvailable(0x%x)", aCharacterSetIdentifier, (unsigned int)aArrayOfCharacterSetsAvailable);
3396 //AutoDetectCharacterSetL relies on the fact that this function does not use
3397 //aFileServerSession if aArrayOfCharacterSetsAvailable is *not* NULL and
3398 //if aCharacterSetIdentifier is *not* a data file
3399 // aFileServerSession is no longer used load Plugin libraries. ECom framework used instead
3400 if (aCharacterSetIdentifier==0)
3402 OstTrace0( TRACE_FATAL, CCNVCHARACTERSETCONVERTER_DOPREPARETOCONVERTTOORFROML, "EPanicNullCharacterSetIdentifier3" );
3404 __ASSERT_ALWAYS(aCharacterSetIdentifier!=0, Panic(EPanicNullCharacterSetIdentifier3));
3405 if (iCharacterSetIdentifierOfLoadedConversionData!=aCharacterSetIdentifier)
3408 TUint newStoredFlags=0;
3409 const SCnvConversionData* newConversionData=NULL;
3410 TBuf8<KMaximumLengthOfReplacementForUnconvertibleUnicodeCharacters> replacementForUnconvertibleUnicodeCharacters(KNullDesC8);
3411 switch (aCharacterSetIdentifier)
3413 case KCharacterSetIdentifierUtf7:
3414 case KCharacterSetIdentifierUtf8:
3415 case KCharacterSetIdentifierImapUtf7:
3416 case KCharacterSetIdentifierJavaConformantUtf8:
3418 case KCharacterSetIdentifierCodePage1252:
3419 case KCharacterSetIdentifierWin1252:
3421 newConversionData=&codePage1252ConversionData;
3422 replacementForUnconvertibleUnicodeCharacters=KLit8AsciiSubstituteCharacter;
3425 case KCharacterSetIdentifierIso88591:
3427 newConversionData=&iso88591ConversionData;
3428 replacementForUnconvertibleUnicodeCharacters=KLit8AsciiSubstituteCharacter;
3431 case KCharacterSetIdentifierAscii:
3433 newConversionData=&asciiConversionData;
3434 replacementForUnconvertibleUnicodeCharacters=KLit8AsciiSubstituteCharacter;
3437 case KCharacterSetIdentifierSms7Bit:
3439 newConversionData=&sms7BitConversionData;
3440 replacementForUnconvertibleUnicodeCharacters=KLit8Sms7BitSubstituteCharacter;
3443 case KCharacterSetIdentifierUnicodeLittle:
3445 newConversionData=&unicodeConversionDataLittle;
3448 case KCharacterSetIdentifierUnicodeBig:
3450 newConversionData=&unicodeConversionDataBig;
3454 if (aArrayOfCharacterSetsAvailable==NULL)
3456 aArrayOfCharacterSetsAvailable=DoCreateArrayOfCharacterSetsAvailableLC(aFileServerSession, aCharacterSetIdentifier);
3460 CleanupStack::PushL(STATIC_CAST(TAny*, NULL)); // dummy item on the cleanup-stack so that we can simply CleanupStack::PopAndDestroy() on ending the loop below
3463 for (TInt i=aArrayOfCharacterSetsAvailable->Count()-1; ; --i)
3467 CleanupStack::PopAndDestroy(); // aArrayOfCharacterSetsAvailable or dummy NULL pointer
3468 return ENotAvailable;
3470 const SCharacterSet& characterSet=(*aArrayOfCharacterSetsAvailable)[i];
3471 if (characterSet.Identifier()==aCharacterSetIdentifier)
3473 if (!characterSet.NameIsFileName())
3475 OstTrace0( TRACE_DUMP, DUP1_CCNVCHARACTERSETCONVERTER_DOPREPARETOCONVERTTOORFROML, "EPanicNameIsNotFileName" );
3477 __ASSERT_DEBUG(characterSet.NameIsFileName(), Panic(EPanicNameIsNotFileName));
3478 if (characterSet.FileIsConversionPlugInLibrary())
3480 newStoredFlags|=EStoredFlagConversionPlugInLibraryIsLoaded;
3483 implUid.iUid = aCharacterSetIdentifier;
3484 replacementForUnconvertibleUnicodeCharacters = (iCharsetCnvCache->GetConverterL(implUid))->ReplacementForUnconvertibleUnicodeCharacters();
3488 //You are here?! This should never happen! Source code here was related to
3489 //old type character set converter data!
3490 OstTrace0( TRACE_FATAL, DUP2_CCNVCHARACTERSETCONVERTER_DOPREPARETOCONVERTTOORFROML, "EPanicCharacterSetNotPresent" );
3491 __ASSERT_ALWAYS(EFalse, Panic(EPanicCharacterSetNotPresent));
3496 CleanupStack::PopAndDestroy(); // aArrayOfCharacterSetsAvailable or dummy NULL pointer
3499 iStoredFlags&=~EStoredFlagConversionPlugInLibraryIsLoaded;
3500 iCharacterSetIdentifierOfLoadedConversionData=aCharacterSetIdentifier;
3501 iStoredFlags|=newStoredFlags;
3502 iConversionData=newConversionData;
3503 iDefaultEndiannessOfForeignCharacters=ELittleEndian;
3504 iDowngradeForExoticLineTerminatingCharacters=EDowngradeExoticLineTerminatingCharactersToCarriageReturnLineFeed;
3505 iReplacementForUnconvertibleUnicodeCharacters=replacementForUnconvertibleUnicodeCharacters;
3510 LOCAL_C void DeleteOneDirectionData(
3511 TInt aNumberOfRanges,
3512 const SCnvConversionData::SOneDirectionData::SRange* aRange)
3514 if ( !((aRange!=NULL) || (aNumberOfRanges==0)) )
3516 OstTrace0( TRACE_DUMP, _DELETEONEDIRECTIONDATA, "EPanicBadNumberOfRanges4" );
3518 __ASSERT_DEBUG((aRange!=NULL) || (aNumberOfRanges==0), Panic(EPanicBadNumberOfRanges4));
3521 if (aNumberOfRanges<=0)
3523 OstTrace0( TRACE_DUMP, DUP1__DELETEONEDIRECTIONDATA, "EPanicBadNumberOfRanges5" );
3525 __ASSERT_DEBUG(aNumberOfRanges>0, Panic(EPanicBadNumberOfRanges5));
3526 SCnvConversionData::SOneDirectionData::SRange* currentRange=CONST_CAST(SCnvConversionData::SOneDirectionData::SRange*, aRange);
3527 const SCnvConversionData::SOneDirectionData::SRange* const lastRange=currentRange+(aNumberOfRanges-1);
3530 switch (currentRange->iAlgorithm)
3532 case SCnvConversionData::SOneDirectionData::SRange::EDirect:
3533 case SCnvConversionData::SOneDirectionData::SRange::EOffset:
3535 case SCnvConversionData::SOneDirectionData::SRange::EIndexedTable16:
3536 #if defined(CONST_STATIC_UNIONS_ARE_POSSIBLE)
3537 delete [] CONST_CAST(SCnvConversionData::SOneDirectionData::SRange::UData::SIndexedTable16*, currentRange->iData.iIndexedTable16.iEntryArray);
3539 delete [] REINTERPRET_CAST(SCnvConversionData::SOneDirectionData::SRange::UData::SIndexedTable16*, currentRange->iData.iWord1);
3542 case SCnvConversionData::SOneDirectionData::SRange::EKeyedTable1616:
3543 #if defined(CONST_STATIC_UNIONS_ARE_POSSIBLE)
3544 delete [] CONST_CAST(SCnvConversionData::SOneDirectionData::SRange::UData::SKeyedTable1616*, currentRange->iData.iKeyedTable1616.iEntryArray);
3546 delete [] REINTERPRET_CAST(SCnvConversionData::SOneDirectionData::SRange::UData::SKeyedTable1616*, currentRange->iData.iWord2);
3549 case SCnvConversionData::SOneDirectionData::SRange::EKeyedTable16OfIndexedTables16:
3553 OstTrace0( TRACE_FATAL, DUP2__DELETEONEDIRECTIONDATA, "EPanicBadAlgorithm2" );
3554 Panic(EPanicBadAlgorithm2);
3558 if (currentRange>lastRange)
3560 OstTrace0( TRACE_DUMP, DUP3__DELETEONEDIRECTIONDATA, "EPanicPointerPastUpperLimit25" );
3562 __ASSERT_DEBUG(currentRange<=lastRange, Panic(EPanicPointerPastUpperLimit25));
3563 if (currentRange==lastRange)
3569 delete [] CONST_CAST(SCnvConversionData::SOneDirectionData::SRange*, aRange);
3573 void CCnvCharacterSetConverter::DeleteConversionData(const SCnvConversionData* aConversionData)
3575 if (aConversionData!=NULL)
3577 delete [] CONST_CAST(SCnvConversionData::SVariableByteData::SRange*, aConversionData->iForeignVariableByteData.iRangeArray);
3578 DeleteOneDirectionData(aConversionData->iForeignToUnicodeData.iNumberOfRanges, aConversionData->iForeignToUnicodeData.iRangeArray);
3579 DeleteOneDirectionData(aConversionData->iUnicodeToForeignData.iNumberOfRanges, aConversionData->iUnicodeToForeignData.iRangeArray);
3580 delete CONST_CAST(SCnvConversionData*, aConversionData);
3584 void CCnvCharacterSetConverter::DeleteConversionData(TAny* aConversionData)
3586 DeleteConversionData(STATIC_CAST(SCnvConversionData*, aConversionData));
3589 CCnvCharacterSetConverter::TEndianness
3590 CCnvCharacterSetConverter::EndiannessOfForeignCharacters(
3591 const SCnvConversionData& aConversionData,
3592 TEndianness aDefaultEndiannessOfForeignCharacters)
3594 switch (aConversionData.iEndiannessOfForeignCharacters)
3596 case SCnvConversionData::EUnspecified:
3597 return aDefaultEndiannessOfForeignCharacters;
3598 case SCnvConversionData::EFixedLittleEndian:
3599 return ELittleEndian;
3600 case SCnvConversionData::EFixedBigEndian:
3604 OstTrace0( TRACE_DUMP, CCNVCHARACTERSETCONVERTER_ENDIANNESSOFFOREIGNCHARACTERS, "EPanicBadEndianness3" );
3605 Panic(EPanicBadEndianness3);
3607 return ELittleEndian; // dummy return to prevent compiler error
3610 // CCnvCharacterSetConverter::TArrayOfAscendingIndices
3612 /** Appends an index to the array of indices.
3614 The value of aIndex should be greater than that of the
3615 last index in the array, to maintain an ascending array. The return
3616 value should be tested to see whether the function succeeded or not.
3618 @param aIndex The index to append to the array.
3619 @return EAppendFailed if the append failed, or
3620 EAppendSuccessful if it succeeded. */
3621 EXPORT_C CCnvCharacterSetConverter::TArrayOfAscendingIndices::TAppendResult
3622 CCnvCharacterSetConverter::TArrayOfAscendingIndices::AppendIndex(TInt aIndex)
3626 OstTrace1( TRACE_DUMP, DUP2_TARRAYOFASCENDINGINDICES_APPENDINDEX, "Bad index in TArrayOfAscendingIndices::AppendIndex;aIndex=%d", aIndex );
3628 __ASSERT_DEBUG(aIndex>=0, Panic(EPanicBadIndex));
3629 const TInt lengthOfArrayOfIndices=iArrayOfIndices.Length();
3630 if ((aIndex>STATIC_CAST(TInt, KMaxTUint16)) || (lengthOfArrayOfIndices==iArrayOfIndices.MaxLength()))
3632 return EAppendFailed;
3634 if ( (lengthOfArrayOfIndices!=0) && (iArrayOfIndices[lengthOfArrayOfIndices-1]>=aIndex))
3636 OstTrace1( TRACE_DUMP, DUP1_TARRAYOFASCENDINGINDICES_APPENDINDEX, "Duplicate Index Or Not Ascending in TArrayOfAscendingIndices::AppendIndex;aIndex=%d", aIndex );
3638 __ASSERT_DEBUG((lengthOfArrayOfIndices==0) || (iArrayOfIndices[lengthOfArrayOfIndices-1]<aIndex), Panic(EPanicDuplicateIndexOrNotAscending));
3639 iArrayOfIndices.Append(aIndex);
3640 return EAppendSuccessful;
3644 The method sets the max size of the internal character set converter cache.
3645 The cache is used mainly to improve the performance of AutoDetectCharSetL() calls.
3646 It caches loaded converter implementations. The next time when a specific implementation is needed,
3647 a search will be done in the cache if this implementation is already loaded and if it is there,
3648 the cached implementation will be used. SetMaxCacheSize() call
3649 is used to limit the max cache size, because the loaded implementatiions may consume a lot of the
3650 system resources (memory for example).
3651 By default (if SetMaxCacheSize() is never called) the max cache size is limited to 32 entries.
3652 Note: Setting very small cache size will impact the overall performance of CHARCONV functions.
3653 If the choosen cache size is less than the number of existing character set converter
3654 implementations, there will be no performance gain or it will be far beyond client's
3655 expectations. For best performance the choosen cache size should be bigger or equal to
3656 the number of the existing character set converter implementations.
3657 @param aSize The new max cache size. It must be bigger or equal to 4.
3658 @panic User::Invariant() if the new max cache size is less than 4.
3659 @see CCnvCharacterSetConverter::AutoDetectCharSetL
3661 EXPORT_C void CCnvCharacterSetConverter::SetMaxCacheSize(TInt aSize)
3663 if ( aSize < CCharsetCnvCache::KMinCacheSize )
3665 OstTrace1( TRACE_FATAL, CCNVCHARACTERSETCONVERTER_SETMAXCACHESIZE, "Parameter aSize < KMinCacheSize in CCnvCharacterSetConverter::SetMaxCacheSize;aSize=%d", aSize );
3667 __ASSERT_ALWAYS(aSize >= CCharsetCnvCache::KMinCacheSize, User::Invariant());
3668 iCharsetCnvCache->SetMaxSize(aSize);