Update contrib.
2 * Copyright (c) 2002 Nokia Corporation and/or its subsidiary(-ies).
4 * This component and the accompanying materials are made available
5 * under the terms of "Eclipse Public License v1.0"
6 * which accompanies this distribution, and is available
7 * at the URL "http://www.eclipse.org/legal/epl-v10.html".
9 * Initial Contributors:
10 * Nokia Corporation - initial contribution.
14 * Description: Implements the characterconversion plug-in
15 * for ISCII characterset.
25 #include <convgeneratedcpp.h>
26 #include <convutils.h>
28 //The maximum length of any intermediate buffer allocated for conversion.
29 const TInt KMaximumLengthOfIntermediateBuffer=5;
30 //The ISCII ATR code point, used for ISCII script switching mechanism.
31 const TUint KControlCharacterEscape=0xef;
32 //The number of Indic scripts supported by the plug-in.
33 //ISCII in general addresses all the Indic character sets.
34 const TUint KNumberOfIndicCharactersetsSupported = 1;
35 //The common reason for panic for all panics raised by the iscii plug-in
36 _LIT16(KPanicReason,"ISCII Plug-in Panic");
37 //The escape sequence for ISCII (ATR) is 0xEF and immidiate byte following
38 //that is the script selection code for Devanagari.
39 _LIT8(KEscapeSequenceDevanagari,"\xef\x42");
40 //The sequence for Explicit Halant, in unicode it gets converted to VIRAMA+ZWNJ
41 _LIT8(KExplicitHalant,"\xe8\xe8");
42 //For supportiing ISCII to Unicode conversion of multi byte ISCII sequences, the
43 //sequence is converted to intermediate unused iscii code point.
44 _LIT8(KReplacementForExplicitHalant,"\xe8\xfc");
45 //The sequence for Soft Halant, in unicode it gets converted to VIRAMA+ZWJ
46 _LIT8(KSoftHalant,"\xe8\xe9");
47 //For supportiing ISCII to Unicode conversion of multi byte ISCII sequences, the
48 //sequence is converted to intermediate unused iscii code point.
49 _LIT8(KReplacementForSoftHalant,"\xe8\xfd");
50 //Devanagari character Om
51 _LIT8(KOm,"\xa1\xe9");
52 ////For supportiing ISCII to Unicode conversion of multi byte ISCII sequences, the
53 //sequence is converted to intermediate unused iscii code point.
54 _LIT8(KReplacementForOm,"\xfe");
55 //Devanagari character Avagraha
56 _LIT8(KAvagraha,"\xea\xe9");
57 //For supportiing ISCII to Unicode conversion of multi byte ISCII sequences, the
58 //sequence is converted to intermediate unused iscii code point.
59 _LIT8(KReplacementForAvagraha,"\xff");
61 //Devanagari character VOCALIC RR
62 _LIT8(KVocalicRr,"\xaa\xe9");
63 //For supportiing ISCII to Unicode conversion of multi byte ISCII sequences, the
64 //sequence is converted to intermediate unused iscii code point.
65 _LIT8(KReplacementForVocalicRr,"\x80");
66 //Devanagari character VOCALIC LL
67 _LIT8(KVocalicLl,"\xa7\xe9");
68 //For supportiing ISCII to Unicode conversion of multi byte ISCII sequences, the
69 //sequence is converted to intermediate unused iscii code point.
70 _LIT8(KReplacementForVocalicLl,"\x81");
71 //Devanagari character VOCALIC L SIGN
72 _LIT8(KVocalicLSign,"\xdb\xe9");
73 //For supportiing ISCII to Unicode conversion of multi byte ISCII sequences, the
74 //sequence is converted to intermediate unused iscii code point.
75 _LIT8(KReplacementForVocalicLSign,"\x82");
76 //Devanagari character VOCALIC LL SIGN
77 _LIT8(KVocalicLlSign,"\xdc\xe9");
78 //For supportiing ISCII to Unicode conversion of multi byte ISCII sequences, the
79 //sequence is converted to intermediate unused iscii code point.
80 _LIT8(KReplacementForVocalicLlSign,"\x83");
81 //Devanagari character VOCALIC L
82 _LIT8(KVocalicL,"\xa6\xe9");
83 //For supportiing ISCII to Unicode conversion of multi byte ISCII sequences, the
84 //sequence is converted to intermediate unused iscii code point.
85 _LIT8(KReplacementForVocalicL,"\x84");
86 //Devanagari character VOCALIC RR SIGN
87 _LIT8(KVocalicRrSign,"\xdf\xe9");
88 //For supportiing ISCII to Unicode conversion of multi byte ISCII sequences, the
89 //sequence is converted to intermediate unused iscii code point.
90 _LIT8(KReplacementForVocalicRrSign,"\x85");
92 //Unconvertible ISCII character
93 _LIT8(KIsciiUnconvertibleCharacter,"\xeb");
97 //The panic raised by ConvertToUnicodeFromModalForeign_Internal() if the input
98 //conversion flag is CCnvCharacterSetConverter::EInputConversionFlagStopAtFirstUnconvertibleCharacter
99 EPanicBadInputConversionFlags=1,
100 //Panic raised if the buffer does not start with the escape sequence 0xEF
101 EPanicBadRemainderOfForeign,
102 //Panic is raised if the length of the search buffer is greater than the length of the
104 EPanicBadReplacementBuffer,
105 //If the offset of start of the escape sequence is not an unsigned number.
106 EPanicBadStartOfNextEscapeSequence
109 //The dummy datastructure for the dummy conversion data i.e. used for conversion if the
110 //script selection code is not supported.
111 #define ARRAY_LENGTH(aArray) (sizeof(aArray)/sizeof((aArray)[0]))
113 LOCAL_D const SCnvConversionData::SOneDirectionData::SRange::UData::SKeyedTable1616::SEntry keyedTable1616_foreignToUnicode_1[]=
121 LOCAL_D const SCnvConversionData::SOneDirectionData::SRange::UData::SKeyedTable1616::SEntry keyedTable1616_unicodeToForeign_1[]=
129 LOCAL_D const SCnvConversionData::SVariableByteData::SRange foreignVariableByteDataRanges[]=
139 LOCAL_D const SCnvConversionData::SOneDirectionData::SRange foreignToUnicodeDataRanges[]=
144 SCnvConversionData::SOneDirectionData::SRange::EDirect,
154 SCnvConversionData::SOneDirectionData::SRange::EKeyedTable1616,
158 UData_SKeyedTable1616(keyedTable1616_foreignToUnicode_1)
163 LOCAL_D const SCnvConversionData::SOneDirectionData::SRange unicodeToForeignDataRanges[]=
168 SCnvConversionData::SOneDirectionData::SRange::EDirect,
178 SCnvConversionData::SOneDirectionData::SRange::EKeyedTable1616,
182 UData_SKeyedTable1616(keyedTable1616_unicodeToForeign_1)
187 //The dummy conversion data to be used for conversion if the iscii code sequence is not
188 //Devanagari (i.e. the script selection code is not 0x42 and something else.
189 //In this case the ISCII characters are converted to unconvertible characters.
191 LOCAL_D const SCnvConversionData conversionDataDummy=
193 SCnvConversionData::EFixedBigEndian,
195 ARRAY_LENGTH(foreignVariableByteDataRanges),
196 foreignVariableByteDataRanges
199 ARRAY_LENGTH(foreignToUnicodeDataRanges),
200 foreignToUnicodeDataRanges
203 ARRAY_LENGTH(unicodeToForeignDataRanges),
204 unicodeToForeignDataRanges
214 ///////////////////////////////////////////////////////////////
218 #include <ecom/implementationproxy.h>
219 #include <charactersetconverter.h>
223 * The character conversion plug-in implementation for Iscii.
226 * @since Series 60 3.1
229 class CIsciiImplementation : public CCharacterSetConverterPluginInterface
232 //From CCharacterSetConverterPluginInterface
233 virtual const TDesC8& ReplacementForUnconvertibleUnicodeCharacters();
235 //From CCharacterSetConverterPluginInterface
236 virtual TInt ConvertFromUnicode(
237 CCnvCharacterSetConverter::TEndianness aDefaultEndiannessOfForeignCharacters,
238 const TDesC8& aReplacementForUnconvertibleUnicodeCharacters,
240 const TDesC16& aUnicode,
241 CCnvCharacterSetConverter::TArrayOfAscendingIndices& aIndicesOfUnconvertibleCharacters );
243 //From CCharacterSetConverterPluginInterface
244 virtual TInt ConvertToUnicode(
245 CCnvCharacterSetConverter::TEndianness aDefaultEndiannessOfForeignCharacters,
247 const TDesC8& aForeign,
249 TInt& aNumberOfUnconvertibleCharacters,
250 TInt& aIndexOfFirstByteOfFirstUnconvertibleCharacter );
252 //From CCharacterSetConverterPluginInterface
253 virtual TBool IsInThisCharacterSetL(
255 TInt& aConfidenceLevel,
258 static CIsciiImplementation* NewL();
260 virtual ~CIsciiImplementation();
262 CIsciiImplementation();
265 //Checks if a descriptor starts with another descriptor at the begining.
266 LOCAL_C TBool IsStartOf(const TDesC8& aEscapeSequence, const TDesC8& aBuffer)
268 const TInt lengthOfStart=aEscapeSequence.Length();
269 return (aBuffer.Length()>=lengthOfStart) && (aBuffer.Left(lengthOfStart)==aEscapeSequence);
271 // -----------------------------------------------------------------------------
272 // MatchesEscapeSequence()
273 //If the remainder of the foreign text starts with the passed escapesequence, modifies the remainder of the foreign text
274 //and sets the homogeneous run buffer that uses the same conversion data.
275 //The homogeneous run buffer is the buffer that will use a single conversion data, it doesn't contain the attribute code
276 // neither it contains the script switching code.
277 //The aRemainderOfForeign buffer
279 // Returns: ETrue: If the sequence contains the escape sequence
280 // EFalse: If the sequence does not contain the escape sequence
282 // -----------------------------------------------------------------------------
284 LOCAL_C TBool MatchesEscapeSequence(TInt& aNumberOfForeignBytesConsumed, TPtrC8& aHomogeneousRun,
285 TPtrC8& aRemainderOfForeign, const TDesC8& aEscapeSequence)
287 const TInt lengthOfEscapeSequence=aEscapeSequence.Length();
288 if (IsStartOf(aEscapeSequence, aRemainderOfForeign))
290 aRemainderOfForeign.Set(aRemainderOfForeign.Mid(lengthOfEscapeSequence));
291 const TInt startOfNextEscapeSequence=aRemainderOfForeign.Locate(KControlCharacterEscape);
292 if (startOfNextEscapeSequence==KErrNotFound)
294 aHomogeneousRun.Set(aRemainderOfForeign);
295 aRemainderOfForeign.Set(NULL, 0);
299 aHomogeneousRun.Set(aRemainderOfForeign.Left(startOfNextEscapeSequence));
300 aRemainderOfForeign.Set(aRemainderOfForeign.Mid(startOfNextEscapeSequence));
302 aNumberOfForeignBytesConsumed+=lengthOfEscapeSequence;
308 // -----------------------------------------------------------------------------
309 // NextHomogeneousForeignRun()
310 //Matches the escape sequence of each of the elements of the SState array with the remainder of
311 //foreign text and if the escape sequence matches with the start of remainder of the foreign text,
312 //then the conversion data is set to the conversion data corresponding to the escape sequence
313 //Also the homogeneous foreign text for conversion with the same escape sequence is set.
315 // Returns: ETrue: If length of the remainder of foreign buffer is nonzero.
316 // EFalse: If length of the remainder of foreign buffer is zero.
318 // -----------------------------------------------------------------------------
322 LOCAL_C TBool NextHomogeneousForeignRun(const SCnvConversionData*& aConversionData, TInt& aNumberOfForeignBytesConsumed, TPtrC8& aHomogeneousRun, TPtrC8& aRemainderOfForeign, const TArray<CnvUtilities::SState>& aArrayOfStates, TUint& aOutputConversionFlags)
324 TBool returnValue = EFalse;
325 TBool foundState = EFalse;
326 __ASSERT_DEBUG((aRemainderOfForeign.Length()==0) || (aRemainderOfForeign[0]==KControlCharacterEscape), User::Panic(KPanicReason,EPanicBadRemainderOfForeign));
327 if (aRemainderOfForeign.Length()==0)
331 const TInt numberOfStates=aArrayOfStates.Count();
333 for (i=0; i<numberOfStates; ++i)
335 const CnvUtilities::SState& state=aArrayOfStates[i];
336 if (MatchesEscapeSequence(aNumberOfForeignBytesConsumed, aHomogeneousRun, aRemainderOfForeign, *state.iEscapeSequence))
338 aConversionData=state.iConversionData;
344 for (i=0; i<numberOfStates; ++i)
346 if (IsStartOf(aRemainderOfForeign, *aArrayOfStates[i].iEscapeSequence))
348 // aRemainderOfForeign ends with a truncated escape sequence, so ConvertToUnicode cannot convert any more
349 aOutputConversionFlags|=CCnvCharacterSetConverter::EOutputConversionFlagInputIsTruncated;
354 MatchesEscapeSequence(aNumberOfForeignBytesConsumed,aHomogeneousRun,aRemainderOfForeign,aRemainderOfForeign.Left(2));
355 aConversionData = &conversionDataDummy;
358 if (aHomogeneousRun.Length()>0)
364 // -----------------------------------------------------------------------------
365 // ConvertFromUnicodeIntermediateBufferInPlace()
366 //Default implementation for conversion to the intermediate buffer
367 //It modifies the unicode buffer before it is converted back to iscii.
368 //The current implementation of iscii plug-in doesn't require any
369 //modification to the default implementation
372 // -----------------------------------------------------------------------------
376 LOCAL_C void ConvertFromUnicodeIntermediateBufferInPlace(TInt aStartPositionInDescriptor, TDes8& aDescriptor, TInt& aNumberOfCharactersThatDroppedOut)
378 CnvUtilities::ConvertFromIntermediateBufferInPlace(aStartPositionInDescriptor, aDescriptor, aNumberOfCharactersThatDroppedOut, KEscapeSequenceDevanagari, 1);
381 // -----------------------------------------------------------------------------
382 // DoFindAndModifyBuffer()
383 //Modifies the iscii buffer by replacing the search buffer with the replacement buffer.
384 //Introduced for handling multibyte iscii sequence.
385 //Takes the search buffer array and the replacement buffer arrays as input to it and replaces all
386 //the occurances of the search buffer with the corresponding replace buffer.
389 // -----------------------------------------------------------------------------
392 LOCAL_C void DoFindAndModifyBuffer(TDes8& aModifyBuffer,const TDesC8& aSearchBuffer,const TDesC8& aReplaceBuffer)
397 __ASSERT_ALWAYS((aSearchBuffer.Length()>= aReplaceBuffer.Length()),User::Panic(KPanicReason,EPanicBadReplacementBuffer));
398 if((offset = aModifyBuffer.Find(aSearchBuffer)) != KErrNotFound)
400 TUint8 *pointerToBuffer = const_cast<TUint8*> (aModifyBuffer.Ptr());
401 Mem::Copy(pointerToBuffer+offset,aReplaceBuffer.Ptr(),aReplaceBuffer.Length());
402 Mem::Copy(pointerToBuffer+offset+aReplaceBuffer.Length(),pointerToBuffer+offset+aSearchBuffer.Length(),aModifyBuffer.Length()-aSearchBuffer.Length()-offset);
403 aModifyBuffer.SetLength(aModifyBuffer.Length() - aSearchBuffer.Length() + aReplaceBuffer.Length());
411 // -----------------------------------------------------------------------------
412 // FindAndModifyBuffer()
413 //Modifies the iscii buffer by replacing the search buffer with the replacement buffer.
414 //Calls DoFindAndModifyBuffer() and supplies the search buffer and replacement buffer.
415 //Introduced for handling multibyte iscii sequence.
418 // -----------------------------------------------------------------------------
421 LOCAL_C void FindAndModifyBuffer(TDes8& aModifyBuffer)
424 RArray<TPtrC8> searchBuffer;
425 RArray<TPtrC8> replaceBuffer;
427 //If the passed buffer contains the replacement buffer,
428 //Then it should not get converted to respective Unicode
429 //buffer rather it should get converted to replacement for
430 //unconvertible character.
432 ret |= searchBuffer.Append(KReplacementForExplicitHalant().Right(1));
433 ret |= searchBuffer.Append(KReplacementForSoftHalant().Right(1));
434 ret |= searchBuffer.Append(KReplacementForOm().Right(1));
435 ret |= searchBuffer.Append(KReplacementForAvagraha().Right(1));
437 ret |= searchBuffer.Append(KReplacementForVocalicRr().Right(1));
438 ret |= searchBuffer.Append(KReplacementForVocalicLl().Right(1));
439 ret |= searchBuffer.Append(KReplacementForVocalicLSign().Right(1));
440 ret |= searchBuffer.Append(KReplacementForVocalicLlSign().Right(1));
441 ret |= searchBuffer.Append(KReplacementForVocalicL().Right(1));
442 ret |= searchBuffer.Append(KReplacementForVocalicRrSign().Right(1));
444 //All normal search buffers
445 ret |= searchBuffer.Append(KExplicitHalant().Mid(0));
446 ret |= searchBuffer.Append(KSoftHalant().Mid(0));
447 ret |= searchBuffer.Append(KOm().Mid(0));
448 ret |= searchBuffer.Append(KAvagraha().Mid(0));
450 ret |= searchBuffer.Append(KVocalicRr().Mid(0));
451 ret |= searchBuffer.Append(KVocalicLl().Mid(0));
452 ret |= searchBuffer.Append(KVocalicLSign().Mid(0));
453 ret |= searchBuffer.Append(KVocalicLlSign().Mid(0));
454 ret |= searchBuffer.Append(KVocalicL().Mid(0));
455 ret |= searchBuffer.Append(KVocalicRrSign().Mid(0));
457 //The replacement buffer for the odd cases to restrict the
458 //replacement buffers not to get converted to the corresponding
461 ret |= replaceBuffer.Append(KIsciiUnconvertibleCharacter().Mid(0));
462 ret |= replaceBuffer.Append(KIsciiUnconvertibleCharacter().Mid(0));
463 ret |= replaceBuffer.Append(KIsciiUnconvertibleCharacter().Mid(0));
464 ret |= replaceBuffer.Append(KIsciiUnconvertibleCharacter().Mid(0));
466 ret |= replaceBuffer.Append(KIsciiUnconvertibleCharacter().Mid(0));
467 ret |= replaceBuffer.Append(KIsciiUnconvertibleCharacter().Mid(0));
468 ret |= replaceBuffer.Append(KIsciiUnconvertibleCharacter().Mid(0));
469 ret |= replaceBuffer.Append(KIsciiUnconvertibleCharacter().Mid(0));
470 ret |= replaceBuffer.Append(KIsciiUnconvertibleCharacter().Mid(0));
471 ret |= replaceBuffer.Append(KIsciiUnconvertibleCharacter().Mid(0));
473 //All normal replace buffers
474 ret |= replaceBuffer.Append(KReplacementForExplicitHalant().Mid(0));
475 ret |= replaceBuffer.Append(KReplacementForSoftHalant().Mid(0));
476 ret |= replaceBuffer.Append(KReplacementForOm().Mid(0));
477 ret |= replaceBuffer.Append(KReplacementForAvagraha().Mid(0));
480 ret |= replaceBuffer.Append(KReplacementForVocalicRr().Mid(0));
481 ret |= replaceBuffer.Append(KReplacementForVocalicLl().Mid(0));
482 ret |= replaceBuffer.Append(KReplacementForVocalicLSign().Mid(0));
483 ret |= replaceBuffer.Append(KReplacementForVocalicLlSign().Mid(0));
484 ret |= replaceBuffer.Append(KReplacementForVocalicL().Mid(0));
485 ret |= replaceBuffer.Append(KReplacementForVocalicRrSign().Mid(0));
487 __ASSERT_DEBUG(!ret, User::Panic(_L("RArray append failure"), ret));
489 for(TInt counter=0;counter<searchBuffer.Count();counter++)
491 DoFindAndModifyBuffer(aModifyBuffer,searchBuffer[counter],replaceBuffer[counter]);
493 searchBuffer.Reset();
494 replaceBuffer.Reset();
498 // -----------------------------------------------------------------------------
499 // DoNormalizeReturnValue()
500 //Modifies the return value(Number of bytes did not get converted) according to the modified
501 //intermediate buffer. Takes the modified intermediate buffer, return value, search and replace
502 //buffers. Searches for the replace buffer in the intermediate buffer and if found, it looks for
503 //the actual buffer corresponding to the replace buffer and adds the difference of the lengths
504 //of the actual to replace buffer to the return value.
507 // -----------------------------------------------------------------------------
510 LOCAL_C void DoNormalizeReturnValue(TUint& aReturnValue,const TDesC8& aBuffer,RArray<TPtrC8>& anArrayOfSearches,RArray<TPtrC8>& anArrayOfReplaces)
512 TPtr8 buffer(const_cast<TUint8*>(aBuffer.Ptr()),aBuffer.Length(),aBuffer.Length());
513 TUint count = anArrayOfSearches.Count();
517 for(TUint i=0;i<count;i++)
519 TPtrC8 searchBufferForComparison(buffer.Right(anArrayOfReplaces[i].Length()));
520 TInt returnCompare = searchBufferForComparison.Compare(anArrayOfReplaces[i]);
521 if(returnCompare == 0)
524 aReturnValue += (anArrayOfSearches[i].Length() - anArrayOfReplaces[i].Length());
525 buffer=buffer.MidTPtr(0,buffer.Length()-anArrayOfReplaces[i].Length());
530 if(buffer.Length() == 0)
537 buffer=buffer.MidTPtr(0,buffer.Length()-1);
543 // -----------------------------------------------------------------------------
544 // NormalizeReturnValue()
545 //Modifies the return value(Number of bytes did not get converted) according to the
546 //replacements done to the iscii buffer before conversion.
547 //Internally calls DoNormalizeReturnValue() by suppling the search and replacement
552 // -----------------------------------------------------------------------------
555 LOCAL_C void NormalizeReturnValue(TUint& aReturnValue,const TDesC8& aBuffer)
558 RArray<TPtrC8> searchBuffer;
559 RArray<TPtrC8> replaceBuffer;
561 ret |= searchBuffer.Append(KExplicitHalant().Mid(0));
562 ret |= searchBuffer.Append(KSoftHalant().Mid(0));
563 ret |= searchBuffer.Append(KOm().Mid(0));
564 ret |= searchBuffer.Append(KAvagraha().Mid(0));
566 ret |= searchBuffer.Append(KVocalicRr().Mid(0));
567 ret |= searchBuffer.Append(KVocalicLl().Mid(0));
568 ret |= searchBuffer.Append(KVocalicLSign().Mid(0));
569 ret |= searchBuffer.Append(KVocalicLlSign().Mid(0));
570 ret |= searchBuffer.Append(KVocalicL().Mid(0));
571 ret |= searchBuffer.Append(KVocalicRrSign().Mid(0));
573 ret |= replaceBuffer.Append(KReplacementForExplicitHalant().Mid(0));
574 ret |= replaceBuffer.Append(KReplacementForSoftHalant().Mid(0));
575 ret |= replaceBuffer.Append(KReplacementForOm().Mid(0));
576 ret |= replaceBuffer.Append(KReplacementForAvagraha().Mid(0));
578 ret |= replaceBuffer.Append(KReplacementForVocalicRr().Mid(0));
579 ret |= replaceBuffer.Append(KReplacementForVocalicLl().Mid(0));
580 ret |= replaceBuffer.Append(KReplacementForVocalicLSign().Mid(0));
581 ret |= replaceBuffer.Append(KReplacementForVocalicLlSign().Mid(0));
582 ret |= replaceBuffer.Append(KReplacementForVocalicL().Mid(0));
583 ret |= replaceBuffer.Append(KReplacementForVocalicRrSign().Mid(0));
585 __ASSERT_DEBUG(!ret, User::Panic(_L("RArray append failure"), ret));
587 DoNormalizeReturnValue(aReturnValue,aBuffer,searchBuffer,replaceBuffer);
588 searchBuffer.Reset();
589 replaceBuffer.Reset();
592 // -----------------------------------------------------------------------------
593 // HandleHomogeneousRun()
594 //Handles a homogeneous foreign buffer and converts the foreign buffer to unicode
595 //On return the aUnicode argument contains the converted unicode data.
596 //Also it sets the return value, returned from the conversion. The return value also
597 //takes into account if there is any buffer modification done before passing it to
598 //CCnvCharacterSetConverter::DoConvertToUnicode()
603 // -----------------------------------------------------------------------------
606 LOCAL_C void HandleHomogeneousRun(const SCnvConversionData*& aConversionData,
607 CCnvCharacterSetConverter::TEndianness aDefaultEndiannessOfForeignCharacters,
609 const TDesC8& aHomogeneousForeign,
610 TInt& aNumberOfUnconvertibleCharacters,
611 TInt& aIndexOfFirstByteOfFirstUnconvertibleCharacter,
612 TUint& aOutputConversionFlags,
613 TUint aInputConversionFlags,TInt& aNumberOfForeignBytesConsumed,
616 TInt numberOfUnconvertibleCharacters;
617 TInt indexOfFirstByteOfFirstUnconvertibleCharacter;
618 TUint noOfConsumedBytes = 0;
619 if(aConversionData == NULL)
621 aReturnValue = CCnvCharacterSetConverter::EErrorIllFormedInput;
624 aReturnValue = CCnvCharacterSetConverter::DoConvertToUnicode(*aConversionData,aDefaultEndiannessOfForeignCharacters,
625 aUnicode,aHomogeneousForeign,numberOfUnconvertibleCharacters,
626 indexOfFirstByteOfFirstUnconvertibleCharacter,aOutputConversionFlags,
628 //The numberOfUnconvertibleCharacters and indexOfFirstByteOfFirstUnconvertibleCharacter are the values with
629 //respect to the intermediate iscii buffer and original values aIndexOfFirstByteOfFirstUnconvertibleCharacter and
630 //aNumberOfUnconvertibleCharacters need to be adjusted accordingly.
632 aInputConversionFlags);
633 if(numberOfUnconvertibleCharacters>0)
635 if(aNumberOfUnconvertibleCharacters == 0)
637 aIndexOfFirstByteOfFirstUnconvertibleCharacter = aNumberOfForeignBytesConsumed + indexOfFirstByteOfFirstUnconvertibleCharacter;
639 aNumberOfUnconvertibleCharacters+=numberOfUnconvertibleCharacters;
641 noOfConsumedBytes = aHomogeneousForeign.Length();
642 //To Check whether it is really required.
643 NormalizeReturnValue(noOfConsumedBytes,aHomogeneousForeign);
644 aNumberOfForeignBytesConsumed+=noOfConsumedBytes;
647 TUint normalizedReturnValue = aReturnValue;
649 //There original iscii buffer copied to an intermediate iscii buffer and then modified
650 //and is then passed for conversion. Now, after conversion, the return value needs to
651 //be adjusted according to the original buffer. NormalizeReturnValue() does the
654 NormalizeReturnValue(normalizedReturnValue,aHomogeneousForeign);
655 aNumberOfForeignBytesConsumed-=normalizedReturnValue;
656 aReturnValue=normalizedReturnValue;
659 //The HandleHomogeneousRun() method is called in a loop and once there is some
660 //iscii codes converted to unicode, the ConvertToUnicode() should not return
661 //CCnvCharacterSetConverter::EErrorIllFormedInput even though the conversion
662 //method does not convert any of the iscii codes ppassed. To ensure that once the
663 //first non-zero number of iscii codes are converted, the internal input conversion
664 //flag is set to EInputConversionFlagAllowTruncatedInputNotEvenPartlyConsumable.
666 if(aNumberOfForeignBytesConsumed>0)
668 aInputConversionFlags|=CCnvCharacterSetConverter::EInputConversionFlagAllowTruncatedInputNotEvenPartlyConsumable;
673 // -----------------------------------------------------------------------------
674 // IsTruncatedDoubleByteIsciiSequence()
675 //Checks if anIsciiBuffer is a part of multi byte iscii sequence truncated in the middle.
676 //If it is a truncated sequence, then returns ETrue else returns EFalse.
678 // Returns: ETrue: If the intermediate input iscii buffer is truncated
679 // EFalse: If the intermediate input iscii buffer is not truncated
681 // -----------------------------------------------------------------------------
684 LOCAL_C TBool IsTruncatedDoubleByteIsciiSequence(const TDesC8& anIsciiBuffer)
686 RArray<TPtrC8> searchBuffer;
687 if(anIsciiBuffer.Length () == 0)
689 if(anIsciiBuffer[anIsciiBuffer.Length()-1] == 0xEF)
692 TInt appendret = KErrNone;
693 appendret |= searchBuffer.Append(KSoftHalant().Mid(0));
694 appendret |= searchBuffer.Append(KOm().Mid(0));
695 appendret |= searchBuffer.Append(KAvagraha().Mid(0));
696 appendret |= searchBuffer.Append(KExplicitHalant().Mid(0));
697 __ASSERT_DEBUG(!appendret, User::Panic(_L("RArray append failure"), appendret));
700 TBool isNotTruncated =EFalse;
702 //First check if the intermediate iscii buffer is ending with a complete multi byte sequence.
703 //If it ends with a complete multi byte sequence, no need to check if the last character of
704 //intermediate iscii is same as first character of multi byte iscii sequence. And return EFalse.
705 for(TUint counter = 0;counter<searchBuffer.Count();counter++)
707 if(searchBuffer[counter].Compare(anIsciiBuffer.Right(searchBuffer[counter].Length())) == 0)
709 isNotTruncated = ETrue;
713 //If the intermediate iscii buffer is not ending with a complete multi byte sequence, and the
714 //last code of the iscii buffer is a part of the multibyte sequence, then the iscii buffer is a
715 //truncated sequence and in that case return ETrue.
717 for(TUint counter = 0;counter<searchBuffer.Count();counter++)
721 else if( (anIsciiBuffer[anIsciiBuffer.Length()-1] == searchBuffer[counter][0]))
727 searchBuffer.Reset();
731 // -----------------------------------------------------------------------------
732 // ReplacementForUnconvertibleUnicodeCharacters()
733 //Returns the replacement character for unconvertible unicode character.
734 //In the current implementation it is 0x1a (ASCII Substitute character)
735 //The default implementation calls ReplacementForUnconvertibleUnicodeCharacters_internal()
736 //in turn which is generated by cnvtool.
738 // Returns: Replacemt for unconvertible unicode characters (0x1a)
740 // -----------------------------------------------------------------------------
743 const TDesC8& CIsciiImplementation::ReplacementForUnconvertibleUnicodeCharacters()
745 return ReplacementForUnconvertibleUnicodeCharacters_internal();
748 // -----------------------------------------------------------------------------
749 // ConvertFromUnicode()
750 //The main conversion function for converting from unicode to iscii
751 //Loaded and called by the character conversion framework.
752 //In turn calls CnvUtilities::ConvertFromUnicode() which is Symbian provide
753 //utility method for converting unicode to modal character codes.
755 // Returns: The numbet of unicode codes it could not convert.
757 // -----------------------------------------------------------------------------
760 TInt CIsciiImplementation::ConvertFromUnicode(
761 CCnvCharacterSetConverter::TEndianness
762 aDefaultEndiannessOfForeignCharacters,
763 const TDesC8& aReplacementForUnconvertibleUnicodeCharacters,
765 const TDesC16& aUnicode,
766 CCnvCharacterSetConverter::TArrayOfAscendingIndices& aIndicesOfUnconvertibleCharacters )
768 TFixedArray<CnvUtilities::SCharacterSet,KNumberOfIndicCharactersetsSupported> aArrayOfCharacterSets;
769 aArrayOfCharacterSets[0].iConversionData = &conversionData;
770 aArrayOfCharacterSets[0].iConvertFromIntermediateBufferInPlace = ConvertFromUnicodeIntermediateBufferInPlace;
771 aArrayOfCharacterSets[0].iEscapeSequence = &KEscapeSequenceDevanagari();
773 return CnvUtilities::ConvertFromUnicode(
774 aDefaultEndiannessOfForeignCharacters,
775 aReplacementForUnconvertibleUnicodeCharacters,
778 aIndicesOfUnconvertibleCharacters,
779 aArrayOfCharacterSets.Array());
782 // -----------------------------------------------------------------------------
783 // ConvertToUnicode()
784 //The main conversion function for converting from iscii to unicode
785 //Loaded and called by the character conversion framework.
786 //To support some of the iscii characters, the input forign buffer is
787 //copied to an intermediate buffer and then is then modified and
788 //CCnvCharactersetConverter::DoConvertToUnicode() is called with
789 //the modified buffer. For extensibility of iscii to other Indic languages
790 //it uses CnvUtilities::SState datastructure. CnvUtilities::SState is a
791 //Symbian defined class for modal charactersets. The escape sequence
792 //is specified to ATR followed by the script selection code and the conversion
793 //data is specified to be the conversion for the particular script. For the time
794 //being only Devanagari with script selection code 0x42 is supported. If
795 //any of the other script codes are used the conversion leads to unconvertible
796 //character i.e. 0xFFFD.
797 // Returns: The numbet of iscii codes it could not convert.
799 // -----------------------------------------------------------------------------
802 TInt CIsciiImplementation::ConvertToUnicode(
803 CCnvCharacterSetConverter::TEndianness aDefaultEndiannessOfForeignCharacters,
805 const TDesC8& aForeign,
807 TInt& aNumberOfUnconvertibleCharacters,
808 TInt& aIndexOfFirstByteOfFirstUnconvertibleCharacter )
810 aNumberOfUnconvertibleCharacters = 0;
811 TUint aOutputConversionFlags = CCnvCharacterSetConverter::KStateDefault;
812 aIndexOfFirstByteOfFirstUnconvertibleCharacter=-1;
813 TUint internalInputConversionFlags = 0;
814 TInt numberOfForeignBytesConsumed=0;
815 TPtrC8 remainderOfForeign(aForeign);
818 TBool isSkipMatchSequence = EFalse;
819 const SCnvConversionData* convData;
820 //Set the iscii conversion data and escape sequence for Devanagari.
821 TFixedArray<CnvUtilities::SState,KNumberOfIndicCharactersetsSupported> modals;
822 modals[0].iConversionData = &conversionData;
823 modals[0].iEscapeSequence = &KEscapeSequenceDevanagari();
825 aUnicode.SetLength(0);
827 //The internal input conversion flag for conversion is set to CCnvCharacterSetConverter::EInputConversionFlagAppend
828 //so that for each conversion in the conversion loop, the generated conversion buffer is appened to the aUnicode buffer.
829 internalInputConversionFlags |= CCnvCharacterSetConverter::EInputConversionFlagAppend;
830 if (aForeign.Length()==0)
834 //Get the conversion data from the previous call else the conversion data is set to the default
835 //conversion data, i.e. Devanagari.
836 convData=(aState!=CCnvCharacterSetConverter::KStateDefault)? REINTERPRET_CAST(const SCnvConversionData*, aState): modals[0].iConversionData;
839 TBuf8<KMaximumLengthOfIntermediateBuffer> intermediateBuffer;
840 TUint numberOfForeignBytesConsumedThisTime = 0;
841 if((remainderOfForeign.Length() >=KMaximumLengthOfIntermediateBuffer) && (aUnicode.MaxLength()-aUnicode.Length() >=KMaximumLengthOfIntermediateBuffer))
843 numberOfForeignBytesConsumedThisTime = KMaximumLengthOfIntermediateBuffer;
844 intermediateBuffer = remainderOfForeign.Left(numberOfForeignBytesConsumedThisTime);
845 //If the intermediate buffer is a part of truncated buffer sequence but the
846 //actual input buffer is not truncated then truncated sequence is not converted.
847 //The intermediate buffer is modified so as not to contain the truncated sequence.
849 flag = IsTruncatedDoubleByteIsciiSequence(intermediateBuffer);
852 numberOfForeignBytesConsumedThisTime --;
853 intermediateBuffer = remainderOfForeign.Left(numberOfForeignBytesConsumedThisTime);
859 flag = IsTruncatedDoubleByteIsciiSequence(remainderOfForeign.Left(aUnicode.MaxLength()-aUnicode.Length()));
862 numberOfForeignBytesConsumedThisTime = aUnicode.MaxLength()-aUnicode.Length();
863 intermediateBuffer = remainderOfForeign.Left(numberOfForeignBytesConsumedThisTime);
867 if(aForeign.Length()>(numberOfForeignBytesConsumed+aUnicode.Length()))
869 numberOfForeignBytesConsumedThisTime = aUnicode.MaxLength()-aUnicode.Length()-1;
870 intermediateBuffer = remainderOfForeign.Left(numberOfForeignBytesConsumedThisTime);
875 numberOfForeignBytesConsumedThisTime = aUnicode.MaxLength()-aUnicode.Length();
876 intermediateBuffer = remainderOfForeign.Left(numberOfForeignBytesConsumedThisTime);
881 //The input intermediate iscii buffer is modified with the search and replace
882 //buffers. It is required for supporting multibyte iscii sequences.
883 FindAndModifyBuffer(intermediateBuffer);
884 TPtrC8 remainderOfForeignInternal(intermediateBuffer);
885 TPtrC8 homogeneousRun;
886 const TInt startOfNextEscapeSequence=intermediateBuffer.Locate(KControlCharacterEscape);
887 if (startOfNextEscapeSequence!=0)
889 if (startOfNextEscapeSequence==KErrNotFound)
891 homogeneousRun.Set(remainderOfForeignInternal);
892 remainderOfForeignInternal.Set(NULL, 0);
896 __ASSERT_DEBUG(startOfNextEscapeSequence>0, User::Panic(KPanicReason,EPanicBadStartOfNextEscapeSequence));
897 homogeneousRun.Set(remainderOfForeignInternal.Left(startOfNextEscapeSequence));
898 remainderOfForeignInternal.Set(remainderOfForeignInternal.Mid(startOfNextEscapeSequence));
900 isSkipMatchSequence = ETrue;
904 if(!isSkipMatchSequence)
906 if (!NextHomogeneousForeignRun(convData, numberOfForeignBytesConsumed, homogeneousRun,
907 remainderOfForeignInternal, modals.Array(), aOutputConversionFlags))
912 HandleHomogeneousRun( convData, aDefaultEndiannessOfForeignCharacters, aUnicode, homogeneousRun, aNumberOfUnconvertibleCharacters,
913 aIndexOfFirstByteOfFirstUnconvertibleCharacter,aOutputConversionFlags,internalInputConversionFlags,
914 numberOfForeignBytesConsumed,returnValue);
919 isSkipMatchSequence = EFalse;
923 if ((!flag && (numberOfForeignBytesConsumedThisTime != KMaximumLengthOfIntermediateBuffer)) || (flag && (numberOfForeignBytesConsumedThisTime != (KMaximumLengthOfIntermediateBuffer-1) )))
925 remainderOfForeign.Set(aForeign.Mid(numberOfForeignBytesConsumed));
927 //If the number of iscii bytes consumed by the conversion is zero also the output conversion
928 //flag is not set to EOutputConversionFlagInputIsTruncated, then return EErrorIllFormedInput.
929 if ((numberOfForeignBytesConsumed==0) && (aOutputConversionFlags&CCnvCharacterSetConverter::EOutputConversionFlagInputIsTruncated))
931 return CCnvCharacterSetConverter::EErrorIllFormedInput;
933 //Set the conversion data sothat next time when ConvertToUnicode() is called,
934 //will use the previous conversion data.
935 aState=REINTERPRET_CAST(TInt, convData);
936 return aForeign.Length()-numberOfForeignBytesConsumed;
939 // -----------------------------------------------------------------------------
940 // IsInThisCharacterSetL()
941 //The method tells how probable it is that a sample piece of text is encoded in this character set.
942 //On return aConfidenceLevel, indicates how confident the function is about its return value. For
943 //iscii it is the default implementation and it does not implement the autodetect functionality.
944 //Loaded and called by the character conversion framework.
946 // Returns: EFalse: To tell CCnvCharacterSetConverter::AutoDetectCharacterSetL() that the plug-in DLL
947 // is not implementing a function of this signature and is therefore empty.
949 // -----------------------------------------------------------------------------
953 //Default implementation for IsInThisCharacterSetL()
955 TBool CIsciiImplementation::IsInThisCharacterSetL(
957 TInt& aConfidenceLevel,
961 aConfidenceLevel = 0;
965 // -----------------------------------------------------------------------------
967 //Factory function for CIsciiImplementation(). Instantiates a CIsciiImplementation object on heap
968 //and returns the pointer to it.
970 // Returns: CIsciiImplementation*
972 // -----------------------------------------------------------------------------
975 CIsciiImplementation* CIsciiImplementation::NewL()
977 CIsciiImplementation* self = new(ELeave) CIsciiImplementation;
981 // -----------------------------------------------------------------------------
982 // CIsciiImplementation()
983 //default constructor, does nothing
987 // -----------------------------------------------------------------------------
989 CIsciiImplementation::CIsciiImplementation()
993 // -----------------------------------------------------------------------------
994 // ~CIsciiImplementation()
995 //default desstructor, does nothing
999 // -----------------------------------------------------------------------------
1002 CIsciiImplementation::~CIsciiImplementation()
1006 // ECOM CREATION FUNCTION
1007 const TImplementationProxy ImplementationTable[] =
1009 // Used also in 0x1027508E.rss ( implementation_uid )
1010 IMPLEMENTATION_PROXY_ENTRY( 0x1027508E, CIsciiImplementation::NewL )
1013 // -----------------------------------------------------------------------------
1014 // ImplementationGroupProxy()
1015 //Returns a pointer to TImplementationProxy object which contains the implementation uid vs factory
1016 //function table. Also on return sets the aTableCount to the number of entries in the table.
1018 // Returns: TImplementationProxy*
1020 // -----------------------------------------------------------------------------
1022 EXPORT_C const TImplementationProxy* ImplementationGroupProxy( TInt& aTableCount )
1024 aTableCount = sizeof( ImplementationTable ) / sizeof(TImplementationProxy);
1025 return ImplementationTable;
1029 #include <convplug.h>
1032 // -----------------------------------------------------------------------------
1034 //For EKA1 this is the entry point for the DLL.
1036 // Returns: KErrNone
1038 // -----------------------------------------------------------------------------
1040 GLDEF_C TInt E32Dll(TDllReason)
1046 //Checks if a descriptor starts with another descriptor at the begining.
1047 LOCAL_C TBool IsStartOf(const TDesC8& aEscapeSequence, const TDesC8& aBuffer)
1049 const TInt lengthOfStart=aEscapeSequence.Length();
1050 return (aBuffer.Length()>=lengthOfStart) && (aBuffer.Left(lengthOfStart)==aEscapeSequence);
1052 // -----------------------------------------------------------------------------
1053 // MatchesEscapeSequence()
1054 //If the remainder of the foreign text starts with the passed escapesequence, modifies the remainder of the foreign text
1055 //and sets the homogeneous run buffer that uses the same conversion data.
1056 //The homogeneous run buffer is the buffer that will use a single conversion data, it doesn't contain the attribute code
1057 // neither it contains the script switching code.
1058 //The aRemainderOfForeign buffer
1060 // Returns: ETrue: If the sequence contains the escape sequence
1061 // EFalse: If the sequence does not contain the escape sequence
1063 // -----------------------------------------------------------------------------
1065 LOCAL_C TBool MatchesEscapeSequence(TInt& aNumberOfForeignBytesConsumed, TPtrC8& aHomogeneousRun,
1066 TPtrC8& aRemainderOfForeign, const TDesC8& aEscapeSequence)
1068 const TInt lengthOfEscapeSequence=aEscapeSequence.Length();
1069 if (IsStartOf(aEscapeSequence, aRemainderOfForeign))
1071 aRemainderOfForeign.Set(aRemainderOfForeign.Mid(lengthOfEscapeSequence));
1072 const TInt startOfNextEscapeSequence=aRemainderOfForeign.Locate(KControlCharacterEscape);
1073 if (startOfNextEscapeSequence==KErrNotFound)
1075 aHomogeneousRun.Set(aRemainderOfForeign);
1076 aRemainderOfForeign.Set(NULL, 0);
1080 aHomogeneousRun.Set(aRemainderOfForeign.Left(startOfNextEscapeSequence));
1081 aRemainderOfForeign.Set(aRemainderOfForeign.Mid(startOfNextEscapeSequence));
1083 aNumberOfForeignBytesConsumed+=lengthOfEscapeSequence;
1089 // -----------------------------------------------------------------------------
1090 // NextHomogeneousForeignRun()
1091 //Matches the escape sequence of each of the elements of the SState array with the remainder of
1092 //foreign text and if the escape sequence matches with the start of remainder of the foreign text,
1093 //then the conversion data is set to the conversion data corresponding to the escape sequence
1094 //Also the homogeneous foreign text for conversion with the same escape sequence is set.
1096 // Returns: ETrue: If length of the remainder of foreign buffer is nonzero.
1097 // EFalse: If length of the remainder of foreign buffer is zero.
1099 // -----------------------------------------------------------------------------
1103 LOCAL_C TBool NextHomogeneousForeignRun(const SCnvConversionData*& aConversionData, TInt& aNumberOfForeignBytesConsumed, TPtrC8& aHomogeneousRun, TPtrC8& aRemainderOfForeign, const TArray<CnvUtilities::SState>& aArrayOfStates, TUint& aOutputConversionFlags)
1105 TBool returnValue = EFalse;
1106 TBool foundState = EFalse;
1107 __ASSERT_DEBUG((aRemainderOfForeign.Length()==0) || (aRemainderOfForeign[0]==KControlCharacterEscape), User::Panic(KPanicReason,EPanicBadRemainderOfForeign));
1108 if (aRemainderOfForeign.Length()==0)
1112 const TInt numberOfStates=aArrayOfStates.Count();
1114 for (i=0; i<numberOfStates; ++i)
1116 const CnvUtilities::SState& state=aArrayOfStates[i];
1117 if (MatchesEscapeSequence(aNumberOfForeignBytesConsumed, aHomogeneousRun, aRemainderOfForeign, *state.iEscapeSequence))
1119 aConversionData=state.iConversionData;
1125 for (i=0; i<numberOfStates; ++i)
1127 if (IsStartOf(aRemainderOfForeign, *aArrayOfStates[i].iEscapeSequence))
1129 // aRemainderOfForeign ends with a truncated escape sequence, so ConvertToUnicode cannot convert any more
1130 aOutputConversionFlags|=CCnvCharacterSetConverter::EOutputConversionFlagInputIsTruncated;
1135 MatchesEscapeSequence(aNumberOfForeignBytesConsumed,aHomogeneousRun,aRemainderOfForeign,aRemainderOfForeign.Left(2));
1136 aConversionData = &conversionDataDummy;
1137 returnValue = ETrue;
1139 if (aHomogeneousRun.Length()>0)
1141 returnValue = ETrue;
1145 // -----------------------------------------------------------------------------
1146 // ConvertFromUnicodeIntermediateBufferInPlace()
1147 //Default implementation for conversion to the intermediate buffer
1148 //It modifies the unicode buffer before it is converted back to iscii.
1149 //The current implementation of iscii plug-in doesn't require any
1150 //modification to the default implementation
1153 // -----------------------------------------------------------------------------
1157 LOCAL_C void ConvertFromUnicodeIntermediateBufferInPlace(TInt aStartPositionInDescriptor, TDes8& aDescriptor, TInt& aNumberOfCharactersThatDroppedOut)
1159 CnvUtilities::ConvertFromIntermediateBufferInPlace(aStartPositionInDescriptor, aDescriptor, aNumberOfCharactersThatDroppedOut, KEscapeSequenceDevanagari, 1);
1162 // -----------------------------------------------------------------------------
1163 // DoFindAndModifyBuffer()
1164 //Modifies the iscii buffer by replacing the search buffer with the replacement buffer.
1165 //Introduced for handling multibyte iscii sequence.
1166 //Takes the search buffer array and the replacement buffer arrays as input to it and replaces all
1167 //the occurances of the search buffer with the corresponding replace buffer.
1170 // -----------------------------------------------------------------------------
1173 LOCAL_C void DoFindAndModifyBuffer(TDes8& aModifyBuffer,const TDesC8& aSearchBuffer,const TDesC8& aReplaceBuffer)
1178 __ASSERT_ALWAYS((aSearchBuffer.Length()>= aReplaceBuffer.Length()),User::Panic(KPanicReason,EPanicBadReplacementBuffer));
1179 if((offset = aModifyBuffer.Find(aSearchBuffer)) != KErrNotFound)
1181 TUint8 *pointerToBuffer = const_cast<TUint8*> (aModifyBuffer.Ptr());
1182 Mem::Copy(pointerToBuffer+offset,aReplaceBuffer.Ptr(),aReplaceBuffer.Length());
1183 Mem::Copy(pointerToBuffer+offset+aReplaceBuffer.Length(),pointerToBuffer+offset+aSearchBuffer.Length(),aModifyBuffer.Length()-aSearchBuffer.Length()-offset);
1184 aModifyBuffer.SetLength(aModifyBuffer.Length() - aSearchBuffer.Length() + aReplaceBuffer.Length());
1192 // -----------------------------------------------------------------------------
1193 // FindAndModifyBuffer()
1194 //Modifies the iscii buffer by replacing the search buffer with the replacement buffer.
1195 //Calls DoFindAndModifyBuffer() and supplies the search buffer and replacement buffer.
1196 //Introduced for handling multibyte iscii sequence.
1199 // -----------------------------------------------------------------------------
1202 LOCAL_C void FindAndModifyBuffer(TDes8& aModifyBuffer)
1204 RArray<TPtrC8> searchBuffer;
1205 RArray<TPtrC8> replaceBuffer;
1207 TInt ret = KErrNone;
1208 ret |= searchBuffer.Append(KExplicitHalant().Mid(0));
1209 ret |= searchBuffer.Append(KSoftHalant().Mid(0));
1210 ret |= searchBuffer.Append(KOm().Mid(0));
1211 ret |= searchBuffer.Append(KAvagraha().Mid(0));
1213 ret |= replaceBuffer.Append(KReplacementForExplicitHalant().Mid(0));
1214 ret |= replaceBuffer.Append(KReplacementForSoftHalant().Mid(0));
1215 ret |= replaceBuffer.Append(KReplacementForOm().Mid(0));
1216 ret |= replaceBuffer.Append(KReplacementForAvagraha().Mid(0));
1218 __ASSERT_DEBUG(!ret, User::Panic(_L("RArray append failure"), ret));
1220 for(TInt counter=0;counter<searchBuffer.Count();counter++)
1222 DoFindAndModifyBuffer(aModifyBuffer,searchBuffer[counter],replaceBuffer[counter]);
1224 searchBuffer.Reset();
1225 replaceBuffer.Reset();
1229 // -----------------------------------------------------------------------------
1230 // DoNormalizeReturnValue()
1231 //Modifies the return value(Number of bytes did not get converted) according to the modified
1232 //intermediate buffer. Takes the modified intermediate buffer, return value, search and replace
1233 //buffers. Searches for the replace buffer in the intermediate buffer and if found, it looks for
1234 //the actual buffer corresponding to the replace buffer and adds the difference of the lengths
1235 //of the actual to replace buffer to the return value.
1238 // -----------------------------------------------------------------------------
1241 LOCAL_C void DoNormalizeReturnValue(TUint& aReturnValue,const TDesC8& aBuffer,RArray<TPtrC8>& anArrayOfSearches,RArray<TPtrC8>& anArrayOfReplaces)
1243 TPtr8 buffer(const_cast<TUint8*>(aBuffer.Ptr()),aBuffer.Length(),aBuffer.Length());
1244 TUint count = anArrayOfSearches.Count();
1247 TBool flag = EFalse;
1248 for(TUint i=0;i<count;i++)
1250 TPtrC8 searchBufferForComparison(buffer.Right(anArrayOfReplaces[i].Length()));
1251 TInt returnCompare = searchBufferForComparison.Compare(anArrayOfReplaces[i]);
1252 if(returnCompare == 0)
1255 aReturnValue += (anArrayOfSearches[i].Length() - anArrayOfReplaces[i].Length());
1256 buffer=buffer.MidTPtr(0,buffer.Length()-anArrayOfReplaces[i].Length());
1261 if(buffer.Length() == 0)
1268 buffer=buffer.MidTPtr(0,buffer.Length()-1);
1274 // -----------------------------------------------------------------------------
1275 // NormalizeReturnValue()
1276 //Modifies the return value(Number of bytes did not get converted) according to the
1277 //replacements done to the iscii buffer before conversion.
1278 //Internally calls DoNormalizeReturnValue() by suppling the search and replacement
1283 // -----------------------------------------------------------------------------
1286 LOCAL_C void NormalizeReturnValue(TUint& aReturnValue,const TDesC8& aBuffer)
1288 RArray<TPtrC8> searchBuffer;
1289 RArray<TPtrC8> replaceBuffer;
1291 ret |= searchBuffer.Append(KExplicitHalant().Mid(0));
1292 ret |= searchBuffer.Append(KSoftHalant().Mid(0));
1293 ret |= searchBuffer.Append(KOm().Mid(0));
1294 ret |= searchBuffer.Append(KAvagraha().Mid(0));
1296 ret |= replaceBuffer.Append(KReplacementForExplicitHalant().Mid(0));
1297 ret |= replaceBuffer.Append(KReplacementForSoftHalant().Mid(0));
1298 ret |= replaceBuffer.Append(KReplacementForOm().Mid(0));
1299 ret |= replaceBuffer.Append(KReplacementForAvagraha().Mid(0));
1301 __ASSERT_DEBUG(!ret, User::Panic(_L("RArray append failure"), ret));
1303 DoNormalizeReturnValue(aReturnValue,aBuffer,searchBuffer,replaceBuffer);
1304 searchBuffer.Reset();
1305 replaceBuffer.Reset();
1308 // -----------------------------------------------------------------------------
1309 // HandleHomogeneousRun()
1310 //Handles a homogeneous foreign buffer and converts the foreign buffer to unicode
1311 //On return the aUnicode argument contains the converted unicode data.
1312 //Also it sets the return value, returned from the conversion. The return value also
1313 //takes into account if there is any buffer modification done before passing it to
1314 //CCnvCharacterSetConverter::DoConvertToUnicode()
1319 // -----------------------------------------------------------------------------
1322 LOCAL_C void HandleHomogeneousRun(const SCnvConversionData*& aConversionData,
1323 CCnvCharacterSetConverter::TEndianness aDefaultEndiannessOfForeignCharacters,
1325 const TDesC8& aHomogeneousForeign,
1326 TInt& aNumberOfUnconvertibleCharacters,
1327 TInt& aIndexOfFirstByteOfFirstUnconvertibleCharacter,
1328 TUint& aOutputConversionFlags,
1329 TUint aInputConversionFlags,TInt& aNumberOfForeignBytesConsumed,
1332 TInt numberOfUnconvertibleCharacters;
1333 TInt indexOfFirstByteOfFirstUnconvertibleCharacter;
1334 TUint noOfConsumedBytes = 0;
1335 if(aConversionData == NULL)
1337 aReturnValue = CCnvCharacterSetConverter::EErrorIllFormedInput;
1340 aReturnValue = CCnvCharacterSetConverter::DoConvertToUnicode(*aConversionData,aDefaultEndiannessOfForeignCharacters,
1341 aUnicode,aHomogeneousForeign,numberOfUnconvertibleCharacters,
1342 indexOfFirstByteOfFirstUnconvertibleCharacter,aOutputConversionFlags,
1344 //The numberOfUnconvertibleCharacters and indexOfFirstByteOfFirstUnconvertibleCharacter are the values with
1345 //respect to the intermediate iscii buffer and original values aIndexOfFirstByteOfFirstUnconvertibleCharacter and
1346 //aNumberOfUnconvertibleCharacters need to be adjusted accordingly.
1348 aInputConversionFlags);
1349 if(numberOfUnconvertibleCharacters>0)
1351 if(aNumberOfUnconvertibleCharacters == 0)
1353 aIndexOfFirstByteOfFirstUnconvertibleCharacter = aNumberOfForeignBytesConsumed + indexOfFirstByteOfFirstUnconvertibleCharacter;
1355 aNumberOfUnconvertibleCharacters+=numberOfUnconvertibleCharacters;
1357 noOfConsumedBytes = aHomogeneousForeign.Length();
1358 //To Check whether it is really required.
1359 NormalizeReturnValue(noOfConsumedBytes,aHomogeneousForeign);
1360 aNumberOfForeignBytesConsumed+=noOfConsumedBytes;
1363 TUint normalizedReturnValue = aReturnValue;
1365 //There original iscii buffer copied to an intermediate iscii buffer and then modified
1366 //and is then passed for conversion. Now, after conversion, the return value needs to
1367 //be adjusted according to the original buffer. NormalizeReturnValue() does the
1370 NormalizeReturnValue(normalizedReturnValue,aHomogeneousForeign);
1371 aNumberOfForeignBytesConsumed-=normalizedReturnValue;
1372 aReturnValue=normalizedReturnValue;
1375 //The HandleHomogeneousRun() method is called in a loop and once there is some
1376 //iscii codes converted to unicode, the ConvertToUnicode() should not return
1377 //CCnvCharacterSetConverter::EErrorIllFormedInput even though the conversion
1378 //method does not convert any of the iscii codes ppassed. To ensure that once the
1379 //first non-zero number of iscii codes are converted, the internal input conversion
1380 //flag is set to EInputConversionFlagAllowTruncatedInputNotEvenPartlyConsumable.
1382 if(aNumberOfForeignBytesConsumed>0)
1384 aInputConversionFlags|=CCnvCharacterSetConverter::EInputConversionFlagAllowTruncatedInputNotEvenPartlyConsumable;
1389 // -----------------------------------------------------------------------------
1390 // IsTruncatedDoubleByteIsciiSequence()
1391 //Checks if anIsciiBuffer is a part of multi byte iscii sequence truncated in the middle.
1392 //If it is a truncated sequence, then returns ETrue else returns EFalse.
1394 // Returns: ETrue: If the intermediate input iscii buffer is truncated
1395 // EFalse: If the intermediate input iscii buffer is not truncated
1397 // -----------------------------------------------------------------------------
1400 LOCAL_C TBool IsTruncatedDoubleByteIsciiSequence(const TDesC8& anIsciiBuffer)
1402 RArray<TPtrC8> searchBuffer;
1403 if(anIsciiBuffer.Length () == 0)
1405 if(anIsciiBuffer[anIsciiBuffer.Length()-1] == 0xEF)
1408 TInt appendret = KErrNone;
1409 appendret |= searchBuffer.Append(KSoftHalant().Mid(0));
1410 appendret |= searchBuffer.Append(KOm().Mid(0));
1411 appendret |= searchBuffer.Append(KAvagraha().Mid(0));
1412 appendret |= searchBuffer.Append(KExplicitHalant().Mid(0));
1413 __ASSERT_DEBUG(!ret, User::Panic(_L("RArray append failure"), ret));
1416 TBool isNotTruncated =EFalse;
1418 //First check if the intermediate iscii buffer is ending with a complete multi byte sequence.
1419 //If it ends with a complete multi byte sequence, no need to check if the last character of
1420 //intermediate iscii is same as first character of multi byte iscii sequence. And return EFalse.
1421 for(TUint counter = 0;counter<searchBuffer.Count();counter++)
1423 if(searchBuffer[counter].Compare(anIsciiBuffer.Right(searchBuffer[counter].Length())) == 0)
1425 isNotTruncated = ETrue;
1429 //If the intermediate iscii buffer is not ending with a complete multi byte sequence, and the
1430 //last code of the iscii buffer is a part of the multibyte sequence, then the iscii buffer is a
1431 //truncated sequence and in that case return ETrue.
1433 for(TUint counter = 0;counter<searchBuffer.Count();counter++)
1437 else if( (anIsciiBuffer[anIsciiBuffer.Length()-1] == searchBuffer[counter][0]))
1443 searchBuffer.Reset();
1447 // -----------------------------------------------------------------------------
1448 // ReplacementForUnconvertibleUnicodeCharacters()
1449 //Returns the replacement character for unconvertible unicode character.
1450 //In the current implementation it is 0x1a (ASCII Substitute character)
1451 //The default implementation calls ReplacementForUnconvertibleUnicodeCharacters_internal()
1452 //in turn which is generated by cnvtool.
1454 // Returns: Replacemt for unconvertible unicode characters (0x1a)
1456 // -----------------------------------------------------------------------------
1459 EXPORT_C const TDesC8& ReplacementForUnconvertibleUnicodeCharacters()
1461 return ReplacementForUnconvertibleUnicodeCharacters_internal();
1464 // -----------------------------------------------------------------------------
1465 // ConvertFromUnicode()
1466 //The main conversion function for converting from unicode to iscii
1467 //Loaded and called by the character conversion framework.
1468 //In turn calls CnvUtilities::ConvertFromUnicode() which is Symbian provide
1469 //utility method for converting unicode to modal character codes.
1471 // Returns: The numbet of unicode codes it could not convert.
1473 // -----------------------------------------------------------------------------
1476 EXPORT_C TInt ConvertFromUnicode(
1477 CCnvCharacterSetConverter::TEndianness
1478 aDefaultEndiannessOfForeignCharacters,
1479 const TDesC8& aReplacementForUnconvertibleUnicodeCharacters,
1481 const TDesC16& aUnicode,
1482 CCnvCharacterSetConverter::TArrayOfAscendingIndices& aIndicesOfUnconvertibleCharacters )
1484 TFixedArray<CnvUtilities::SCharacterSet,KNumberOfIndicCharactersetsSupported> aArrayOfCharacterSets;
1485 aArrayOfCharacterSets[0].iConversionData = &conversionData;
1486 aArrayOfCharacterSets[0].iConvertFromIntermediateBufferInPlace = ConvertFromUnicodeIntermediateBufferInPlace;
1487 aArrayOfCharacterSets[0].iEscapeSequence = &KEscapeSequenceDevanagari();
1489 return CnvUtilities::ConvertFromUnicode(
1490 aDefaultEndiannessOfForeignCharacters,
1491 aReplacementForUnconvertibleUnicodeCharacters,
1494 aIndicesOfUnconvertibleCharacters,
1495 aArrayOfCharacterSets.Array());
1498 // -----------------------------------------------------------------------------
1499 // ConvertToUnicode()
1500 //The main conversion function for converting from iscii to unicode
1501 //Loaded and called by the character conversion framework.
1502 //To support some of the iscii characters, the input forign buffer is
1503 //copied to an intermediate buffer and then is then modified and
1504 //CCnvCharactersetConverter::DoConvertToUnicode() is called with
1505 //the modified buffer. For extensibility of iscii to other Indic languages
1506 //it uses CnvUtilities::SState datastructure. CnvUtilities::SState is a
1507 //Symbian defined class for modal charactersets. The escape sequence
1508 //is specified to ATR followed by the script selection code and the conversion
1509 //data is specified to be the conversion for the particular script. For the time
1510 //being only Devanagari with script selection code 0x42 is supported. If
1511 //any of the other script codes are used the conversion leads to unconvertible
1512 //character i.e. 0xFFFD.
1513 // Returns: The numbet of iscii codes it could not convert.
1515 // -----------------------------------------------------------------------------
1518 EXPORT_C TInt ConvertToUnicode(
1519 CCnvCharacterSetConverter::TEndianness aDefaultEndiannessOfForeignCharacters,
1521 const TDesC8& aForeign,
1523 TInt& aNumberOfUnconvertibleCharacters,
1524 TInt& aIndexOfFirstByteOfFirstUnconvertibleCharacter )
1526 aNumberOfUnconvertibleCharacters = 0;
1527 TUint aOutputConversionFlags = CCnvCharacterSetConverter::KStateDefault;
1528 aIndexOfFirstByteOfFirstUnconvertibleCharacter=-1;
1529 TUint internalInputConversionFlags = 0;
1530 TInt numberOfForeignBytesConsumed=0;
1531 TPtrC8 remainderOfForeign(aForeign);
1533 TBool flag = EFalse;
1534 TBool isSkipMatchSequence = EFalse;
1535 const SCnvConversionData* convData;
1536 //Set the iscii conversion data and escape sequence for Devanagari.
1537 TFixedArray<CnvUtilities::SState,KNumberOfIndicCharactersetsSupported> modals;
1538 modals[0].iConversionData = &conversionData;
1539 modals[0].iEscapeSequence = &KEscapeSequenceDevanagari();
1541 aUnicode.SetLength(0);
1543 //The internal input conversion flag for conversion is set to CCnvCharacterSetConverter::EInputConversionFlagAppend
1544 //so that for each conversion in the conversion loop, the generated conversion buffer is appened to the aUnicode buffer.
1545 internalInputConversionFlags |= CCnvCharacterSetConverter::EInputConversionFlagAppend;
1546 if (aForeign.Length()==0)
1550 //Get the conversion data from the previous call else the conversion data is set to the default
1551 //conversion data, i.e. Devanagari.
1552 convData=(aState!=CCnvCharacterSetConverter::KStateDefault)? REINTERPRET_CAST(const SCnvConversionData*, aState): modals[0].iConversionData;
1555 TBuf8<KMaximumLengthOfIntermediateBuffer> intermediateBuffer;
1556 TUint numberOfForeignBytesConsumedThisTime = 0;
1557 if((remainderOfForeign.Length() >=KMaximumLengthOfIntermediateBuffer) && (aUnicode.MaxLength()-aUnicode.Length() >=KMaximumLengthOfIntermediateBuffer))
1559 numberOfForeignBytesConsumedThisTime = KMaximumLengthOfIntermediateBuffer;
1560 intermediateBuffer = remainderOfForeign.Left(numberOfForeignBytesConsumedThisTime);
1561 //If the intermediate buffer is a part of truncated buffer sequence but the
1562 //actual input buffer is not truncated then truncated sequence is not converted.
1563 //The intermediate buffer is modified so as not to contain the truncated sequence.
1565 flag = IsTruncatedDoubleByteIsciiSequence(intermediateBuffer);
1568 numberOfForeignBytesConsumedThisTime --;
1569 intermediateBuffer = remainderOfForeign.Left(numberOfForeignBytesConsumedThisTime);
1575 flag = IsTruncatedDoubleByteIsciiSequence(remainderOfForeign.Left(aUnicode.MaxLength()-aUnicode.Length()));
1578 numberOfForeignBytesConsumedThisTime = aUnicode.MaxLength()-aUnicode.Length();
1579 intermediateBuffer = remainderOfForeign.Left(numberOfForeignBytesConsumedThisTime);
1583 if(aForeign.Length()>(numberOfForeignBytesConsumed+aUnicode.Length()))
1585 numberOfForeignBytesConsumedThisTime = aUnicode.MaxLength()-aUnicode.Length()-1;
1586 intermediateBuffer = remainderOfForeign.Left(numberOfForeignBytesConsumedThisTime);
1591 numberOfForeignBytesConsumedThisTime = aUnicode.MaxLength()-aUnicode.Length();
1592 intermediateBuffer = remainderOfForeign.Left(numberOfForeignBytesConsumedThisTime);
1597 //The input intermediate iscii buffer is modified with the search and replace
1598 //buffers. It is required for supporting multibyte iscii sequences.
1599 FindAndModifyBuffer(intermediateBuffer);
1600 TPtrC8 remainderOfForeignInternal(intermediateBuffer);
1601 TPtrC8 homogeneousRun;
1602 const TInt startOfNextEscapeSequence=intermediateBuffer.Locate(KControlCharacterEscape);
1603 if (startOfNextEscapeSequence!=0)
1605 if (startOfNextEscapeSequence==KErrNotFound)
1607 homogeneousRun.Set(remainderOfForeignInternal);
1608 remainderOfForeignInternal.Set(NULL, 0);
1612 __ASSERT_DEBUG(startOfNextEscapeSequence>0, User::Panic(KPanicReason,EPanicBadStartOfNextEscapeSequence));
1613 homogeneousRun.Set(remainderOfForeignInternal.Left(startOfNextEscapeSequence));
1614 remainderOfForeignInternal.Set(remainderOfForeignInternal.Mid(startOfNextEscapeSequence));
1616 isSkipMatchSequence = ETrue;
1620 if(!isSkipMatchSequence)
1622 if (!NextHomogeneousForeignRun(convData, numberOfForeignBytesConsumed, homogeneousRun,
1623 remainderOfForeignInternal, modals.Array(), aOutputConversionFlags))
1628 HandleHomogeneousRun( convData, aDefaultEndiannessOfForeignCharacters, aUnicode, homogeneousRun, aNumberOfUnconvertibleCharacters,
1629 aIndexOfFirstByteOfFirstUnconvertibleCharacter,aOutputConversionFlags,internalInputConversionFlags,
1630 numberOfForeignBytesConsumed,returnValue);
1635 isSkipMatchSequence = EFalse;
1639 if ((!flag && (numberOfForeignBytesConsumedThisTime != KMaximumLengthOfIntermediateBuffer)) || (flag && (numberOfForeignBytesConsumedThisTime != (KMaximumLengthOfIntermediateBuffer-1) )))
1641 remainderOfForeign.Set(aForeign.Mid(numberOfForeignBytesConsumed));
1643 //If the number of iscii bytes consumed by the conversion is zero also the output conversion
1644 //flag is not set to EOutputConversionFlagInputIsTruncated, then return EErrorIllFormedInput.
1645 if ((numberOfForeignBytesConsumed==0) && (aOutputConversionFlags&CCnvCharacterSetConverter::EOutputConversionFlagInputIsTruncated))
1647 return CCnvCharacterSetConverter::EErrorIllFormedInput;
1649 //Set the conversion data sothat next time when ConvertToUnicode() is called,
1650 //will use the previous conversion data.
1651 aState=REINTERPRET_CAST(TInt, convData);
1652 return aForeign.Length()-numberOfForeignBytesConsumed;
1655 // -----------------------------------------------------------------------------
1656 // IsInThisCharacterSetL()
1657 //The method tells how probable it is that a sample piece of text is encoded in this character set.
1658 //On return aConfidenceLevel, indicates how confident the function is about its return value. For
1659 //iscii it is the default implementation and it does not implement the autodetect functionality.
1660 //Loaded and called by the character conversion framework.
1662 // Returns: EFalse: To tell CCnvCharacterSetConverter::AutoDetectCharacterSetL() that the plug-in DLL
1663 // is not implementing a function of this signature and is therefore empty.
1665 // -----------------------------------------------------------------------------
1669 //Default implementation for IsInThisCharacterSetL()
1671 EXPORT_C TBool IsInThisCharacterSetL(
1673 TInt& aConfidenceLevel,
1676 aSetToTrue = EFalse;
1677 aConfidenceLevel = 0;
1681 EXPORT_C void Reserved_2()
1685 EXPORT_C void Reserved_3()
1689 EXPORT_C void Reserved_4()
1693 EXPORT_C void Reserved_5()
1697 EXPORT_C void Reserved_6()
1701 EXPORT_C void Reserved_7()
1705 EXPORT_C void Reserved_8()