Update contrib.
2 * Copyright (c) 1998-2009 Nokia Corporation and/or its subsidiary(-ies).
4 * This component and the accompanying materials are made available
5 * under the terms of "Eclipse Public License v1.0"
6 * which accompanies this distribution, and is available
7 * at the URL "http://www.eclipse.org/legal/epl-v10.html".
9 * Initial Contributors:
10 * Nokia Corporation - initial contribution.
15 * Implementation of the classes that import and export plain text.
24 TPlainTextIOState:: TPlainTextIOState(const CPlainText::TImportExportParam& aParam,
25 CPlainText::TImportExportResult& aResult,
26 RWriteStream& aOutput,RReadStream& aInput):
33 iCheckByteOrder(FALSE)
35 aResult = CPlainText::TImportExportResult(); // zero output counters; aResult may be re-used.
38 TText TPlainTextIOState::ReadRawCharL()
41 if (iParam.iInputInternal)
42 iInput.ReadL((TUint8*)&c,sizeof(TText));
44 c = iInput.ReadUint16L();
46 c = (TText)(((c << 8) & 0xFF00) | ((c >> 8) & 0xFF));
49 if (c == CEditableText::EReversedByteOrderMark)
51 c = CEditableText::EByteOrderMark;
52 iSwapInput = !iSwapInput;
54 iCheckByteOrder = FALSE;
56 iResult.iInputChars++;
60 void TPlainTextIOState::WriteRawCharL(TText aChar)
62 if (iResult.iOutputChars < iParam.iMaxOutputChars)
64 if (iParam.iOutputInternal)
65 iOutput.WriteL((TUint8*)&aChar,sizeof(TText));
67 iOutput.WriteUint16L(aChar);
68 iResult.iOutputChars++;
72 CPlainTextConverter* CPlainTextConverter::NewLC()
74 CPlainTextConverter* c = new(ELeave) CPlainTextConverter;
75 CleanupStack::PushL(c);
76 c->iConversionBuffer = new(ELeave) TUint8[EConversionBufferSize];
80 CPlainTextConverter::~CPlainTextConverter()
83 delete [] iConversionBuffer;
87 Prepare to convert between Unicode and a foreign encoding.
88 If aSample is non-null it can be used to guess the foreign encoding, but only if iParam.iGuessForeignEncoding is true.
90 void CPlainTextConverter::PrepareToConvertL(TPlainTextIOState& aState,const TDesC8* aSample)
94 iConverter = CCnvCharacterSetConverter::NewL();
95 if (aState.iParam.iFileSession == NULL)
97 TInt error = rfs.Connect();
98 User::LeaveIfError(error);
100 CleanupClosePushL(rfs);
103 rfs = *aState.iParam.iFileSession;
105 TUint foreign_encoding = aState.iParam.iForeignEncoding;
107 // Try to guess the foreign encoding.
108 if (aSample && aState.iParam.iGuessForeignEncoding)
110 CArrayFix<CCnvCharacterSetConverter::SCharacterSet>* charsets =
111 CCnvCharacterSetConverter::CreateArrayOfCharacterSetsAvailableLC(rfs);
113 CCnvCharacterSetConverter::AutoDetectCharacterSetL(confidence,foreign_encoding,*charsets,*aSample);
114 CleanupStack::PopAndDestroy(charsets);
116 User::Leave(KErrNotSupported);
119 if (iConverter->PrepareToConvertToOrFromL(foreign_encoding,rfs) != CCnvCharacterSetConverter::EAvailable)
120 User::Leave(KErrNotSupported);
121 aState.iResult.iForeignEncoding = foreign_encoding;
122 if (aState.iParam.iFileSession == NULL)
124 CleanupStack::Pop(); // rfs
129 void TPlainTextWriter::TranslateL(const CPlainText::TImportExportParam& aParam,CPlainText::TImportExportResult& aResult,
130 RWriteStream& aOutput,RReadStream& aInput)
132 TPlainTextWriter writer(aParam,aResult,aOutput,aInput);
133 writer.TranslateHelperL();
136 TPlainTextWriter::TPlainTextWriter(const CPlainText::TImportExportParam& aParam,CPlainText::TImportExportResult& aResult,
137 RWriteStream& aOutput,RReadStream& aInput):
138 TPlainTextIOState(aParam,aResult,aOutput,aInput),
141 iMaxLineBufferLength(0)
145 void TPlainTextWriter::TranslateHelperL()
147 if (iParam.iForeignEncoding)
149 iConverter = CPlainTextConverter::NewLC();
150 iConverter->PrepareToConvertL(*this,NULL);
153 if (iParam.iOrganisation == CPlainText::EOrganiseByLine)
154 iMaxLineLength = iParam.iMaxLineLength;
156 iMaxLineLength = KMaxTInt; // when exporting by paragraph, the wrapping width has no effect
157 if (iMaxLineLength <= 0)
158 iMaxLineLength = KMaxTInt;
160 if (iMaxLineLength < KMaxTInt)
161 iMaxLineBufferLength = iMaxLineLength;
162 else if (iParam.iForeignEncoding)
163 iMaxLineBufferLength = EDefaultLineBufferSize;
164 if (iMaxLineBufferLength)
165 iLineBuffer = new(ELeave) TText[iMaxLineBufferLength];
168 CleanupStack::PushL(iLineBuffer);
169 TRAPD(error,TranslateToEofL());
170 if (error == KErrEof)
172 if (error == KErrNone)
177 CleanupStack::Pop(iLineBuffer);
178 delete [] iLineBuffer;
180 CleanupStack::PopAndDestroy(iConverter);
181 User::LeaveIfError(error);
184 void TPlainTextWriter::TranslateToEofL()
188 TText c = ReadRawCharL();
191 // Write a CR-LF at a forced line break if organising by line.
192 case CEditableText::ELineBreak:
193 if (iParam.iOrganisation == CPlainText::EOrganiseByLine)
202 // Write a CR-LF at the end of the paragraph, then an extra one if lines are split by CR-LFs.
203 case CEditableText::EParagraphDelimiter:
206 if (iParam.iOrganisation == CPlainText::EOrganiseByLine)
216 void TPlainTextWriter::FlushL()
219 WriteAndConvertL(iLineBuffer,iLineLength);
223 void TPlainTextWriter::WriteCharL(TText aChar)
227 if (iLineLength >= iMaxLineBufferLength)
229 int linebreak = iMaxLineBufferLength;
230 int stripped_linebreak = iMaxLineBufferLength;
232 if (iLineLength >= iMaxLineLength)
234 for (linebreak = iMaxLineLength; linebreak > 0; linebreak--)
235 if (iLineBuffer[linebreak - 1] == ' ')
238 linebreak = iMaxLineLength;
240 // Strip a single trailing space if any; it is added when text is imported.
241 stripped_linebreak = linebreak;
242 if (iLineBuffer[linebreak - 1] == ' ')
243 stripped_linebreak = linebreak - 1;
246 WriteAndConvertL(iLineBuffer,stripped_linebreak);
247 if (iLineLength >= iMaxLineLength)
251 while (i < iMaxLineBufferLength)
252 iLineBuffer[j++] = iLineBuffer[i++];
255 iLineBuffer[iLineLength++] = aChar;
258 WriteRawCharL(aChar);
261 void TPlainTextWriter::WriteNewLineL()
263 WriteAndConvertL(_S("\x0d\x0a"),2);
266 void TPlainTextWriter::WriteAndConvertL(const TText* aText,TInt aLength)
272 TPtrC source(aText,aLength);
273 TPtr8 dest(iConverter->iConversionBuffer,CPlainTextConverter::EConversionBufferSize);
274 int remainder = iConverter->iConverter->ConvertFromUnicode(dest,source);
276 User::Leave(KErrCorrupt);
277 int available = iParam.iMaxOutputChars - iResult.iOutputChars;
278 if (available < dest.Length())
279 dest.SetLength(available);
280 if (dest.Length() > 0)
282 iOutput.WriteL(dest);
283 iResult.iOutputChars += dest.Length();
285 int converted = aLength - remainder;
287 aLength -= converted;
292 while (aLength-- > 0)
293 WriteRawCharL(*aText++);
297 TPlainTextReader::TPlainTextReader(const CPlainText::TImportExportParam& aParam,CPlainText::TImportExportResult& aResult,
298 RWriteStream& aOutput,RReadStream& aInput):
299 TPlainTextIOState(aParam,aResult,aOutput,aInput),
303 iConversionState(CCnvCharacterSetConverter::KStateDefault)
305 iCheckByteOrder = TRUE;
308 void TPlainTextReader::TranslateL(const CPlainText::TImportExportParam& aParam,CPlainText::TImportExportResult& aResult,
309 RWriteStream& aOutput,RReadStream& aInput)
311 TPlainTextReader reader(aParam,aResult,aOutput,aInput);
312 if(reader.iParam.iOrganisation == CPlainText::EOrganiseByLine)
314 TLineTextWriter txtWriter(reader);
315 TSLBTransaltor slbTranslator(txtWriter);
316 reader.TranslateHelperL(slbTranslator);
320 TParagraphTextWriter txtWriter(reader);
321 TSLBTransaltor slbTranslator(txtWriter);
322 reader.TranslateHelperL(slbTranslator);
326 void TPlainTextReader::TranslateHelperL(TSLBTransaltor& aSLBTranslator)
328 if (iParam.iForeignEncoding || iParam.iGuessForeignEncoding)
330 iConverter = CPlainTextConverter::NewLC();
331 iInputBuffer = new(ELeave) TText[EInputBufferSize];
332 CleanupStack::PushL(iInputBuffer);
336 TRAPD(error,TranslateToEofL(aSLBTranslator));
337 if (error == KErrEof)
339 if (error == KErrNone)
343 CleanupStack::Pop(iInputBuffer);
344 delete [] iInputBuffer;
345 CleanupStack::PopAndDestroy(iConverter);
347 User::LeaveIfError(error);
350 void TPlainTextReader::TranslateToEofL(TSLBTransaltor& aSLBTranslator)
354 TText c = ReadAndConvertL();
355 aSLBTranslator.ProcessL(c);
357 aSLBTranslator.FlushL();
360 TText TPlainTextReader::ReadAndConvertL()
362 // Read EConversionBufferSize bytes into a conversion buffer (iConversionBuffer).
363 // Using CharConv convert this into unicode and place in a destination buffer (dest).
364 // This may result in some bytes that cannot be converted (remainder) as that
365 // character encoding is truncated.
366 // This remainder is then moved to the begining of the conversion buffer and more
367 // data read in after it, in effect untruncating that last character.
368 // Before this next read takes place the next converted unicode character is returned
369 // until the destination buffer positional pointers reach the end where more data is
370 // required for processing.
372 if (iConverter && iInputBuffer)
374 if (iInputPos >= iInputLength)
377 Attempt to read more foreign characters if there are less than 20,
378 which is the current maximum length of a multibyte character sequence for CHARCONV.
379 Use MStreamBuf::ReadL, which doesn't leave on EOF, rather than RReadStream::ReadL,
380 which does, and doesn't tell you how much was actually read.
382 if (iConverter->iConversionBufferLength < 20)
383 iConverter->iConversionBufferLength +=
384 iInput.Source()->ReadL(iConverter->iConversionBuffer + iConverter->iConversionBufferLength,
385 CPlainTextConverter::EConversionBufferSize - iConverter->iConversionBufferLength);
387 // Create the converter late so we have a sample of foreign text for auto-detection of the encoding.
388 if (!iConverter->iConverter)
390 TPtrC8 sample(iConverter->iConversionBuffer,iConverter->iConversionBufferLength);
391 iConverter->PrepareToConvertL(*this,&sample);
394 // Translate from the foreign encoding to Unicode.
395 TPtr dest(iInputBuffer,0,EInputBufferSize);
396 TPtrC8 source(iConverter->iConversionBuffer,iConverter->iConversionBufferLength);
397 int remainder = iConverter->iConverter->ConvertToUnicode(dest,source,iConversionState);
399 User::Leave(KErrCorrupt);
401 // Move the remaining foreign characters if any to the start of the buffer
402 // so that on the next read it can be joined with its truncated part.
403 for (int i = 0, j = iConverter->iConversionBufferLength - remainder; i < remainder; ++i, ++j)
404 iConverter->iConversionBuffer[i] = iConverter->iConversionBuffer[j];
405 iConverter->iConversionBufferLength = remainder;
408 iInputLength = dest.Length();
409 if (iInputLength == 0)
410 User::Leave(KErrEof);
412 iResult.iInputChars++;
413 return iInputBuffer[iInputPos++];
416 return ReadRawCharL();
420 The method processes the imput characters, writing them to the output, but skipping
421 the picture characters (CEditableText::EPictureCharacter).
422 The method is not called directly and should not be called. It implements
423 MOutputChar::OutputCharL(TChar aChar) and is called from TParagraphTextWriter and
424 TLineTextWriter implementations.
425 @param aChar Character to be processed.
427 void TPlainTextReader::OutputCharL(TText aChar)
431 case CEditableText::EByteOrderMark :
432 // leading byte order marks are ignored
433 if(iResult.iInputChars > 1)
435 WriteRawCharL(aChar);
438 case CEditableText::EPictureCharacter:
439 //Picture characters are ignored because they would cause ETEXT to panic when it attempted to find
440 //the picture corresponding to the character.
443 WriteRawCharL(aChar);