os/security/securityanddataprivacytools/securitytools/certapp/store--/us_ucmp.cpp
Update contrib.
2 * Copyright (c) 1998-2009 Nokia Corporation and/or its subsidiary(-ies).
4 * This component and the accompanying materials are made available
5 * under the terms of the License "Eclipse Public License v1.0"
6 * which accompanies this distribution, and is available
7 * at the URL "http://www.eclipse.org/legal/epl-v10.html".
9 * Initial Contributors:
10 * Nokia Corporation - initial contribution.
15 * Implementation of the Standard Compression Scheme for Unicode.
16 * This code is compiled only in the Unicode build.
26 const TUint32 TUnicodeCompressionState::iStaticWindow[EStaticWindows] =
29 0x0080, // Latin-1 supplement
30 0x0100, // Latin Extended-A
31 0x0300, // Combining Diacritics
32 0x2000, // General Punctuation
33 0x2080, // Currency Symbols
34 0x2100, // Letterlike Symbols and Number Forms
35 0x3000 // CJK Symbols and Punctuation
38 const TUint32 TUnicodeCompressionState::iDynamicWindowDefault[EDynamicWindows] =
40 0x0080, // Latin-1 supplement
41 0x00C0, // parts of Latin-1 supplement and Latin Extended-A
47 0xFF00 // Fullwidth ASCII
50 const TUint16 TUnicodeCompressionState::iSpecialBase[ESpecialBases] =
52 0x00C0, // Latin 1 letters (not symbols) and some of Extended-A
53 0x0250, // IPA extensions
58 0xFF60 // Halfwidth katakana
61 // Single-byte mode tag values
62 const TUint8 SQ0 = 0x01; // <byte> quote from window 0
63 const TUint8 SDX = 0x0B; // <hbyte> <lbyte> define window in expansion area
64 const TUint8 SQU = 0x0E; // <hbyte> <lbyte> quote Unicode value
65 const TUint8 SCU = 0x0F; // switch to Unicode mode
66 const TUint8 SC0 = 0x10; // select dynamic window 0
67 const TUint8 SD0 = 0x18; // <byte> set dynamic window 0 index to <byte> and select it
69 // Unicode mode tag values
70 const TUint8 UC0 = 0xE0; // select dynamic window 0 and switch to single-byte mode
71 const TUint8 UD0 = 0xE8; // <byte> set dynamic window 0 index to <byte>, select it and switch to
73 const TUint8 UQU = 0xF0; // <hbyte>, <lbyte> quote Unicode value
74 const TUint8 UDX = 0xF1; // <hbyte>, <lbyte> define window in expansion area and switch to single-byte mode
76 TUnicodeCompressionState::TUnicodeCompressionState():
80 iMaxCompressedBytes(0)
85 void TUnicodeCompressionState::Reset()
88 iActiveWindowBase = 0x0080;
89 for (int i = 0; i < EDynamicWindows; i++)
90 iDynamicWindow[i] = iDynamicWindowDefault[i];
94 // Return the index of the static window that contains this code, if any, or -1 if there is none.
95 TInt TUnicodeCompressionState::StaticWindowIndex(TUint16 aCode)
97 for (TInt i = 0; i < EStaticWindows; i++)
98 if (aCode >= iStaticWindow[i] && aCode < iStaticWindow[i] + 128)
104 If aCode can be accommodated in one of the legal dynamic windows, return the index of that window
105 in the offset table. If not return KErrNotFound.
107 TInt TUnicodeCompressionState::DynamicWindowOffsetIndex(TUint16 aCode)
111 if (aCode >= 0x3400 && aCode <= 0xDFFF)
115 Prefer sections that cross half-block boundaries. These are better adapted to actual text.
116 They are represented by offset indices 0xf9..0xff.
118 for (int i = 0; i < ESpecialBases; i++)
119 if (aCode >= iSpecialBase[i] && aCode < iSpecialBase[i] + 128)
123 Offset indices 0x01..0x67 represent half blocks from 0x0080 to 0x3380 and
124 0x68..0xA7 represent half blocks from 0xE000 to 0xFF80.
131 // Return the base of the window represented by offset index <n>. Return 0 if the offset index is illegal.
132 TUint32 TUnicodeCompressionState::DynamicWindowBase(TInt aOffsetIndex)
134 if (aOffsetIndex >= 0xF9 && aOffsetIndex <= 0xFF)
137 WARNING: don't optimise the following two lines by replacing them with
138 'return iSpecialBase[aOffsetIndex - 0xF9];'. To do so would re-introduce an error
139 in ARM builds caused by optimisation and consequent erroneous fixing up
140 of the array base: see defect EDNGASR-4AGJQX in ER5U defects.
142 int special_base_index = aOffsetIndex - 0xF9;
143 return iSpecialBase[special_base_index];
145 if (aOffsetIndex >= 0x01 && aOffsetIndex <= 0x67)
146 return aOffsetIndex * 0x80;
147 if (aOffsetIndex >= 0x68 && aOffsetIndex <= 0xA7)
148 return aOffsetIndex * 0x80 + 0xAC00;
152 TBool TUnicodeCompressionState::EncodeAsIs(TUint16 aCode)
154 return aCode == 0x0000 || aCode == 0x0009 || aCode == 0x000A || aCode == 0x000D ||
155 (aCode >= 0x0020 && aCode <= 0x007F);
158 void TUnicodeCompressionState::Panic(TPanic aPanic)
160 User::Panic(_L16("ucmp"),(TInt)aPanic);
163 EXPORT_C TUnicodeCompressor::TUnicodeCompressor():
164 iInputBufferStart(0),
166 iOutputBufferStart(0),
167 iOutputBufferSize(0),
168 iDynamicWindowIndex(0),
170 iOutputPointer(NULL),
173 // Clear coverity warning
174 memset(iOutputBuffer, 0, sizeof(iOutputBuffer));
177 EXPORT_C void TUnicodeCompressor::CompressL(RWriteStream& aOutput,MUnicodeSource& aInput,
178 TInt aMaxOutputBytes,TInt aMaxInputWords,
179 TInt* aOutputBytes,TInt* aInputWords)
181 DoCompressL(&aOutput,NULL,&aInput,aMaxOutputBytes,aMaxInputWords,aOutputBytes,aInputWords);
184 EXPORT_C void TUnicodeCompressor::CompressL(TUint8* aOutput,MUnicodeSource& aInput,
185 TInt aMaxOutputBytes,TInt aMaxInputWords,
186 TInt* aOutputBytes,TInt* aInputWords)
188 DoCompressL(NULL,aOutput,&aInput,aMaxOutputBytes,aMaxInputWords,aOutputBytes,aInputWords);
191 EXPORT_C TInt TUnicodeCompressor::FlushL(RWriteStream& aOutput,TInt aMaxOutputBytes,TInt& aOutputBytes)
193 DoCompressL(&aOutput,NULL,NULL,aMaxOutputBytes,0,&aOutputBytes,NULL);
194 return iOutputBufferSize;
197 EXPORT_C TInt TUnicodeCompressor::FlushL(TUint8* aOutput,TInt aMaxOutputBytes,TInt& aOutputBytes)
199 DoCompressL(NULL,aOutput,NULL,aMaxOutputBytes,0,&aOutputBytes,NULL);
200 return iOutputBufferSize;
203 EXPORT_C TInt TUnicodeCompressor::CompressedSizeL(MUnicodeSource& aInput,TInt aInputWords)
206 TUnicodeCompressor c;
207 c.DoCompressL(NULL,NULL,&aInput,KMaxTInt,aInputWords,&bytes,NULL);
211 // Compress until input or output is exhausted or an exception occurs.
212 void TUnicodeCompressor::DoCompressL(RWriteStream* aOutputStream,TUint8* aOutputPointer,MUnicodeSource* aInput,
213 TInt aMaxOutputBytes,TInt aMaxInputWords,
214 TInt* aOutputBytes,TInt* aInputWords)
216 iOutputStream = aOutputStream;
217 iOutputPointer = aOutputPointer;
219 iMaxCompressedBytes = aMaxOutputBytes;
220 iMaxUnicodeWords = aMaxInputWords;
221 iCompressedBytes = iUnicodeWords = 0;
222 FlushOutputBufferL();
225 while (iUnicodeWords < iMaxUnicodeWords && iCompressedBytes < iMaxCompressedBytes)
227 TUint16 x = iInput->ReadUnicodeValueL();
229 iInputBuffer[(iInputBufferStart + iInputBufferSize) % EMaxInputBufferSize] = action;
232 if (iInputBufferSize == EMaxInputBufferSize)
238 *aOutputBytes = iCompressedBytes;
240 *aInputWords = iUnicodeWords;
243 TUnicodeCompressor::TAction::TAction(TUint16 aCode):
246 if (TUnicodeCompressionState::EncodeAsIs(aCode))
247 iTreatment = EPlainASCII;
250 iTreatment = TUnicodeCompressionState::DynamicWindowOffsetIndex(aCode);
251 if (iTreatment == -1)
253 iTreatment = TUnicodeCompressionState::StaticWindowIndex(aCode);
254 if (iTreatment == -1)
255 iTreatment = EPlainUnicode;
257 iTreatment += EFirstStatic;
262 void TUnicodeCompressor::WriteCharacterFromBuffer()
264 const TAction& action = iInputBuffer[iInputBufferStart];
266 iInputBufferStart = (iInputBufferStart + 1) % EMaxInputBufferSize;
267 WriteCharacter(action);
270 void TUnicodeCompressor::FlushInputBufferL()
272 while (iInputBufferSize > 0 && iCompressedBytes < iMaxCompressedBytes)
276 void TUnicodeCompressor::WriteRunL()
278 // Write out any leading characters that can be passed through.
280 while (iInputBufferSize > 0)
282 const TAction& action = iInputBuffer[iInputBufferStart];
283 if (action.iTreatment == TAction::EPlainASCII ||
284 (action.iCode >= iActiveWindowBase && action.iCode < iActiveWindowBase + 128))
285 WriteCharacterFromBuffer();
290 // Write a run of characters that cannot be passed through.
292 if (iInputBufferSize > 0)
295 Find a run of characters with the same treatment and select that treatment
296 if the run has more than one character.
298 int treatment = iInputBuffer[iInputBufferStart].iTreatment;
299 int next_treatment = treatment;
301 for (i = 1; i < iInputBufferSize; i++)
303 int index = (iInputBufferStart + i) % EMaxInputBufferSize;
304 next_treatment = iInputBuffer[index].iTreatment;
305 if (next_treatment != treatment)
310 SelectTreatment(treatment);
311 for (i = 0; i < run_size; i++)
312 WriteCharacterFromBuffer();
315 FlushOutputBufferL();
318 void TUnicodeCompressor::FlushOutputBufferL()
320 while (iOutputBufferSize > 0 && iCompressedBytes < iMaxCompressedBytes)
322 TUint8 byte = iOutputBuffer[iOutputBufferStart];
324 *iOutputPointer++ = byte;
325 else if (iOutputStream)
326 iOutputStream->WriteUint8L(byte);
329 iOutputBufferStart = (iOutputBufferStart + 1) % EMaxOutputBufferSize;
333 void TUnicodeCompressor::SelectTreatment(TInt aTreatment)
335 if (aTreatment == TAction::EPlainUnicode)
337 // Switch to Unicode mode if not there already.
346 if (aTreatment == TAction::EPlainASCII)
348 // Switch to single-byte mode, using the current dynamic window, if not there already.
351 WriteByte(UC0 + iDynamicWindowIndex);
352 iUnicodeMode = FALSE;
357 if (aTreatment >= TAction::EFirstDynamic && aTreatment <= TAction::ELastDynamic)
359 TUint32 base = DynamicWindowBase(aTreatment);
361 // Switch to the appropriate dynamic window if it is available; if not, redefine and select dynamic window 4.
362 for (int i = 0; i < EDynamicWindows; i++)
363 if (base == iDynamicWindow[i])
367 else if (i != iDynamicWindowIndex)
369 iUnicodeMode = FALSE;
370 iDynamicWindowIndex = i;
371 iActiveWindowBase = base;
378 iDynamicWindowIndex = 4;
379 iUnicodeMode = FALSE;
380 WriteByte(aTreatment);
381 iDynamicWindow[4] = base;
382 iActiveWindowBase = base;
387 // Write a character without changing mode or window.
388 void TUnicodeCompressor::WriteCharacter(const TAction& aAction)
391 WriteUCharacter(aAction.iCode);
393 WriteSCharacter(aAction);
396 void TUnicodeCompressor::WriteUCharacter(TUint16 aCode)
398 // Emit the 'quote Unicode' tag if the character would conflict with a tag.
399 if (aCode >= 0xE000 && aCode <= 0xF2FF)
402 // Write the Unicode value big-end first.
403 WriteByte((aCode >> 8) & 0xFF);
404 WriteByte(aCode & 0xFF);
407 void TUnicodeCompressor::WriteByte(TUint aByte)
409 if (iOutputBufferSize >= EMaxOutputBufferSize)
410 Panic(EOutputBufferOverflow); //Panic here is ok as this is a programming error
411 iOutputBuffer[(iOutputBufferStart + iOutputBufferSize) % EMaxOutputBufferSize] = (TUint8)aByte;
415 void TUnicodeCompressor::WriteSCharacter(const TAction& aAction)
417 // Characters in the range 0x0020..0x007F, plus nul, tab, cr, and lf, can be emitted as their low bytes.
418 if (aAction.iTreatment == TAction::EPlainASCII)
420 WriteByte(aAction.iCode);
424 // Characters in a static window can be written using SQ<n> plus a byte in the range 0x00-0x7F
425 if (aAction.iTreatment >= TAction::EFirstStatic && aAction.iTreatment <= TAction::ELastStatic)
427 int window = aAction.iTreatment - TAction::EFirstStatic;
428 WriteByte(SQ0 + window);
429 WriteByte(aAction.iCode);
433 // Characters in the current dynamic window can be written as a byte in the range 0x80-0xFF.
434 if (aAction.iCode >= iActiveWindowBase && aAction.iCode < iActiveWindowBase + 128)
436 WriteByte(aAction.iCode - iActiveWindowBase + 0x80);
440 // Characters in another dynamic window can be written using SQ<n> plus a byte in the range 0x80-0xFF
442 for (i = 0; i < EDynamicWindows; i++)
443 if (aAction.iCode >= iDynamicWindow[i] && aAction.iCode < iDynamicWindow[i] + 128)
446 WriteByte(aAction.iCode - iDynamicWindow[i] + 0x80);
450 // Other characters can be quoted.
452 WriteByte((aAction.iCode >> 8) & 0xFF);
453 WriteByte(aAction.iCode & 0xFF);
457 EXPORT_C TUnicodeExpander::TUnicodeExpander():
458 iInputBufferStart(0),
460 iOutputBufferStart(0),
461 iOutputBufferSize(0),
466 // Clear coverity warnings
467 memset(iInputBuffer, 0, sizeof(iInputBuffer));
468 memset(iOutputBuffer, 0, sizeof(iOutputBuffer));
471 EXPORT_C void TUnicodeExpander::ExpandL(MUnicodeSink& aOutput,RReadStream& aInput,
472 TInt aMaxOutputWords,TInt aMaxInputBytes,
473 TInt* aOutputWords,TInt* aInputBytes)
475 DoExpandL(&aOutput,&aInput,NULL,aMaxOutputWords,aMaxInputBytes,aOutputWords,aInputBytes);
478 EXPORT_C void TUnicodeExpander::ExpandL(MUnicodeSink& aOutput,const TUint8* aInput,
479 TInt aMaxOutputWords,TInt aMaxInputBytes,
480 TInt* aOutputWords,TInt* aInputBytes)
482 DoExpandL(&aOutput,NULL,aInput,aMaxOutputWords,aMaxInputBytes,aOutputWords,aInputBytes);
485 EXPORT_C TInt TUnicodeExpander::FlushL(MUnicodeSink& aOutput,TInt aMaxOutputWords,TInt& aOutputWords)
487 DoExpandL(&aOutput,NULL,NULL,aMaxOutputWords,0,&aOutputWords,NULL);
488 return iOutputBufferSize;
491 EXPORT_C TInt TUnicodeExpander::ExpandedSizeL(RReadStream& aInput,TInt aInputBytes)
495 e.DoExpandL(NULL,&aInput,NULL,KMaxTInt,aInputBytes,&words,NULL);
499 EXPORT_C TInt TUnicodeExpander::ExpandedSizeL(const TUint8* aInput,TInt aInputBytes)
503 e.DoExpandL(NULL,NULL,aInput,KMaxTInt,aInputBytes,&words,NULL);
507 // Expand until input or output is exhausted or an exception occurs.
508 void TUnicodeExpander::DoExpandL(MUnicodeSink* aOutput,RReadStream* aInputStream,const TUint8* aInputPointer,
509 TInt aMaxOutputWords,TInt aMaxInputBytes,
510 TInt* aOutputWords,TInt* aInputBytes)
513 iInputStream = aInputStream;
514 iInputPointer = aInputPointer;
515 iMaxUnicodeWords = aMaxOutputWords;
516 iMaxCompressedBytes = aMaxInputBytes;
517 iUnicodeWords = iCompressedBytes = 0;
518 iInputBufferStart = 0;
519 FlushOutputBufferL();
520 if (iInputPointer || iInputStream)
522 while (iUnicodeWords + iOutputBufferSize < iMaxUnicodeWords && iCompressedBytes < iMaxCompressedBytes)
526 *aOutputWords = iUnicodeWords;
528 *aInputBytes = iCompressedBytes;
531 void TUnicodeExpander::HandleByteL()
534 TBool handled = FALSE;
538 handled = HandleUByteL(byte);
540 handled = HandleSByteL(byte);
542 iInputBufferStart = 0;
544 iInputBufferSize = 0;
545 FlushOutputBufferL();
548 void TUnicodeExpander::FlushOutputBufferL()
550 while (iOutputBufferSize > 0 && iUnicodeWords < iMaxUnicodeWords)
553 iOutput->WriteUnicodeValueL(iOutputBuffer[iOutputBufferStart]);
556 iOutputBufferStart = (iOutputBufferStart + 1) % EMaxOutputBufferSize;
560 TBool TUnicodeExpander::HandleSByteL(TUint8 aByte)
562 // 'Pass-through' codes.
563 if (TUnicodeCompressionState::EncodeAsIs(aByte))
569 // Codes 0x80-0xFF select a character from the active window.
572 WriteChar32(iActiveWindowBase + aByte - 0x80);
576 // SQU: quote a Unicode character.
578 return QuoteUnicodeL();
580 // SCU: switch to Unicode mode.
587 // SQn: quote from window n.
588 if (aByte >= SQ0 && aByte <= SQ0 + 7)
590 int window = aByte - SQ0;
596 c += iStaticWindow[window];
598 c += iDynamicWindow[window] - 0x80;
606 // SCn: switch to dynamic window n.
607 if (aByte >= SC0 && aByte <= SC0 + 7)
609 iActiveWindowBase = iDynamicWindow[aByte - SC0];
613 // SDn: define dynamic window n and switch to it.
614 if (aByte >= SD0 && aByte <= SD0 + 7)
615 return DefineWindowL(aByte - SD0);
617 // SDX: define window in the expansion space.
619 return DefineExpansionWindowL();
621 User::Leave(KErrCorrupt);
625 TBool TUnicodeExpander::HandleUByteL(TUint8 aByte)
627 // Plain Unicode; get the low byte and emit the Unicode value.
628 if (aByte <= 0xDF || aByte >= 0xF3)
633 TUint16 c = (TUint16)((aByte << 8) | lo);
641 // Quote a Unicode character that would otherwise conflict with a tag.
643 return QuoteUnicodeL();
645 // UCn: change to single byte mode and select window n.
646 if (aByte >= UC0 && aByte <= UC0 + 7)
648 iUnicodeMode = FALSE;
649 iActiveWindowBase = iDynamicWindow[aByte - UC0];
653 // UDn: define dynamic window n and switch to it.
654 if (aByte >= UD0 && aByte <= UD0 + 7)
655 return DefineWindowL(aByte - UD0);
657 // UDX: define window in the expansion space.
659 return DefineExpansionWindowL();
661 User::Leave(KErrCorrupt);
665 TBool TUnicodeExpander::QuoteUnicodeL()
668 if (ReadByteL(hi) && ReadByteL(lo))
670 TUint16 c = (TUint16)((hi << 8) | lo);
678 TBool TUnicodeExpander::DefineWindowL(TInt aIndex)
681 if (ReadByteL(window))
683 iUnicodeMode = FALSE;
684 iActiveWindowBase = DynamicWindowBase(window);
685 iDynamicWindow[aIndex] = iActiveWindowBase;
692 TBool TUnicodeExpander::DefineExpansionWindowL()
695 if (ReadByteL(hi) && ReadByteL(lo))
697 iUnicodeMode = FALSE;
698 iActiveWindowBase = 0x10000 + (0x80 * ((hi & 0x1F) * 0x100 + lo));
699 iDynamicWindow[hi >> 5] = iActiveWindowBase;
706 // Read either from the buffer (in the case of restarting after source finished in mid-operation) or from the source.
707 TBool TUnicodeExpander::ReadByteL(TUint8& aByte)
709 if (iInputBufferStart < iInputBufferSize)
711 aByte = iInputBuffer[iInputBufferStart++];
714 else if (iCompressedBytes < iMaxCompressedBytes)
717 aByte = *iInputPointer++;
719 aByte = iInputStream->ReadUint8L();
720 iInputBuffer[iInputBufferStart++] = aByte;
721 iInputBufferSize = iInputBufferStart;
729 void TUnicodeExpander::WriteChar(TUint16 aChar)
731 if (iOutputBufferSize >= EMaxOutputBufferSize)
732 Panic(EOutputBufferOverflow); //Panic here is ok since this is a programming error
733 iOutputBuffer[(iOutputBufferStart + iOutputBufferSize) % EMaxOutputBufferSize] = aChar;
737 // Write a Unicode character; write using surrogates if in the range 0x10000..0x10FFFF.
738 void TUnicodeExpander::WriteChar32(TUint aChar)
741 WriteChar((TUint16)aChar);
742 else if (aChar <= 0x10FFFF)
744 aChar -= 0x10000; // reduce to 20-bit value in the range 0x0..0xFFFFF
745 WriteChar((TUint16)(0xD800 + (aChar >> 10))); // first high surrogate + high 10 bits
746 WriteChar((TUint16)(0xDC00 + (aChar & 0x03FF))); // first low surrogate + low 10 bits
749 //Panic to be kept here as impossible to test this case (nor the one before). Biggest value that can be passed is 0xFFFFF