os/persistentdata/persistentstorage/store/pcstore/src/unicodecompression.cpp
author sl
Tue, 10 Jun 2014 14:32:02 +0200
changeset 1 260cb5ec6c19
permissions -rw-r--r--
Update contrib.
     1 // Copyright (c) 2006-2009 Nokia Corporation and/or its subsidiary(-ies).
     2 // All rights reserved.
     3 // This component and the accompanying materials are made available
     4 // under the terms of "Eclipse Public License v1.0"
     5 // which accompanies this distribution, and is available
     6 // at the URL "http://www.eclipse.org/legal/epl-v10.html".
     7 //
     8 // Initial Contributors:
     9 // Nokia Corporation - initial contribution.
    10 //
    11 // Contributors:
    12 //
    13 // Description:
    14 // Classes implemented in this file are used for Unicode compression and decompression.
    15 // Their code is borrowed from Symbian, only with some changes such as the "Panic" function 
    16 // is changed to exit the program. The Symbian coding standard will be kept in the code.
    17 // 
    18 //
    19 
    20 #include <stdlib.h>
    21 #include "unicodecompression.h"
    22 
    23 namespace PCStore
    24 {
    25 const TUint32 TUnicodeCompressionState::iStaticWindow[EStaticWindows] =
    26 	{
    27 	0x0000,		// tags
    28 	0x0080,		// Latin-1 supplement
    29 	0x0100,		// Latin Extended-A
    30 	0x0300,		// Combining Diacritics
    31 	0x2000,		// General Punctuation
    32 	0x2080,		// Currency Symbols
    33 	0x2100,		// Letterlike Symbols and Number Forms
    34 	0x3000		// CJK Symbols and Punctuation
    35 	};
    36 
    37 const TUint32 TUnicodeCompressionState::iDynamicWindowDefault[EDynamicWindows] =
    38 	{
    39 	0x0080,		// Latin-1 supplement
    40 	0x00C0,		// parts of Latin-1 supplement and Latin Extended-A
    41 	0x0400,		// Cyrillic
    42 	0x0600,		// Arabic
    43 	0x0900,		// Devanagari
    44 	0x3040,		// Hiragana
    45 	0x30A0,		// Katakana
    46 	0xFF00		// Fullwidth ASCII
    47 	};
    48 
    49 const TUint16 TUnicodeCompressionState::iSpecialBase[ESpecialBases] =
    50 	{
    51 	0x00C0,		// Latin 1 letters (not symbols) and some of Extended-A
    52 	0x0250,		// IPA extensions
    53 	0x0370,		// Greek
    54 	0x0530,		// Armenian
    55 	0x3040,		// Hiragana
    56 	0x30A0,		// Katakana
    57 	0xFF60		// Halfwidth katakana
    58 	};
    59 
    60 // Single-byte mode tag values
    61 const TUint8 SQ0 = 0x01;	// <byte>				quote from window 0
    62 const TUint8 SDX = 0x0B;	// <hbyte> <lbyte>		define window in expansion area
    63 const TUint8 SQU = 0x0E;	// <hbyte> <lbyte>		quote Unicode value
    64 const TUint8 SCU = 0x0F;	//						switch to Unicode mode
    65 const TUint8 SC0 = 0x10;	//						select dynamic window 0
    66 const TUint8 SD0 = 0x18;	// <byte>				set dynamic window 0 index to <byte> and select it
    67 
    68 // Unicode mode tag values
    69 const TUint8 UC0 = 0xE0;	//						select dynamic window 0 and switch to single-byte mode
    70 const TUint8 UD0 = 0xE8;	// <byte>				set dynamic window 0 index to <byte>, select it and switch to
    71 							//						single-byte mode
    72 const TUint8 UQU = 0xF0;	// <hbyte>, <lbyte>		quote Unicode value
    73 const TUint8 UDX = 0xF1;	// <hbyte>, <lbyte>		define window in expansion area and switch to single-byte mode
    74 	
    75 TUnicodeCompressionState::TUnicodeCompressionState():
    76 	iUnicodeWords(0),
    77 	iMaxUnicodeWords(0),
    78 	iCompressedBytes(0),
    79 	iMaxCompressedBytes(0)
    80 	{
    81 	Reset();
    82 	}
    83 
    84 void TUnicodeCompressionState::Reset()
    85 	{
    86 	iUnicodeMode = false;
    87 	iActiveWindowBase = 0x0080;
    88 	for (int i = 0; i < EDynamicWindows; i++)
    89 		iDynamicWindow[i] = iDynamicWindowDefault[i];
    90 	}
    91 
    92 
    93 // Return the index of the static window that contains this code, if any, or -1 if there is none.
    94 TInt TUnicodeCompressionState::StaticWindowIndex(TUint16 aCode)
    95 	{
    96 	for (TInt i = 0; i < EStaticWindows; i++)
    97 		if (aCode >= iStaticWindow[i] && aCode < iStaticWindow[i] + 128)
    98 			return i;
    99 	return -1;
   100 	}
   101 
   102 /*
   103 If aCode can be accommodated in one of the legal dynamic windows, return the index of that window
   104 in the offset table. If not return KErrNotFound.
   105 */
   106 TInt TUnicodeCompressionState::DynamicWindowOffsetIndex(TUint16 aCode)
   107 	{
   108 	if (aCode < 0x0080)
   109 		return KErrNotFound;
   110 	if (aCode >= 0x3400 && aCode <= 0xDFFF)
   111 		return KErrNotFound;
   112 
   113 	/*
   114 	Prefer sections that cross half-block boundaries. These are better adapted to actual text.
   115 	They are represented by offset indices 0xf9..0xff.
   116 	*/
   117 	for (int i = 0; i < ESpecialBases; i++)
   118 		if (aCode >= iSpecialBase[i] && aCode < iSpecialBase[i] + 128)
   119 			return 0xF9 + i;
   120 
   121 	/*
   122 	Offset indices 0x01..0x67 represent half blocks from 0x0080 to 0x3380 and
   123 	0x68..0xA7 represent half blocks from 0xE000 to 0xFF80.
   124 	*/
   125 	if (aCode >= 0xE000)
   126 		aCode -= 0xAC00;
   127 	return aCode / 0x80;
   128 	}
   129 
   130 // Return the base of the window represented by offset index <n>. Return 0 if the offset index is illegal.
   131 TUint32 TUnicodeCompressionState::DynamicWindowBase(TInt aOffsetIndex)
   132 	{
   133 	if (aOffsetIndex >= 0xF9 && aOffsetIndex <= 0xFF)
   134 		{
   135 		/*
   136 		WARNING: don't optimise the following two lines by replacing them with
   137 		'return iSpecialBase[aOffsetIndex - 0xF9];'. To do so would re-introduce an error
   138 		in ARM builds caused by optimisation and consequent erroneous fixing up
   139 		of the array base: see defect EDNGASR-4AGJQX in ER5U defects.
   140 		*/
   141 		int special_base_index = aOffsetIndex - 0xF9;
   142 		return iSpecialBase[special_base_index];
   143 		}
   144 	if (aOffsetIndex >= 0x01 && aOffsetIndex <= 0x67)
   145 		return aOffsetIndex * 0x80;
   146 	if (aOffsetIndex >= 0x68 && aOffsetIndex <= 0xA7)
   147 		return aOffsetIndex * 0x80 + 0xAC00;
   148 	return 0;
   149 	}
   150 
   151 TBool TUnicodeCompressionState::EncodeAsIs(TUint16 aCode)
   152 	{
   153 	return aCode == 0x0000 || aCode == 0x0009 || aCode == 0x000A || aCode == 0x000D ||
   154 		   (aCode >= 0x0020 && aCode <= 0x007F);
   155 	}
   156 
   157 void TUnicodeCompressionState::Panic(TPanic aPanic)
   158 	{
   159 		exit(aPanic);
   160 	}
   161 
   162 TUnicodeCompressor::TUnicodeCompressor():
   163 	iInputBufferStart(0),
   164 	iInputBufferSize(0),
   165 	iOutputBufferStart(0),
   166 	iOutputBufferSize(0),
   167 	iDynamicWindowIndex(0),
   168 	iOutputStream(NULL),
   169 	iOutputPointer(NULL),
   170 	iInput(NULL)
   171 	{
   172 	}
   173 
   174 void TUnicodeCompressor::CompressL(CStoreWriteStream& aOutput,MUnicodeSource& aInput,
   175 											TInt aMaxOutputBytes,TInt aMaxInputWords,
   176 											TInt* aOutputBytes,TInt* aInputWords)
   177 	{
   178 	DoCompressL(&aOutput,NULL,&aInput,aMaxOutputBytes,aMaxInputWords,aOutputBytes,aInputWords);
   179 	}
   180 
   181 void TUnicodeCompressor::CompressL(TUint8* aOutput,MUnicodeSource& aInput,
   182 											TInt aMaxOutputBytes,TInt aMaxInputWords,
   183 											TInt* aOutputBytes,TInt* aInputWords)
   184 	{
   185 	DoCompressL(NULL,aOutput,&aInput,aMaxOutputBytes,aMaxInputWords,aOutputBytes,aInputWords);
   186 	}
   187 
   188 TInt TUnicodeCompressor::FlushL(CStoreWriteStream& aOutput,TInt aMaxOutputBytes,TInt& aOutputBytes)
   189 	{
   190 	DoCompressL(&aOutput,NULL,NULL,aMaxOutputBytes,0,&aOutputBytes,NULL);
   191 	return iOutputBufferSize;
   192 	}
   193 
   194 TInt TUnicodeCompressor::FlushL(TUint8* aOutput,TInt aMaxOutputBytes,TInt& aOutputBytes)
   195 	{
   196 	DoCompressL(NULL,aOutput,NULL,aMaxOutputBytes,0,&aOutputBytes,NULL);
   197 	return iOutputBufferSize;
   198 	}
   199 
   200 TInt TUnicodeCompressor::CompressedSizeL(MUnicodeSource& aInput,TInt aInputWords)
   201 	{
   202 	TInt bytes;
   203 	TUnicodeCompressor c;
   204 	c.DoCompressL(NULL,NULL,&aInput,KMaxTInt,aInputWords,&bytes,NULL);
   205 	return bytes;
   206 	}
   207 
   208 // Compress until input or output is exhausted or an exception occurs.
   209 void TUnicodeCompressor::DoCompressL(CStoreWriteStream* aOutputStream,TUint8* aOutputPointer,MUnicodeSource* aInput,
   210 									 TInt aMaxOutputBytes,TInt aMaxInputWords,
   211 									 TInt* aOutputBytes,TInt* aInputWords)
   212 	{
   213 	iOutputStream = aOutputStream;
   214 	iOutputPointer = aOutputPointer;
   215 	iInput = aInput;
   216 	iMaxCompressedBytes = aMaxOutputBytes;
   217 	iMaxUnicodeWords = aMaxInputWords;
   218 	iCompressedBytes = iUnicodeWords = 0;
   219 	FlushOutputBufferL();
   220 	if (iInput)
   221 		{
   222 		while (iUnicodeWords < iMaxUnicodeWords && iCompressedBytes < iMaxCompressedBytes)
   223 			{
   224 			TUint16 x = iInput->ReadUnicodeValueL();
   225 			TAction action(x);
   226 			iInputBuffer[(iInputBufferStart + iInputBufferSize) % EMaxInputBufferSize] = action;
   227 			iInputBufferSize++;
   228 			iUnicodeWords++;
   229 			if (iInputBufferSize == EMaxInputBufferSize)
   230 				WriteRunL();
   231 			}
   232 		}
   233 	FlushInputBufferL();
   234 	if (aOutputBytes)
   235 		*aOutputBytes = iCompressedBytes;
   236 	if (aInputWords)
   237 		*aInputWords = iUnicodeWords;
   238 	}
   239 
   240 TUnicodeCompressor::TAction::TAction(TUint16 aCode):
   241 	iCode(aCode)
   242 	{
   243 	if (TUnicodeCompressionState::EncodeAsIs(aCode))
   244 		iTreatment = EPlainASCII;
   245 	else
   246 		{
   247 		iTreatment = TUnicodeCompressionState::DynamicWindowOffsetIndex(aCode);
   248 		if (iTreatment == -1)
   249 			{
   250 			iTreatment = TUnicodeCompressionState::StaticWindowIndex(aCode);
   251 			if (iTreatment == -1)
   252 				iTreatment = EPlainUnicode;
   253 			else
   254 				iTreatment += EFirstStatic;
   255 			}
   256 		}
   257 	}
   258 
   259 void TUnicodeCompressor::WriteCharacterFromBuffer()
   260 	{
   261 	const TAction& action = iInputBuffer[iInputBufferStart];
   262 	iInputBufferSize--;
   263 	iInputBufferStart = (iInputBufferStart + 1) % EMaxInputBufferSize;
   264 	WriteCharacter(action);
   265 	}
   266 
   267 void TUnicodeCompressor::FlushInputBufferL()
   268 	{
   269 	while (iInputBufferSize > 0 && iCompressedBytes < iMaxCompressedBytes)
   270 		WriteRunL();
   271 	}
   272 
   273 void TUnicodeCompressor::WriteRunL()
   274 	{
   275 	// Write out any leading characters that can be passed through.
   276 	if (!iUnicodeMode)
   277 		while (iInputBufferSize > 0)
   278 			{
   279 			const TAction& action = iInputBuffer[iInputBufferStart];
   280 			if (action.iTreatment == TAction::EPlainASCII ||
   281 				(action.iCode >= iActiveWindowBase && action.iCode < iActiveWindowBase + 128))
   282 				WriteCharacterFromBuffer();
   283 			else
   284 				break;
   285 			}
   286 
   287 	// Write a run of characters that cannot be passed through.
   288 	int i;
   289 	if (iInputBufferSize > 0)
   290 		{
   291 		/*
   292 		Find a run of characters with the same treatment and select that treatment
   293 		if the run has more than one character.
   294 		*/
   295 		int treatment = iInputBuffer[iInputBufferStart].iTreatment;
   296 		int next_treatment = treatment;
   297 		int run_size = 1;
   298 		for (i = 1; i < iInputBufferSize; i++)
   299 			{
   300 			int index = (iInputBufferStart + i) % EMaxInputBufferSize;
   301 			next_treatment = iInputBuffer[index].iTreatment;
   302 			if (next_treatment != treatment)
   303 				break;
   304 			run_size++;
   305 			}
   306 		if (run_size > 1)
   307 			SelectTreatment(treatment);
   308 		for (i = 0; i < run_size; i++)
   309 			WriteCharacterFromBuffer();
   310 		}
   311 
   312 	FlushOutputBufferL();
   313 	}
   314 
   315 void TUnicodeCompressor::FlushOutputBufferL()
   316 	{
   317 	while (iOutputBufferSize > 0 &&	iCompressedBytes < iMaxCompressedBytes)
   318 		{
   319 		TUint8 byte = iOutputBuffer[iOutputBufferStart];
   320 		if (iOutputPointer)
   321 			*iOutputPointer++ = byte;
   322 		else if (iOutputStream)
   323 			iOutputStream->WriteUint8(byte);
   324 		iCompressedBytes++;
   325 		iOutputBufferSize--;
   326 		iOutputBufferStart = (iOutputBufferStart + 1) % EMaxOutputBufferSize;
   327 		}
   328 	}
   329 
   330 void TUnicodeCompressor::SelectTreatment(TInt aTreatment)
   331 	{
   332 	if (aTreatment == TAction::EPlainUnicode)
   333 		{
   334 		// Switch to Unicode mode if not there already.
   335 		if (!iUnicodeMode)
   336 			{
   337 			WriteByte(SCU);
   338 			iUnicodeMode = true;
   339 			}
   340 		return;
   341 		}
   342 
   343 	if (aTreatment == TAction::EPlainASCII)
   344 		{
   345 		// Switch to single-byte mode, using the current dynamic window, if not there already.
   346 		if (iUnicodeMode)
   347 			{
   348 			WriteByte(UC0 + iDynamicWindowIndex);
   349 			iUnicodeMode = false;
   350 			}
   351 		return;
   352 		}
   353 
   354 	if (aTreatment >= TAction::EFirstDynamic && aTreatment <= TAction::ELastDynamic)
   355 		{
   356 		TUint32 base = DynamicWindowBase(aTreatment);
   357 
   358 		// Switch to the appropriate dynamic window if it is available; if not, redefine and select dynamic window 4.
   359 		for (int i = 0; i < EDynamicWindows; i++)
   360 			if (base == iDynamicWindow[i])
   361 				{
   362 				if (iUnicodeMode)
   363 					WriteByte(UC0 + i);
   364 				else if (i != iDynamicWindowIndex)
   365 					WriteByte(SC0 + i);
   366 				iUnicodeMode = false;
   367 				iDynamicWindowIndex = i;
   368 				iActiveWindowBase = base;
   369 				return;
   370 				}
   371 		if (iUnicodeMode)
   372 			WriteByte(UD0 + 4);
   373 		else
   374 			WriteByte(SD0 + 4);
   375 		iDynamicWindowIndex = 4;
   376 		iUnicodeMode = false;
   377 		WriteByte(aTreatment);
   378 		iDynamicWindow[4] = base;
   379 		iActiveWindowBase = base;
   380 		return;
   381 		}
   382 	}
   383 
   384 // Write a character without changing mode or window.
   385 void TUnicodeCompressor::WriteCharacter(const TAction& aAction)
   386 	{
   387 	if (iUnicodeMode)
   388 		WriteUCharacter(aAction.iCode);
   389 	else
   390 		WriteSCharacter(aAction);
   391 	}
   392 
   393 void TUnicodeCompressor::WriteUCharacter(TUint16 aCode)
   394 	{
   395 	// Emit the 'quote Unicode' tag if the character would conflict with a tag.
   396 	if (aCode >= 0xE000 && aCode <= 0xF2FF)
   397 		WriteByte(UQU);
   398 
   399 	// Write the Unicode value big-end first.
   400 	WriteByte((aCode >> 8) & 0xFF);
   401 	WriteByte(aCode & 0xFF);
   402 	}
   403 
   404 void TUnicodeCompressor::WriteByte(TUint aByte)
   405 	{
   406 	if (iOutputBufferSize >= EMaxOutputBufferSize)
   407 		Panic(EOutputBufferOverflow);
   408 	iOutputBuffer[(iOutputBufferStart + iOutputBufferSize) % EMaxOutputBufferSize] = (TUint8)aByte;
   409 	iOutputBufferSize++;
   410 	}
   411 
   412 void TUnicodeCompressor::WriteSCharacter(const TAction& aAction)
   413 	{
   414 	// Characters in the range 0x0020..0x007F, plus nul, tab, cr, and lf, can be emitted as their low bytes.
   415 	if (aAction.iTreatment == TAction::EPlainASCII)
   416 		{
   417 		WriteByte(aAction.iCode);
   418 		return;
   419 		}
   420 
   421 	// Characters in a static window can be written using SQ<n> plus a byte in the range 0x00-0x7F
   422 	if (aAction.iTreatment >= TAction::EFirstStatic && aAction.iTreatment <= TAction::ELastStatic)
   423 		{
   424 		int window = aAction.iTreatment - TAction::EFirstStatic;
   425 		WriteByte(SQ0 + window);
   426 		WriteByte(aAction.iCode);
   427 		return;
   428 		}
   429 
   430 	// Characters in the current dynamic window can be written as a byte in the range 0x80-0xFF.
   431 	if (aAction.iCode >= iActiveWindowBase && aAction.iCode < iActiveWindowBase + 128)
   432 		{
   433 		WriteByte(aAction.iCode - iActiveWindowBase + 0x80);
   434 		return;
   435 		}
   436 
   437 	// Characters in another dynamic window can be written using SQ<n> plus a byte in the range 0x80-0xFF
   438 	int i;
   439 	for (i = 0; i < EDynamicWindows; i++)
   440 		if (aAction.iCode >= iDynamicWindow[i] && aAction.iCode < iDynamicWindow[i] + 128)
   441 			{
   442 			WriteByte(SQ0 + i);
   443 			WriteByte(aAction.iCode - iDynamicWindow[i] + 0x80);
   444 			return;
   445 			}
   446 
   447 	// Other characters can be quoted.
   448 	WriteByte(SQU);
   449 	WriteByte((aAction.iCode >> 8) & 0xFF);
   450 	WriteByte(aAction.iCode & 0xFF);
   451 	return;
   452 	}
   453 
   454 
   455 TUnicodeExpander::TUnicodeExpander():
   456 	iInputBufferStart(0),
   457 	iInputBufferSize(0),
   458 	iOutputBufferStart(0),
   459 	iOutputBufferSize(0),
   460 	iOutput(NULL),
   461 	iInputStream(NULL),
   462 	iInputPointer(NULL)
   463 	{
   464 	}
   465 
   466 void TUnicodeExpander::ExpandL(MUnicodeSink& aOutput,CStoreReadStream& aInput,
   467 										TInt aMaxOutputWords,TInt aMaxInputBytes,
   468 										TInt* aOutputWords,TInt* aInputBytes)
   469 	{
   470 	DoExpandL(&aOutput,&aInput,NULL,aMaxOutputWords,aMaxInputBytes,aOutputWords,aInputBytes);
   471 	}
   472 
   473 void TUnicodeExpander::ExpandL(MUnicodeSink& aOutput,const TUint8* aInput,
   474 										TInt aMaxOutputWords,TInt aMaxInputBytes,
   475 										TInt* aOutputWords,TInt* aInputBytes)
   476 	{
   477 	DoExpandL(&aOutput,NULL,aInput,aMaxOutputWords,aMaxInputBytes,aOutputWords,aInputBytes);
   478 	}
   479 
   480 TInt TUnicodeExpander::FlushL(MUnicodeSink& aOutput,TInt aMaxOutputWords,TInt& aOutputWords)
   481 	{
   482 	DoExpandL(&aOutput,NULL,NULL,aMaxOutputWords,0,&aOutputWords,NULL);
   483 	return iOutputBufferSize;
   484 	}
   485 
   486 TInt TUnicodeExpander::ExpandedSizeL(CStoreReadStream& aInput,TInt aInputBytes)
   487 	{
   488 	TInt words;
   489 	TUnicodeExpander e;
   490 	e.DoExpandL(NULL,&aInput,NULL,KMaxTInt,aInputBytes,&words,NULL);
   491 	return words;
   492 	}
   493 
   494 TInt TUnicodeExpander::ExpandedSizeL(const TUint8* aInput,TInt aInputBytes)
   495 	{
   496 	TInt words;
   497 	TUnicodeExpander e;
   498 	e.DoExpandL(NULL,NULL,aInput,KMaxTInt,aInputBytes,&words,NULL);
   499 	return words;
   500 	}
   501 
   502 // Expand until input or output is exhausted or an exception occurs.
   503 void TUnicodeExpander::DoExpandL(MUnicodeSink* aOutput,CStoreReadStream* aInputStream,const TUint8* aInputPointer,
   504 								 TInt aMaxOutputWords,TInt aMaxInputBytes,
   505 								 TInt* aOutputWords,TInt* aInputBytes)
   506 	{
   507 	iOutput = aOutput;
   508 	iInputStream = aInputStream;
   509 	iInputPointer = aInputPointer;
   510 	iMaxUnicodeWords = aMaxOutputWords;
   511 	iMaxCompressedBytes = aMaxInputBytes;
   512 	iUnicodeWords = iCompressedBytes = 0;
   513 	iInputBufferStart = 0;
   514 	FlushOutputBufferL();
   515 	if (iInputPointer || iInputStream)
   516 		{
   517 		while (iUnicodeWords + iOutputBufferSize < iMaxUnicodeWords && iCompressedBytes < iMaxCompressedBytes)
   518 			HandleByteL();
   519 		}
   520 	if (aOutputWords)
   521 		*aOutputWords = iUnicodeWords;
   522 	if (aInputBytes)
   523 		*aInputBytes = iCompressedBytes;
   524 	}
   525 
   526 void TUnicodeExpander::HandleByteL()
   527 	{
   528 	TUint8 byte;
   529 	TBool handled = false;
   530 	if (ReadByteL(byte))
   531 		{
   532 		if (iUnicodeMode)
   533 			handled = HandleUByteL(byte);
   534 		else
   535 			handled = HandleSByteL(byte);
   536 		}
   537 	iInputBufferStart = 0;
   538 	if (handled)
   539 		iInputBufferSize = 0;
   540 	FlushOutputBufferL();
   541 	}
   542 
   543 void TUnicodeExpander::FlushOutputBufferL()
   544 	{
   545 	while (iOutputBufferSize > 0 &&	iUnicodeWords < iMaxUnicodeWords)
   546 		{
   547 		if (iOutput)
   548 			iOutput->WriteUnicodeValueL(iOutputBuffer[iOutputBufferStart]);
   549 		iUnicodeWords++;
   550 		iOutputBufferSize--;
   551 		iOutputBufferStart = (iOutputBufferStart + 1) % EMaxOutputBufferSize;
   552 		}
   553 	}
   554 
   555 TBool TUnicodeExpander::HandleSByteL(TUint8 aByte)
   556 	{
   557 	// 'Pass-through' codes.
   558 	if (TUnicodeCompressionState::EncodeAsIs(aByte))
   559 		{
   560 		WriteChar(aByte);
   561 		return true;
   562 		}
   563 
   564 	// Codes 0x80-0xFF select a character from the active window.
   565 	if (aByte >= 0x80)
   566 		{
   567 		WriteChar32(iActiveWindowBase + aByte - 0x80);
   568 		return true;
   569 		}
   570 
   571 	// SQU: quote a Unicode character.
   572 	if (aByte == SQU)
   573 		return QuoteUnicodeL();
   574 
   575 	// SCU: switch to Unicode mode.
   576 	if (aByte == SCU)
   577 		{
   578 		iUnicodeMode = true;
   579 		return true;
   580 		}
   581 
   582 	// SQn: quote from window n.
   583 	if (aByte >= SQ0 && aByte <= SQ0 + 7)
   584 		{
   585 		int window = aByte - SQ0;
   586 		TUint8 byte;
   587 		if (ReadByteL(byte))
   588 			{
   589 			TUint32 c = byte;
   590 			if (c <= 0x7F)
   591 				c += iStaticWindow[window];
   592 			else
   593 				c += iDynamicWindow[window] - 0x80;
   594 			WriteChar32(c);
   595 			return true;
   596 			}
   597 		else
   598 			return false;
   599 		}
   600 
   601 	// SCn: switch to dynamic window n.
   602 	if (aByte >= SC0 && aByte <= SC0 + 7)
   603 		{
   604 		iActiveWindowBase = iDynamicWindow[aByte - SC0];
   605 		return true;
   606 		}
   607 
   608 	// SDn: define dynamic window n and switch to it.
   609 	if (aByte >= SD0 && aByte <= SD0 + 7)
   610 		return DefineWindowL(aByte - SD0);
   611 
   612 	// SDX: define window in the expansion space.
   613 	if (aByte == SDX)
   614 		return DefineExpansionWindowL();
   615 
   616 	Panic(EUnhandledByte);
   617 	return false;
   618 	}
   619 
   620 TBool TUnicodeExpander::HandleUByteL(TUint8 aByte)
   621 	{
   622 	// Plain Unicode; get the low byte and emit the Unicode value.
   623 	if (aByte <= 0xDF || aByte >= 0xF3)
   624 		{
   625 		TUint8 lo;
   626 		if (ReadByteL(lo))
   627 			{
   628 			TUint16 c = (TUint16)((aByte << 8) | lo);
   629 			WriteChar(c);
   630 			return true;
   631 			}
   632 		else
   633 			return false;
   634 		}
   635 
   636 	// Quote a Unicode character that would otherwise conflict with a tag.
   637 	if (aByte == UQU)
   638 		return QuoteUnicodeL();
   639 
   640 	// UCn: change to single byte mode and select window n.
   641 	if (aByte >= UC0 && aByte <= UC0 + 7)
   642 		{
   643 		iUnicodeMode = false;
   644 		iActiveWindowBase = iDynamicWindow[aByte - UC0];
   645 		return true;
   646 		}
   647 
   648 	// UDn: define dynamic window n and switch to it.
   649 	if (aByte >= UD0 && aByte <= UD0 + 7)
   650 		return DefineWindowL(aByte - UD0);
   651 
   652 	// UDX: define window in the expansion space.
   653 	if (aByte == UDX)
   654 		return DefineExpansionWindowL();
   655 
   656 	Panic(EUnhandledByte);
   657 	return false;
   658 	}
   659 
   660 TBool TUnicodeExpander::QuoteUnicodeL()
   661 	{
   662 	TUint8 hi, lo;
   663 	if (ReadByteL(hi) && ReadByteL(lo))
   664 		{
   665 		TUint16 c = (TUint16)((hi << 8) | lo);
   666 		WriteChar(c);
   667 		return true;
   668 		}
   669 	else
   670 		return false;
   671 	}
   672 
   673 TBool TUnicodeExpander::DefineWindowL(TInt aIndex)
   674 	{
   675 	TUint8 window;
   676 	if (ReadByteL(window))
   677 		{
   678 		iUnicodeMode = false;
   679 		iActiveWindowBase = DynamicWindowBase(window);
   680 		iDynamicWindow[aIndex] = iActiveWindowBase;
   681 		return true;
   682 		}
   683 	else
   684 		return false;
   685 	}
   686 
   687 TBool TUnicodeExpander::DefineExpansionWindowL()
   688 	{
   689 	TUint8 hi, lo;
   690 	if (ReadByteL(hi) && ReadByteL(lo))
   691 		{
   692 		iUnicodeMode = false;
   693 		iActiveWindowBase = 0x10000 + (0x80 * ((hi & 0x1F) * 0x100 + lo));
   694 		iDynamicWindow[hi >> 5] = iActiveWindowBase;
   695 		return true;
   696 		}
   697 	else
   698 		return false;
   699 	}
   700 
   701 // Read either from the buffer (in the case of restarting after source finished in mid-operation) or from the source.
   702 TBool TUnicodeExpander::ReadByteL(TUint8& aByte)
   703 	{
   704 	if (iInputBufferStart < iInputBufferSize)
   705 		{
   706 		aByte = iInputBuffer[iInputBufferStart++];
   707 		return true;
   708 		}
   709 	else if (iCompressedBytes < iMaxCompressedBytes)
   710 		{
   711 		if (iInputPointer)
   712 			aByte = *iInputPointer++;
   713 		else
   714 			aByte = iInputStream->ReadUint8();
   715 		iInputBuffer[iInputBufferStart++] = aByte;
   716 		iInputBufferSize = iInputBufferStart;
   717 		iCompressedBytes++;
   718 		return true;
   719 		}
   720 	else
   721 		return false;
   722 	}
   723 
   724 void TUnicodeExpander::WriteChar(TUint16 aChar)
   725 	{
   726 	if (iOutputBufferSize >= EMaxOutputBufferSize)
   727 		Panic(EOutputBufferOverflow);
   728 	iOutputBuffer[(iOutputBufferStart + iOutputBufferSize) % EMaxOutputBufferSize] = aChar;
   729 	iOutputBufferSize++;
   730 	}
   731 
   732 // Write a Unicode character; write using surrogates if in the range 0x10000..0x10FFFF.
   733 void TUnicodeExpander::WriteChar32(TUint aChar)
   734 	{
   735 	if (aChar <= 0xFFFF)
   736 		WriteChar((TUint16)aChar);
   737 	else if (aChar <= 0x10FFFF)
   738 		{
   739 		aChar -= 0x10000;									// reduce to 20-bit value in the range 0x0..0xFFFFF
   740 		WriteChar((TUint16)(0xD800 + (aChar >> 10)));		// first high surrogate + high 10 bits
   741 		WriteChar((TUint16)(0xDC00 + (aChar & 0x03FF)));	// first low surrogate + low 10 bits
   742 		}
   743 	else
   744 		Panic(ENotUnicode);
   745 	}
   746 }