os/persistentdata/persistentstorage/store/pcstore/src/unicodecompression.cpp
author sl
Tue, 10 Jun 2014 14:32:02 +0200
changeset 1 260cb5ec6c19
permissions -rw-r--r--
Update contrib.
sl@0
     1
// Copyright (c) 2006-2009 Nokia Corporation and/or its subsidiary(-ies).
sl@0
     2
// All rights reserved.
sl@0
     3
// This component and the accompanying materials are made available
sl@0
     4
// under the terms of "Eclipse Public License v1.0"
sl@0
     5
// which accompanies this distribution, and is available
sl@0
     6
// at the URL "http://www.eclipse.org/legal/epl-v10.html".
sl@0
     7
//
sl@0
     8
// Initial Contributors:
sl@0
     9
// Nokia Corporation - initial contribution.
sl@0
    10
//
sl@0
    11
// Contributors:
sl@0
    12
//
sl@0
    13
// Description:
sl@0
    14
// Classes implemented in this file are used for Unicode compression and decompression.
sl@0
    15
// Their code is borrowed from Symbian, only with some changes such as the "Panic" function 
sl@0
    16
// is changed to exit the program. The Symbian coding standard will be kept in the code.
sl@0
    17
// 
sl@0
    18
//
sl@0
    19
sl@0
    20
#include <stdlib.h>
sl@0
    21
#include "unicodecompression.h"
sl@0
    22
sl@0
    23
namespace PCStore
sl@0
    24
{
sl@0
    25
const TUint32 TUnicodeCompressionState::iStaticWindow[EStaticWindows] =
sl@0
    26
	{
sl@0
    27
	0x0000,		// tags
sl@0
    28
	0x0080,		// Latin-1 supplement
sl@0
    29
	0x0100,		// Latin Extended-A
sl@0
    30
	0x0300,		// Combining Diacritics
sl@0
    31
	0x2000,		// General Punctuation
sl@0
    32
	0x2080,		// Currency Symbols
sl@0
    33
	0x2100,		// Letterlike Symbols and Number Forms
sl@0
    34
	0x3000		// CJK Symbols and Punctuation
sl@0
    35
	};
sl@0
    36
sl@0
    37
const TUint32 TUnicodeCompressionState::iDynamicWindowDefault[EDynamicWindows] =
sl@0
    38
	{
sl@0
    39
	0x0080,		// Latin-1 supplement
sl@0
    40
	0x00C0,		// parts of Latin-1 supplement and Latin Extended-A
sl@0
    41
	0x0400,		// Cyrillic
sl@0
    42
	0x0600,		// Arabic
sl@0
    43
	0x0900,		// Devanagari
sl@0
    44
	0x3040,		// Hiragana
sl@0
    45
	0x30A0,		// Katakana
sl@0
    46
	0xFF00		// Fullwidth ASCII
sl@0
    47
	};
sl@0
    48
sl@0
    49
const TUint16 TUnicodeCompressionState::iSpecialBase[ESpecialBases] =
sl@0
    50
	{
sl@0
    51
	0x00C0,		// Latin 1 letters (not symbols) and some of Extended-A
sl@0
    52
	0x0250,		// IPA extensions
sl@0
    53
	0x0370,		// Greek
sl@0
    54
	0x0530,		// Armenian
sl@0
    55
	0x3040,		// Hiragana
sl@0
    56
	0x30A0,		// Katakana
sl@0
    57
	0xFF60		// Halfwidth katakana
sl@0
    58
	};
sl@0
    59
sl@0
    60
// Single-byte mode tag values
sl@0
    61
const TUint8 SQ0 = 0x01;	// <byte>				quote from window 0
sl@0
    62
const TUint8 SDX = 0x0B;	// <hbyte> <lbyte>		define window in expansion area
sl@0
    63
const TUint8 SQU = 0x0E;	// <hbyte> <lbyte>		quote Unicode value
sl@0
    64
const TUint8 SCU = 0x0F;	//						switch to Unicode mode
sl@0
    65
const TUint8 SC0 = 0x10;	//						select dynamic window 0
sl@0
    66
const TUint8 SD0 = 0x18;	// <byte>				set dynamic window 0 index to <byte> and select it
sl@0
    67
sl@0
    68
// Unicode mode tag values
sl@0
    69
const TUint8 UC0 = 0xE0;	//						select dynamic window 0 and switch to single-byte mode
sl@0
    70
const TUint8 UD0 = 0xE8;	// <byte>				set dynamic window 0 index to <byte>, select it and switch to
sl@0
    71
							//						single-byte mode
sl@0
    72
const TUint8 UQU = 0xF0;	// <hbyte>, <lbyte>		quote Unicode value
sl@0
    73
const TUint8 UDX = 0xF1;	// <hbyte>, <lbyte>		define window in expansion area and switch to single-byte mode
sl@0
    74
	
sl@0
    75
TUnicodeCompressionState::TUnicodeCompressionState():
sl@0
    76
	iUnicodeWords(0),
sl@0
    77
	iMaxUnicodeWords(0),
sl@0
    78
	iCompressedBytes(0),
sl@0
    79
	iMaxCompressedBytes(0)
sl@0
    80
	{
sl@0
    81
	Reset();
sl@0
    82
	}
sl@0
    83
sl@0
    84
void TUnicodeCompressionState::Reset()
sl@0
    85
	{
sl@0
    86
	iUnicodeMode = false;
sl@0
    87
	iActiveWindowBase = 0x0080;
sl@0
    88
	for (int i = 0; i < EDynamicWindows; i++)
sl@0
    89
		iDynamicWindow[i] = iDynamicWindowDefault[i];
sl@0
    90
	}
sl@0
    91
sl@0
    92
sl@0
    93
// Return the index of the static window that contains this code, if any, or -1 if there is none.
sl@0
    94
TInt TUnicodeCompressionState::StaticWindowIndex(TUint16 aCode)
sl@0
    95
	{
sl@0
    96
	for (TInt i = 0; i < EStaticWindows; i++)
sl@0
    97
		if (aCode >= iStaticWindow[i] && aCode < iStaticWindow[i] + 128)
sl@0
    98
			return i;
sl@0
    99
	return -1;
sl@0
   100
	}
sl@0
   101
sl@0
   102
/*
sl@0
   103
If aCode can be accommodated in one of the legal dynamic windows, return the index of that window
sl@0
   104
in the offset table. If not return KErrNotFound.
sl@0
   105
*/
sl@0
   106
TInt TUnicodeCompressionState::DynamicWindowOffsetIndex(TUint16 aCode)
sl@0
   107
	{
sl@0
   108
	if (aCode < 0x0080)
sl@0
   109
		return KErrNotFound;
sl@0
   110
	if (aCode >= 0x3400 && aCode <= 0xDFFF)
sl@0
   111
		return KErrNotFound;
sl@0
   112
sl@0
   113
	/*
sl@0
   114
	Prefer sections that cross half-block boundaries. These are better adapted to actual text.
sl@0
   115
	They are represented by offset indices 0xf9..0xff.
sl@0
   116
	*/
sl@0
   117
	for (int i = 0; i < ESpecialBases; i++)
sl@0
   118
		if (aCode >= iSpecialBase[i] && aCode < iSpecialBase[i] + 128)
sl@0
   119
			return 0xF9 + i;
sl@0
   120
sl@0
   121
	/*
sl@0
   122
	Offset indices 0x01..0x67 represent half blocks from 0x0080 to 0x3380 and
sl@0
   123
	0x68..0xA7 represent half blocks from 0xE000 to 0xFF80.
sl@0
   124
	*/
sl@0
   125
	if (aCode >= 0xE000)
sl@0
   126
		aCode -= 0xAC00;
sl@0
   127
	return aCode / 0x80;
sl@0
   128
	}
sl@0
   129
sl@0
   130
// Return the base of the window represented by offset index <n>. Return 0 if the offset index is illegal.
sl@0
   131
TUint32 TUnicodeCompressionState::DynamicWindowBase(TInt aOffsetIndex)
sl@0
   132
	{
sl@0
   133
	if (aOffsetIndex >= 0xF9 && aOffsetIndex <= 0xFF)
sl@0
   134
		{
sl@0
   135
		/*
sl@0
   136
		WARNING: don't optimise the following two lines by replacing them with
sl@0
   137
		'return iSpecialBase[aOffsetIndex - 0xF9];'. To do so would re-introduce an error
sl@0
   138
		in ARM builds caused by optimisation and consequent erroneous fixing up
sl@0
   139
		of the array base: see defect EDNGASR-4AGJQX in ER5U defects.
sl@0
   140
		*/
sl@0
   141
		int special_base_index = aOffsetIndex - 0xF9;
sl@0
   142
		return iSpecialBase[special_base_index];
sl@0
   143
		}
sl@0
   144
	if (aOffsetIndex >= 0x01 && aOffsetIndex <= 0x67)
sl@0
   145
		return aOffsetIndex * 0x80;
sl@0
   146
	if (aOffsetIndex >= 0x68 && aOffsetIndex <= 0xA7)
sl@0
   147
		return aOffsetIndex * 0x80 + 0xAC00;
sl@0
   148
	return 0;
sl@0
   149
	}
sl@0
   150
sl@0
   151
TBool TUnicodeCompressionState::EncodeAsIs(TUint16 aCode)
sl@0
   152
	{
sl@0
   153
	return aCode == 0x0000 || aCode == 0x0009 || aCode == 0x000A || aCode == 0x000D ||
sl@0
   154
		   (aCode >= 0x0020 && aCode <= 0x007F);
sl@0
   155
	}
sl@0
   156
sl@0
   157
void TUnicodeCompressionState::Panic(TPanic aPanic)
sl@0
   158
	{
sl@0
   159
		exit(aPanic);
sl@0
   160
	}
sl@0
   161
sl@0
   162
TUnicodeCompressor::TUnicodeCompressor():
sl@0
   163
	iInputBufferStart(0),
sl@0
   164
	iInputBufferSize(0),
sl@0
   165
	iOutputBufferStart(0),
sl@0
   166
	iOutputBufferSize(0),
sl@0
   167
	iDynamicWindowIndex(0),
sl@0
   168
	iOutputStream(NULL),
sl@0
   169
	iOutputPointer(NULL),
sl@0
   170
	iInput(NULL)
sl@0
   171
	{
sl@0
   172
	}
sl@0
   173
sl@0
   174
void TUnicodeCompressor::CompressL(CStoreWriteStream& aOutput,MUnicodeSource& aInput,
sl@0
   175
											TInt aMaxOutputBytes,TInt aMaxInputWords,
sl@0
   176
											TInt* aOutputBytes,TInt* aInputWords)
sl@0
   177
	{
sl@0
   178
	DoCompressL(&aOutput,NULL,&aInput,aMaxOutputBytes,aMaxInputWords,aOutputBytes,aInputWords);
sl@0
   179
	}
sl@0
   180
sl@0
   181
void TUnicodeCompressor::CompressL(TUint8* aOutput,MUnicodeSource& aInput,
sl@0
   182
											TInt aMaxOutputBytes,TInt aMaxInputWords,
sl@0
   183
											TInt* aOutputBytes,TInt* aInputWords)
sl@0
   184
	{
sl@0
   185
	DoCompressL(NULL,aOutput,&aInput,aMaxOutputBytes,aMaxInputWords,aOutputBytes,aInputWords);
sl@0
   186
	}
sl@0
   187
sl@0
   188
TInt TUnicodeCompressor::FlushL(CStoreWriteStream& aOutput,TInt aMaxOutputBytes,TInt& aOutputBytes)
sl@0
   189
	{
sl@0
   190
	DoCompressL(&aOutput,NULL,NULL,aMaxOutputBytes,0,&aOutputBytes,NULL);
sl@0
   191
	return iOutputBufferSize;
sl@0
   192
	}
sl@0
   193
sl@0
   194
TInt TUnicodeCompressor::FlushL(TUint8* aOutput,TInt aMaxOutputBytes,TInt& aOutputBytes)
sl@0
   195
	{
sl@0
   196
	DoCompressL(NULL,aOutput,NULL,aMaxOutputBytes,0,&aOutputBytes,NULL);
sl@0
   197
	return iOutputBufferSize;
sl@0
   198
	}
sl@0
   199
sl@0
   200
TInt TUnicodeCompressor::CompressedSizeL(MUnicodeSource& aInput,TInt aInputWords)
sl@0
   201
	{
sl@0
   202
	TInt bytes;
sl@0
   203
	TUnicodeCompressor c;
sl@0
   204
	c.DoCompressL(NULL,NULL,&aInput,KMaxTInt,aInputWords,&bytes,NULL);
sl@0
   205
	return bytes;
sl@0
   206
	}
sl@0
   207
sl@0
   208
// Compress until input or output is exhausted or an exception occurs.
sl@0
   209
void TUnicodeCompressor::DoCompressL(CStoreWriteStream* aOutputStream,TUint8* aOutputPointer,MUnicodeSource* aInput,
sl@0
   210
									 TInt aMaxOutputBytes,TInt aMaxInputWords,
sl@0
   211
									 TInt* aOutputBytes,TInt* aInputWords)
sl@0
   212
	{
sl@0
   213
	iOutputStream = aOutputStream;
sl@0
   214
	iOutputPointer = aOutputPointer;
sl@0
   215
	iInput = aInput;
sl@0
   216
	iMaxCompressedBytes = aMaxOutputBytes;
sl@0
   217
	iMaxUnicodeWords = aMaxInputWords;
sl@0
   218
	iCompressedBytes = iUnicodeWords = 0;
sl@0
   219
	FlushOutputBufferL();
sl@0
   220
	if (iInput)
sl@0
   221
		{
sl@0
   222
		while (iUnicodeWords < iMaxUnicodeWords && iCompressedBytes < iMaxCompressedBytes)
sl@0
   223
			{
sl@0
   224
			TUint16 x = iInput->ReadUnicodeValueL();
sl@0
   225
			TAction action(x);
sl@0
   226
			iInputBuffer[(iInputBufferStart + iInputBufferSize) % EMaxInputBufferSize] = action;
sl@0
   227
			iInputBufferSize++;
sl@0
   228
			iUnicodeWords++;
sl@0
   229
			if (iInputBufferSize == EMaxInputBufferSize)
sl@0
   230
				WriteRunL();
sl@0
   231
			}
sl@0
   232
		}
sl@0
   233
	FlushInputBufferL();
sl@0
   234
	if (aOutputBytes)
sl@0
   235
		*aOutputBytes = iCompressedBytes;
sl@0
   236
	if (aInputWords)
sl@0
   237
		*aInputWords = iUnicodeWords;
sl@0
   238
	}
sl@0
   239
sl@0
   240
TUnicodeCompressor::TAction::TAction(TUint16 aCode):
sl@0
   241
	iCode(aCode)
sl@0
   242
	{
sl@0
   243
	if (TUnicodeCompressionState::EncodeAsIs(aCode))
sl@0
   244
		iTreatment = EPlainASCII;
sl@0
   245
	else
sl@0
   246
		{
sl@0
   247
		iTreatment = TUnicodeCompressionState::DynamicWindowOffsetIndex(aCode);
sl@0
   248
		if (iTreatment == -1)
sl@0
   249
			{
sl@0
   250
			iTreatment = TUnicodeCompressionState::StaticWindowIndex(aCode);
sl@0
   251
			if (iTreatment == -1)
sl@0
   252
				iTreatment = EPlainUnicode;
sl@0
   253
			else
sl@0
   254
				iTreatment += EFirstStatic;
sl@0
   255
			}
sl@0
   256
		}
sl@0
   257
	}
sl@0
   258
sl@0
   259
void TUnicodeCompressor::WriteCharacterFromBuffer()
sl@0
   260
	{
sl@0
   261
	const TAction& action = iInputBuffer[iInputBufferStart];
sl@0
   262
	iInputBufferSize--;
sl@0
   263
	iInputBufferStart = (iInputBufferStart + 1) % EMaxInputBufferSize;
sl@0
   264
	WriteCharacter(action);
sl@0
   265
	}
sl@0
   266
sl@0
   267
void TUnicodeCompressor::FlushInputBufferL()
sl@0
   268
	{
sl@0
   269
	while (iInputBufferSize > 0 && iCompressedBytes < iMaxCompressedBytes)
sl@0
   270
		WriteRunL();
sl@0
   271
	}
sl@0
   272
sl@0
   273
void TUnicodeCompressor::WriteRunL()
sl@0
   274
	{
sl@0
   275
	// Write out any leading characters that can be passed through.
sl@0
   276
	if (!iUnicodeMode)
sl@0
   277
		while (iInputBufferSize > 0)
sl@0
   278
			{
sl@0
   279
			const TAction& action = iInputBuffer[iInputBufferStart];
sl@0
   280
			if (action.iTreatment == TAction::EPlainASCII ||
sl@0
   281
				(action.iCode >= iActiveWindowBase && action.iCode < iActiveWindowBase + 128))
sl@0
   282
				WriteCharacterFromBuffer();
sl@0
   283
			else
sl@0
   284
				break;
sl@0
   285
			}
sl@0
   286
sl@0
   287
	// Write a run of characters that cannot be passed through.
sl@0
   288
	int i;
sl@0
   289
	if (iInputBufferSize > 0)
sl@0
   290
		{
sl@0
   291
		/*
sl@0
   292
		Find a run of characters with the same treatment and select that treatment
sl@0
   293
		if the run has more than one character.
sl@0
   294
		*/
sl@0
   295
		int treatment = iInputBuffer[iInputBufferStart].iTreatment;
sl@0
   296
		int next_treatment = treatment;
sl@0
   297
		int run_size = 1;
sl@0
   298
		for (i = 1; i < iInputBufferSize; i++)
sl@0
   299
			{
sl@0
   300
			int index = (iInputBufferStart + i) % EMaxInputBufferSize;
sl@0
   301
			next_treatment = iInputBuffer[index].iTreatment;
sl@0
   302
			if (next_treatment != treatment)
sl@0
   303
				break;
sl@0
   304
			run_size++;
sl@0
   305
			}
sl@0
   306
		if (run_size > 1)
sl@0
   307
			SelectTreatment(treatment);
sl@0
   308
		for (i = 0; i < run_size; i++)
sl@0
   309
			WriteCharacterFromBuffer();
sl@0
   310
		}
sl@0
   311
sl@0
   312
	FlushOutputBufferL();
sl@0
   313
	}
sl@0
   314
sl@0
   315
void TUnicodeCompressor::FlushOutputBufferL()
sl@0
   316
	{
sl@0
   317
	while (iOutputBufferSize > 0 &&	iCompressedBytes < iMaxCompressedBytes)
sl@0
   318
		{
sl@0
   319
		TUint8 byte = iOutputBuffer[iOutputBufferStart];
sl@0
   320
		if (iOutputPointer)
sl@0
   321
			*iOutputPointer++ = byte;
sl@0
   322
		else if (iOutputStream)
sl@0
   323
			iOutputStream->WriteUint8(byte);
sl@0
   324
		iCompressedBytes++;
sl@0
   325
		iOutputBufferSize--;
sl@0
   326
		iOutputBufferStart = (iOutputBufferStart + 1) % EMaxOutputBufferSize;
sl@0
   327
		}
sl@0
   328
	}
sl@0
   329
sl@0
   330
void TUnicodeCompressor::SelectTreatment(TInt aTreatment)
sl@0
   331
	{
sl@0
   332
	if (aTreatment == TAction::EPlainUnicode)
sl@0
   333
		{
sl@0
   334
		// Switch to Unicode mode if not there already.
sl@0
   335
		if (!iUnicodeMode)
sl@0
   336
			{
sl@0
   337
			WriteByte(SCU);
sl@0
   338
			iUnicodeMode = true;
sl@0
   339
			}
sl@0
   340
		return;
sl@0
   341
		}
sl@0
   342
sl@0
   343
	if (aTreatment == TAction::EPlainASCII)
sl@0
   344
		{
sl@0
   345
		// Switch to single-byte mode, using the current dynamic window, if not there already.
sl@0
   346
		if (iUnicodeMode)
sl@0
   347
			{
sl@0
   348
			WriteByte(UC0 + iDynamicWindowIndex);
sl@0
   349
			iUnicodeMode = false;
sl@0
   350
			}
sl@0
   351
		return;
sl@0
   352
		}
sl@0
   353
sl@0
   354
	if (aTreatment >= TAction::EFirstDynamic && aTreatment <= TAction::ELastDynamic)
sl@0
   355
		{
sl@0
   356
		TUint32 base = DynamicWindowBase(aTreatment);
sl@0
   357
sl@0
   358
		// Switch to the appropriate dynamic window if it is available; if not, redefine and select dynamic window 4.
sl@0
   359
		for (int i = 0; i < EDynamicWindows; i++)
sl@0
   360
			if (base == iDynamicWindow[i])
sl@0
   361
				{
sl@0
   362
				if (iUnicodeMode)
sl@0
   363
					WriteByte(UC0 + i);
sl@0
   364
				else if (i != iDynamicWindowIndex)
sl@0
   365
					WriteByte(SC0 + i);
sl@0
   366
				iUnicodeMode = false;
sl@0
   367
				iDynamicWindowIndex = i;
sl@0
   368
				iActiveWindowBase = base;
sl@0
   369
				return;
sl@0
   370
				}
sl@0
   371
		if (iUnicodeMode)
sl@0
   372
			WriteByte(UD0 + 4);
sl@0
   373
		else
sl@0
   374
			WriteByte(SD0 + 4);
sl@0
   375
		iDynamicWindowIndex = 4;
sl@0
   376
		iUnicodeMode = false;
sl@0
   377
		WriteByte(aTreatment);
sl@0
   378
		iDynamicWindow[4] = base;
sl@0
   379
		iActiveWindowBase = base;
sl@0
   380
		return;
sl@0
   381
		}
sl@0
   382
	}
sl@0
   383
sl@0
   384
// Write a character without changing mode or window.
sl@0
   385
void TUnicodeCompressor::WriteCharacter(const TAction& aAction)
sl@0
   386
	{
sl@0
   387
	if (iUnicodeMode)
sl@0
   388
		WriteUCharacter(aAction.iCode);
sl@0
   389
	else
sl@0
   390
		WriteSCharacter(aAction);
sl@0
   391
	}
sl@0
   392
sl@0
   393
void TUnicodeCompressor::WriteUCharacter(TUint16 aCode)
sl@0
   394
	{
sl@0
   395
	// Emit the 'quote Unicode' tag if the character would conflict with a tag.
sl@0
   396
	if (aCode >= 0xE000 && aCode <= 0xF2FF)
sl@0
   397
		WriteByte(UQU);
sl@0
   398
sl@0
   399
	// Write the Unicode value big-end first.
sl@0
   400
	WriteByte((aCode >> 8) & 0xFF);
sl@0
   401
	WriteByte(aCode & 0xFF);
sl@0
   402
	}
sl@0
   403
sl@0
   404
void TUnicodeCompressor::WriteByte(TUint aByte)
sl@0
   405
	{
sl@0
   406
	if (iOutputBufferSize >= EMaxOutputBufferSize)
sl@0
   407
		Panic(EOutputBufferOverflow);
sl@0
   408
	iOutputBuffer[(iOutputBufferStart + iOutputBufferSize) % EMaxOutputBufferSize] = (TUint8)aByte;
sl@0
   409
	iOutputBufferSize++;
sl@0
   410
	}
sl@0
   411
sl@0
   412
void TUnicodeCompressor::WriteSCharacter(const TAction& aAction)
sl@0
   413
	{
sl@0
   414
	// Characters in the range 0x0020..0x007F, plus nul, tab, cr, and lf, can be emitted as their low bytes.
sl@0
   415
	if (aAction.iTreatment == TAction::EPlainASCII)
sl@0
   416
		{
sl@0
   417
		WriteByte(aAction.iCode);
sl@0
   418
		return;
sl@0
   419
		}
sl@0
   420
sl@0
   421
	// Characters in a static window can be written using SQ<n> plus a byte in the range 0x00-0x7F
sl@0
   422
	if (aAction.iTreatment >= TAction::EFirstStatic && aAction.iTreatment <= TAction::ELastStatic)
sl@0
   423
		{
sl@0
   424
		int window = aAction.iTreatment - TAction::EFirstStatic;
sl@0
   425
		WriteByte(SQ0 + window);
sl@0
   426
		WriteByte(aAction.iCode);
sl@0
   427
		return;
sl@0
   428
		}
sl@0
   429
sl@0
   430
	// Characters in the current dynamic window can be written as a byte in the range 0x80-0xFF.
sl@0
   431
	if (aAction.iCode >= iActiveWindowBase && aAction.iCode < iActiveWindowBase + 128)
sl@0
   432
		{
sl@0
   433
		WriteByte(aAction.iCode - iActiveWindowBase + 0x80);
sl@0
   434
		return;
sl@0
   435
		}
sl@0
   436
sl@0
   437
	// Characters in another dynamic window can be written using SQ<n> plus a byte in the range 0x80-0xFF
sl@0
   438
	int i;
sl@0
   439
	for (i = 0; i < EDynamicWindows; i++)
sl@0
   440
		if (aAction.iCode >= iDynamicWindow[i] && aAction.iCode < iDynamicWindow[i] + 128)
sl@0
   441
			{
sl@0
   442
			WriteByte(SQ0 + i);
sl@0
   443
			WriteByte(aAction.iCode - iDynamicWindow[i] + 0x80);
sl@0
   444
			return;
sl@0
   445
			}
sl@0
   446
sl@0
   447
	// Other characters can be quoted.
sl@0
   448
	WriteByte(SQU);
sl@0
   449
	WriteByte((aAction.iCode >> 8) & 0xFF);
sl@0
   450
	WriteByte(aAction.iCode & 0xFF);
sl@0
   451
	return;
sl@0
   452
	}
sl@0
   453
sl@0
   454
sl@0
   455
TUnicodeExpander::TUnicodeExpander():
sl@0
   456
	iInputBufferStart(0),
sl@0
   457
	iInputBufferSize(0),
sl@0
   458
	iOutputBufferStart(0),
sl@0
   459
	iOutputBufferSize(0),
sl@0
   460
	iOutput(NULL),
sl@0
   461
	iInputStream(NULL),
sl@0
   462
	iInputPointer(NULL)
sl@0
   463
	{
sl@0
   464
	}
sl@0
   465
sl@0
   466
void TUnicodeExpander::ExpandL(MUnicodeSink& aOutput,CStoreReadStream& aInput,
sl@0
   467
										TInt aMaxOutputWords,TInt aMaxInputBytes,
sl@0
   468
										TInt* aOutputWords,TInt* aInputBytes)
sl@0
   469
	{
sl@0
   470
	DoExpandL(&aOutput,&aInput,NULL,aMaxOutputWords,aMaxInputBytes,aOutputWords,aInputBytes);
sl@0
   471
	}
sl@0
   472
sl@0
   473
void TUnicodeExpander::ExpandL(MUnicodeSink& aOutput,const TUint8* aInput,
sl@0
   474
										TInt aMaxOutputWords,TInt aMaxInputBytes,
sl@0
   475
										TInt* aOutputWords,TInt* aInputBytes)
sl@0
   476
	{
sl@0
   477
	DoExpandL(&aOutput,NULL,aInput,aMaxOutputWords,aMaxInputBytes,aOutputWords,aInputBytes);
sl@0
   478
	}
sl@0
   479
sl@0
   480
TInt TUnicodeExpander::FlushL(MUnicodeSink& aOutput,TInt aMaxOutputWords,TInt& aOutputWords)
sl@0
   481
	{
sl@0
   482
	DoExpandL(&aOutput,NULL,NULL,aMaxOutputWords,0,&aOutputWords,NULL);
sl@0
   483
	return iOutputBufferSize;
sl@0
   484
	}
sl@0
   485
sl@0
   486
TInt TUnicodeExpander::ExpandedSizeL(CStoreReadStream& aInput,TInt aInputBytes)
sl@0
   487
	{
sl@0
   488
	TInt words;
sl@0
   489
	TUnicodeExpander e;
sl@0
   490
	e.DoExpandL(NULL,&aInput,NULL,KMaxTInt,aInputBytes,&words,NULL);
sl@0
   491
	return words;
sl@0
   492
	}
sl@0
   493
sl@0
   494
TInt TUnicodeExpander::ExpandedSizeL(const TUint8* aInput,TInt aInputBytes)
sl@0
   495
	{
sl@0
   496
	TInt words;
sl@0
   497
	TUnicodeExpander e;
sl@0
   498
	e.DoExpandL(NULL,NULL,aInput,KMaxTInt,aInputBytes,&words,NULL);
sl@0
   499
	return words;
sl@0
   500
	}
sl@0
   501
sl@0
   502
// Expand until input or output is exhausted or an exception occurs.
sl@0
   503
void TUnicodeExpander::DoExpandL(MUnicodeSink* aOutput,CStoreReadStream* aInputStream,const TUint8* aInputPointer,
sl@0
   504
								 TInt aMaxOutputWords,TInt aMaxInputBytes,
sl@0
   505
								 TInt* aOutputWords,TInt* aInputBytes)
sl@0
   506
	{
sl@0
   507
	iOutput = aOutput;
sl@0
   508
	iInputStream = aInputStream;
sl@0
   509
	iInputPointer = aInputPointer;
sl@0
   510
	iMaxUnicodeWords = aMaxOutputWords;
sl@0
   511
	iMaxCompressedBytes = aMaxInputBytes;
sl@0
   512
	iUnicodeWords = iCompressedBytes = 0;
sl@0
   513
	iInputBufferStart = 0;
sl@0
   514
	FlushOutputBufferL();
sl@0
   515
	if (iInputPointer || iInputStream)
sl@0
   516
		{
sl@0
   517
		while (iUnicodeWords + iOutputBufferSize < iMaxUnicodeWords && iCompressedBytes < iMaxCompressedBytes)
sl@0
   518
			HandleByteL();
sl@0
   519
		}
sl@0
   520
	if (aOutputWords)
sl@0
   521
		*aOutputWords = iUnicodeWords;
sl@0
   522
	if (aInputBytes)
sl@0
   523
		*aInputBytes = iCompressedBytes;
sl@0
   524
	}
sl@0
   525
sl@0
   526
void TUnicodeExpander::HandleByteL()
sl@0
   527
	{
sl@0
   528
	TUint8 byte;
sl@0
   529
	TBool handled = false;
sl@0
   530
	if (ReadByteL(byte))
sl@0
   531
		{
sl@0
   532
		if (iUnicodeMode)
sl@0
   533
			handled = HandleUByteL(byte);
sl@0
   534
		else
sl@0
   535
			handled = HandleSByteL(byte);
sl@0
   536
		}
sl@0
   537
	iInputBufferStart = 0;
sl@0
   538
	if (handled)
sl@0
   539
		iInputBufferSize = 0;
sl@0
   540
	FlushOutputBufferL();
sl@0
   541
	}
sl@0
   542
sl@0
   543
void TUnicodeExpander::FlushOutputBufferL()
sl@0
   544
	{
sl@0
   545
	while (iOutputBufferSize > 0 &&	iUnicodeWords < iMaxUnicodeWords)
sl@0
   546
		{
sl@0
   547
		if (iOutput)
sl@0
   548
			iOutput->WriteUnicodeValueL(iOutputBuffer[iOutputBufferStart]);
sl@0
   549
		iUnicodeWords++;
sl@0
   550
		iOutputBufferSize--;
sl@0
   551
		iOutputBufferStart = (iOutputBufferStart + 1) % EMaxOutputBufferSize;
sl@0
   552
		}
sl@0
   553
	}
sl@0
   554
sl@0
   555
TBool TUnicodeExpander::HandleSByteL(TUint8 aByte)
sl@0
   556
	{
sl@0
   557
	// 'Pass-through' codes.
sl@0
   558
	if (TUnicodeCompressionState::EncodeAsIs(aByte))
sl@0
   559
		{
sl@0
   560
		WriteChar(aByte);
sl@0
   561
		return true;
sl@0
   562
		}
sl@0
   563
sl@0
   564
	// Codes 0x80-0xFF select a character from the active window.
sl@0
   565
	if (aByte >= 0x80)
sl@0
   566
		{
sl@0
   567
		WriteChar32(iActiveWindowBase + aByte - 0x80);
sl@0
   568
		return true;
sl@0
   569
		}
sl@0
   570
sl@0
   571
	// SQU: quote a Unicode character.
sl@0
   572
	if (aByte == SQU)
sl@0
   573
		return QuoteUnicodeL();
sl@0
   574
sl@0
   575
	// SCU: switch to Unicode mode.
sl@0
   576
	if (aByte == SCU)
sl@0
   577
		{
sl@0
   578
		iUnicodeMode = true;
sl@0
   579
		return true;
sl@0
   580
		}
sl@0
   581
sl@0
   582
	// SQn: quote from window n.
sl@0
   583
	if (aByte >= SQ0 && aByte <= SQ0 + 7)
sl@0
   584
		{
sl@0
   585
		int window = aByte - SQ0;
sl@0
   586
		TUint8 byte;
sl@0
   587
		if (ReadByteL(byte))
sl@0
   588
			{
sl@0
   589
			TUint32 c = byte;
sl@0
   590
			if (c <= 0x7F)
sl@0
   591
				c += iStaticWindow[window];
sl@0
   592
			else
sl@0
   593
				c += iDynamicWindow[window] - 0x80;
sl@0
   594
			WriteChar32(c);
sl@0
   595
			return true;
sl@0
   596
			}
sl@0
   597
		else
sl@0
   598
			return false;
sl@0
   599
		}
sl@0
   600
sl@0
   601
	// SCn: switch to dynamic window n.
sl@0
   602
	if (aByte >= SC0 && aByte <= SC0 + 7)
sl@0
   603
		{
sl@0
   604
		iActiveWindowBase = iDynamicWindow[aByte - SC0];
sl@0
   605
		return true;
sl@0
   606
		}
sl@0
   607
sl@0
   608
	// SDn: define dynamic window n and switch to it.
sl@0
   609
	if (aByte >= SD0 && aByte <= SD0 + 7)
sl@0
   610
		return DefineWindowL(aByte - SD0);
sl@0
   611
sl@0
   612
	// SDX: define window in the expansion space.
sl@0
   613
	if (aByte == SDX)
sl@0
   614
		return DefineExpansionWindowL();
sl@0
   615
sl@0
   616
	Panic(EUnhandledByte);
sl@0
   617
	return false;
sl@0
   618
	}
sl@0
   619
sl@0
   620
TBool TUnicodeExpander::HandleUByteL(TUint8 aByte)
sl@0
   621
	{
sl@0
   622
	// Plain Unicode; get the low byte and emit the Unicode value.
sl@0
   623
	if (aByte <= 0xDF || aByte >= 0xF3)
sl@0
   624
		{
sl@0
   625
		TUint8 lo;
sl@0
   626
		if (ReadByteL(lo))
sl@0
   627
			{
sl@0
   628
			TUint16 c = (TUint16)((aByte << 8) | lo);
sl@0
   629
			WriteChar(c);
sl@0
   630
			return true;
sl@0
   631
			}
sl@0
   632
		else
sl@0
   633
			return false;
sl@0
   634
		}
sl@0
   635
sl@0
   636
	// Quote a Unicode character that would otherwise conflict with a tag.
sl@0
   637
	if (aByte == UQU)
sl@0
   638
		return QuoteUnicodeL();
sl@0
   639
sl@0
   640
	// UCn: change to single byte mode and select window n.
sl@0
   641
	if (aByte >= UC0 && aByte <= UC0 + 7)
sl@0
   642
		{
sl@0
   643
		iUnicodeMode = false;
sl@0
   644
		iActiveWindowBase = iDynamicWindow[aByte - UC0];
sl@0
   645
		return true;
sl@0
   646
		}
sl@0
   647
sl@0
   648
	// UDn: define dynamic window n and switch to it.
sl@0
   649
	if (aByte >= UD0 && aByte <= UD0 + 7)
sl@0
   650
		return DefineWindowL(aByte - UD0);
sl@0
   651
sl@0
   652
	// UDX: define window in the expansion space.
sl@0
   653
	if (aByte == UDX)
sl@0
   654
		return DefineExpansionWindowL();
sl@0
   655
sl@0
   656
	Panic(EUnhandledByte);
sl@0
   657
	return false;
sl@0
   658
	}
sl@0
   659
sl@0
   660
TBool TUnicodeExpander::QuoteUnicodeL()
sl@0
   661
	{
sl@0
   662
	TUint8 hi, lo;
sl@0
   663
	if (ReadByteL(hi) && ReadByteL(lo))
sl@0
   664
		{
sl@0
   665
		TUint16 c = (TUint16)((hi << 8) | lo);
sl@0
   666
		WriteChar(c);
sl@0
   667
		return true;
sl@0
   668
		}
sl@0
   669
	else
sl@0
   670
		return false;
sl@0
   671
	}
sl@0
   672
sl@0
   673
TBool TUnicodeExpander::DefineWindowL(TInt aIndex)
sl@0
   674
	{
sl@0
   675
	TUint8 window;
sl@0
   676
	if (ReadByteL(window))
sl@0
   677
		{
sl@0
   678
		iUnicodeMode = false;
sl@0
   679
		iActiveWindowBase = DynamicWindowBase(window);
sl@0
   680
		iDynamicWindow[aIndex] = iActiveWindowBase;
sl@0
   681
		return true;
sl@0
   682
		}
sl@0
   683
	else
sl@0
   684
		return false;
sl@0
   685
	}
sl@0
   686
sl@0
   687
TBool TUnicodeExpander::DefineExpansionWindowL()
sl@0
   688
	{
sl@0
   689
	TUint8 hi, lo;
sl@0
   690
	if (ReadByteL(hi) && ReadByteL(lo))
sl@0
   691
		{
sl@0
   692
		iUnicodeMode = false;
sl@0
   693
		iActiveWindowBase = 0x10000 + (0x80 * ((hi & 0x1F) * 0x100 + lo));
sl@0
   694
		iDynamicWindow[hi >> 5] = iActiveWindowBase;
sl@0
   695
		return true;
sl@0
   696
		}
sl@0
   697
	else
sl@0
   698
		return false;
sl@0
   699
	}
sl@0
   700
sl@0
   701
// Read either from the buffer (in the case of restarting after source finished in mid-operation) or from the source.
sl@0
   702
TBool TUnicodeExpander::ReadByteL(TUint8& aByte)
sl@0
   703
	{
sl@0
   704
	if (iInputBufferStart < iInputBufferSize)
sl@0
   705
		{
sl@0
   706
		aByte = iInputBuffer[iInputBufferStart++];
sl@0
   707
		return true;
sl@0
   708
		}
sl@0
   709
	else if (iCompressedBytes < iMaxCompressedBytes)
sl@0
   710
		{
sl@0
   711
		if (iInputPointer)
sl@0
   712
			aByte = *iInputPointer++;
sl@0
   713
		else
sl@0
   714
			aByte = iInputStream->ReadUint8();
sl@0
   715
		iInputBuffer[iInputBufferStart++] = aByte;
sl@0
   716
		iInputBufferSize = iInputBufferStart;
sl@0
   717
		iCompressedBytes++;
sl@0
   718
		return true;
sl@0
   719
		}
sl@0
   720
	else
sl@0
   721
		return false;
sl@0
   722
	}
sl@0
   723
sl@0
   724
void TUnicodeExpander::WriteChar(TUint16 aChar)
sl@0
   725
	{
sl@0
   726
	if (iOutputBufferSize >= EMaxOutputBufferSize)
sl@0
   727
		Panic(EOutputBufferOverflow);
sl@0
   728
	iOutputBuffer[(iOutputBufferStart + iOutputBufferSize) % EMaxOutputBufferSize] = aChar;
sl@0
   729
	iOutputBufferSize++;
sl@0
   730
	}
sl@0
   731
sl@0
   732
// Write a Unicode character; write using surrogates if in the range 0x10000..0x10FFFF.
sl@0
   733
void TUnicodeExpander::WriteChar32(TUint aChar)
sl@0
   734
	{
sl@0
   735
	if (aChar <= 0xFFFF)
sl@0
   736
		WriteChar((TUint16)aChar);
sl@0
   737
	else if (aChar <= 0x10FFFF)
sl@0
   738
		{
sl@0
   739
		aChar -= 0x10000;									// reduce to 20-bit value in the range 0x0..0xFFFFF
sl@0
   740
		WriteChar((TUint16)(0xD800 + (aChar >> 10)));		// first high surrogate + high 10 bits
sl@0
   741
		WriteChar((TUint16)(0xDC00 + (aChar & 0x03FF)));	// first low surrogate + low 10 bits
sl@0
   742
		}
sl@0
   743
	else
sl@0
   744
		Panic(ENotUnicode);
sl@0
   745
	}
sl@0
   746
}