epoc32/include/s32ucmp.h
author William Roberts <williamr@symbian.org>
Wed, 31 Mar 2010 12:33:34 +0100
branchSymbian3
changeset 4 837f303aceeb
parent 2 2fe1408b6811
permissions -rw-r--r--
Current Symbian^3 public API header files (from PDK 3.0.h)
This is the epoc32/include tree with the "platform" subtrees removed, and
all but a selected few mbg and rsg files removed.
williamr@2
     1
// Copyright (c) 1998-2009 Nokia Corporation and/or its subsidiary(-ies).
williamr@2
     2
// All rights reserved.
williamr@2
     3
// This component and the accompanying materials are made available
williamr@4
     4
// under the terms of "Eclipse Public License v1.0"
williamr@2
     5
// which accompanies this distribution, and is available
williamr@4
     6
// at the URL "http://www.eclipse.org/legal/epl-v10.html".
williamr@2
     7
//
williamr@2
     8
// Initial Contributors:
williamr@2
     9
// Nokia Corporation - initial contribution.
williamr@2
    10
//
williamr@2
    11
// Contributors:
williamr@2
    12
//
williamr@2
    13
// Description:
williamr@2
    14
// Header for the Standard Compression Scheme for Unicode.
williamr@2
    15
// This code is compiled only in the Unicode build.
williamr@2
    16
// 
williamr@2
    17
//
williamr@2
    18
williamr@2
    19
#ifndef __S32UCMP_H__
williamr@2
    20
#define __S32UCMP_H__ 1
williamr@2
    21
williamr@2
    22
#ifdef _UNICODE
williamr@2
    23
williamr@2
    24
#include <e32std.h>
williamr@2
    25
#include <s32mem.h>
williamr@2
    26
williamr@2
    27
/**
williamr@2
    28
 * @publishedAll 
williamr@2
    29
 * @released
williamr@2
    30
 */
williamr@2
    31
class TUnicodeCompressionState
williamr@2
    32
	{
williamr@2
    33
	public:
williamr@2
    34
	TUnicodeCompressionState();
williamr@2
    35
	void Reset();
williamr@2
    36
	static TInt StaticWindowIndex(TUint16 aCode);
williamr@2
    37
	static TInt DynamicWindowOffsetIndex(TUint16 aCode);
williamr@2
    38
	static TUint32 DynamicWindowBase(TInt aOffsetIndex);
williamr@2
    39
	static TBool EncodeAsIs(TUint16 aCode);
williamr@2
    40
williamr@2
    41
	enum TPanic
williamr@2
    42
		{
williamr@2
    43
		EUnhandledByte,			// expander code fails to handle all possible byte codes
williamr@2
    44
		ENotUnicode,			// expander can't handle Unicode values outside range 0x0..0x10FFFF;
williamr@2
    45
								// that is, 16-bit codes plus 32-bit codes that can be expressed using
williamr@2
    46
								// 16-bit surrogates
williamr@2
    47
		EOutputBufferOverflow	// output buffer is not big enough
williamr@2
    48
		};
williamr@2
    49
williamr@2
    50
	static void Panic(TPanic aPanic);
williamr@2
    51
williamr@2
    52
	protected:
williamr@2
    53
williamr@2
    54
	enum
williamr@2
    55
		{
williamr@2
    56
		EStaticWindows = 8,
williamr@2
    57
		EDynamicWindows = 8,
williamr@2
    58
		ESpecialBases = 7
williamr@2
    59
		};
williamr@2
    60
williamr@2
    61
	TBool iUnicodeMode;									// TRUE if in Unicode mode as opposed to single-byte mode
williamr@2
    62
	TUint32 iActiveWindowBase;							// base of the active window - bases are 32-bit because they
williamr@2
    63
														// can be set to the surrogate area, which represents codes
williamr@2
    64
														// from 0x00010000 to 0x0010FFFF - planes 1-16 of ISO-10646.
williamr@2
    65
	static const TUint32 iStaticWindow[EStaticWindows];	// bases of the static windows
williamr@2
    66
	static const TUint32 iDynamicWindowDefault[EDynamicWindows];	// default bases of the dynamic windows
williamr@2
    67
	static const TUint16 iSpecialBase[ESpecialBases];	// bases for window offsets F9..FF
williamr@2
    68
williamr@2
    69
	TUint32 iDynamicWindow[EDynamicWindows];			// bases of the dynamic windows
williamr@2
    70
	TInt iUnicodeWords;									// Unicode words processed; read by compressor, written by expander
williamr@2
    71
	TInt iMaxUnicodeWords;								// maximum number of Unicode words to read or write
williamr@2
    72
	TInt iCompressedBytes;								// compressed bytes processed: read by expander, written by compressor
williamr@2
    73
	TInt iMaxCompressedBytes;							// maximum number of compressed bytes to read or write
williamr@2
    74
	};
williamr@2
    75
williamr@2
    76
/**
williamr@2
    77
 * @publishedAll 
williamr@2
    78
 * @released
williamr@2
    79
 */
williamr@2
    80
class MUnicodeSource
williamr@2
    81
	{
williamr@2
    82
	public:
williamr@2
    83
	virtual TUint16 ReadUnicodeValueL() = 0;
williamr@2
    84
	};
williamr@2
    85
williamr@2
    86
/**
williamr@2
    87
 * @publishedAll 
williamr@2
    88
 * @released
williamr@2
    89
 A class to read Unicode values directly from memory.
williamr@2
    90
 */
williamr@2
    91
class TMemoryUnicodeSource: public MUnicodeSource
williamr@2
    92
	{
williamr@2
    93
	public:
williamr@2
    94
	inline TMemoryUnicodeSource(const TUint16* aPtr);
williamr@2
    95
	inline TUint16 ReadUnicodeValueL();
williamr@2
    96
williamr@2
    97
	private:
williamr@2
    98
	const TUint16* iPtr;
williamr@2
    99
	};
williamr@2
   100
williamr@2
   101
/**
williamr@2
   102
 * @publishedAll 
williamr@2
   103
 * @released
williamr@2
   104
 A class to read Unicode values from a stream built on a memory object.
williamr@2
   105
 */
williamr@2
   106
class TMemoryStreamUnicodeSource: public MUnicodeSource
williamr@2
   107
	{
williamr@2
   108
	public:
williamr@2
   109
	inline TMemoryStreamUnicodeSource(RReadStream& aStream);
williamr@2
   110
	inline TUint16 ReadUnicodeValueL();
williamr@2
   111
williamr@2
   112
	private:
williamr@2
   113
	RReadStream& iStream;
williamr@2
   114
	};
williamr@2
   115
williamr@2
   116
/**
williamr@2
   117
 * @publishedAll 
williamr@2
   118
 * @released
williamr@2
   119
 */
williamr@2
   120
class MUnicodeSink
williamr@2
   121
	{
williamr@2
   122
	public:
williamr@2
   123
	virtual void WriteUnicodeValueL(TUint16 aValue) = 0;
williamr@2
   124
	};
williamr@2
   125
williamr@2
   126
/**
williamr@2
   127
 * @publishedAll 
williamr@2
   128
 * @released
williamr@2
   129
 A class to write Unicode values directly to memory.
williamr@2
   130
 */
williamr@2
   131
class TMemoryUnicodeSink: public MUnicodeSink
williamr@2
   132
	{
williamr@2
   133
	public:
williamr@2
   134
	inline TMemoryUnicodeSink(TUint16* aPtr);
williamr@2
   135
	inline void WriteUnicodeValueL(TUint16 aValue);
williamr@2
   136
williamr@2
   137
	private:
williamr@2
   138
	TUint16* iPtr;
williamr@2
   139
	};
williamr@2
   140
williamr@2
   141
/**
williamr@2
   142
 * @publishedAll 
williamr@2
   143
 * @released
williamr@2
   144
 A class to write Unicode values to a stream built on a memory object.
williamr@2
   145
 */
williamr@2
   146
class TMemoryStreamUnicodeSink: public MUnicodeSink
williamr@2
   147
	{
williamr@2
   148
	public:
williamr@2
   149
	inline TMemoryStreamUnicodeSink(RWriteStream& aStream);
williamr@2
   150
	inline void WriteUnicodeValueL(TUint16 aValue);
williamr@2
   151
williamr@2
   152
	private:
williamr@2
   153
	RWriteStream& iStream;
williamr@2
   154
	};
williamr@2
   155
williamr@2
   156
/**
williamr@2
   157
 * @publishedAll 
williamr@2
   158
 * @released
williamr@2
   159
 
williamr@2
   160
A class to hold functions to compress text using the Standard Compression Scheme for Unicode.
williamr@2
   161
williamr@2
   162
A note on error handling and leaving.
williamr@2
   163
williamr@2
   164
Although all the public functions except the constructor can leave, it is possible to guarantee success: that is,
williamr@2
   165
guarantee that a call will not leave, and that compression will be completed. To do this, (i) supply a MUnicodeSource
williamr@2
   166
object with a non-leaving ReadUnicodeValueL function, such as a TMemoryUnicodeSource; (ii) write output to a
williamr@2
   167
RWriteStream with a non-leaving WriteL function, or to a buffer that you already know to be big enough, which can be
williamr@2
   168
found out using CompressedSizeL.
williamr@2
   169
williamr@2
   170
This guarantee of success is particularly useful when compressing from one memory buffer to another.
williamr@2
   171
*/
williamr@2
   172
class TUnicodeCompressor: public TUnicodeCompressionState
williamr@2
   173
	{
williamr@2
   174
	public:
williamr@2
   175
	IMPORT_C TUnicodeCompressor();
williamr@2
   176
	IMPORT_C void CompressL(RWriteStream& aOutput,MUnicodeSource& aInput,
williamr@2
   177
							TInt aMaxOutputBytes = KMaxTInt,TInt aMaxInputWords = KMaxTInt,
williamr@2
   178
							TInt* aOutputBytes = NULL,TInt* aInputWords = NULL);
williamr@2
   179
	IMPORT_C void CompressL(TUint8* aOutput,MUnicodeSource& aInput,
williamr@2
   180
							TInt aMaxOutputBytes = KMaxTInt,TInt aMaxInputWords = KMaxTInt,
williamr@2
   181
							TInt* aOutputBytes = NULL,TInt* aInputWords = NULL);
williamr@2
   182
	IMPORT_C TInt FlushL(RWriteStream& aOutput,TInt aMaxOutputBytes,TInt& aOutputBytes);
williamr@2
   183
	IMPORT_C TInt FlushL(TUint8* aOutput,TInt aMaxOutputBytes,TInt& aOutputBytes);
williamr@2
   184
	IMPORT_C static TInt CompressedSizeL(MUnicodeSource& aInput,TInt aInputWords);
williamr@2
   185
williamr@2
   186
	private:
williamr@2
   187
williamr@2
   188
	 // A structure to store a character and its treatment code
williamr@2
   189
	struct TAction
williamr@2
   190
		{
williamr@2
   191
		// Treatment codes: static and dynamic window numbers, plain ASCII or plain Unicode
williamr@2
   192
		enum
williamr@2
   193
			{
williamr@2
   194
			EPlainUnicode = -2,	// character cannot be expressed as ASCII or using static or dynamic windows
williamr@2
   195
			EPlainASCII = -1,	// character can be emitted as an ASCII code
williamr@2
   196
			EFirstDynamic = 0,	// values 0..255 are for dynamic windows with offsets at these places in the offset table
williamr@2
   197
			ELastDynamic = 255,
williamr@2
   198
			EFirstStatic = 256,	// values 256..263 are for static windows 0..7
williamr@2
   199
			ELastStatic = 263
williamr@2
   200
			};
williamr@2
   201
williamr@2
   202
		inline TAction();
williamr@2
   203
		TAction(TUint16 aCode);
williamr@2
   204
williamr@2
   205
		TUint16 iCode;		// Unicode value of the character
williamr@2
   206
		TInt iTreatment;	// treatment code: see above
williamr@2
   207
		};
williamr@2
   208
williamr@2
   209
	void DoCompressL(RWriteStream* aOutputStream,TUint8* aOutputPointer,MUnicodeSource* aInput,
williamr@2
   210
					 TInt aMaxCompressedBytes,TInt aMaxUnicodeWords,
williamr@2
   211
					 TInt* aCompressedBytes,TInt* aUnicodeWords);
williamr@2
   212
	void FlushInputBufferL();
williamr@2
   213
	void FlushOutputBufferL();
williamr@2
   214
	void WriteRunL();
williamr@2
   215
	void WriteCharacter(const TAction& aAction);
williamr@2
   216
	void WriteSCharacter(const TAction& aAction);
williamr@2
   217
	void WriteUCharacter(TUint16 aCode);
williamr@2
   218
	void WriteByte(TUint aByte);
williamr@2
   219
	void WriteCharacterFromBuffer();
williamr@2
   220
	void SelectTreatment(TInt aTreatment);
williamr@2
   221
williamr@2
   222
	enum
williamr@2
   223
		{
williamr@2
   224
		EMaxInputBufferSize = 4,
williamr@2
   225
		EMaxOutputBufferSize = EMaxInputBufferSize * 3	// no Unicode character can be encoded as more than three bytes
williamr@2
   226
		};
williamr@2
   227
	TAction iInputBuffer[EMaxInputBufferSize];			// circular buffer; queue of Unicode characters to be processed
williamr@2
   228
	TInt iInputBufferStart;								// position of first Unicode character to be processed
williamr@2
   229
	TInt iInputBufferSize;								// characters in the input buffer
williamr@2
   230
	TUint8 iOutputBuffer[EMaxOutputBufferSize];			// circular buffer; queue of compressed bytes to be output
williamr@2
   231
	TInt iOutputBufferStart;							// position of first compressed byte to be output
williamr@2
   232
	TInt iOutputBufferSize;								// characters in the output buffer
williamr@2
   233
	TInt iDynamicWindowIndex;							// index of the current dynamic window
williamr@2
   234
	RWriteStream* iOutputStream;						// if non-null, output is to this stream
williamr@2
   235
	TUint8* iOutputPointer;								// if non-null, output is to memory
williamr@2
   236
	MUnicodeSource* iInput;								// input object
williamr@2
   237
	};
williamr@2
   238
williamr@2
   239
/**
williamr@2
   240
 * @publishedAll 
williamr@2
   241
 * @released
williamr@2
   242
williamr@2
   243
A class to hold functions to expand text using the Standard Compression Scheme for Unicode.
williamr@2
   244
williamr@2
   245
A note on error handling and leaving.
williamr@2
   246
williamr@2
   247
Although all the public functions except the constructor can leave, it is possible to guarantee success: that is,
williamr@2
   248
guarantee that a call will not leave, and that expansion will be completed. To do this, (i) supply a MUnicodeSink
williamr@2
   249
object with a non-leaving WriteUnicodeValueL function, such as a TMemoryUnicodeSink; (ii) read input from a RReadStream
williamr@2
   250
with a non-leaving ReadL function; (iii) supply a big enough buffer to write the ouput; you can find out how big by
williamr@2
   251
calling ExpandedSizeL, using methods (i) and (ii) to guarantee success.
williamr@2
   252
williamr@2
   253
This guarantee of success is particularly useful when expanding from one memory buffer to another.
williamr@2
   254
*/
williamr@2
   255
class TUnicodeExpander: public TUnicodeCompressionState
williamr@2
   256
	{
williamr@2
   257
	public:
williamr@2
   258
	IMPORT_C TUnicodeExpander();
williamr@2
   259
	IMPORT_C void ExpandL(MUnicodeSink& aOutput,RReadStream& aInput,
williamr@2
   260
						  TInt aMaxOutputWords = KMaxTInt,TInt aMaxInputBytes = KMaxTInt,
williamr@2
   261
						  TInt* aOutputWords = NULL,TInt* aInputBytes = NULL);
williamr@2
   262
	IMPORT_C void ExpandL(MUnicodeSink& aOutput,const TUint8* aInput,
williamr@2
   263
						  TInt aMaxOutputWords = KMaxTInt,TInt aMaxInputBytes = KMaxTInt,
williamr@2
   264
						  TInt* aOutputWords = NULL,TInt* aInputBytes = NULL);
williamr@2
   265
	IMPORT_C TInt FlushL(MUnicodeSink& aOutput,TInt aMaxOutputWords,TInt& aOutputWords);
williamr@2
   266
	IMPORT_C static TInt ExpandedSizeL(RReadStream& aInput,TInt aInputBytes);
williamr@2
   267
	IMPORT_C static TInt ExpandedSizeL(const TUint8* aInput,TInt aInputBytes);
williamr@2
   268
williamr@2
   269
	private:
williamr@2
   270
	void DoExpandL(MUnicodeSink* aOutput,RReadStream* aInputStream,const TUint8* aInputPointer,
williamr@2
   271
				   TInt aMaxOutputWords,TInt aMaxInputBytes,
williamr@2
   272
				   TInt* aOutputWords,TInt* aInputBytes);
williamr@2
   273
	void HandleByteL();
williamr@2
   274
	void FlushOutputBufferL();
williamr@2
   275
	TBool HandleSByteL(TUint8 aByte);
williamr@2
   276
	TBool HandleUByteL(TUint8 aByte);
williamr@2
   277
	TBool ReadByteL(TUint8& aByte);
williamr@2
   278
	TBool QuoteUnicodeL();
williamr@2
   279
	TBool DefineWindowL(TInt aIndex);
williamr@2
   280
	TBool DefineExpansionWindowL();
williamr@2
   281
	void WriteChar(TText aChar);
williamr@2
   282
	void WriteChar32(TUint aChar);
williamr@2
   283
williamr@2
   284
	enum
williamr@2
   285
		{
williamr@2
   286
		EMaxInputBufferSize = 3,						// no Unicode character can be encoded as more than 3 bytes
williamr@2
   287
		EMaxOutputBufferSize = 2						// no byte can be expanded into more than 2 Unicode characters
williamr@2
   288
		};
williamr@2
   289
	TUint8 iInputBuffer[EMaxInputBufferSize];			// buffer containing a group of compressed bytes representing
williamr@2
   290
														// a single operation; when an input source ends in the
williamr@2
   291
														// middle of an operation, this buffer enables the next
williamr@2
   292
														// expansion to start in the correct state
williamr@2
   293
	TInt iInputBufferStart;								// next read position in the input buffer
williamr@2
   294
	TInt iInputBufferSize;								// bytes in the input buffer
williamr@2
   295
	TUint16 iOutputBuffer[EMaxOutputBufferSize];		// circular buffer; queue of Unicode characters to be output
williamr@2
   296
	TInt iOutputBufferStart;							// position of first Unicode character to be output
williamr@2
   297
	TInt iOutputBufferSize;								// characters in the output buffer
williamr@2
   298
	MUnicodeSink* iOutput;								// output object
williamr@2
   299
	RReadStream* iInputStream;							// if non-null, input is from this stream
williamr@2
   300
	const TUint8* iInputPointer;						// if non-null, input is from memory
williamr@2
   301
	};
williamr@2
   302
williamr@2
   303
// inline functions start here
williamr@2
   304
williamr@2
   305
inline TMemoryUnicodeSource::TMemoryUnicodeSource(const TUint16* aPtr):
williamr@2
   306
	iPtr(aPtr)
williamr@2
   307
	{
williamr@2
   308
	}
williamr@2
   309
williamr@2
   310
inline TUint16 TMemoryUnicodeSource::ReadUnicodeValueL()
williamr@2
   311
	{
williamr@2
   312
	return *iPtr++;
williamr@2
   313
	}
williamr@2
   314
williamr@2
   315
inline TMemoryStreamUnicodeSource::TMemoryStreamUnicodeSource(RReadStream& aStream):
williamr@2
   316
	iStream(aStream)
williamr@2
   317
	{
williamr@2
   318
	}
williamr@2
   319
williamr@2
   320
inline TUint16 TMemoryStreamUnicodeSource::ReadUnicodeValueL()
williamr@2
   321
	{
williamr@2
   322
	TUint16 x;
williamr@2
   323
	iStream.ReadL((TUint8*)&x,sizeof(TUint16));
williamr@2
   324
	return x;
williamr@2
   325
	}
williamr@2
   326
williamr@2
   327
inline TMemoryUnicodeSink::TMemoryUnicodeSink(TUint16* aPtr):
williamr@2
   328
	iPtr(aPtr)
williamr@2
   329
	{
williamr@2
   330
	}
williamr@2
   331
williamr@2
   332
inline void TMemoryUnicodeSink::WriteUnicodeValueL(TUint16 aValue)
williamr@2
   333
	{
williamr@2
   334
	*iPtr++ = aValue;
williamr@2
   335
	}
williamr@2
   336
williamr@2
   337
inline TMemoryStreamUnicodeSink::TMemoryStreamUnicodeSink(RWriteStream& aStream):
williamr@2
   338
	iStream(aStream)
williamr@2
   339
	{
williamr@2
   340
	}
williamr@2
   341
williamr@2
   342
inline void TMemoryStreamUnicodeSink::WriteUnicodeValueL(TUint16 aValue)
williamr@2
   343
	{
williamr@2
   344
	iStream.WriteL((TUint8*)&aValue,sizeof(TUint16));
williamr@2
   345
	}
williamr@2
   346
williamr@2
   347
inline TUnicodeCompressor::TAction::TAction():
williamr@2
   348
	iCode(0),
williamr@2
   349
	iTreatment(EPlainUnicode)
williamr@2
   350
	{
williamr@2
   351
	}
williamr@2
   352
williamr@2
   353
#endif // _UNICODE
williamr@2
   354
williamr@2
   355
#endif // __S32UCMP_H__