Update contrib.
2 * Copyright (c) 1998-2009 Nokia Corporation and/or its subsidiary(-ies).
4 * This component and the accompanying materials are made available
5 * under the terms of the License "Eclipse Public License v1.0"
6 * which accompanies this distribution, and is available
7 * at the URL "http://www.eclipse.org/legal/epl-v10.html".
9 * Initial Contributors:
10 * Nokia Corporation - initial contribution.
15 * Header for the Standard Compression Scheme for Unicode.
16 * This code is compiled only in the Unicode build.
22 #define __S32UCMP_H__ 1
34 class TUnicodeCompressionState
37 TUnicodeCompressionState();
39 static TInt StaticWindowIndex(TUint16 aCode);
40 static TInt DynamicWindowOffsetIndex(TUint16 aCode);
41 static TUint32 DynamicWindowBase(TInt aOffsetIndex);
42 static TBool EncodeAsIs(TUint16 aCode);
46 EUnhandledByte, // expander code fails to handle all possible byte codes
47 ENotUnicode, // expander can't handle Unicode values outside range 0x0..0x10FFFF;
48 // that is, 16-bit codes plus 32-bit codes that can be expressed using
50 EOutputBufferOverflow // output buffer is not big enough
53 static void Panic(TPanic aPanic);
64 TBool iUnicodeMode; // TRUE if in Unicode mode as opposed to single-byte mode
65 TUint32 iActiveWindowBase; // base of the active window - bases are 32-bit because they
66 // can be set to the surrogate area, which represents codes
67 // from 0x00010000 to 0x0010FFFF - planes 1-16 of ISO-10646.
68 static const TUint32 iStaticWindow[EStaticWindows]; // bases of the static windows
69 static const TUint32 iDynamicWindowDefault[EDynamicWindows]; // default bases of the dynamic windows
70 static const TUint16 iSpecialBase[ESpecialBases]; // bases for window offsets F9..FF
72 TUint32 iDynamicWindow[EDynamicWindows]; // bases of the dynamic windows
73 TInt iUnicodeWords; // Unicode words processed; read by compressor, written by expander
74 TInt iMaxUnicodeWords; // maximum number of Unicode words to read or write
75 TInt iCompressedBytes; // compressed bytes processed: read by expander, written by compressor
76 TInt iMaxCompressedBytes; // maximum number of compressed bytes to read or write
82 virtual TUint16 ReadUnicodeValueL() = 0;
86 A class to read Unicode values directly from memory.
88 class TMemoryUnicodeSource: public MUnicodeSource
91 inline TMemoryUnicodeSource(const TUint16* aPtr);
92 inline TUint16 ReadUnicodeValueL();
99 A class to read Unicode values from a stream built on a memory object.
101 class TMemoryStreamUnicodeSource: public MUnicodeSource
104 inline TMemoryStreamUnicodeSource(RReadStream& aStream);
105 inline TUint16 ReadUnicodeValueL();
108 RReadStream& iStream;
114 virtual void WriteUnicodeValueL(TUint16 aValue) = 0;
118 A class to write Unicode values directly to memory.
120 class TMemoryUnicodeSink: public MUnicodeSink
123 inline TMemoryUnicodeSink(TUint16* aPtr);
124 inline void WriteUnicodeValueL(TUint16 aValue);
131 A class to write Unicode values to a stream built on a memory object.
133 class TMemoryStreamUnicodeSink: public MUnicodeSink
136 inline TMemoryStreamUnicodeSink(RWriteStream& aStream);
137 inline void WriteUnicodeValueL(TUint16 aValue);
140 RWriteStream& iStream;
145 A class to hold functions to compress text using the Standard Compression Scheme for Unicode.
147 A note on error handling and leaving.
149 Although all the public functions except the constructor can leave, it is possible to guarantee success: that is,
150 guarantee that a call will not leave, and that compression will be completed. To do this, (i) supply a MUnicodeSource
151 object with a non-leaving ReadUnicodeValueL function, such as a TMemoryUnicodeSource; (ii) write output to a
152 RWriteStream with a non-leaving WriteL function, or to a buffer that you already know to be big enough, which can be
153 found out using CompressedSizeL.
155 This guarantee of success is particularly useful when compressing from one memory buffer to another.
157 class TUnicodeCompressor: public TUnicodeCompressionState
160 IMPORT_C TUnicodeCompressor();
161 IMPORT_C void CompressL(RWriteStream& aOutput,MUnicodeSource& aInput,
162 TInt aMaxOutputBytes = KMaxTInt,TInt aMaxInputWords = KMaxTInt,
163 TInt* aOutputBytes = NULL,TInt* aInputWords = NULL);
164 IMPORT_C void CompressL(TUint8* aOutput,MUnicodeSource& aInput,
165 TInt aMaxOutputBytes = KMaxTInt,TInt aMaxInputWords = KMaxTInt,
166 TInt* aOutputBytes = NULL,TInt* aInputWords = NULL);
167 IMPORT_C TInt FlushL(RWriteStream& aOutput,TInt aMaxOutputBytes,TInt& aOutputBytes);
168 IMPORT_C TInt FlushL(TUint8* aOutput,TInt aMaxOutputBytes,TInt& aOutputBytes);
169 IMPORT_C static TInt CompressedSizeL(MUnicodeSource& aInput,TInt aInputWords);
173 // A structure to store a character and its treatment code
176 // Treatment codes: static and dynamic window numbers, plain ASCII or plain Unicode
179 EPlainUnicode = -2, // character cannot be expressed as ASCII or using static or dynamic windows
180 EPlainASCII = -1, // character can be emitted as an ASCII code
181 EFirstDynamic = 0, // values 0..255 are for dynamic windows with offsets at these places in the offset table
183 EFirstStatic = 256, // values 256..263 are for static windows 0..7
188 TAction(TUint16 aCode);
190 TUint16 iCode; // Unicode value of the character
191 TInt iTreatment; // treatment code: see above
194 void DoCompressL(RWriteStream* aOutputStream,TUint8* aOutputPointer,MUnicodeSource* aInput,
195 TInt aMaxCompressedBytes,TInt aMaxUnicodeWords,
196 TInt* aCompressedBytes,TInt* aUnicodeWords);
197 void FlushInputBufferL();
198 void FlushOutputBufferL();
200 void WriteCharacter(const TAction& aAction);
201 void WriteSCharacter(const TAction& aAction);
202 void WriteUCharacter(TUint16 aCode);
203 void WriteByte(TUint aByte);
204 void WriteCharacterFromBuffer();
205 void SelectTreatment(TInt aTreatment);
209 EMaxInputBufferSize = 4,
210 EMaxOutputBufferSize = EMaxInputBufferSize * 3 // no Unicode character can be encoded as more than three bytes
212 TAction iInputBuffer[EMaxInputBufferSize]; // circular buffer; queue of Unicode characters to be processed
213 TInt iInputBufferStart; // position of first Unicode character to be processed
214 TInt iInputBufferSize; // characters in the input buffer
215 TUint8 iOutputBuffer[EMaxOutputBufferSize]; // circular buffer; queue of compressed bytes to be output
216 TInt iOutputBufferStart; // position of first compressed byte to be output
217 TInt iOutputBufferSize; // characters in the output buffer
218 TInt iDynamicWindowIndex; // index of the current dynamic window
219 RWriteStream* iOutputStream; // if non-null, output is to this stream
220 TUint8* iOutputPointer; // if non-null, output is to memory
221 MUnicodeSource* iInput; // input object
226 A class to hold functions to expand text using the Standard Compression Scheme for Unicode.
228 A note on error handling and leaving.
230 Although all the public functions except the constructor can leave, it is possible to guarantee success: that is,
231 guarantee that a call will not leave, and that expansion will be completed. To do this, (i) supply a MUnicodeSink
232 object with a non-leaving WriteUnicodeValueL function, such as a TMemoryUnicodeSink; (ii) read input from a RReadStream
233 with a non-leaving ReadL function; (iii) supply a big enough buffer to write the ouput; you can find out how big by
234 calling ExpandedSizeL, using methods (i) and (ii) to guarantee success.
236 This guarantee of success is particularly useful when expanding from one memory buffer to another.
238 class TUnicodeExpander: public TUnicodeCompressionState
241 IMPORT_C TUnicodeExpander();
242 IMPORT_C void ExpandL(MUnicodeSink& aOutput,RReadStream& aInput,
243 TInt aMaxOutputWords = KMaxTInt,TInt aMaxInputBytes = KMaxTInt,
244 TInt* aOutputWords = NULL,TInt* aInputBytes = NULL);
245 IMPORT_C void ExpandL(MUnicodeSink& aOutput,const TUint8* aInput,
246 TInt aMaxOutputWords = KMaxTInt,TInt aMaxInputBytes = KMaxTInt,
247 TInt* aOutputWords = NULL,TInt* aInputBytes = NULL);
248 IMPORT_C TInt FlushL(MUnicodeSink& aOutput,TInt aMaxOutputWords,TInt& aOutputWords);
249 IMPORT_C static TInt ExpandedSizeL(RReadStream& aInput,TInt aInputBytes);
250 IMPORT_C static TInt ExpandedSizeL(const TUint8* aInput,TInt aInputBytes);
253 void DoExpandL(MUnicodeSink* aOutput,RReadStream* aInputStream,const TUint8* aInputPointer,
254 TInt aMaxOutputWords,TInt aMaxInputBytes,
255 TInt* aOutputWords,TInt* aInputBytes);
257 void FlushOutputBufferL();
258 TBool HandleSByteL(TUint8 aByte);
259 TBool HandleUByteL(TUint8 aByte);
260 TBool ReadByteL(TUint8& aByte);
261 TBool QuoteUnicodeL();
262 TBool DefineWindowL(TInt aIndex);
263 TBool DefineExpansionWindowL();
264 void WriteChar(TText aChar);
265 void WriteChar32(TUint aChar);
269 EMaxInputBufferSize = 3, // no Unicode character can be encoded as more than 3 bytes
270 EMaxOutputBufferSize = 2 // no byte can be expanded into more than 2 Unicode characters
272 TUint8 iInputBuffer[EMaxInputBufferSize]; // buffer containing a group of compressed bytes representing
273 // a single operation; when an input source ends in the
274 // middle of an operation, this buffer enables the next
275 // expansion to start in the correct state
276 TInt iInputBufferStart; // next read position in the input buffer
277 TInt iInputBufferSize; // bytes in the input buffer
278 TUint16 iOutputBuffer[EMaxOutputBufferSize]; // circular buffer; queue of Unicode characters to be output
279 TInt iOutputBufferStart; // position of first Unicode character to be output
280 TInt iOutputBufferSize; // characters in the output buffer
281 MUnicodeSink* iOutput; // output object
282 RReadStream* iInputStream; // if non-null, input is from this stream
283 const TUint8* iInputPointer; // if non-null, input is from memory
286 // inline functions start here
288 inline TMemoryUnicodeSource::TMemoryUnicodeSource(const TUint16* aPtr):
293 inline TUint16 TMemoryUnicodeSource::ReadUnicodeValueL()
298 inline TMemoryStreamUnicodeSource::TMemoryStreamUnicodeSource(RReadStream& aStream):
303 inline TUint16 TMemoryStreamUnicodeSource::ReadUnicodeValueL()
306 iStream.ReadL((TUint8*)&x,sizeof(TUint16));
310 inline TMemoryUnicodeSink::TMemoryUnicodeSink(TUint16* aPtr):
315 inline void TMemoryUnicodeSink::WriteUnicodeValueL(TUint16 aValue)
320 inline TMemoryStreamUnicodeSink::TMemoryStreamUnicodeSink(RWriteStream& aStream):
325 inline void TMemoryStreamUnicodeSink::WriteUnicodeValueL(TUint16 aValue)
327 iStream.WriteL((TUint8*)&aValue,sizeof(TUint16));
330 inline TUnicodeCompressor::TAction::TAction():
332 iTreatment(EPlainUnicode)
338 #endif // __S32UCMP_H__