sl@0
|
1 |
// Copyright (c) 2006-2009 Nokia Corporation and/or its subsidiary(-ies).
|
sl@0
|
2 |
// All rights reserved.
|
sl@0
|
3 |
// This component and the accompanying materials are made available
|
sl@0
|
4 |
// under the terms of "Eclipse Public License v1.0"
|
sl@0
|
5 |
// which accompanies this distribution, and is available
|
sl@0
|
6 |
// at the URL "http://www.eclipse.org/legal/epl-v10.html".
|
sl@0
|
7 |
//
|
sl@0
|
8 |
// Initial Contributors:
|
sl@0
|
9 |
// Nokia Corporation - initial contribution.
|
sl@0
|
10 |
//
|
sl@0
|
11 |
// Contributors:
|
sl@0
|
12 |
//
|
sl@0
|
13 |
// Description:
|
sl@0
|
14 |
// Classes defined in this file are used for Unicode compression and decompression.
|
sl@0
|
15 |
// Their code is borrowed from Symbian, only with some changes such as the "Panic" function
|
sl@0
|
16 |
// is changed to exit the program. The Symbian coding standard will be kept in the code.
|
sl@0
|
17 |
//
|
sl@0
|
18 |
//
|
sl@0
|
19 |
|
sl@0
|
20 |
|
sl@0
|
21 |
#if !defined(__UNICODECOMPRESSION_H__)
|
sl@0
|
22 |
#define __UNICODECOMPRESSION_H__
|
sl@0
|
23 |
|
sl@0
|
24 |
#include <stdio.h>
|
sl@0
|
25 |
#include <pcstore/pcstoredef.h>
|
sl@0
|
26 |
#include <pcstore/storereadstream.h>
|
sl@0
|
27 |
#include <pcstore/storewritestream.h>
|
sl@0
|
28 |
#include "pcstoreconst.h"
|
sl@0
|
29 |
|
sl@0
|
30 |
namespace PCStore
|
sl@0
|
31 |
{
|
sl@0
|
32 |
/**
|
sl@0
|
33 |
@internalComponent
|
sl@0
|
34 |
*/
|
sl@0
|
35 |
class TUnicodeCompressionState
|
sl@0
|
36 |
{
|
sl@0
|
37 |
public:
|
sl@0
|
38 |
TUnicodeCompressionState();
|
sl@0
|
39 |
void Reset();
|
sl@0
|
40 |
static TInt StaticWindowIndex(TUint16 aCode);
|
sl@0
|
41 |
static TInt DynamicWindowOffsetIndex(TUint16 aCode);
|
sl@0
|
42 |
static TUint32 DynamicWindowBase(TInt aOffsetIndex);
|
sl@0
|
43 |
static TBool EncodeAsIs(TUint16 aCode);
|
sl@0
|
44 |
|
sl@0
|
45 |
enum TPanic
|
sl@0
|
46 |
{
|
sl@0
|
47 |
EUnhandledByte, // expander code fails to handle all possible byte codes
|
sl@0
|
48 |
ENotUnicode, // expander can't handle Unicode values outside range 0x0..0x10FFFF;
|
sl@0
|
49 |
// that is, 16-bit codes plus 32-bit codes that can be expressed using
|
sl@0
|
50 |
// 16-bit surrogates
|
sl@0
|
51 |
EOutputBufferOverflow // output buffer is not big enough
|
sl@0
|
52 |
};
|
sl@0
|
53 |
|
sl@0
|
54 |
static void Panic(TPanic aPanic);
|
sl@0
|
55 |
|
sl@0
|
56 |
protected:
|
sl@0
|
57 |
|
sl@0
|
58 |
enum
|
sl@0
|
59 |
{
|
sl@0
|
60 |
EStaticWindows = 8,
|
sl@0
|
61 |
EDynamicWindows = 8,
|
sl@0
|
62 |
ESpecialBases = 7
|
sl@0
|
63 |
};
|
sl@0
|
64 |
|
sl@0
|
65 |
TBool iUnicodeMode; // TRUE if in Unicode mode as opposed to single-byte mode
|
sl@0
|
66 |
TUint32 iActiveWindowBase; // base of the active window - bases are 32-bit because they
|
sl@0
|
67 |
// can be set to the surrogate area, which represents codes
|
sl@0
|
68 |
// from 0x00010000 to 0x0010FFFF - planes 1-16 of ISO-10646.
|
sl@0
|
69 |
static const TUint32 iStaticWindow[EStaticWindows]; // bases of the static windows
|
sl@0
|
70 |
static const TUint32 iDynamicWindowDefault[EDynamicWindows]; // default bases of the dynamic windows
|
sl@0
|
71 |
static const TUint16 iSpecialBase[ESpecialBases]; // bases for window offsets F9..FF
|
sl@0
|
72 |
|
sl@0
|
73 |
TUint32 iDynamicWindow[EDynamicWindows]; // bases of the dynamic windows
|
sl@0
|
74 |
TInt iUnicodeWords; // Unicode words processed; read by compressor, written by expander
|
sl@0
|
75 |
TInt iMaxUnicodeWords; // maximum number of Unicode words to read or write
|
sl@0
|
76 |
TInt iCompressedBytes; // compressed bytes processed: read by expander, written by compressor
|
sl@0
|
77 |
TInt iMaxCompressedBytes; // maximum number of compressed bytes to read or write
|
sl@0
|
78 |
};
|
sl@0
|
79 |
|
sl@0
|
80 |
/**
|
sl@0
|
81 |
@internalComponent
|
sl@0
|
82 |
*/
|
sl@0
|
83 |
class MUnicodeSource
|
sl@0
|
84 |
{
|
sl@0
|
85 |
public:
|
sl@0
|
86 |
virtual TUint16 ReadUnicodeValueL() = 0;
|
sl@0
|
87 |
};
|
sl@0
|
88 |
|
sl@0
|
89 |
/**
|
sl@0
|
90 |
@internalComponent
|
sl@0
|
91 |
|
sl@0
|
92 |
A class to read Unicode values directly from memory.
|
sl@0
|
93 |
*/
|
sl@0
|
94 |
class TMemoryUnicodeSource: public MUnicodeSource
|
sl@0
|
95 |
{
|
sl@0
|
96 |
public:
|
sl@0
|
97 |
inline TMemoryUnicodeSource(const TUint16* aPtr);
|
sl@0
|
98 |
inline TUint16 ReadUnicodeValueL();
|
sl@0
|
99 |
|
sl@0
|
100 |
private:
|
sl@0
|
101 |
const TUint16* iPtr;
|
sl@0
|
102 |
};
|
sl@0
|
103 |
|
sl@0
|
104 |
/**
|
sl@0
|
105 |
@internalComponent
|
sl@0
|
106 |
|
sl@0
|
107 |
A class to read Unicode values from a stream built on a memory object.
|
sl@0
|
108 |
*/
|
sl@0
|
109 |
class TMemoryStreamUnicodeSource: public MUnicodeSource
|
sl@0
|
110 |
{
|
sl@0
|
111 |
public:
|
sl@0
|
112 |
inline TMemoryStreamUnicodeSource(CStoreReadStream& aStream);
|
sl@0
|
113 |
inline TUint16 ReadUnicodeValueL();
|
sl@0
|
114 |
|
sl@0
|
115 |
private:
|
sl@0
|
116 |
CStoreReadStream& iStream;
|
sl@0
|
117 |
};
|
sl@0
|
118 |
|
sl@0
|
119 |
/**
|
sl@0
|
120 |
@internalComponent
|
sl@0
|
121 |
|
sl@0
|
122 |
*/
|
sl@0
|
123 |
class MUnicodeSink
|
sl@0
|
124 |
{
|
sl@0
|
125 |
public:
|
sl@0
|
126 |
virtual void WriteUnicodeValueL(TUint16 aValue) = 0;
|
sl@0
|
127 |
};
|
sl@0
|
128 |
|
sl@0
|
129 |
/**
|
sl@0
|
130 |
@internalComponent
|
sl@0
|
131 |
|
sl@0
|
132 |
A class to write Unicode values directly to memory.
|
sl@0
|
133 |
*/
|
sl@0
|
134 |
class TMemoryUnicodeSink: public MUnicodeSink
|
sl@0
|
135 |
{
|
sl@0
|
136 |
public:
|
sl@0
|
137 |
inline TMemoryUnicodeSink(TUint16* aPtr);
|
sl@0
|
138 |
inline void WriteUnicodeValueL(TUint16 aValue);
|
sl@0
|
139 |
|
sl@0
|
140 |
private:
|
sl@0
|
141 |
TUint16* iPtr;
|
sl@0
|
142 |
};
|
sl@0
|
143 |
|
sl@0
|
144 |
/**
|
sl@0
|
145 |
@internalComponent
|
sl@0
|
146 |
|
sl@0
|
147 |
A class to write Unicode values to a stream built on a memory object.
|
sl@0
|
148 |
*/
|
sl@0
|
149 |
class TMemoryStreamUnicodeSink: public MUnicodeSink
|
sl@0
|
150 |
{
|
sl@0
|
151 |
public:
|
sl@0
|
152 |
inline TMemoryStreamUnicodeSink(CStoreWriteStream& aStream);
|
sl@0
|
153 |
inline void WriteUnicodeValueL(TUint16 aValue);
|
sl@0
|
154 |
|
sl@0
|
155 |
private:
|
sl@0
|
156 |
CStoreWriteStream& iStream;
|
sl@0
|
157 |
};
|
sl@0
|
158 |
|
sl@0
|
159 |
/**
|
sl@0
|
160 |
@internalComponent
|
sl@0
|
161 |
|
sl@0
|
162 |
A class to hold functions to compress text using the Standard Compression Scheme for Unicode.
|
sl@0
|
163 |
*/
|
sl@0
|
164 |
class TUnicodeCompressor: public TUnicodeCompressionState
|
sl@0
|
165 |
{
|
sl@0
|
166 |
public:
|
sl@0
|
167 |
TUnicodeCompressor();
|
sl@0
|
168 |
void CompressL(CStoreWriteStream& aOutput,MUnicodeSource& aInput,
|
sl@0
|
169 |
TInt aMaxOutputBytes = KMaxTInt,TInt aMaxInputWords = KMaxTInt,
|
sl@0
|
170 |
TInt* aOutputBytes = static_cast<TInt*>(NULL),TInt* aInputWords = static_cast<TInt*>(NULL));
|
sl@0
|
171 |
void CompressL(TUint8* aOutput,MUnicodeSource& aInput,
|
sl@0
|
172 |
TInt aMaxOutputBytes = KMaxTInt,TInt aMaxInputWords = KMaxTInt,
|
sl@0
|
173 |
TInt* aOutputBytes = static_cast<TInt*>(NULL),TInt* aInputWords = static_cast<TInt*>(NULL));
|
sl@0
|
174 |
TInt FlushL(CStoreWriteStream& aOutput,TInt aMaxOutputBytes,TInt& aOutputBytes);
|
sl@0
|
175 |
TInt FlushL(TUint8* aOutput,TInt aMaxOutputBytes,TInt& aOutputBytes);
|
sl@0
|
176 |
static TInt CompressedSizeL(MUnicodeSource& aInput,TInt aInputWords);
|
sl@0
|
177 |
|
sl@0
|
178 |
private:
|
sl@0
|
179 |
|
sl@0
|
180 |
// A structure to store a character and its treatment code
|
sl@0
|
181 |
struct TAction
|
sl@0
|
182 |
{
|
sl@0
|
183 |
// Treatment codes: static and dynamic window numbers, plain ASCII or plain Unicode
|
sl@0
|
184 |
enum
|
sl@0
|
185 |
{
|
sl@0
|
186 |
EPlainUnicode = -2, // character cannot be expressed as ASCII or using static or dynamic windows
|
sl@0
|
187 |
EPlainASCII = -1, // character can be emitted as an ASCII code
|
sl@0
|
188 |
EFirstDynamic = 0, // values 0..255 are for dynamic windows with offsets at these places in the offset table
|
sl@0
|
189 |
ELastDynamic = 255,
|
sl@0
|
190 |
EFirstStatic = 256, // values 256..263 are for static windows 0..7
|
sl@0
|
191 |
ELastStatic = 263
|
sl@0
|
192 |
};
|
sl@0
|
193 |
|
sl@0
|
194 |
inline TAction();
|
sl@0
|
195 |
TAction(TUint16 aCode);
|
sl@0
|
196 |
|
sl@0
|
197 |
TUint16 iCode; // Unicode value of the character
|
sl@0
|
198 |
TInt iTreatment; // treatment code: see above
|
sl@0
|
199 |
};
|
sl@0
|
200 |
|
sl@0
|
201 |
void DoCompressL(CStoreWriteStream* aOutputStream,TUint8* aOutputPointer,MUnicodeSource* aInput,
|
sl@0
|
202 |
TInt aMaxCompressedBytes,TInt aMaxUnicodeWords,
|
sl@0
|
203 |
TInt* aCompressedBytes,TInt* aUnicodeWords);
|
sl@0
|
204 |
void FlushInputBufferL();
|
sl@0
|
205 |
void FlushOutputBufferL();
|
sl@0
|
206 |
void WriteRunL();
|
sl@0
|
207 |
void WriteCharacter(const TAction& aAction);
|
sl@0
|
208 |
void WriteSCharacter(const TAction& aAction);
|
sl@0
|
209 |
void WriteUCharacter(TUint16 aCode);
|
sl@0
|
210 |
void WriteByte(TUint aByte);
|
sl@0
|
211 |
void WriteCharacterFromBuffer();
|
sl@0
|
212 |
void SelectTreatment(TInt aTreatment);
|
sl@0
|
213 |
|
sl@0
|
214 |
enum
|
sl@0
|
215 |
{
|
sl@0
|
216 |
EMaxInputBufferSize = 4,
|
sl@0
|
217 |
EMaxOutputBufferSize = EMaxInputBufferSize * 3 // no Unicode character can be encoded as more than three bytes
|
sl@0
|
218 |
};
|
sl@0
|
219 |
TAction iInputBuffer[EMaxInputBufferSize]; // circular buffer; queue of Unicode characters to be processed
|
sl@0
|
220 |
TInt iInputBufferStart; // position of first Unicode character to be processed
|
sl@0
|
221 |
TInt iInputBufferSize; // characters in the input buffer
|
sl@0
|
222 |
TUint8 iOutputBuffer[EMaxOutputBufferSize]; // circular buffer; queue of compressed bytes to be output
|
sl@0
|
223 |
TInt iOutputBufferStart; // position of first compressed byte to be output
|
sl@0
|
224 |
TInt iOutputBufferSize; // characters in the output buffer
|
sl@0
|
225 |
TInt iDynamicWindowIndex; // index of the current dynamic window
|
sl@0
|
226 |
CStoreWriteStream* iOutputStream; // if non-null, output is to this stream
|
sl@0
|
227 |
TUint8* iOutputPointer; // if non-null, output is to memory
|
sl@0
|
228 |
MUnicodeSource* iInput; // input object
|
sl@0
|
229 |
};
|
sl@0
|
230 |
|
sl@0
|
231 |
/**
|
sl@0
|
232 |
@internalComponent
|
sl@0
|
233 |
|
sl@0
|
234 |
A class to hold functions to expand text using the Standard Compression Scheme for Unicode.
|
sl@0
|
235 |
*/
|
sl@0
|
236 |
class TUnicodeExpander: public TUnicodeCompressionState
|
sl@0
|
237 |
{
|
sl@0
|
238 |
public:
|
sl@0
|
239 |
TUnicodeExpander();
|
sl@0
|
240 |
void ExpandL(MUnicodeSink& aOutput,CStoreReadStream& aInput,
|
sl@0
|
241 |
TInt aMaxOutputWords = KMaxTInt,TInt aMaxInputBytes = KMaxTInt,
|
sl@0
|
242 |
TInt* aOutputWords = static_cast<TInt*>(NULL),TInt* aInputBytes = static_cast<TInt*>(NULL));
|
sl@0
|
243 |
void ExpandL(MUnicodeSink& aOutput,const TUint8* aInput,
|
sl@0
|
244 |
TInt aMaxOutputWords = KMaxTInt,TInt aMaxInputBytes = KMaxTInt,
|
sl@0
|
245 |
TInt* aOutputWords = static_cast<TInt*>(NULL),TInt* aInputBytes = static_cast<TInt*>(NULL));
|
sl@0
|
246 |
TInt FlushL(MUnicodeSink& aOutput,TInt aMaxOutputWords,TInt& aOutputWords);
|
sl@0
|
247 |
static TInt ExpandedSizeL(CStoreReadStream& aInput,TInt aInputBytes);
|
sl@0
|
248 |
static TInt ExpandedSizeL(const TUint8* aInput,TInt aInputBytes);
|
sl@0
|
249 |
|
sl@0
|
250 |
private:
|
sl@0
|
251 |
void DoExpandL(MUnicodeSink* aOutput,CStoreReadStream* aInputStream,const TUint8* aInputPointer,
|
sl@0
|
252 |
TInt aMaxOutputWords,TInt aMaxInputBytes,
|
sl@0
|
253 |
TInt* aOutputWords,TInt* aInputBytes);
|
sl@0
|
254 |
void HandleByteL();
|
sl@0
|
255 |
void FlushOutputBufferL();
|
sl@0
|
256 |
TBool HandleSByteL(TUint8 aByte);
|
sl@0
|
257 |
TBool HandleUByteL(TUint8 aByte);
|
sl@0
|
258 |
TBool ReadByteL(TUint8& aByte);
|
sl@0
|
259 |
TBool QuoteUnicodeL();
|
sl@0
|
260 |
TBool DefineWindowL(TInt aIndex);
|
sl@0
|
261 |
TBool DefineExpansionWindowL();
|
sl@0
|
262 |
void WriteChar(TText aChar);
|
sl@0
|
263 |
void WriteChar32(TUint aChar);
|
sl@0
|
264 |
|
sl@0
|
265 |
enum
|
sl@0
|
266 |
{
|
sl@0
|
267 |
EMaxInputBufferSize = 3, // no Unicode character can be encoded as more than 3 bytes
|
sl@0
|
268 |
EMaxOutputBufferSize = 2 // no byte can be expanded into more than 2 Unicode characters
|
sl@0
|
269 |
};
|
sl@0
|
270 |
TUint8 iInputBuffer[EMaxInputBufferSize]; // buffer containing a group of compressed bytes representing
|
sl@0
|
271 |
// a single operation; when an input source ends in the
|
sl@0
|
272 |
// middle of an operation, this buffer enables the next
|
sl@0
|
273 |
// expansion to start in the correct state
|
sl@0
|
274 |
TInt iInputBufferStart; // next read position in the input buffer
|
sl@0
|
275 |
TInt iInputBufferSize; // bytes in the input buffer
|
sl@0
|
276 |
TUint16 iOutputBuffer[EMaxOutputBufferSize]; // circular buffer; queue of Unicode characters to be output
|
sl@0
|
277 |
TInt iOutputBufferStart; // position of first Unicode character to be output
|
sl@0
|
278 |
TInt iOutputBufferSize; // characters in the output buffer
|
sl@0
|
279 |
MUnicodeSink* iOutput; // output object
|
sl@0
|
280 |
CStoreReadStream* iInputStream; // if non-null, input is from this stream
|
sl@0
|
281 |
const TUint8* iInputPointer; // if non-null, input is from memory
|
sl@0
|
282 |
};
|
sl@0
|
283 |
|
sl@0
|
284 |
// inline functions start here
|
sl@0
|
285 |
|
sl@0
|
286 |
inline TMemoryUnicodeSource::TMemoryUnicodeSource(const TUint16* aPtr):
|
sl@0
|
287 |
iPtr(aPtr)
|
sl@0
|
288 |
{
|
sl@0
|
289 |
}
|
sl@0
|
290 |
|
sl@0
|
291 |
inline TUint16 TMemoryUnicodeSource::ReadUnicodeValueL()
|
sl@0
|
292 |
{
|
sl@0
|
293 |
return *iPtr++;
|
sl@0
|
294 |
}
|
sl@0
|
295 |
|
sl@0
|
296 |
inline TMemoryStreamUnicodeSource::TMemoryStreamUnicodeSource(CStoreReadStream& aStream):
|
sl@0
|
297 |
iStream(aStream)
|
sl@0
|
298 |
{
|
sl@0
|
299 |
}
|
sl@0
|
300 |
|
sl@0
|
301 |
inline TUint16 TMemoryStreamUnicodeSource::ReadUnicodeValueL()
|
sl@0
|
302 |
{
|
sl@0
|
303 |
TUint16 x;
|
sl@0
|
304 |
iStream.Read(reinterpret_cast<TUint8*>(&x),sizeof(TUint16));
|
sl@0
|
305 |
return x;
|
sl@0
|
306 |
}
|
sl@0
|
307 |
|
sl@0
|
308 |
inline TMemoryUnicodeSink::TMemoryUnicodeSink(TUint16* aPtr):
|
sl@0
|
309 |
iPtr(aPtr)
|
sl@0
|
310 |
{
|
sl@0
|
311 |
}
|
sl@0
|
312 |
|
sl@0
|
313 |
inline void TMemoryUnicodeSink::WriteUnicodeValueL(TUint16 aValue)
|
sl@0
|
314 |
{
|
sl@0
|
315 |
*iPtr++ = aValue;
|
sl@0
|
316 |
}
|
sl@0
|
317 |
|
sl@0
|
318 |
inline TMemoryStreamUnicodeSink::TMemoryStreamUnicodeSink(CStoreWriteStream& aStream):
|
sl@0
|
319 |
iStream(aStream)
|
sl@0
|
320 |
{
|
sl@0
|
321 |
}
|
sl@0
|
322 |
|
sl@0
|
323 |
inline void TMemoryStreamUnicodeSink::WriteUnicodeValueL(TUint16 aValue)
|
sl@0
|
324 |
{
|
sl@0
|
325 |
iStream.Write(reinterpret_cast<TUint8*>(&aValue),sizeof(TUint16));
|
sl@0
|
326 |
}
|
sl@0
|
327 |
|
sl@0
|
328 |
inline TUnicodeCompressor::TAction::TAction():
|
sl@0
|
329 |
iCode(0),
|
sl@0
|
330 |
iTreatment(EPlainUnicode)
|
sl@0
|
331 |
{
|
sl@0
|
332 |
}
|
sl@0
|
333 |
}
|
sl@0
|
334 |
#endif // !defined(__UNICODECOMPRESSION_H__)
|