os/persistentdata/persistentstorage/store/pcstore/src/unicodecompression.h
author sl
Tue, 10 Jun 2014 14:32:02 +0200
changeset 1 260cb5ec6c19
permissions -rw-r--r--
Update contrib.
sl@0
     1
// Copyright (c) 2006-2009 Nokia Corporation and/or its subsidiary(-ies).
sl@0
     2
// All rights reserved.
sl@0
     3
// This component and the accompanying materials are made available
sl@0
     4
// under the terms of "Eclipse Public License v1.0"
sl@0
     5
// which accompanies this distribution, and is available
sl@0
     6
// at the URL "http://www.eclipse.org/legal/epl-v10.html".
sl@0
     7
//
sl@0
     8
// Initial Contributors:
sl@0
     9
// Nokia Corporation - initial contribution.
sl@0
    10
//
sl@0
    11
// Contributors:
sl@0
    12
//
sl@0
    13
// Description:
sl@0
    14
// Classes defined in this file are used for Unicode compression and decompression.
sl@0
    15
// Their code is borrowed from Symbian, only with some changes such as the "Panic" function 
sl@0
    16
// is changed to exit the program. The Symbian coding standard will be kept in the code.
sl@0
    17
// 
sl@0
    18
//
sl@0
    19
sl@0
    20
sl@0
    21
#if !defined(__UNICODECOMPRESSION_H__)
sl@0
    22
#define __UNICODECOMPRESSION_H__
sl@0
    23
sl@0
    24
#include <stdio.h>
sl@0
    25
#include <pcstore/pcstoredef.h>
sl@0
    26
#include <pcstore/storereadstream.h>
sl@0
    27
#include <pcstore/storewritestream.h>
sl@0
    28
#include "pcstoreconst.h"
sl@0
    29
sl@0
    30
namespace PCStore
sl@0
    31
{
sl@0
    32
/**
sl@0
    33
@internalComponent
sl@0
    34
*/
sl@0
    35
class TUnicodeCompressionState
sl@0
    36
    {
sl@0
    37
    public:
sl@0
    38
    TUnicodeCompressionState();
sl@0
    39
    void Reset();
sl@0
    40
    static TInt StaticWindowIndex(TUint16 aCode);
sl@0
    41
    static TInt DynamicWindowOffsetIndex(TUint16 aCode);
sl@0
    42
    static TUint32 DynamicWindowBase(TInt aOffsetIndex);
sl@0
    43
    static TBool EncodeAsIs(TUint16 aCode);
sl@0
    44
sl@0
    45
    enum TPanic
sl@0
    46
        {
sl@0
    47
        EUnhandledByte,         // expander code fails to handle all possible byte codes
sl@0
    48
        ENotUnicode,            // expander can't handle Unicode values outside range 0x0..0x10FFFF;
sl@0
    49
                                // that is, 16-bit codes plus 32-bit codes that can be expressed using
sl@0
    50
                                // 16-bit surrogates
sl@0
    51
        EOutputBufferOverflow   // output buffer is not big enough
sl@0
    52
        };
sl@0
    53
sl@0
    54
    static void Panic(TPanic aPanic);
sl@0
    55
sl@0
    56
    protected:
sl@0
    57
sl@0
    58
    enum
sl@0
    59
        {
sl@0
    60
        EStaticWindows = 8,
sl@0
    61
        EDynamicWindows = 8,
sl@0
    62
        ESpecialBases = 7
sl@0
    63
        };
sl@0
    64
sl@0
    65
    TBool iUnicodeMode;                                 // TRUE if in Unicode mode as opposed to single-byte mode
sl@0
    66
    TUint32 iActiveWindowBase;                          // base of the active window - bases are 32-bit because they
sl@0
    67
                                                        // can be set to the surrogate area, which represents codes
sl@0
    68
                                                        // from 0x00010000 to 0x0010FFFF - planes 1-16 of ISO-10646.
sl@0
    69
    static const TUint32 iStaticWindow[EStaticWindows]; // bases of the static windows
sl@0
    70
    static const TUint32 iDynamicWindowDefault[EDynamicWindows];    // default bases of the dynamic windows
sl@0
    71
    static const TUint16 iSpecialBase[ESpecialBases];   // bases for window offsets F9..FF
sl@0
    72
sl@0
    73
    TUint32 iDynamicWindow[EDynamicWindows];            // bases of the dynamic windows
sl@0
    74
    TInt iUnicodeWords;                                 // Unicode words processed; read by compressor, written by expander
sl@0
    75
    TInt iMaxUnicodeWords;                              // maximum number of Unicode words to read or write
sl@0
    76
    TInt iCompressedBytes;                              // compressed bytes processed: read by expander, written by compressor
sl@0
    77
    TInt iMaxCompressedBytes;                           // maximum number of compressed bytes to read or write
sl@0
    78
    };
sl@0
    79
sl@0
    80
/**
sl@0
    81
@internalComponent
sl@0
    82
*/
sl@0
    83
class MUnicodeSource
sl@0
    84
    {
sl@0
    85
    public:
sl@0
    86
    virtual TUint16 ReadUnicodeValueL() = 0;
sl@0
    87
    };
sl@0
    88
sl@0
    89
/**
sl@0
    90
@internalComponent
sl@0
    91
sl@0
    92
A class to read Unicode values directly from memory.
sl@0
    93
*/
sl@0
    94
class TMemoryUnicodeSource: public MUnicodeSource
sl@0
    95
    {
sl@0
    96
    public:
sl@0
    97
    inline TMemoryUnicodeSource(const TUint16* aPtr);
sl@0
    98
    inline TUint16 ReadUnicodeValueL();
sl@0
    99
sl@0
   100
    private:
sl@0
   101
    const TUint16* iPtr;
sl@0
   102
    };
sl@0
   103
sl@0
   104
/**
sl@0
   105
@internalComponent
sl@0
   106
 
sl@0
   107
A class to read Unicode values from a stream built on a memory object.
sl@0
   108
*/
sl@0
   109
class TMemoryStreamUnicodeSource: public MUnicodeSource
sl@0
   110
    {
sl@0
   111
    public:
sl@0
   112
    inline TMemoryStreamUnicodeSource(CStoreReadStream& aStream);
sl@0
   113
    inline TUint16 ReadUnicodeValueL();
sl@0
   114
sl@0
   115
    private:
sl@0
   116
    CStoreReadStream& iStream;
sl@0
   117
    };
sl@0
   118
sl@0
   119
/**
sl@0
   120
@internalComponent
sl@0
   121
 
sl@0
   122
*/
sl@0
   123
class MUnicodeSink
sl@0
   124
    {
sl@0
   125
    public:
sl@0
   126
    virtual void WriteUnicodeValueL(TUint16 aValue) = 0;
sl@0
   127
    };
sl@0
   128
sl@0
   129
/**
sl@0
   130
@internalComponent
sl@0
   131
sl@0
   132
A class to write Unicode values directly to memory.
sl@0
   133
*/
sl@0
   134
class TMemoryUnicodeSink: public MUnicodeSink
sl@0
   135
    {
sl@0
   136
    public:
sl@0
   137
    inline TMemoryUnicodeSink(TUint16* aPtr);
sl@0
   138
    inline void WriteUnicodeValueL(TUint16 aValue);
sl@0
   139
sl@0
   140
    private:
sl@0
   141
    TUint16* iPtr;
sl@0
   142
    };
sl@0
   143
sl@0
   144
/**
sl@0
   145
@internalComponent
sl@0
   146
sl@0
   147
A class to write Unicode values to a stream built on a memory object.
sl@0
   148
*/
sl@0
   149
class TMemoryStreamUnicodeSink: public MUnicodeSink
sl@0
   150
    {
sl@0
   151
    public:
sl@0
   152
    inline TMemoryStreamUnicodeSink(CStoreWriteStream& aStream);
sl@0
   153
    inline void WriteUnicodeValueL(TUint16 aValue);
sl@0
   154
sl@0
   155
    private:
sl@0
   156
    CStoreWriteStream& iStream;
sl@0
   157
    };
sl@0
   158
sl@0
   159
/**
sl@0
   160
@internalComponent
sl@0
   161
 
sl@0
   162
A class to hold functions to compress text using the Standard Compression Scheme for Unicode.
sl@0
   163
*/
sl@0
   164
class TUnicodeCompressor: public TUnicodeCompressionState
sl@0
   165
    {
sl@0
   166
    public:
sl@0
   167
    TUnicodeCompressor();
sl@0
   168
    void CompressL(CStoreWriteStream& aOutput,MUnicodeSource& aInput,
sl@0
   169
                            TInt aMaxOutputBytes = KMaxTInt,TInt aMaxInputWords = KMaxTInt,
sl@0
   170
                            TInt* aOutputBytes = static_cast<TInt*>(NULL),TInt* aInputWords = static_cast<TInt*>(NULL));
sl@0
   171
    void CompressL(TUint8* aOutput,MUnicodeSource& aInput,
sl@0
   172
                            TInt aMaxOutputBytes = KMaxTInt,TInt aMaxInputWords = KMaxTInt,
sl@0
   173
                            TInt* aOutputBytes = static_cast<TInt*>(NULL),TInt* aInputWords = static_cast<TInt*>(NULL));
sl@0
   174
    TInt FlushL(CStoreWriteStream& aOutput,TInt aMaxOutputBytes,TInt& aOutputBytes);
sl@0
   175
    TInt FlushL(TUint8* aOutput,TInt aMaxOutputBytes,TInt& aOutputBytes);
sl@0
   176
    static TInt CompressedSizeL(MUnicodeSource& aInput,TInt aInputWords);
sl@0
   177
sl@0
   178
    private:
sl@0
   179
sl@0
   180
     // A structure to store a character and its treatment code
sl@0
   181
    struct TAction
sl@0
   182
        {
sl@0
   183
        // Treatment codes: static and dynamic window numbers, plain ASCII or plain Unicode
sl@0
   184
        enum
sl@0
   185
            {
sl@0
   186
            EPlainUnicode = -2, // character cannot be expressed as ASCII or using static or dynamic windows
sl@0
   187
            EPlainASCII = -1,   // character can be emitted as an ASCII code
sl@0
   188
            EFirstDynamic = 0,  // values 0..255 are for dynamic windows with offsets at these places in the offset table
sl@0
   189
            ELastDynamic = 255,
sl@0
   190
            EFirstStatic = 256, // values 256..263 are for static windows 0..7
sl@0
   191
            ELastStatic = 263
sl@0
   192
            };
sl@0
   193
sl@0
   194
        inline TAction();
sl@0
   195
        TAction(TUint16 aCode);
sl@0
   196
sl@0
   197
        TUint16 iCode;      // Unicode value of the character
sl@0
   198
        TInt iTreatment;    // treatment code: see above
sl@0
   199
        };
sl@0
   200
sl@0
   201
    void DoCompressL(CStoreWriteStream* aOutputStream,TUint8* aOutputPointer,MUnicodeSource* aInput,
sl@0
   202
                     TInt aMaxCompressedBytes,TInt aMaxUnicodeWords,
sl@0
   203
                     TInt* aCompressedBytes,TInt* aUnicodeWords);
sl@0
   204
    void FlushInputBufferL();
sl@0
   205
    void FlushOutputBufferL();
sl@0
   206
    void WriteRunL();
sl@0
   207
    void WriteCharacter(const TAction& aAction);
sl@0
   208
    void WriteSCharacter(const TAction& aAction);
sl@0
   209
    void WriteUCharacter(TUint16 aCode);
sl@0
   210
    void WriteByte(TUint aByte);
sl@0
   211
    void WriteCharacterFromBuffer();
sl@0
   212
    void SelectTreatment(TInt aTreatment);
sl@0
   213
sl@0
   214
    enum
sl@0
   215
        {
sl@0
   216
        EMaxInputBufferSize = 4,
sl@0
   217
        EMaxOutputBufferSize = EMaxInputBufferSize * 3  // no Unicode character can be encoded as more than three bytes
sl@0
   218
        };
sl@0
   219
    TAction iInputBuffer[EMaxInputBufferSize];          // circular buffer; queue of Unicode characters to be processed
sl@0
   220
    TInt iInputBufferStart;                             // position of first Unicode character to be processed
sl@0
   221
    TInt iInputBufferSize;                              // characters in the input buffer
sl@0
   222
    TUint8 iOutputBuffer[EMaxOutputBufferSize];         // circular buffer; queue of compressed bytes to be output
sl@0
   223
    TInt iOutputBufferStart;                            // position of first compressed byte to be output
sl@0
   224
    TInt iOutputBufferSize;                             // characters in the output buffer
sl@0
   225
    TInt iDynamicWindowIndex;                           // index of the current dynamic window
sl@0
   226
    CStoreWriteStream* iOutputStream;                        // if non-null, output is to this stream
sl@0
   227
    TUint8* iOutputPointer;                             // if non-null, output is to memory
sl@0
   228
    MUnicodeSource* iInput;                             // input object
sl@0
   229
    };
sl@0
   230
sl@0
   231
/**
sl@0
   232
@internalComponent
sl@0
   233
sl@0
   234
A class to hold functions to expand text using the Standard Compression Scheme for Unicode.
sl@0
   235
*/
sl@0
   236
class TUnicodeExpander: public TUnicodeCompressionState
sl@0
   237
    {
sl@0
   238
    public:
sl@0
   239
    TUnicodeExpander();
sl@0
   240
    void ExpandL(MUnicodeSink& aOutput,CStoreReadStream& aInput,
sl@0
   241
                          TInt aMaxOutputWords = KMaxTInt,TInt aMaxInputBytes = KMaxTInt,
sl@0
   242
                          TInt* aOutputWords = static_cast<TInt*>(NULL),TInt* aInputBytes = static_cast<TInt*>(NULL));
sl@0
   243
    void ExpandL(MUnicodeSink& aOutput,const TUint8* aInput,
sl@0
   244
                          TInt aMaxOutputWords = KMaxTInt,TInt aMaxInputBytes = KMaxTInt,
sl@0
   245
                          TInt* aOutputWords = static_cast<TInt*>(NULL),TInt* aInputBytes = static_cast<TInt*>(NULL));
sl@0
   246
    TInt FlushL(MUnicodeSink& aOutput,TInt aMaxOutputWords,TInt& aOutputWords);
sl@0
   247
    static TInt ExpandedSizeL(CStoreReadStream& aInput,TInt aInputBytes);
sl@0
   248
    static TInt ExpandedSizeL(const TUint8* aInput,TInt aInputBytes);
sl@0
   249
sl@0
   250
    private:
sl@0
   251
    void DoExpandL(MUnicodeSink* aOutput,CStoreReadStream* aInputStream,const TUint8* aInputPointer,
sl@0
   252
                   TInt aMaxOutputWords,TInt aMaxInputBytes,
sl@0
   253
                   TInt* aOutputWords,TInt* aInputBytes);
sl@0
   254
    void HandleByteL();
sl@0
   255
    void FlushOutputBufferL();
sl@0
   256
    TBool HandleSByteL(TUint8 aByte);
sl@0
   257
    TBool HandleUByteL(TUint8 aByte);
sl@0
   258
    TBool ReadByteL(TUint8& aByte);
sl@0
   259
    TBool QuoteUnicodeL();
sl@0
   260
    TBool DefineWindowL(TInt aIndex);
sl@0
   261
    TBool DefineExpansionWindowL();
sl@0
   262
    void WriteChar(TText aChar);
sl@0
   263
    void WriteChar32(TUint aChar);
sl@0
   264
sl@0
   265
    enum
sl@0
   266
        {
sl@0
   267
        EMaxInputBufferSize = 3,                        // no Unicode character can be encoded as more than 3 bytes
sl@0
   268
        EMaxOutputBufferSize = 2                        // no byte can be expanded into more than 2 Unicode characters
sl@0
   269
        };
sl@0
   270
    TUint8 iInputBuffer[EMaxInputBufferSize];           // buffer containing a group of compressed bytes representing
sl@0
   271
                                                        // a single operation; when an input source ends in the
sl@0
   272
                                                        // middle of an operation, this buffer enables the next
sl@0
   273
                                                        // expansion to start in the correct state
sl@0
   274
    TInt iInputBufferStart;                             // next read position in the input buffer
sl@0
   275
    TInt iInputBufferSize;                              // bytes in the input buffer
sl@0
   276
    TUint16 iOutputBuffer[EMaxOutputBufferSize];        // circular buffer; queue of Unicode characters to be output
sl@0
   277
    TInt iOutputBufferStart;                            // position of first Unicode character to be output
sl@0
   278
    TInt iOutputBufferSize;                             // characters in the output buffer
sl@0
   279
    MUnicodeSink* iOutput;                              // output object
sl@0
   280
    CStoreReadStream* iInputStream;                          // if non-null, input is from this stream
sl@0
   281
    const TUint8* iInputPointer;                        // if non-null, input is from memory
sl@0
   282
    };
sl@0
   283
sl@0
   284
// inline functions start here
sl@0
   285
sl@0
   286
inline TMemoryUnicodeSource::TMemoryUnicodeSource(const TUint16* aPtr):
sl@0
   287
    iPtr(aPtr)
sl@0
   288
    {
sl@0
   289
    }
sl@0
   290
sl@0
   291
inline TUint16 TMemoryUnicodeSource::ReadUnicodeValueL()
sl@0
   292
    {
sl@0
   293
    return *iPtr++;
sl@0
   294
    }
sl@0
   295
sl@0
   296
inline TMemoryStreamUnicodeSource::TMemoryStreamUnicodeSource(CStoreReadStream& aStream):
sl@0
   297
    iStream(aStream)
sl@0
   298
    {
sl@0
   299
    }
sl@0
   300
sl@0
   301
inline TUint16 TMemoryStreamUnicodeSource::ReadUnicodeValueL()
sl@0
   302
    {
sl@0
   303
    TUint16 x;
sl@0
   304
    iStream.Read(reinterpret_cast<TUint8*>(&x),sizeof(TUint16));
sl@0
   305
    return x;
sl@0
   306
    }
sl@0
   307
sl@0
   308
inline TMemoryUnicodeSink::TMemoryUnicodeSink(TUint16* aPtr):
sl@0
   309
    iPtr(aPtr)
sl@0
   310
    {
sl@0
   311
    }
sl@0
   312
sl@0
   313
inline void TMemoryUnicodeSink::WriteUnicodeValueL(TUint16 aValue)
sl@0
   314
    {
sl@0
   315
    *iPtr++ = aValue;
sl@0
   316
    }
sl@0
   317
sl@0
   318
inline TMemoryStreamUnicodeSink::TMemoryStreamUnicodeSink(CStoreWriteStream& aStream):
sl@0
   319
    iStream(aStream)
sl@0
   320
    {
sl@0
   321
    }
sl@0
   322
sl@0
   323
inline void TMemoryStreamUnicodeSink::WriteUnicodeValueL(TUint16 aValue)
sl@0
   324
    {
sl@0
   325
    iStream.Write(reinterpret_cast<TUint8*>(&aValue),sizeof(TUint16));
sl@0
   326
    }
sl@0
   327
sl@0
   328
inline TUnicodeCompressor::TAction::TAction():
sl@0
   329
    iCode(0),
sl@0
   330
    iTreatment(EPlainUnicode)
sl@0
   331
    {
sl@0
   332
    }
sl@0
   333
}
sl@0
   334
#endif // !defined(__UNICODECOMPRESSION_H__)