Update contrib.
1 // Copyright (c) 2007-2009 Nokia Corporation and/or its subsidiary(-ies).
2 // All rights reserved.
3 // This component and the accompanying materials are made available
4 // under the terms of the License "Eclipse Public License v1.0"
5 // which accompanies this distribution, and is available
6 // at the URL "http://www.eclipse.org/legal/epl-v10.html".
8 // Initial Contributors:
9 // Nokia Corporation - initial contribution.
14 // e32\include\byte_pair_compress.h
15 // This header file contains both the prototype and implementation for the byte pair compressor.
16 // This is done to facilitate sharing the code between the e32 test code and the tools. The
17 // implementation is only included if the macro BYTE_PAIR_COMPRESS_INCLUDE_IMPLEMENTATION is
20 // WARNING: This file contains some APIs which are internal and are subject
21 // to change without notice. Such APIs should therefore not be used
22 // outside the Kernel and Hardware Services package.
25 #ifndef __BYTE_PAIR_COMPRESS_H__
26 #define __BYTE_PAIR_COMPRESS_H__
33 * Compress up to 4096 bytes of data usign the byte-pair compression algorithm.
35 * @param aDest Destination buffer, must be at least four times the size of the source data.
36 * @param aSrc Source data to compress.
37 * @param aSize The size of the source data.
39 extern TInt BytePairCompress(TUint8* aDest, TUint8* aSrc, TInt aSize);
41 #ifdef BYTE_PAIR_COMPRESS_INCLUDE_IMPLEMENTATION
43 const TInt BlockSize = 0x1000;
46 TUint16 PairCount[0x10000];
47 TUint16 PairBuffer[BlockSize*2];
49 TUint16 GlobalPairs[0x10000] = {0};
50 TUint16 GlobalTokenCounts[0x100] = {0};
52 TUint16 ByteCount[0x100+4];
54 void CountBytes(TUint8* data, TInt size)
56 memset(ByteCount,0,sizeof(ByteCount));
57 TUint8* dataEnd = data+size;
62 inline void ByteUsed(TInt b)
64 ByteCount[b] = 0xffff;
67 int TieBreak(int b1,int b2)
69 return -ByteCount[b1]-ByteCount[b2];
72 TInt MostCommonPair(TInt& pair, TUint8* data, TInt size, TInt minFrequency, TInt marker)
74 memset(PairCount,0,sizeof(PairCount));
75 TUint8* dataEnd = data+size-1;
83 // skip marker and following byte
91 // skip marker and following byte
99 // ensure a pair of identical bytes don't get double counted
105 if(PairCount[p]==minFrequency)
106 PairBuffer[pairsFound++] = (TUint16)p;
111 TInt bestTieBreak = 0;
115 p = PairBuffer[pairsFound];
121 bestTieBreak = TieBreak(p&0xff,p>>8);
123 else if(f==bestCount)
125 TInt tieBreak = TieBreak(p&0xff,p>>8);
126 if(tieBreak>bestTieBreak)
130 bestTieBreak = tieBreak;
138 TInt LeastCommonByte(TInt& byte)
140 TInt bestCount = 0xffff;
142 for(TInt b = 0; b<0x100; b++)
144 TInt f = ByteCount[b];
155 TInt BytePairCompress(TUint8* dst, TUint8* src, TInt size)
157 TInt originalSize = size;
158 TUint8* dst2 = dst+size*2;
162 TUint8 tokens[0x100*3];
168 TInt overhead = 1+3+LeastCommonByte(marker);
171 TUint8* inEnd = in+size;
172 TUint8* outStart = out;
186 for(TInt r=256; r>0; --r)
189 TInt byteCount = LeastCommonByte(byte);
191 TInt pairCount = MostCommonPair(pair,in,size,overhead+1,marker);
192 TInt saving = pairCount-byteCount;
200 TUint8* d=tokens+3*tokenCount;
206 *d++ = (TUint8)(pair>>8);
217 *out++ = (TUint8)marker;
222 *out++ = (TUint8)marker;
225 else if(b==(pair&0xff) && in<inEnd && *in==(pair>>8))
250 // sort tokens with a bubble sort...
251 for(TInt x=0; x<tokenCount-1; x++)
252 for(TInt y=x+1; y<tokenCount; y++)
253 if(tokens[x*3]>tokens[y*3])
255 TInt z = tokens[x*3];
256 tokens[x*3] = tokens[y*3];
257 tokens[y*3] = (TUint8)z;
259 tokens[x*3+1] = tokens[y*3+1];
260 tokens[y*3+1] = (TUint8)z;
262 tokens[x*3+2] = tokens[y*3+2];
263 tokens[y*3+2] = (TUint8)z;
266 // check for not being able to compress...
267 if(size>originalSize)
269 *dst++ = 0; // store zero token count
270 memcpy(dst,src,originalSize); // store original data
271 return originalSize+1;
274 // make sure data is in second buffer (dst2)
276 memcpy(dst2,dst,size);
279 TUint8* originalDst = dst;
280 *dst++ = (TUint8)tokenCount;
283 *dst++ = (TUint8)marker;
286 memcpy(dst,tokens,tokenCount*3);
291 TUint8* bitMask = dst;
292 memset(bitMask,0,32);
298 bitMask[t>>3] |= (1<<(t&7));
306 memcpy(dst,dst2,size);
310 ++GlobalTokenCounts[tokenCount];
312 // return total size of compressed data...
313 return dst-originalDst;