Update contrib.
1 // Copyright (c) 1998-2009 Nokia Corporation and/or its subsidiary(-ies).
2 // All rights reserved.
3 // This component and the accompanying materials are made available
4 // under the terms of "Eclipse Public License v1.0"
5 // which accompanies this distribution, and is available
6 // at the URL "http://www.eclipse.org/legal/epl-v10.html".
8 // Initial Contributors:
9 // Nokia Corporation - initial contribution.
14 // Store database compression code
22 #define __EXTRA_DEFLATE
25 // deflation constants
26 const TInt KDeflateMinLength=3;
27 const TInt KDeflateMaxLength=258;
28 const TInt KDeflateMaxDistance=4096;
29 const TInt KDeflateDistCodeBase=0x200;
30 // huffman coding/decoding
31 const TInt KHuffMaxCodeLength=25;
32 const TInt KHuffTerminate=1;
33 const TUint KBitsEmpty=0x80000000u;
34 const TUint KBitsInit=KBitsEmpty>>1;
35 const TUint KBitsFull=KBitsEmpty>>8;
36 const TUint KBitsEOF=KBitsEmpty>>9;
37 const TUint KBitsNext=0x80u;
39 const TInt KDeflateMetaCodes=26;
41 const TUint KDeflateHashMultiplier=0xAC4B9B19u;
42 const TInt KDeflateHashShift=24;
47 static void EncodingL(TUint32* aEncoding,TInt aCodes);
48 static void Decoding(TUint32* aDecoding,TInt aCodes,TInt aBase=0);
50 typedef TUint16 THuff;
63 static void Lengths(TUint32* aLengths,const TNode* aNodes,TInt aNode,TInt aLen);
64 static TUint32* SubTree(TUint32* aPtr,const TUint32* aValue,TUint32** aLevel);
70 THuffEncoder(RWriteStream& aStream);
72 void EncodeL(TUint aCode,TInt aLength);
73 void EncodeL(TUint32 aHuffCode);
76 enum {EBufSize=0x100};
78 TUint8 iBuf[EBufSize];
79 RWriteStream& iStream;
80 TUint32 iCode; // code in production
88 inline static HDeflateHash& NewLC(TInt aLinks);
90 inline TInt First(const TUint8* aPtr,TInt aPos);
91 inline TInt Next(TInt aPos,TInt aOffset) const;
93 inline HDeflateHash();
94 inline static TInt Hash(const TUint8* aPtr);
96 typedef TUint16 TOffset;
99 TOffset iOffset[1]; // or more
105 void DeflateL(const TUint8* aBase,TInt aLength);
107 const TUint8* DoDeflateL(const TUint8* aBase,const TUint8* aEnd,HDeflateHash& aHash);
108 static TInt Match(const TUint8* aPtr,const TUint8* aEnd,TInt aPos,HDeflateHash& aHas);
109 void SegmentL(TInt aLength,TInt aDistance);
110 virtual void LitLenL(TInt aCode) =0;
111 virtual void OffsetL(TInt aCode) =0;
112 virtual void ExtraL(TInt aLen,TUint aBits) =0;
118 TInflater(const TUint8* aIn,const CDbStoreCompression::TEncoding& aDecoding);
120 inline const TUint8* Ptr() const;
121 inline static TInt BufferSize();
125 const TUint8* iRptr; // partial segment
127 const TUint32* iLitLenTree;
128 const TUint32* iDistTree;
129 TUint8 iOut[KDeflateMaxDistance]; // circular buffer for distance matches
132 NONSHARABLE_CLASS(TDeflateStats) : public MDeflater
135 inline TDeflateStats(CDbStoreCompression::TEncoding& aEncoding);
138 void LitLenL(TInt aCode);
139 void OffsetL(TInt aCode);
140 void ExtraL(TInt aLen,TUint aBits);
142 CDbStoreCompression::TEncoding& iEncoding;
145 NONSHARABLE_CLASS(TDeflater) : public MDeflater
148 inline TDeflater(THuffEncoder& aEncoder,const CDbStoreCompression::TEncoding& aEncoding);
151 void LitLenL(TInt aCode);
152 void OffsetL(TInt aCode);
153 void ExtraL(TInt aLen,TUint aBits);
155 THuffEncoder& iEncoder;
156 const CDbStoreCompression::TEncoding& iEncoding;
159 NONSHARABLE_CLASS(HDeflateBuf) : public TBufBuf
162 enum TMode {EAnalysis,EDeflate}; // mirror CDbStoreCompression enum
164 static HDeflateBuf* NewL(MStreamBuf* aHost,CDbStoreCompression::TEncoding& aEncoding,TMode aMode);
166 inline HDeflateBuf(MStreamBuf* aHost,CDbStoreCompression::TEncoding& aEncoding,CBufBase* aBuf,TMode aMode);
167 virtual inline ~HDeflateBuf();
173 CDbStoreCompression::TEncoding& iEncoding;
178 NONSHARABLE_CLASS(HInflateBuf) : public TBufBuf
181 static HInflateBuf* NewL(MStreamBuf* aHost,const CDbStoreCompression::TEncoding& aEncoding);
183 inline HInflateBuf(CBufBase* aBuf);
184 virtual inline ~HInflateBuf();
191 NONSHARABLE_CLASS(CDbStoreTable::CCompressor) : public CBase, public CCluster::MAlter
194 inline CCompressor();
196 void ProcessL(CDbStoreTable* aTable);
198 TUint8* AlterRecordL(TUint8* aWPtr,const TUint8* aRPtr,TInt aLength);
200 CDbStoreTable* iTable;
206 // This class builds a huffman encoding from a frequency table and builds
207 // a decoding tree from a code-lengths table
209 // the encoding generated is based on the rule that given two symbols s1 and s2, with
210 // code length l1 and l2, and huffman codes h1 and h2:
212 // if l1<l2 then h1<h2 when compared lexicographically
213 // if l1==l2 and s1<s2 then h1<h2 ditto
215 // This allows the encoding to be stored compactly as a table of code lengths
218 // recursive function to calculate the code lengths from the node tree
220 void Huffman::Lengths(TUint32* aLengths,const TNode* aNodes,TInt aNode,TInt aLen)
222 __ASSERT(aLen<KHuffMaxCodeLength);
224 const TNode& node=aNodes[aNode];
225 if (node.iLeft&KLeaf)
226 aLengths[node.iLeft&~KLeaf]=aLen;
228 Lengths(aLengths,aNodes,node.iLeft,aLen);
229 if (node.iRight&KLeaf)
230 aLengths[node.iRight&~KLeaf]=aLen;
232 Lengths(aLengths,aNodes,node.iRight,aLen);
236 // write the subtree below aPtr and return the head
238 TUint32* Huffman::SubTree(TUint32* aPtr,const TUint32* aValue,TUint32** aLevel)
240 TUint32* l=*aLevel++;
243 TUint32* sub1=SubTree(aPtr,aValue,aLevel); // 0-tree first
244 aPtr=SubTree(sub1,aValue-(aPtr-sub1)-1,aLevel); // 1-tree
245 TInt branch=(TUint8*)sub1-(TUint8*)aPtr;
250 TUint term0=*aValue--; // 0-term
251 aPtr=SubTree(aPtr,aValue,aLevel); // 1-tree
256 TUint term0=*aValue--; // 0-term
257 TUint term1=*aValue--;
258 *--aPtr=(term1>>16<<16)|(term0>>16);
264 // Build a huffman encoding table from a symbol frequency table
265 // aTable contains frequency data on input for aCodes symbols
266 // aTable contains the huffman encoding on output
268 void Huffman::EncodingL(TUint32* aTable,TInt aCodes)
271 // step 1. Sort the values into decreasing order of frequency
273 TLeaf* leaves=new(ELeave) TLeaf[aCodes];
274 CleanupArrayDeletePushL(leaves);
277 for (ii=0;ii<aCodes;++ii)
281 continue; // no coding for ii
283 for (jj=0;jj<lCount;++jj)
285 if (leaves[jj].iCount<=c)
288 Mem::Move(leaves+jj+1,leaves+jj,sizeof(TLeaf)*(lCount-jj));
290 leaves[jj].iVal=THuff(ii|KLeaf);
294 // Huffman algorithm: pair off least frequent nodes and reorder
295 // result is the code lengths in aTable[]
297 if (lCount==1) // special case for a single value (always encode as "0")
298 aTable[leaves[0].iVal&~KLeaf]=1;
300 { // don't encode for empty coding: leaves in order now
302 TNode* nodes=new(ELeave) TNode[lCount-1];
305 TNode& node=nodes[max];
306 node.iLeft=leaves[lCount-1].iVal;
307 node.iRight=leaves[lCount].iVal;
308 // re-order the leaves now to reflect new combined frequency
309 TUint c=leaves[lCount-1].iCount+leaves[lCount].iCount;
313 if (leaves[jj-1].iCount>=c)
316 Mem::Move(leaves+jj+1,leaves+jj,sizeof(TLeaf)*(lCount-1-jj));
319 leaves[jj].iVal=THuff(max);
322 Lengths(aTable,nodes,leaves[0].iVal,0);
325 CleanupStack::PopAndDestroy(); // leaves
327 // step 3: Generate the coding based on the code lengths
329 TInt lenCount[KHuffMaxCodeLength];
330 Mem::FillZ(lenCount,sizeof(lenCount));
332 for (ii=aCodes;--ii>=0;)
334 TInt len=aTable[ii]-1;
339 TUint nextCode[KHuffMaxCodeLength];
341 for (ii=0;ii<KHuffMaxCodeLength;++ii)
344 code=(code+lenCount[ii])<<1;
347 for (ii=0;ii<aCodes;++ii)
352 aTable[ii] = (nextCode[len-1]<<(KHuffMaxCodeLength-len))|(len<<KHuffMaxCodeLength);
359 // generate the decoding tree from the huffman code length data
360 // output alphabet is [aBase,aBase+aCodes)
362 void Huffman::Decoding(TUint32* aDecoding,TInt aCodes,TInt aBase)
364 TInt counts[KHuffMaxCodeLength];
365 Mem::FillZ(counts,sizeof(counts));
370 TUint len=aDecoding[ii];
371 __ASSERT(len<=(TUint)KHuffMaxCodeLength);
379 TUint32* level[KHuffMaxCodeLength];
380 TUint32* lit=aDecoding+codes;
381 for (ii=0;ii<KHuffMaxCodeLength;++ii)
386 aBase=(aBase<<17)+(KHuffTerminate<<16);
387 for (ii=0;ii<aCodes;++ii)
389 TUint len=TUint8(aDecoding[ii]);
391 *--level[len-1]|=(ii<<17)+aBase;
393 if (codes==1) // codes==1 special case: tree is not complete
394 *aDecoding>>=16; // 0-terminate at root
397 __DEBUG(TUint32* p=) SubTree(aDecoding+codes-1,aDecoding+codes-1,level);
398 __ASSERT(p==aDecoding);
402 // Class HDeflateHash
404 inline HDeflateHash::HDeflateHash()
405 {TInt* p=iHash+256;do *--p=-KDeflateMaxDistance-1; while (p>iHash);}
407 inline HDeflateHash& HDeflateHash::NewLC(TInt aLinks)
409 __ASSERT(!(KDeflateMaxDistance&(KDeflateMaxDistance-1))); // ensure power of two
410 return *new(User::AllocLC(_FOFF(HDeflateHash,iOffset[Min(aLinks,KDeflateMaxDistance)]))) HDeflateHash;
413 inline TInt HDeflateHash::Hash(const TUint8* aPtr)
415 TUint x=aPtr[0]|(aPtr[1]<<8)|(aPtr[2]<<16);
416 return (x*KDeflateHashMultiplier)>>KDeflateHashShift;
419 inline TInt HDeflateHash::First(const TUint8* aPtr,TInt aPos)
422 TInt offset=Min(aPos-iHash[h],KDeflateMaxDistance<<1);
424 iOffset[aPos&(KDeflateMaxDistance-1)]=TOffset(offset);
428 inline TInt HDeflateHash::Next(TInt aPos,TInt aOffset) const
429 {return aOffset+iOffset[(aPos-aOffset)&(KDeflateMaxDistance-1)];}
434 // generic deflation algorithm, can do either statistics and the encoder
436 TInt MDeflater::Match(const TUint8* aPtr,const TUint8* aEnd,TInt aPos,HDeflateHash& aHash)
438 TInt offset=aHash.First(aPtr,aPos);
439 if (offset>KDeflateMaxDistance)
442 aEnd=Min(aEnd,aPtr+KDeflateMaxLength);
446 const TUint8* p=aPtr-offset;
448 { // might be a better match
449 const TUint8* m=aPtr;
456 return ((m-aPtr)<<16)|offset;
461 match=(l<<16)|offset;
465 offset=aHash.Next(aPos,offset);
466 } while (offset<=KDeflateMaxDistance);
471 // Apply the deflation algorithm to the data [aBase,aEnd)
472 // Return a pointer after the last byte that was deflated (which may not be aEnd)
474 const TUint8* MDeflater::DoDeflateL(const TUint8* aBase,const TUint8* aEnd,HDeflateHash& aHash)
476 __ASSERT(aEnd-aBase>KDeflateMinLength);
478 const TUint8* ptr=aBase;
479 #ifdef __EXTRA_DEFLATE
480 TInt prev=0; // the previous deflation match
484 TInt match=Match(ptr,aEnd,ptr-aBase,aHash);
485 #ifdef __EXTRA_DEFLATE
486 // Extra deflation applies two optimisations which double the time taken
487 // 1. If we have a match at p, then test for a better match at p+1 before using it
488 // 2. When we have a match, add the hash links for all the data which will be skipped
489 if (match>>16 < prev>>16)
490 { // use the previous match--it was better
492 SegmentL(len,prev-(len<<16));
493 // fill in missing hash entries for better compression
494 const TUint8* e=ptr+len-2;
498 aHash.First(ptr,ptr-aBase);
502 else if (match<=(KDeflateMinLength<<16))
503 LitLenL(*ptr); // no deflation match here
505 { // save this match and test the next position
506 if (prev) // we had a match at ptr-1, but this is better
512 // Basic deflation will store any match found, and not update the hash links for the
513 // data which is skipped
514 if (match<=(KDeflateMinLength<<16)) // no match
519 SegmentL(len,match-(len<<16));
523 } while (ptr+KDeflateMinLength-1<aEnd);
524 #ifdef __EXTRA_DEFLATE
526 { // emit the stored match
528 SegmentL(len,prev-(len<<16));
536 // The generic deflation algorithm
538 void MDeflater::DeflateL(const TUint8* aBase,TInt aLength)
540 const TUint8* end=aBase+aLength;
541 if (aLength>KDeflateMinLength)
542 { // deflation kicks in if there is enough data
543 HDeflateHash& hash=HDeflateHash::NewLC(aLength);
544 aBase=DoDeflateL(aBase,end,hash);
545 CleanupStack::PopAndDestroy();
547 while (aBase<end) // emit remaining bytes
549 LitLenL(CDbStoreCompression::TEncoding::EEos); // eos marker
553 // Turn a (length,offset) pair into the deflation codes+extra bits before calling
554 // the specific LitLen(), Offset() and Extra() functions.
556 void MDeflater::SegmentL(TInt aLength,TInt aDistance)
558 __ASSERT(aLength>=KDeflateMinLength && aLength<=KDeflateMaxLength);
559 aLength-=KDeflateMinLength;
567 __ASSERT((extralen<<2)+len<CDbStoreCompression::TEncoding::ELengths);
568 LitLenL((extralen<<2)+len+CDbStoreCompression::TEncoding::ELiterals);
570 ExtraL(extralen,TUint(aLength)<<(32-extralen));
572 __ASSERT(aDistance>0 && aDistance<=KDeflateMaxDistance);
575 TUint dist=aDistance;
581 __ASSERT((extralen<<2)+dist<CDbStoreCompression::TEncoding::EDistances);
582 OffsetL((extralen<<2)+dist);
584 ExtraL(extralen,TUint(aDistance)<<(32-extralen));
587 // Class TDeflateStats
589 // This class analyses the data stream to generate the frequency tables
590 // for the deflation algorithm
592 inline TDeflateStats::TDeflateStats(CDbStoreCompression::TEncoding& aEncoding)
593 :iEncoding(aEncoding)
596 void TDeflateStats::LitLenL(TInt aCode)
598 ++iEncoding.iLitLen[aCode];
601 void TDeflateStats::OffsetL(TInt aCode)
603 ++iEncoding.iDistance[aCode];
606 void TDeflateStats::ExtraL(TInt,TUint)
609 // Class THuffEncoder
611 // This class generates the byte stream of huffman codes, writing them out to the stream
613 THuffEncoder::THuffEncoder(RWriteStream& aStream)
614 :iStream(aStream),iCode(0),iBits(-8),iWrite(iBuf)
618 // Store a huffman code generated by Huffman::EncodingL()
620 void THuffEncoder::EncodeL(TUint32 aHuffCode)
622 EncodeL(aHuffCode<<(32-KHuffMaxCodeLength),aHuffCode>>KHuffMaxCodeLength);
626 // Store aLength bits from the most significant bits of aCode
628 void THuffEncoder::EncodeL(TUint aCode,TInt aLength)
631 TUint code=iCode|(aCode>>(bits+8));
635 TUint8* write=iWrite;
638 if (write-EBufSize==iBuf)
640 iStream.WriteL(iBuf,EBufSize);
643 *write++=TUint8(code>>24);
654 // Terminate the huffman coding. The longest code is always 1111111111
656 void THuffEncoder::CompleteL()
659 EncodeL(0xffffffffu,-iBits);
661 iStream.WriteL(iBuf,iWrite-iBuf);
666 // Extends MDeflater to provide huffman encoding of the output
669 // construct for encoding
671 inline TDeflater::TDeflater(THuffEncoder& aEncoder,const CDbStoreCompression::TEncoding& aEncoding)
672 :iEncoder(aEncoder),iEncoding(aEncoding)
675 void TDeflater::LitLenL(TInt aCode)
677 iEncoder.EncodeL(iEncoding.iLitLen[aCode]);
680 void TDeflater::OffsetL(TInt aCode)
682 iEncoder.EncodeL(iEncoding.iDistance[aCode]);
685 void TDeflater::ExtraL(TInt aLen,TUint aBits)
687 iEncoder.EncodeL(aBits,aLen);
692 // The inflation algorithm, complete with huffman decoding
694 TInflater::TInflater(const TUint8* aIn,const CDbStoreCompression::TEncoding& aEncoding)
695 :iIn(aIn),iBits(KBitsInit),iLen(0),iLitLenTree(aEncoding.iLitLen),iDistTree(aEncoding.iDistance)
699 // consume all data lag in the history buffer, then decode to fill up the output buffer
701 TInt TInflater::Inflate()
703 // empty the history buffer into the output
704 const TUint8* data=iIn;
706 const TUint8* from=iRptr;
709 TUint8* const end=out+KDeflateMaxDistance;
720 // get a huffman code
726 if ((bits<<=1)&KBitsEmpty)
727 bits=*data++|KBitsFull;
730 if (huff&(KHuffTerminate<<16))
735 if (huff&KHuffTerminate)
741 node=PtrAdd(node,huff);
744 TInt val=TInt(huff>>17)-CDbStoreCompression::TEncoding::ELiterals;
749 continue; // another literal/length combo
751 if (val==CDbStoreCompression::TEncoding::EEos-CDbStoreCompression::TEncoding::ELiterals)
752 { // eos marker. we're done
756 // get the extra bits for the code
760 TInt xtra=(code>>2)-1;
764 if ((bits<<=1)&KBitsEmpty)
765 bits=*data++|KBitsFull;
771 if (val<KDeflateDistCodeBase-CDbStoreCompression::TEncoding::ELiterals)
772 { // length code... get the code
773 len=code+KDeflateMinLength;
774 __ASSERT(len<=KDeflateMaxLength);
776 continue; // read the huffman code
779 __ASSERT(code<KDeflateMaxDistance);
781 if (from+KDeflateMaxDistance<end)
782 from+=KDeflateMaxDistance;
785 TInt tfr=Min(end-out,len);
791 from-=KDeflateMaxDistance;
802 inline const TUint8* TInflater::Ptr() const
804 inline TInt TInflater::BufferSize()
805 {return KDeflateMaxDistance;}
809 // This stream buffer applies the analysis or deflation and huffman coding
810 // on the entire stream data when it is committed
812 inline HDeflateBuf::HDeflateBuf(MStreamBuf* aHost,CDbStoreCompression::TEncoding& aEncoding,CBufBase* aBuf,TMode aMode)
813 :iHost(aHost),iEncoding(aEncoding),iBuf(aBuf),iMode(aMode)
816 HDeflateBuf* HDeflateBuf::NewL(MStreamBuf* aHost,CDbStoreCompression::TEncoding& aEncoding,TMode aMode)
818 CBufBase* buf=CBufFlat::NewL(512);
819 CleanupStack::PushL(buf);
820 HDeflateBuf* self=new(ELeave) HDeflateBuf(aHost,aEncoding,buf,aMode);
825 inline HDeflateBuf::~HDeflateBuf()
826 {delete iBuf;iHost.Release();}
828 void HDeflateBuf::DoRelease()
834 // This is where it all happens
836 void HDeflateBuf::DoSynchL()
838 if (iMode==EAnalysis)
840 TDeflateStats deflater(iEncoding);
841 deflater.DeflateL(iBuf->Ptr(0).Ptr(),iBuf->Size());
845 THuffEncoder encoder(iHost);
846 TDeflater deflater(encoder,iEncoding);
847 deflater.DeflateL(iBuf->Ptr(0).Ptr(),iBuf->Size());
855 // Inflate the input stream. This is not a filter, it reads all the input, inflates it and
856 // keeps it in a memory buffer.
858 const TInt KInflateBufSize=0x800; // 2K
860 HInflateBuf::HInflateBuf(CBufBase* aBuf)
866 inline HInflateBuf::~HInflateBuf()
869 void HInflateBuf::DoRelease()
874 HInflateBuf* HInflateBuf::NewL(MStreamBuf* aHost,const CDbStoreCompression::TEncoding& aEncoding)
876 CBufFlat* host=CBufFlat::NewL(256);
877 CleanupStack::PushL(host);
878 TUint8 buffer[KInflateBufSize];
881 TInt len=aHost->ReadL(buffer,KInflateBufSize);
883 host->InsertL(host->Size(),buffer,len);
884 if (len<KInflateBufSize)
887 CBufSeg* out=CBufSeg::NewL(256);
888 CleanupStack::PushL(out);
889 TInflater* inflater=new(ELeave) TInflater(host->Ptr(0).Ptr(),aEncoding);
890 CleanupStack::PushL(inflater);
893 TInt len=inflater->Inflate();
895 out->InsertL(out->Size(),inflater->Ptr(),len);
896 if (len<inflater->BufferSize())
899 HInflateBuf* buf=new(ELeave) HInflateBuf(out);
900 CleanupStack::PopAndDestroy(); // inflater
901 CleanupStack::Pop(); // out
902 CleanupStack::PopAndDestroy(); // host
903 aHost->Release(); // don't need this anymore
907 // Class CDbStoreTable::Compressor
909 // This class processes an entire table for analysis or compression, using the
910 // CDbStoreRecords::AlterL() functionality and call back to ensure that all clusters
911 // and BLOBs are read and written.
913 inline CDbStoreTable::CCompressor::CCompressor()
916 CDbStoreTable::CCompressor::~CCompressor()
924 // Walk through every cluster in the table
926 void CDbStoreTable::CCompressor::ProcessL(CDbStoreTable* aTable)
929 CDbStoreRecords& rec=aTable->StoreRecordsL();
930 for (TClusterId cluster=rec.Head();cluster!=KNullClusterId;cluster=rec.AlterL(cluster,*this))
935 // Compress every blob, and transfer the record from aRPtr to aWPtr
937 TUint8* CDbStoreTable::CCompressor::AlterRecordL(TUint8* aWPtr,const TUint8* aRPtr,TInt aLength)
939 if (iTable->Def().Columns().HasLongColumns())
941 iTable->CopyToRowL(iRow,TPtrC8(aRPtr,aLength));
942 CDbBlobSpace* blobs=iTable->BlobsL();
944 HDbColumnSet::TIteratorC iter=iTable->Def().Columns().Begin();
945 const HDbColumnSet::TIteratorC end=iTable->Def().Columns().End();
948 if (!TDbCol::IsLong(iter->Type()))
950 TDbBlob& blob=CONST_CAST(TDbBlob&,TDbColumnC(iRow,col).Blob());
953 // do what has to be done...?
954 TUint8* data=(TUint8*)User::AllocLC(blob.Size());
955 blobs->ReadLC(blob.Id(),iter->Type())->ReadL(data,blob.Size());
956 CleanupStack::PopAndDestroy(); // stream buffer
957 // re-write the Blob to compress it
958 blobs->DeleteL(blob.Id());
959 blob.SetId(blobs->CreateL(iter->Type(),data,blob.Size()));
960 CleanupStack::PopAndDestroy(); // data
961 } while (++col,++iter<end);
962 iTable->CopyFromRow(aWPtr,iRow);
965 Mem::Copy(aWPtr,aRPtr,aLength);
966 return aWPtr+aLength;
969 // Class CDbStoreCompression
971 // This class manages the compression for the database, applying filters as appropriate
972 // It also defines the extrenalisation format for the huffman trees
974 const TInt KDeflationCodes=3*(CDbStoreCompression::TEncoding::ELitLens+CDbStoreCompression::TEncoding::EDistances);
976 inline CDbStoreCompression::CDbStoreCompression()
977 // :iState(EAnalysis)
980 CDbStoreCompression* CDbStoreCompression::NewL()
982 return new(ELeave) CDbStoreCompression;
986 // Build huffman codings from the freqeuncy tables
988 void CDbStoreCompression::EncodeL()
990 //Check the comments in CDbStoreCompression::InternalizeL().
991 //The implementation there is very similar to this one and is commented why the "array overrun"
992 //case is impossible.
993 __ASSERT(iState==EAnalysis);
994 TUint32* p=iEncoding[0].iLitLen;
995 TUint32* end=p+KDeflationCodes;
998 Huffman::EncodingL(p,TEncoding::ELitLens);
999 p+=TEncoding::ELitLens;
1000 //coverity[overrun-local]
1001 Huffman::EncodingL(p,TEncoding::EDistances);
1002 //coverity[overrun-local]
1003 p+=TEncoding::EDistances;
1009 // Store the encoding tables as a sequence of code lengths
1010 // The code lengths (0-25) are themselves huffman coded, and the meta coding is stored first
1012 void CDbStoreCompression::ExternalizeL(RWriteStream& aStream) const
1014 __ASSERT(iState==EEncoding);
1015 const TUint32* base=iEncoding[0].iLitLen;
1016 const TUint32* end=base+KDeflationCodes;
1017 TUint32 codes[KDeflateMetaCodes];
1018 Mem::FillZ(codes,sizeof(codes));
1019 const TUint32* p=base;
1020 do ++codes[*p++>>KHuffMaxCodeLength]; while (p<end);
1021 Huffman::EncodingL(codes,KDeflateMetaCodes);
1022 // save the meta encoding
1023 p=codes+KDeflateMetaCodes;
1028 c0>>=KHuffMaxCodeLength;
1029 c1>>=KHuffMaxCodeLength;
1030 aStream.WriteUint8L((c0<<4)|c1);
1032 // write the encoding
1033 THuffEncoder encoder(aStream);
1035 do encoder.EncodeL(codes[*p++>>KHuffMaxCodeLength]); while (p<end);
1036 encoder.CompleteL();
1040 // Internalize a previous saved encoding
1042 void CDbStoreCompression::InternalizeL(RReadStream& aStream)
1044 __ASSERT(iState!=EEncoding);
1046 // read the meta encoding
1047 TUint32 decode[KDeflateMetaCodes];
1048 TUint32* p=decode+KDeflateMetaCodes;
1051 TUint8 c=aStream.ReadUint8L();
1055 Huffman::Decoding(decode,KDeflateMetaCodes);
1056 // decode the encoding
1057 p=iEncoding[0].iLitLen;
1058 TUint32* end=p+KDeflationCodes;
1059 TUint bits=KBitsInit;
1062 const TUint32* node=decode;
1067 if ((bits<<=1)&KBitsEmpty)
1068 bits=aStream.ReadUint8L()|KBitsFull;
1071 if (huff&(KHuffTerminate<<16))
1076 if (huff&KHuffTerminate)
1082 node=PtrAdd(node,huff);
1087 // convert the length tables into huffman decoding trees
1088 //The iEncoding data member is an array of 3 elements of TEncoding type.
1089 //The TEncoding layout is: TUint32 iLitLen[ELitLens], TUint32 iDistance[EDistances].
1090 //Then the in-memory presentation of iEncoding is:
1091 // ELitLens EDistances
1092 //iEncoding[0] ........ ........
1093 //iEncoding[1] ........ ........
1094 //iEncoding[2] ........ ........
1096 //Bellow, in the loop:
1097 // p+=TEncoding::ELitLens; - moves the pointer to the beginning of iDistance data
1098 // p+=TEncoding::EDistances; - moves the pointer to the beginning of iLitLen data of the next element of iEncoding.
1099 //The loop will process the data until "p<end", and "end" is defined as:
1100 // p=iEncoding[0].iLitLen;
1101 // TUint32* end=p+KDeflationCodes;
1102 //KDeflationCodes value is: 3*(CDbStoreCompression::TEncoding::ELitLens+CDbStoreCompression::TEncoding::EDistances),
1103 //so that is the end of the iEncoding array.
1104 //Conclusion: the code incrementing the "p" pointer in the loop bellow won't cause array overrun.
1105 p=iEncoding[0].iLitLen;
1108 Huffman::Decoding(p,TEncoding::ELitLens);
1109 p+=TEncoding::ELitLens;
1110 //coverity[overrun-local]
1111 Huffman::Decoding(p,TEncoding::EDistances,KDeflateDistCodeBase);
1112 //coverity[overrun-local]
1113 p+=TEncoding::EDistances;
1115 if (iState==EAnalysis)
1120 // Apply an inflation filter to a read stream
1122 MStreamBuf* CDbStoreCompression::FilterL(MStreamBuf* aHost,TUint32,RDbStoreReadStream::TType aType)
1124 if (iState==EDecoding || iState==EInflating)
1125 return HInflateBuf::NewL(aHost,iEncoding[aType]);
1130 // Apply a statistics or inflation filter to a write stream
1132 MStreamBuf* CDbStoreCompression::FilterL(MStreamBuf* aHost,TUint32,RDbStoreWriteStream::TType aType)
1136 __LEAVE(KErrWrite); // read-only database
1137 else if (s!=EInflating)
1139 __ASSERT(TInt(EAnalysis)==TInt(HDeflateBuf::EAnalysis));
1140 __ASSERT(TInt(EEncoding)==TInt(HDeflateBuf::EDeflate));
1141 return HDeflateBuf::NewL(aHost,iEncoding[aType],HDeflateBuf::TMode(s));
1146 // Class CDbStoreDatabase
1148 // Compression related code is maintained in this source file
1151 // Iterate across all tables applying analysis or compression to them
1153 void CDbStoreDatabase::CompressTablesL()
1155 TSglQueIterC<CDbStoreDef> iter(SchemaL());
1156 const CDbStoreDef* def;
1157 while ((def=iter++)!=0)
1159 CDbStoreTable::CCompressor* comp=new(ELeave) CDbStoreTable::CCompressor;
1160 CleanupStack::PushL(comp);
1161 comp->ProcessL(STATIC_CAST(CDbStoreTable*,TableL(*def)));
1162 CleanupStack::PopAndDestroy(); // comp
1167 // Compress or decompress the whole database
1169 void CDbStoreDatabase::CompressL(TStreamId aStreamId,TZipType aZip)
1172 iSchemaId=aStreamId;
1173 // read the databse header for encryption information
1174 RStoreReadStream strm;
1175 strm.OpenLC(Store(),aStreamId);
1177 CleanupStack::PopAndDestroy(); // strm
1180 if (iVersion==EDbStoreCompressed)
1182 iCompression->Inflate();
1184 __LEAVE(KErrArgument); // already compressed
1186 else if (aZip==EInflate)
1187 __LEAVE(KErrArgument); // not compressed
1189 { // deflate pass #1: analyse the database
1190 CompressionL(); // construct the compression filter
1191 Transaction().DDLBeginLC();
1193 iClusterCache->FlushL(); // force through the stats buffer
1194 ReplaceSchemaL(); // force through the stats buffer
1195 CleanupStack::PopAndDestroy(); // rollback after analysis!
1196 iCompression->EncodeL();
1198 // now inflate or deflate the data
1199 Transaction().DDLBeginLC();
1201 iVersion=TUint8(aZip==EDeflate ? EDbStoreCompressed : EDbStoreVersion2);
1202 Transaction().DDLCommitL();
1203 CleanupStack::Pop(); // rollback not required
1206 void CDbStoreDatabase::CompressL(CStreamStore* aStore,TStreamId aStreamId,TZipType aZip)
1208 //It looks like there is a potential memory leak in the next 4 lines of code, because:
1209 //1) CDbStoreDatabase* self=NewLC(aStore) - new CDbStoreDatabase object is created on the heap
1210 //2) CDbObject* db=self->InterfaceL() - new CDbObject is created on the heap
1211 //3) CleanupStack::Pop() - the CDbStoreDatabase object from (1) - out from the cleanup stack
1212 //4) db->PushL() - the CDbObject from (2) - in the cleanup stack
1213 //If one of the DDLPrepareL() or CompressL() leaves, looks like the CDbStoreDatabase object from (1) will be leaked.
1214 //This is not a correct guess, becuse:
1215 // - CDbObject* db=self->InterfaceL() - this call creates a new CInterface object
1216 // on the heap. The CInterface() constructor will store the "this" pointer
1217 // passed from the InterfaceL() (so the "self" pointer),
1218 // into its "iDatabase" private data member.
1219 // In which case, the returned CDbObject, of CInterface type, will have
1220 // its "iDatabase" data member initialized.
1221 // The inheritance tree is:
1222 // CBase <-- CDbObject <-- CDbDatabase <-- CInterface
1223 // - db->PushL() - this call puts on the cleanup stack CDbObject::Destroy().
1224 // The "db" object which real type is CInterface with "iDatabase" data member
1225 // initialized with "self", is on the cleanup stack.
1226 // - If one of the next "L" functions leaves, then CDbObject::Destroy() will be executed.
1227 // - CDbObject::Destroy() will call CInterface::~CInterface() - CBase is at the root of the inheritance tree, with
1228 // virtual ~CBase() destructor.
1229 // - CInterface::~CInterface() implementation calls Database().Close(), so that is CDbStoreDatabase::Close() called on
1230 // the "self" pointer.
1231 // - The CDbStoreDatabase::Close() will call "delete this" when its reference count reaches 0.
1232 // The reference counter is increased by 1 in the InterfaceL() chain of calls.
1233 // -------- Conclusion ---------
1234 // No memory leak will occur in the next lines of code. Coverity errors - disabled.
1235 CDbStoreDatabase* self=NewLC(aStore);
1236 //coverity[alloc_fn]
1237 //coverity[var_assign]
1238 CDbObject* db=self->InterfaceL(); // a reference to the database is required
1239 CleanupStack::Pop(); // self
1240 //coverity[noescape]
1242 //coverity[noescape]
1243 self->Transaction().DDLPrepareL(*db);
1244 self->CompressL(aStreamId,aZip);
1245 CleanupStack::PopAndDestroy(); // db
1246 //coverity[leaked_storage]
1249 // Class RDbStoreDatabase
1251 EXPORT_C void RDbStoreDatabase::CompressL(CStreamStore& aStore,TStreamId aId)
1253 CDbStoreDatabase::CompressL(&aStore,aId,CDbStoreDatabase::EDeflate);
1256 EXPORT_C void RDbStoreDatabase::DecompressL(CStreamStore& aStore,TStreamId aId)
1258 CDbStoreDatabase::CompressL(&aStore,aId,CDbStoreDatabase::EInflate);