First public contribution.
2 * Copyright (c) 1997-2009 Nokia Corporation and/or its subsidiary(-ies).
4 * This component and the accompanying materials are made available
5 * under the terms of "Eclipse Public License v1.0"
6 * which accompanies this distribution, and is available
7 * at the URL "http://www.eclipse.org/legal/epl-v10.html".
9 * Initial Contributors:
10 * Nokia Corporation - initial contribution.
15 * Big-Endian converter
24 #define ARRAY_LENGTH(aArray) (sizeof(aArray)/sizeof((aArray)[0]))
27 GLREF_D const SCnvConversionData unicodeConversionDataBig=
29 SCnvConversionData::EFixedBigEndian,
31 ARRAY_LENGTH(unicodeVariableByteDataRanges),
32 unicodeVariableByteDataRanges
35 ARRAY_LENGTH(unicodeTounicodeDataRanges),
36 unicodeTounicodeDataRanges
39 ARRAY_LENGTH(unicodeTounicodeDataRanges),
40 unicodeTounicodeDataRanges
46 GLREF_C void IsCharacterSetUnicodeBig(TInt& aConfidenceLevel, const TDesC8& aSample)
49 TInt sampleLength = aSample.Length();
56 // The first byte is a possible ByteOrderMark
57 // Try matching the next character
60 // the byte order mark could be 0xFEFF or 0xFFFE depending on
61 // endianness of the sample text.
66 for (TInt i = 0; i < sampleLength-1; ++i)
68 if (aSample[i] == 0x0d)
70 if (aSample[i+1] == 0x0a)
72 // Reduce the confidence level
73 aConfidenceLevel-= 25;
78 // if not 100% confident already, check if most even bytes are 0
79 #define MAX_SAMPLE_LENGTH 2048
80 if ( aConfidenceLevel < 100 )
83 // only check the first 2k if big sample
84 TInt length =( sampleLength > MAX_SAMPLE_LENGTH ? MAX_SAMPLE_LENGTH : sampleLength);
86 // start from 0 and check the even bytes
87 for (TInt i = 0; i < length-1; i+=2)
89 if (aSample[i] == 0x0)
93 // if more than 80% even bytes zero then this IS big Endian
94 if ( (repeat * 100) / (length * 5) >= 8)
95 aConfidenceLevel = 100;
98 aConfidenceLevel =(aConfidenceLevel >0)? ((aConfidenceLevel > 100)? 100: aConfidenceLevel): 0;