Update contrib.
2 * Copyright (c) 1997-2009 Nokia Corporation and/or its subsidiary(-ies).
4 * This component and the accompanying materials are made available
5 * under the terms of "Eclipse Public License v1.0"
6 * which accompanies this distribution, and is available
7 * at the URL "http://www.eclipse.org/legal/epl-v10.html".
9 * Initial Contributors:
10 * Nokia Corporation - initial contribution.
22 #define ARRAY_LENGTH(aArray) (sizeof(aArray)/sizeof((aArray)[0]))
24 LOCAL_D const TUint16 keyedTables16OfIndexedTables16_indexedEntries_codePage1252ToUnicode_1[]=
39 LOCAL_D const TUint16 keyedTables16OfIndexedTables16_indexedEntries_codePage1252ToUnicode_2[]=
55 LOCAL_D const TUint16 keyedTables16OfIndexedTables16_indexedEntries_codePage1252ToUnicode_3[]=
61 LOCAL_D const SCnvConversionData::SOneDirectionData::SRange::UData::SKeyedTable16OfIndexedTables16::SKeyedEntry keyedTables16OfIndexedTables16_keyedEntries_codePage1252ToUnicode_1[]=
66 keyedTables16OfIndexedTables16_indexedEntries_codePage1252ToUnicode_1
71 keyedTables16OfIndexedTables16_indexedEntries_codePage1252ToUnicode_2
76 keyedTables16OfIndexedTables16_indexedEntries_codePage1252ToUnicode_3
80 LOCAL_D const SCnvConversionData::SOneDirectionData::SRange::UData::SKeyedTable1616::SEntry keyedTable1616_unicodeToCodePage1252_1[]=
192 LOCAL_D const SCnvConversionData::SVariableByteData::SRange codePage1252VariableByteDataRanges[]=
202 LOCAL_D const SCnvConversionData::SOneDirectionData::SRange codePage1252ToUnicodeDataRanges[]=
207 SCnvConversionData::SOneDirectionData::SRange::EDirect,
218 SCnvConversionData::SOneDirectionData::SRange::EDirect,
229 SCnvConversionData::SOneDirectionData::SRange::EOffset,
233 STATIC_CAST(TUint, 8236),
240 SCnvConversionData::SOneDirectionData::SRange::EOffset,
244 STATIC_CAST(TUint, 239),
251 SCnvConversionData::SOneDirectionData::SRange::EKeyedTable16OfIndexedTables16,
255 UData_SKeyedTable16OfIndexedTables16(keyedTables16OfIndexedTables16_keyedEntries_codePage1252ToUnicode_1)
260 LOCAL_D const SCnvConversionData::SOneDirectionData::SRange unicodeToCodePage1252DataRanges[]=
265 SCnvConversionData::SOneDirectionData::SRange::EDirect,
276 SCnvConversionData::SOneDirectionData::SRange::EDirect,
287 SCnvConversionData::SOneDirectionData::SRange::EKeyedTable1616,
291 UData_SKeyedTable1616(keyedTable1616_unicodeToCodePage1252_1)
296 GLREF_D const SCnvConversionData codePage1252ConversionData=
298 SCnvConversionData::EUnspecified,
300 ARRAY_LENGTH(codePage1252VariableByteDataRanges),
301 codePage1252VariableByteDataRanges
304 ARRAY_LENGTH(codePage1252ToUnicodeDataRanges),
305 codePage1252ToUnicodeDataRanges
308 ARRAY_LENGTH(unicodeToCodePage1252DataRanges),
309 unicodeToCodePage1252DataRanges
315 GLREF_C void IsCharacterSetCP1252(TInt& aConfidenceLevel, const TDesC8& aSample)
317 aConfidenceLevel = 60;
318 TInt sampleLength = aSample.Length();
320 for (TInt i=0; i<sampleLength; ++i)
322 // CP1252 includes ASCII as well
323 // first check if the char is in the range 0x80 - 0x9f (controls codes in ISO88591)
324 // If it is in that range then the likelihood that it's CP1252 is a bit higher
325 if ((aSample[i] >= 0x80) && (aSample[i] <= 0x9f))
327 if((aSample[i]==0x81)||(aSample[i]==0x8D)||(aSample[i]==0x8f)||
328 (aSample[i]==0x90)||(aSample[i]==0x9d))
330 // These code values are not supported by the Codepage CP1252
331 aConfidenceLevel = 0;
336 // problem: UTF8 uses the values 0x80-0x9f in more than 50% of it's multibyte representation
337 // so if the text was UTF8 .... the confidence here would hit the roof. Could check to make
338 // sure that this is not UTF8
342 TInt increment1 = i+1;
343 TInt decrement1 = i-1;
344 // 0xf7 is the division symbol in CP1252.
345 // 0xd7 is the division symbol in CP1252.If char on either side of the division
346 // symbol is a number then the confidence that it's ISO88591 increases
347 if( decrement1>= 0 && ((aSample[i]==0xf7) || (aSample[i]==0xd7)) && increment1<sampleLength)
350 if (increment1 >= sampleLength)
352 if ( (aSample[decrement1] >= 0x30) && (aSample[decrement1] <= 0x39) && // char before is a number
353 (aSample[increment1] >= 0x30) && (aSample[increment1] <= 0x39) ) // char after is a number
358 // Can also use the currency symbol to increase confidence if the char after a
359 // currency symbol is numeric
360 if((aSample[i]>=0xa2) && (aSample[i] <= 0xa5) && increment1<sampleLength)
362 if ((aSample[increment1] >= 0x30) && (aSample[increment1] <= 0x39))
368 aConfidenceLevel =(aConfidenceLevel >0)? ((aConfidenceLevel > 100)? 100: aConfidenceLevel): 0;