os/security/cryptoservices/certificateandkeymgmt/asn1/utf8strdec.cpp
author sl@SLION-WIN7.fritz.box
Fri, 15 Jun 2012 03:10:57 +0200
changeset 0 bde4ae8d615e
permissions -rw-r--r--
First public contribution.
sl@0
     1
/*
sl@0
     2
* Copyright (c) 1998-2009 Nokia Corporation and/or its subsidiary(-ies).
sl@0
     3
* All rights reserved.
sl@0
     4
* This component and the accompanying materials are made available
sl@0
     5
* under the terms of the License "Eclipse Public License v1.0"
sl@0
     6
* which accompanies this distribution, and is available
sl@0
     7
* at the URL "http://www.eclipse.org/legal/epl-v10.html".
sl@0
     8
*
sl@0
     9
* Initial Contributors:
sl@0
    10
* Nokia Corporation - initial contribution.
sl@0
    11
*
sl@0
    12
* Contributors:
sl@0
    13
*
sl@0
    14
* Description: 
sl@0
    15
* UTF8STR.CPP
sl@0
    16
* This file contains the implementation of the UTF8 String ASN1 class.
sl@0
    17
* The IA5 string can contain the following characters:
sl@0
    18
* \<character set unknown pending arrival of ITU spec\>
sl@0
    19
*
sl@0
    20
*/
sl@0
    21
sl@0
    22
sl@0
    23
/**
sl@0
    24
 @file
sl@0
    25
*/
sl@0
    26
sl@0
    27
#include <asn1dec.h>
sl@0
    28
sl@0
    29
TInt ConvertToUnicodeFromUtf8(TDes16& aUnicode, const TDesC8& aUtf8);
sl@0
    30
sl@0
    31
EXPORT_C TASN1DecUTF8String::TASN1DecUTF8String(void)
sl@0
    32
	{
sl@0
    33
	}
sl@0
    34
sl@0
    35
EXPORT_C HBufC* TASN1DecUTF8String::DecodeDERL(const TASN1DecGeneric& aSource)
sl@0
    36
	{
sl@0
    37
	return DecodeContentsL(aSource.GetContentDER());
sl@0
    38
	}
sl@0
    39
sl@0
    40
EXPORT_C HBufC* TASN1DecUTF8String::DecodeDERL(const TDesC8& aSource,TInt& aPos)
sl@0
    41
sl@0
    42
	{
sl@0
    43
	TPtrC8 Source=aSource.Mid(aPos);
sl@0
    44
	TASN1DecGeneric gen(Source);
sl@0
    45
	gen.InitL();
sl@0
    46
	HBufC* res = DecodeContentsL(gen.GetContentDER());
sl@0
    47
	aPos+=gen.LengthDER();
sl@0
    48
	return res;
sl@0
    49
	}
sl@0
    50
sl@0
    51
HBufC* TASN1DecUTF8String::DecodeContentsL(const TDesC8& aSource)
sl@0
    52
	{
sl@0
    53
	HBufC* res = HBufC::NewLC(aSource.Length());
sl@0
    54
	TPtr pRes = res->Des();
sl@0
    55
	User::LeaveIfError(ConvertToUnicodeFromUtf8(pRes, aSource));
sl@0
    56
	CleanupStack::Pop(res);
sl@0
    57
	return res;
sl@0
    58
	}
sl@0
    59
sl@0
    60
/**
sl@0
    61
 * Converts text encoded using the Unicode transformation format UTF-8
sl@0
    62
 * into the Unicode UCS-2 character set.
sl@0
    63
 *
sl@0
    64
 * @param aUnicode	On return, contains the Unicode encoded output string.
sl@0
    65
 * @param aUtf8		The UTF-8 encoded input string
sl@0
    66
 * @return			The number of unconverted bytes left at the end of the
sl@0
    67
 *					input descriptor, or one of the error values defined
sl@0
    68
 *					in <code>TError</code>.
sl@0
    69
 */
sl@0
    70
TInt ConvertToUnicodeFromUtf8(TDes16& aUnicode, const TDesC8& aUtf8)
sl@0
    71
	{
sl@0
    72
	if (aUtf8.Length()==0)
sl@0
    73
		{
sl@0
    74
		aUnicode.SetLength(0);
sl@0
    75
		return 0;
sl@0
    76
		}
sl@0
    77
	if (aUnicode.MaxLength()==0)
sl@0
    78
		{
sl@0
    79
		return aUtf8.Length();
sl@0
    80
		}
sl@0
    81
	TUint16* pointerToCurrentUnicodeCharacter=CONST_CAST(TUint16*, aUnicode.Ptr());
sl@0
    82
	const TUint16* pointerToLastUnicodeCharacter=pointerToCurrentUnicodeCharacter+(aUnicode.MaxLength()-1);
sl@0
    83
	const TUint8* pointerToCurrentUtf8Byte=aUtf8.Ptr();
sl@0
    84
	const TUint8* pointerToLastUtf8Byte=pointerToCurrentUtf8Byte+(aUtf8.Length()-1);
sl@0
    85
	TBool inputIsTruncated=EFalse;
sl@0
    86
	TUint16 replacementcharacter = 0xFFFD;
sl@0
    87
	FOREVER
sl@0
    88
		{
sl@0
    89
		//__ASSERT_DEBUG(pointerToCurrentUnicodeCharacter<=pointerToLastUnicodeCharacter, Panic(EPanicBadUnicodePointers8));
sl@0
    90
		//__ASSERT_DEBUG(pointerToCurrentUtf8Byte<=pointerToLastUtf8Byte, Panic(EPanicBadUtf8Pointers3));
sl@0
    91
		TUint currentUtf8Byte=*pointerToCurrentUtf8Byte;
sl@0
    92
		if ((currentUtf8Byte&0x80)==0x00)
sl@0
    93
			{
sl@0
    94
			*pointerToCurrentUnicodeCharacter=STATIC_CAST(TUint16, currentUtf8Byte);
sl@0
    95
			}
sl@0
    96
		else if ((currentUtf8Byte&0xe0)==0xc0)
sl@0
    97
			{
sl@0
    98
			//__ASSERT_DEBUG(pointerToCurrentUtf8Byte<=pointerToLastUtf8Byte, Panic(EPanicBadUtf8Pointers4));
sl@0
    99
			if (pointerToCurrentUtf8Byte>=pointerToLastUtf8Byte)
sl@0
   100
				{
sl@0
   101
				--pointerToCurrentUnicodeCharacter;
sl@0
   102
				--pointerToCurrentUtf8Byte;
sl@0
   103
				inputIsTruncated=ETrue;
sl@0
   104
				break;
sl@0
   105
				}
sl@0
   106
			TUint currentUnicodeCharacter=((currentUtf8Byte&0x1f)<<6);
sl@0
   107
			++pointerToCurrentUtf8Byte;
sl@0
   108
			currentUtf8Byte=*pointerToCurrentUtf8Byte;
sl@0
   109
			if ((currentUtf8Byte&0xc0)==0x80)
sl@0
   110
				{
sl@0
   111
				currentUnicodeCharacter|=(currentUtf8Byte&0x3f);
sl@0
   112
				*pointerToCurrentUnicodeCharacter=STATIC_CAST(TUint16, currentUnicodeCharacter);
sl@0
   113
				}
sl@0
   114
			else
sl@0
   115
				{
sl@0
   116
				*pointerToCurrentUnicodeCharacter=replacementcharacter;
sl@0
   117
				}
sl@0
   118
			}
sl@0
   119
		else if ((currentUtf8Byte&0xf0)==0xe0)
sl@0
   120
			{
sl@0
   121
			//__ASSERT_DEBUG(pointerToCurrentUtf8Byte<=pointerToLastUtf8Byte, Panic(EPanicBadUtf8Pointers5));
sl@0
   122
			if (pointerToLastUtf8Byte-pointerToCurrentUtf8Byte<2)
sl@0
   123
				{
sl@0
   124
				--pointerToCurrentUnicodeCharacter;
sl@0
   125
				--pointerToCurrentUtf8Byte;
sl@0
   126
				inputIsTruncated=ETrue;
sl@0
   127
				break;
sl@0
   128
				}
sl@0
   129
			TUint currentUnicodeCharacter=((currentUtf8Byte&0x0f)<<12);
sl@0
   130
			++pointerToCurrentUtf8Byte;
sl@0
   131
			currentUtf8Byte=*pointerToCurrentUtf8Byte;
sl@0
   132
			if ((currentUtf8Byte&0xc0)==0x80)
sl@0
   133
				{
sl@0
   134
				currentUnicodeCharacter|=((currentUtf8Byte&0x3f)<<6);
sl@0
   135
				++pointerToCurrentUtf8Byte;
sl@0
   136
				currentUtf8Byte=*pointerToCurrentUtf8Byte;
sl@0
   137
				if ((currentUtf8Byte&0xc0)==0x80)
sl@0
   138
					{
sl@0
   139
					currentUnicodeCharacter|=(currentUtf8Byte&0x3f);
sl@0
   140
					*pointerToCurrentUnicodeCharacter=STATIC_CAST(TUint16, currentUnicodeCharacter);
sl@0
   141
					}
sl@0
   142
				else
sl@0
   143
					{
sl@0
   144
					*pointerToCurrentUnicodeCharacter=STATIC_CAST(TUint16, currentUnicodeCharacter);
sl@0
   145
					}
sl@0
   146
				}
sl@0
   147
			else
sl@0
   148
				{
sl@0
   149
				*pointerToCurrentUnicodeCharacter=replacementcharacter;
sl@0
   150
				}
sl@0
   151
			
sl@0
   152
			}
sl@0
   153
		else if ((currentUtf8Byte&0xf8)==0xf0)
sl@0
   154
			{
sl@0
   155
			//__ASSERT_DEBUG(pointerToCurrentUnicodeCharacter<=pointerToLastUnicodeCharacter, Panic(EPanicBadUnicodePointers9));
sl@0
   156
			if (pointerToCurrentUnicodeCharacter>=pointerToLastUnicodeCharacter)
sl@0
   157
				{
sl@0
   158
				--pointerToCurrentUnicodeCharacter;
sl@0
   159
				--pointerToCurrentUtf8Byte;
sl@0
   160
				break;
sl@0
   161
				}
sl@0
   162
			//__ASSERT_DEBUG(pointerToCurrentUtf8Byte<=pointerToLastUtf8Byte, Panic(EPanicBadUtf8Pointers6));
sl@0
   163
			if (pointerToLastUtf8Byte-pointerToCurrentUtf8Byte<3)
sl@0
   164
				{
sl@0
   165
				--pointerToCurrentUnicodeCharacter;
sl@0
   166
				--pointerToCurrentUtf8Byte;
sl@0
   167
				inputIsTruncated=ETrue;
sl@0
   168
				break;
sl@0
   169
				}
sl@0
   170
			TUint currentUnicodeCharacter=((currentUtf8Byte&0x07)<<8);
sl@0
   171
			++pointerToCurrentUtf8Byte;
sl@0
   172
			currentUtf8Byte=*pointerToCurrentUtf8Byte;
sl@0
   173
			if ((currentUtf8Byte&0xc0)==0x80)
sl@0
   174
				{
sl@0
   175
				currentUnicodeCharacter|=((currentUtf8Byte&0x3f)<<2);
sl@0
   176
				if (currentUnicodeCharacter>=0x0040)
sl@0
   177
					{
sl@0
   178
					currentUnicodeCharacter-=0x0040;
sl@0
   179
					if (currentUnicodeCharacter<0x0400)
sl@0
   180
						{
sl@0
   181
						++pointerToCurrentUtf8Byte;
sl@0
   182
						currentUtf8Byte=*pointerToCurrentUtf8Byte;
sl@0
   183
						if ((currentUtf8Byte&0xc0)==0x80)
sl@0
   184
							{
sl@0
   185
							currentUnicodeCharacter|=((currentUtf8Byte&0x30)>>4);
sl@0
   186
							*pointerToCurrentUnicodeCharacter=STATIC_CAST(TUint16, 0xd800|currentUnicodeCharacter);
sl@0
   187
							currentUnicodeCharacter=((currentUtf8Byte&0x0f)<<6);
sl@0
   188
							++pointerToCurrentUtf8Byte;
sl@0
   189
							currentUtf8Byte=*pointerToCurrentUtf8Byte;
sl@0
   190
							if ((currentUtf8Byte&0xc0)==0x80)
sl@0
   191
								{
sl@0
   192
								currentUnicodeCharacter|=(currentUtf8Byte&0x3f);
sl@0
   193
								++pointerToCurrentUnicodeCharacter;
sl@0
   194
								*pointerToCurrentUnicodeCharacter=STATIC_CAST(TUint16, 0xdc00|currentUnicodeCharacter);
sl@0
   195
								}
sl@0
   196
							}
sl@0
   197
						}
sl@0
   198
					}
sl@0
   199
				}
sl@0
   200
			}
sl@0
   201
		else
sl@0
   202
			{
sl@0
   203
			*pointerToCurrentUnicodeCharacter=replacementcharacter;
sl@0
   204
			}
sl@0
   205
		//__ASSERT_DEBUG(pointerToCurrentUtf8Byte<=pointerToLastUtf8Byte, Panic(EPanicBadUtf8Pointers7));
sl@0
   206
		//__ASSERT_DEBUG(pointerToCurrentUnicodeCharacter<=pointerToLastUnicodeCharacter, Panic(EPanicBadUnicodePointers10));
sl@0
   207
		if ((pointerToCurrentUtf8Byte>=pointerToLastUtf8Byte) || (pointerToCurrentUnicodeCharacter>=pointerToLastUnicodeCharacter))
sl@0
   208
			{
sl@0
   209
			break;
sl@0
   210
			}
sl@0
   211
		++pointerToCurrentUnicodeCharacter;
sl@0
   212
		++pointerToCurrentUtf8Byte;
sl@0
   213
		}
sl@0
   214
	if ((pointerToCurrentUtf8Byte<aUtf8.Ptr()) && inputIsTruncated)
sl@0
   215
		{
sl@0
   216
		return KErrArgument;
sl@0
   217
		}
sl@0
   218
	aUnicode.SetLength((pointerToCurrentUnicodeCharacter-aUnicode.Ptr())+1);
sl@0
   219
	return pointerToLastUtf8Byte-pointerToCurrentUtf8Byte;
sl@0
   220
	}
sl@0
   221