os/textandloc/textandlocutils/numbergrouping/src/RegularExpression.cpp
author sl@SLION-WIN7.fritz.box
Fri, 15 Jun 2012 03:10:57 +0200
changeset 0 bde4ae8d615e
permissions -rw-r--r--
First public contribution.
sl@0
     1
/*
sl@0
     2
* Copyright (c) 2002 Nokia Corporation and/or its subsidiary(-ies).
sl@0
     3
* All rights reserved.
sl@0
     4
* This component and the accompanying materials are made available
sl@0
     5
* under the terms of the License "Eclipse Public License v1.0"
sl@0
     6
* which accompanies this distribution, and is available
sl@0
     7
* at the URL "http://www.eclipse.org/legal/epl-v10.html".
sl@0
     8
*
sl@0
     9
* Initial Contributors:
sl@0
    10
* Nokia Corporation - initial contribution.
sl@0
    11
*
sl@0
    12
* Contributors:
sl@0
    13
*
sl@0
    14
* Description: 
sl@0
    15
*
sl@0
    16
*/
sl@0
    17
sl@0
    18
#include "RegularExpression.h"
sl@0
    19
sl@0
    20
#define KNumOfRecognisedChars 13
sl@0
    21
sl@0
    22
// Panic is implemented in NumberGrouping.cpp
sl@0
    23
GLDEF_C void Panic(TNumberGroupingPanic aPanic);
sl@0
    24
sl@0
    25
CRegularExpression::CRegularExpression()
sl@0
    26
{
sl@0
    27
}
sl@0
    28
sl@0
    29
CRegularExpression* CRegularExpression::NewL(RPointerArray<TDesC>* aPatterns)
sl@0
    30
{
sl@0
    31
	CRegularExpression* s = NewLC(aPatterns);
sl@0
    32
	CleanupStack::Pop();
sl@0
    33
	return s;
sl@0
    34
}
sl@0
    35
sl@0
    36
CRegularExpression* CRegularExpression::NewLC(RPointerArray<TDesC>* aPatterns)
sl@0
    37
{
sl@0
    38
	CRegularExpression* s = new(ELeave)CRegularExpression();
sl@0
    39
	CleanupStack::PushL(s);
sl@0
    40
	s->ConstructL(aPatterns);
sl@0
    41
	return s;
sl@0
    42
}
sl@0
    43
sl@0
    44
void CRegularExpression::ConstructL(RPointerArray<TDesC>* aPatterns)
sl@0
    45
{
sl@0
    46
	GenerateStateTablesL(aPatterns);
sl@0
    47
}
sl@0
    48
sl@0
    49
CRegularExpression::~CRegularExpression()
sl@0
    50
{
sl@0
    51
	for(TInt i = 0; i < iStateMachines.Count(); i++)
sl@0
    52
		delete iStateMachines[i];
sl@0
    53
	
sl@0
    54
	iStateMachines.Close();
sl@0
    55
}
sl@0
    56
sl@0
    57
TInt CRegularExpression::Search(const TDesC& aString)
sl@0
    58
{
sl@0
    59
	return SearchFrom(0, aString);
sl@0
    60
}
sl@0
    61
sl@0
    62
TInt CRegularExpression::SearchFrom(TInt aIndex, const TDesC& aString)
sl@0
    63
{
sl@0
    64
	for(TInt i = aIndex; i < iStateMachines.Count(); ++i)
sl@0
    65
	{
sl@0
    66
		if(iStateMachines[i]->Matches(aString))
sl@0
    67
			return i;
sl@0
    68
	}
sl@0
    69
sl@0
    70
	return KErrNotFound;
sl@0
    71
}
sl@0
    72
sl@0
    73
// Do the parsing
sl@0
    74
void CRegularExpression::GenerateStateTablesL(RPointerArray<TDesC>* aPatterns)
sl@0
    75
{	
sl@0
    76
	for(TInt nPatternCount = 0; nPatternCount < aPatterns->Count(); ++nPatternCount)
sl@0
    77
	{
sl@0
    78
		const TDesC& desPattern = *((*aPatterns)[nPatternCount]) ;	// I know it looks horrific, but it makes the
sl@0
    79
																	// rest of the method _so_ much easier to read
sl@0
    80
		
sl@0
    81
		CStateMachine* StateMachine = CStateMachine::NewLC(KNumOfRecognisedChars, desPattern.Length());
sl@0
    82
		User::LeaveIfError(iStateMachines.Append(StateMachine));
sl@0
    83
		CleanupStack::Pop(); // now the ownership transfers to iStateMachines
sl@0
    84
sl@0
    85
		// parse the desPattern
sl@0
    86
sl@0
    87
		enum TParseState
sl@0
    88
		{
sl@0
    89
			EAny,
sl@0
    90
			EOpenBracketFound,
sl@0
    91
			EChoiceOrRange,
sl@0
    92
			EChoice,
sl@0
    93
			ERange,
sl@0
    94
			ELookingForCloseBracket
sl@0
    95
		};
sl@0
    96
sl@0
    97
		TParseState	parseState = EAny;
sl@0
    98
sl@0
    99
		TInt		nPatternIndex = 0;
sl@0
   100
		TInt		nState = 0;
sl@0
   101
sl@0
   102
		TBuf<10>	bufChoice;
sl@0
   103
		bufChoice.Zero();
sl@0
   104
sl@0
   105
		TBuf<20>	bufParsingError = _L("Parsing syntax error");
sl@0
   106
sl@0
   107
		while(nPatternIndex < desPattern.Length() )
sl@0
   108
		{
sl@0
   109
			TChar cChar = desPattern[nPatternIndex];
sl@0
   110
			TBool bEndOfParse = EFalse;
sl@0
   111
sl@0
   112
			if(nPatternIndex == desPattern.Length() - 1) // end of the parse
sl@0
   113
				bEndOfParse = ETrue;
sl@0
   114
		
sl@0
   115
			switch(cChar)
sl@0
   116
			{
sl@0
   117
			case '1':
sl@0
   118
			case '2':
sl@0
   119
			case '3':
sl@0
   120
			case '4':
sl@0
   121
			case '5':
sl@0
   122
			case '6':
sl@0
   123
			case '7':
sl@0
   124
			case '8':
sl@0
   125
			case '9':
sl@0
   126
			case '0':
sl@0
   127
				switch(parseState)
sl@0
   128
				{
sl@0
   129
				case EAny:
sl@0
   130
					iStateMachines[nPatternCount]->AddStateTransistionL(cChar, nState, bEndOfParse?
sl@0
   131
																					KStateMatched:
sl@0
   132
																					(nState + 1)); 
sl@0
   133
					++nState;
sl@0
   134
					break;
sl@0
   135
				case EOpenBracketFound:
sl@0
   136
					bufChoice.Append(cChar);
sl@0
   137
					parseState = EChoiceOrRange;					
sl@0
   138
					break;
sl@0
   139
				case EChoiceOrRange:
sl@0
   140
				case EChoice:
sl@0
   141
					bufChoice.Append(cChar);
sl@0
   142
					parseState = EChoice;
sl@0
   143
					break;
sl@0
   144
				case ERange:
sl@0
   145
					bufChoice.Append(cChar);
sl@0
   146
					parseState = ELookingForCloseBracket;
sl@0
   147
					break;
sl@0
   148
				//case ELookingForCloseBracket:						
sl@0
   149
				default:
sl@0
   150
					User::Panic(bufParsingError, KErrSyntaxError);
sl@0
   151
					break;
sl@0
   152
				}
sl@0
   153
				break;
sl@0
   154
			case '[':
sl@0
   155
				switch(parseState)
sl@0
   156
				{
sl@0
   157
				case EAny:						
sl@0
   158
					bufChoice.Zero();
sl@0
   159
					parseState = EOpenBracketFound;
sl@0
   160
					break;
sl@0
   161
				//case EOpenBracketFound:			
sl@0
   162
				//case EChoiceOrRange:			
sl@0
   163
				//case EChoice:					
sl@0
   164
				//case ERange:					
sl@0
   165
				//case ELookingForCloseBracket:	
sl@0
   166
				default:
sl@0
   167
					User::Panic(bufParsingError, KErrSyntaxError);
sl@0
   168
					break;
sl@0
   169
				
sl@0
   170
    			}	
sl@0
   171
				break;
sl@0
   172
			case ']':
sl@0
   173
				switch(parseState)
sl@0
   174
				{
sl@0
   175
				case EChoice:
sl@0
   176
					{
sl@0
   177
						for(TInt i = 0; i < bufChoice.Length(); ++i)
sl@0
   178
						{
sl@0
   179
							TChar cChar = bufChoice[i];
sl@0
   180
							
sl@0
   181
							iStateMachines[nPatternCount]->AddStateTransistionL(cChar.GetNumericValue(), 
sl@0
   182
																				nState, 
sl@0
   183
																				bEndOfParse?
sl@0
   184
																					KStateMatched:
sl@0
   185
																					(nState + 1));
sl@0
   186
						}
sl@0
   187
						
sl@0
   188
						++nState;
sl@0
   189
						parseState = EAny;
sl@0
   190
					}
sl@0
   191
					break;
sl@0
   192
				case ELookingForCloseBracket:
sl@0
   193
					{
sl@0
   194
						TChar cTopOfRange = bufChoice[1];
sl@0
   195
						TChar cBottomOfRange = bufChoice[0];
sl@0
   196
sl@0
   197
						TInt nTopOfRange = cTopOfRange.GetNumericValue();		// if they're not there then something
sl@0
   198
						TInt nBottomOfRange = cBottomOfRange.GetNumericValue();	// is seriously amiss...
sl@0
   199
						
sl@0
   200
						if(nTopOfRange < nBottomOfRange)
sl@0
   201
							User::Panic(bufParsingError, KErrSyntaxError);
sl@0
   202
					
sl@0
   203
						for(TInt i = nBottomOfRange; i <= nTopOfRange; ++i)
sl@0
   204
						{
sl@0
   205
							iStateMachines[nPatternCount]->AddStateTransistionL(i, nState, bEndOfParse?
sl@0
   206
																							KStateMatched:
sl@0
   207
																							(nState + 1));
sl@0
   208
						}
sl@0
   209
						++nState;
sl@0
   210
						parseState = EAny;
sl@0
   211
					}
sl@0
   212
					break;
sl@0
   213
				//case EAny:						
sl@0
   214
				//case EOpenBracketFound:			
sl@0
   215
				//case EChoiceOrRange:			
sl@0
   216
				//case ERange:		
sl@0
   217
				default:
sl@0
   218
					User::Panic(bufParsingError, KErrSyntaxError);
sl@0
   219
					break;
sl@0
   220
				}	
sl@0
   221
				break;
sl@0
   222
			case '-':
sl@0
   223
				switch(parseState)
sl@0
   224
				{
sl@0
   225
				case EChoiceOrRange:			
sl@0
   226
					parseState = ERange;
sl@0
   227
					break;	
sl@0
   228
				//case EAny:						
sl@0
   229
				//case EOpenBracketFound:			
sl@0
   230
				//case ELookingForCloseBracket:	
sl@0
   231
				//case ERange:					
sl@0
   232
				//case EChoice:
sl@0
   233
				default:
sl@0
   234
					User::Panic(bufParsingError, KErrSyntaxError);
sl@0
   235
					break;
sl@0
   236
				}
sl@0
   237
				break;
sl@0
   238
			case '.':
sl@0
   239
			case '+':
sl@0
   240
				switch(parseState)
sl@0
   241
				{
sl@0
   242
				case EAny:						
sl@0
   243
					iStateMachines[nPatternCount]->AddStateTransistionL(cChar, nState, bEndOfParse?
sl@0
   244
																					KStateMatched:
sl@0
   245
																					(nState + 1));
sl@0
   246
					++nState;
sl@0
   247
					break;
sl@0
   248
				//case EOpenBracketFound:			
sl@0
   249
				//case EChoiceOrRange:			
sl@0
   250
				//case ELookingForCloseBracket:	
sl@0
   251
				//case ERange:					
sl@0
   252
				//case EChoice:
sl@0
   253
				default:
sl@0
   254
					User::Panic(bufParsingError, KErrSyntaxError);
sl@0
   255
					break;					
sl@0
   256
				}
sl@0
   257
				break;
sl@0
   258
			default:
sl@0
   259
				User::Panic(bufParsingError, KErrSyntaxError);
sl@0
   260
				break;
sl@0
   261
			}
sl@0
   262
sl@0
   263
			++nPatternIndex;
sl@0
   264
		}
sl@0
   265
sl@0
   266
		if(parseState != EAny)
sl@0
   267
			User::Panic(bufParsingError, KErrSyntaxError);
sl@0
   268
	}
sl@0
   269
}
sl@0
   270
sl@0
   271
void CRegularExpression::GetWildcardVersionOfPattern( 
sl@0
   272
    TInt aPatternIndex, TText aWildcard, TDes& aWildcardedPattern) const
sl@0
   273
    {
sl@0
   274
    __ASSERT_ALWAYS( (0 <= aPatternIndex) && (aPatternIndex < iStateMachines.Count()),
sl@0
   275
        Panic(ENumberGroupingNoSuchStateMachine) );
sl@0
   276
    iStateMachines[aPatternIndex]->GetWildcardVersionOfPattern( aWildcard, aWildcardedPattern );
sl@0
   277
    }
sl@0
   278
sl@0
   279
// End of File