Update contrib.
1 // Copyright (c) 2003-2009 Nokia Corporation and/or its subsidiary(-ies).
2 // All rights reserved.
3 // This component and the accompanying materials are made available
4 // under the terms of "Eclipse Public License v1.0"
5 // which accompanies this distribution, and is available
6 // at the URL "http://www.eclipse.org/legal/epl-v10.html".
8 // Initial Contributors:
9 // Nokia Corporation - initial contribution.
19 #include "LineBreak.h"
20 #include "LineBreakImp.h"
23 const TText16 KThaiCodePageStart = 0x0E00;
24 const TText16 KThaiCodePageEnd = 0x0E5C;
25 const TUint KNumThaiCharacters = KThaiCodePageEnd - KThaiCodePageStart;
28 Ecanpsulates rules for when Thai character sequence line breaking.
31 class ThaiLinebreakRules
34 enum TCharClassification
59 KOutOfRangeFlag = 1 << EOutOfRange,
60 KConsOAngFlag = 1 << EConsOAng,
61 KConsYoYakFlag = 1 << EConsYoYak,
62 KConsHoHipFlag = 1 << EConsHoHip,
63 KConsWoWeanFlag = 1 << EConsWoWean,
64 KConsDigraphFlag = 1 << EConsDigraph,
65 KConsOtherFlag = 1 << EConsOther,
66 KPostVowelAFlag = 1 << EPostVowelA,
67 KPostVowelAAFlag = 1 << EPostVowelAA,
68 KPostVowelOtherFlag = 1 << EPostVowelOther,
69 KPreVowelFlag = 1 << EPreVowel,
70 KDepMaiHanAkatFlag = 1 << EDepMaiHanAkat,
71 KDepSaraIFlag = 1 << EDepSaraI,
72 KDepOtherFlag = 1 << EDepOther,
74 KSpecialDepFlags = KDepMaiHanAkatFlag | KDepSaraIFlag,
75 KPostVowelFlags = KPostVowelAFlag | KPostVowelAAFlag | KPostVowelOtherFlag,
76 KConsFlags = KConsOtherFlag | KConsDigraphFlag | KConsWoWeanFlag
77 | KConsHoHipFlag | KConsYoYakFlag | KConsOAngFlag,
78 KAllFlags = KOutOfRangeFlag | KConsOAngFlag | KConsYoYakFlag
79 | KConsHoHipFlag | KConsWoWeanFlag | KConsDigraphFlag
80 | KConsOtherFlag | KPostVowelAFlag | KPostVowelAAFlag
81 | KPostVowelOtherFlag | KPreVowelFlag | KDepMaiHanAkatFlag
82 | KDepSaraIFlag | KDepOtherFlag
85 /** Returns the Thai linebreaking class of the character. */
86 static TCharClassification Class(TInt aChar);
87 /** Returns true if aChar is a combining character according to aBreaker. */
88 static TBool IsCombiningChar(TInt aChar, const MLineBreaker& aBreaker);
89 /** Returns the Thai linebreaking class of the character at (*aChar),
90 searching backwards for the base character if it is foreign and of type CM.
91 @param aChar The position of the character within the string.
92 @param aStart The start of the string.
93 @param aBreaker The line breaker to query for line breaking class.
95 static TCharClassification DerivedClass(const TText* aChar,
96 const TText* aStart, const MLineBreaker& aBreaker);
98 Gets the line break rule for the previous and current character pair
99 @param aPrevClass Class of the previous character.
100 @param aClass Class of the current character.
101 @return the rule code corresponding to the input pair.
103 static TBool BreakAllowedBetween(
104 TCharClassification aPrevClass, TCharClassification aClass);
105 /** Returns whether a line break is allowed before the SA character at
107 @param aChar The position of the character within the string.
108 @param aStart The start of the string.
109 @param aBreaker The line breaker to query for line breaking class.
111 static TBool BreakAllowedAt(const TText* aChar,
112 const TText* aStart, const MLineBreaker& aBreaker);
115 Classification of each character
117 static const TUint8 KCharClassifications[KNumThaiCharacters];
120 Rules table of prev to next character
122 static const TUint32 KRules[EMaxClassification];
125 const TUint8 ThaiLinebreakRules::KCharClassifications[KNumThaiCharacters] =
127 EOutOfRange, // 0x0E00
128 EConsOther, // 0x0E01
129 EConsOther, // 0x0E02
130 EConsOther, // 0x0E03
131 EConsOther, // 0x0E04
132 EConsOther, // 0x0E05
133 EConsOther, // 0x0E06
134 EConsDigraph, // 0x0E07
135 EConsOther, // 0x0E08
136 EConsOther, // 0x0E09
137 EConsOther, // 0x0E0A
138 EConsOther, // 0x0E0B
139 EConsOther, // 0x0E0C
140 EConsOther, // 0x0E0D
141 EConsOther, // 0x0E0E
142 EConsOther, // 0x0E0F
144 EConsOther, // 0x0E10
145 EConsOther, // 0x0E11
146 EConsOther, // 0x0E12
147 EConsOther, // 0x0E13
148 EConsOther, // 0x0E14
149 EConsOther, // 0x0E15
150 EConsOther, // 0x0E16
151 EConsOther, // 0x0E17
152 EConsOther, // 0x0E18
153 EConsDigraph, // 0x0E19
154 EConsOther, // 0x0E1A
155 EConsOther, // 0x0E1B
156 EConsOther, // 0x0E1C
157 EConsOther, // 0x0E1D
158 EConsOther, // 0x0E1E
159 EConsOther, // 0x0E1F
161 EConsOther, // 0x0E20
162 EConsDigraph, // 0x0E21
163 EConsYoYak, // 0x0E22
164 EConsDigraph, // 0x0E23
165 EConsOther, // 0x0E24
166 EConsDigraph, // 0x0E25
167 EConsOther, // 0x0E26
168 EConsWoWean, // 0x0E27
169 EConsOther, // 0x0E28
170 EConsOther, // 0x0E29
171 EConsOther, // 0x0E2A
172 EConsHoHip, // 0x0E2B
173 EConsOther, // 0x0E2C
175 EConsOther, // 0x0E2E
176 EOutOfRange, // 0x0E2F
178 EPostVowelA, // 0x0E30
179 EDepMaiHanAkat, // 0x0E31
180 EPostVowelAA, // 0x0E32
181 EPostVowelOther,// 0x0E33
191 EOutOfRange, // 0x0E3B
192 EOutOfRange, // 0x0E3C
193 EOutOfRange, // 0x0E3D
194 EOutOfRange, // 0x0E3E
195 EOutOfRange, // 0x0E3F
203 EPostVowelOther,// 0x0E45
204 EOutOfRange, // 0x0E46
214 EOutOfRange, // 0x0E4F
216 EOutOfRange, // 0x0E50
217 EOutOfRange, // 0x0E51
218 EOutOfRange, // 0x0E52
219 EOutOfRange, // 0x0E53
220 EOutOfRange, // 0x0E54
221 EOutOfRange, // 0x0E55
222 EOutOfRange, // 0x0E56
223 EOutOfRange, // 0x0E57
224 EOutOfRange, // 0x0E58
225 EOutOfRange, // 0x0E59
226 EOutOfRange, // 0x0E5A
227 EOutOfRange // 0x0E5B
230 const TUint32 KNormalBreaksBeforeCons =
231 ThaiLinebreakRules::KPreVowelFlag
232 | ThaiLinebreakRules::KConsOtherFlag
233 | ThaiLinebreakRules::KConsDigraphFlag
234 | ThaiLinebreakRules::KConsHoHipFlag
235 | ThaiLinebreakRules::KOutOfRangeFlag;
236 const TUint32 KNormalBreaksBeforePostVowel =
237 ThaiLinebreakRules::KPreVowelFlag
238 | ThaiLinebreakRules::KPostVowelFlags
239 | ThaiLinebreakRules::KConsFlags
240 | ThaiLinebreakRules::KOutOfRangeFlag;
241 const TUint32 ThaiLinebreakRules::KRules[EMaxClassification] =
243 /* Prev Char EOutOfRange */
244 KAllFlags - KOutOfRangeFlag,
245 /* Prev Char EConsOAng */
246 KNormalBreaksBeforeCons,
247 /* Prev Char EConsYoYak */
248 KNormalBreaksBeforeCons,
249 /* Prev Char EConsHoHip */
250 KNormalBreaksBeforeCons - KConsDigraphFlag,
251 /* Prev Char EConsWoWean */
252 KNormalBreaksBeforeCons - KConsDigraphFlag - KConsHoHipFlag,
253 /* Prev Char EConsDigraph */
254 KNormalBreaksBeforeCons,
255 /* Prev Char EConsOther */
256 KNormalBreaksBeforeCons,
257 /* Prev Char EPostVowelA */
258 KNormalBreaksBeforePostVowel,
259 /* Prev Char EPostVowelAA */
260 KNormalBreaksBeforePostVowel - KPostVowelAFlag,
261 /* Prev Char EPostVowelOther */
262 KNormalBreaksBeforePostVowel,
263 /* Prev Char EPreVowel */
264 KPreVowelFlag | KPostVowelFlags | KOutOfRangeFlag,
265 /* Prev Char EDepMaiHanAkat */
266 KSpecialDepFlags | KPreVowelFlag | KPostVowelAAFlag
267 | KPostVowelAFlag | KOutOfRangeFlag,
268 /* Prev Char EDepSaraI */
269 KSpecialDepFlags | KPreVowelFlag | KPostVowelAAFlag
270 | KPostVowelAFlag | KOutOfRangeFlag,
271 /* Prev Char EDepOther */
272 KSpecialDepFlags | KPreVowelFlag | KPostVowelAAFlag
273 | KPostVowelAFlag | KConsOtherFlag | KConsDigraphFlag
274 | KConsWoWeanFlag | KConsHoHipFlag | KOutOfRangeFlag
277 ThaiLinebreakRules::TCharClassification ThaiLinebreakRules::Class(TInt a)
279 return static_cast<TCharClassification>(
280 (KThaiCodePageStart <= a && a < KThaiCodePageEnd) ?
281 KCharClassifications[a - KThaiCodePageStart] :
285 TBool ThaiLinebreakRules::IsCombiningChar(TInt aChar,
286 const MLineBreaker& aBreaker)
288 TUint dummy1, dummy2;
289 return aBreaker.LineBreakClass(aChar, dummy1, dummy2) == MLineBreaker::ECmLineBreakClass;
292 ThaiLinebreakRules::TCharClassification ThaiLinebreakRules::DerivedClass(
293 const TText* aChar, const TText* aStart, const MLineBreaker& aBreaker)
295 ThaiLinebreakRules::TCharClassification c = Class(*aChar);
296 while (c == EOutOfRange && aChar != aStart
297 && IsCombiningChar(*aChar, aBreaker))
305 TBool ThaiLinebreakRules::BreakAllowedBetween(
306 ThaiLinebreakRules::TCharClassification aClass,
307 ThaiLinebreakRules::TCharClassification aNextClass)
309 return KRules[aClass] & (1 << aNextClass);
312 TBool ThaiLinebreakRules::BreakAllowedAt(const TText* aChar,
313 const TText* aStart, const MLineBreaker& aBreaker)
315 __ASSERT_DEBUG(aStart < aChar, User::Invariant());
316 TCharClassification c = Class(*aChar);
317 if (c == EOutOfRange && IsCombiningChar(*aChar, aBreaker))
319 return BreakAllowedBetween(DerivedClass(aChar - 1, aStart, aBreaker), c);
323 Returns whether a line break is possible within a run of characters all having
324 the class ESaLineBreakClass (Complex content). Languages with Unicocde
325 characters having such a class include: Thai, Lao, Myanmar and Khmer. This
326 default implementation of the GetLineBreakInContext() method only supports the
327 Thai script. Breaks are determined in Thai based on a simple understanding of
328 syllable boundaries. When characters from the other unsupported Sa class
329 languages are found the method exits with EFalse.
331 The text to be searched, which is a contiguous run of characters of class SA
332 (or CM attatched to SA). The break position may be restricted further by
333 aMinBreakPos and aMaxBreakPos, but more text is provided for extra context
336 The start of the text to be considered for line breaks.
338 The end of the text to be considered for line breaks.
340 ETrue if aBreakPos is to be set with the first legal break position,
341 EFalse if aBreakPos is to be set with the last legal break position.
343 If break position found on exit its value is >= Min and <= Max
346 ETrue if and only if a legal break was found, EFalse otherwise.
350 EXPORT_C TBool MLineBreaker::GetLineBreakInContext(const TDesC16& aText,
351 TInt aMinBreakPos, TInt aMaxBreakPos, TBool aForwards,
352 TInt& aBreakPos) const
354 __ASSERT_DEBUG (0 <= aMinBreakPos && aMaxBreakPos <= aText.Length(),
355 Panic(ELineBreakPanic_InvalidInputParam));
357 TInt length = aText.Length();
359 if (aMinBreakPos < 1)
361 if (length - 1 < aMaxBreakPos)
362 aMaxBreakPos = length - 1;
363 if (aMaxBreakPos < aMinBreakPos)
366 const TText16* text = aText.Ptr();
368 if (*text == KZeroWidthSpace)
370 aBreakPos = aMinBreakPos;
373 else if (*(text+length-1) == KZeroWidthSpace)
376 TInt start = aForwards? aMinBreakPos : aMaxBreakPos;
377 TInt end = aForwards? aMaxBreakPos + 1 : aMinBreakPos - 1;
378 TInt direction = aForwards? 1 : -1;
379 for (TInt i = start; i != end; i += direction)
381 if (ThaiLinebreakRules::BreakAllowedAt(text + i, text, *this))