sl@0
|
1 |
#
|
sl@0
|
2 |
# Copyright (c) 1997-2009 Nokia Corporation and/or its subsidiary(-ies).
|
sl@0
|
3 |
# All rights reserved.
|
sl@0
|
4 |
# This component and the accompanying materials are made available
|
sl@0
|
5 |
# under the terms of "Eclipse Public License v1.0"
|
sl@0
|
6 |
# which accompanies this distribution, and is available
|
sl@0
|
7 |
# at the URL "http://www.eclipse.org/legal/epl-v10.html".
|
sl@0
|
8 |
#
|
sl@0
|
9 |
# Initial Contributors:
|
sl@0
|
10 |
# Nokia Corporation - initial contribution.
|
sl@0
|
11 |
#
|
sl@0
|
12 |
# Contributors:
|
sl@0
|
13 |
#
|
sl@0
|
14 |
# Description:
|
sl@0
|
15 |
#
|
sl@0
|
16 |
|
sl@0
|
17 |
use strict;
|
sl@0
|
18 |
use integer;
|
sl@0
|
19 |
|
sl@0
|
20 |
BEGIN
|
sl@0
|
21 |
{
|
sl@0
|
22 |
my $perlScriptPath=$0;
|
sl@0
|
23 |
my $os = $^O; #get the OS type
|
sl@0
|
24 |
#check OS type
|
sl@0
|
25 |
if($os=~/MSWin32/) #Windows OS
|
sl@0
|
26 |
{
|
sl@0
|
27 |
$perlScriptPath=~s/\//\\/g; # replace any forward-slashes with back-slashes
|
sl@0
|
28 |
$perlScriptPath=~s/(\\?)[^\\]+$/$1/; # get rid of this Perl-script's file-name
|
sl@0
|
29 |
}
|
sl@0
|
30 |
else #Unix OS
|
sl@0
|
31 |
{
|
sl@0
|
32 |
$perlScriptPath=~s/\\/\//g; # replace any back-slashes with forward-slashes
|
sl@0
|
33 |
$perlScriptPath=~s/(\/?)[^\/]+$/$1/; # get rid of this Perl-script's file-name
|
sl@0
|
34 |
}
|
sl@0
|
35 |
unshift(@INC, $perlScriptPath); # can't do "use lib $perlScriptPath" here as "use lib" only seems to work with *hard-coded* directory names
|
sl@0
|
36 |
}
|
sl@0
|
37 |
use PARSER;
|
sl@0
|
38 |
use WRITER;
|
sl@0
|
39 |
|
sl@0
|
40 |
$|=1; # ensures that any progress information sent to the screen is displayed immediately and not buffered
|
sl@0
|
41 |
if ((@ARGV==0) || ($ARGV[0]=~/\?/i) || ($ARGV[0]=~/-h/i) || ($ARGV[0]=~/help/i))
|
sl@0
|
42 |
{
|
sl@0
|
43 |
die("\nVersion 021\n\nCharacter-set conversion-table generating tool\nCopyright (c) 2000-2009 Nokia Corporation and/or its subsidiary(-ies).\n\nUsage:\n\n\tcnvtool <control-file> <source-file> <output-file> [options]\n\nwhere the following options are available (each has a short form and a long form which are shown below separated by a '|'):\n\n\t-s | -generateSourceCode\n\t-c | -columns(<a>: <b>, <c>)\n\t-r | -omitReplacementForUnconvertibleUnicodeCharacters\n\t-p | -cutOutAnyPrivateUseUnicodeCharacterSlotsBeingUsed\n\t-u | -sourceFilesToSubtract(<a>, <b>, ...)\n\n");
|
sl@0
|
44 |
}
|
sl@0
|
45 |
my $generateSourceCode=0;
|
sl@0
|
46 |
my @columns=(2, 1, 2);
|
sl@0
|
47 |
my $omitReplacementForUnconvertibleUnicodeCharacters=0;
|
sl@0
|
48 |
my $cutOutAnyPrivateUseUnicodeCharacterSlotsBeingUsed=0;
|
sl@0
|
49 |
my @sourceFilesToSubtract=();
|
sl@0
|
50 |
my $flattenHashAndSave=0; # this flag is not published for use outside of the CHARCONV component
|
sl@0
|
51 |
&extractCommandLineFlags(\$generateSourceCode, \@columns, \$omitReplacementForUnconvertibleUnicodeCharacters, \$cutOutAnyPrivateUseUnicodeCharacterSlotsBeingUsed, \@sourceFilesToSubtract, \$flattenHashAndSave);
|
sl@0
|
52 |
(!$omitReplacementForUnconvertibleUnicodeCharacters || $generateSourceCode) or die("Error: bad combination of flags\n");
|
sl@0
|
53 |
my $controlFile=shift;
|
sl@0
|
54 |
my $sourceFile=shift;
|
sl@0
|
55 |
my $outputFile=shift;
|
sl@0
|
56 |
print("Generating $outputFile...\n");
|
sl@0
|
57 |
my $uid=0;
|
sl@0
|
58 |
my $endiannessAsText='';
|
sl@0
|
59 |
my $endianness=0;
|
sl@0
|
60 |
my $replacementForUnconvertibleUnicodeCharacters='';
|
sl@0
|
61 |
my @foreignVariableByteData=();
|
sl@0
|
62 |
my @foreignToUnicodeData=();
|
sl@0
|
63 |
my @unicodeToForeignData=();
|
sl@0
|
64 |
my %foreignCharacterCodes=();
|
sl@0
|
65 |
my %unicodeCharacterCodes=();
|
sl@0
|
66 |
my %preferredForeignCharacterCodesForConflictResolution=();
|
sl@0
|
67 |
my %preferredUnicodeCharacterCodesForConflictResolution=();
|
sl@0
|
68 |
my %additionalSubsetTables=();
|
sl@0
|
69 |
my %privateUseUnicodeCharacterSlotsUsed=();
|
sl@0
|
70 |
|
sl@0
|
71 |
print(" reading $controlFile...\n");
|
sl@0
|
72 |
open(CONTROL_FILE, "< $controlFile") or die("Error: could not open \"$controlFile\" for reading\n");
|
sl@0
|
73 |
&readHeaderFromControlFile(\*CONTROL_FILE, $controlFile, $generateSourceCode, \$uid, \$endiannessAsText, \$endianness, \$replacementForUnconvertibleUnicodeCharacters, $flattenHashAndSave);
|
sl@0
|
74 |
&readForeignVariableByteDataFromControlFile(\*CONTROL_FILE, $controlFile, \@foreignVariableByteData);
|
sl@0
|
75 |
&readOneDirectionDataFromControlFile(\*CONTROL_FILE, $controlFile, \@foreignToUnicodeData, \%preferredUnicodeCharacterCodesForConflictResolution, \%additionalSubsetTables, 1);
|
sl@0
|
76 |
&readOneDirectionDataFromControlFile(\*CONTROL_FILE, $controlFile, \@unicodeToForeignData, \%preferredForeignCharacterCodesForConflictResolution, \%additionalSubsetTables, 0);
|
sl@0
|
77 |
close(CONTROL_FILE) or die("Error: could not close \"$controlFile\"\n");
|
sl@0
|
78 |
|
sl@0
|
79 |
print(" reading $sourceFile...\n");
|
sl@0
|
80 |
open(SOURCE_FILE, "< $sourceFile") or die("Error: could not open \"$sourceFile\" for reading\n");
|
sl@0
|
81 |
&readSourceFile(\*SOURCE_FILE, $sourceFile, \%foreignCharacterCodes, \%unicodeCharacterCodes, \@columns, $cutOutAnyPrivateUseUnicodeCharacterSlotsBeingUsed, \%privateUseUnicodeCharacterSlotsUsed, 0);
|
sl@0
|
82 |
close(SOURCE_FILE) or die("Error: could not close \"$sourceFile\"\n");
|
sl@0
|
83 |
|
sl@0
|
84 |
my $sourceFileToSubtract;
|
sl@0
|
85 |
foreach $sourceFileToSubtract (@sourceFilesToSubtract)
|
sl@0
|
86 |
{
|
sl@0
|
87 |
print(" subtracting from $sourceFileToSubtract...\n");
|
sl@0
|
88 |
open(SOURCE_FILE_TO_SUBTRACT, "< $sourceFileToSubtract") or die("Error: could not open \"$sourceFileToSubtract\" for reading\n");
|
sl@0
|
89 |
&readSourceFile(\*SOURCE_FILE_TO_SUBTRACT, $sourceFileToSubtract, \%foreignCharacterCodes, \%unicodeCharacterCodes, \@columns, $cutOutAnyPrivateUseUnicodeCharacterSlotsBeingUsed, \%privateUseUnicodeCharacterSlotsUsed, 1);
|
sl@0
|
90 |
close(SOURCE_FILE_TO_SUBTRACT) or die("Error: could not close \"$sourceFileToSubtract\"\n");
|
sl@0
|
91 |
}
|
sl@0
|
92 |
|
sl@0
|
93 |
&warnIfAnyPrivateUseUnicodeCharacterSlotsBeingUsed(\%privateUseUnicodeCharacterSlotsUsed);
|
sl@0
|
94 |
&resolveConflictsAndFlattenArraysToScalars(\%foreignCharacterCodes, \%preferredForeignCharacterCodesForConflictResolution, 'Unicode', 'foreign');
|
sl@0
|
95 |
&resolveConflictsAndFlattenArraysToScalars(\%unicodeCharacterCodes, \%preferredUnicodeCharacterCodesForConflictResolution, 'foreign', 'Unicode');
|
sl@0
|
96 |
&checkForeignVariableByteData($endianness, \@foreignVariableByteData, \@foreignToUnicodeData);
|
sl@0
|
97 |
|
sl@0
|
98 |
print(" writing $outputFile...\n");
|
sl@0
|
99 |
open(OUTPUT_FILE, "> $outputFile") or die("Error: could not open \"$outputFile\" for writing\n");
|
sl@0
|
100 |
if ($generateSourceCode)
|
sl@0
|
101 |
{
|
sl@0
|
102 |
my @sourceCodeOfForeignToUnicodeIndexedTables16=();
|
sl@0
|
103 |
my @sourceCodeOfForeignToUnicodeKeyedTables1616=();
|
sl@0
|
104 |
my @sourceCodeOfForeignToUnicodeKeyedTables16OfIndexedTables16_indexedEntries=();
|
sl@0
|
105 |
my @sourceCodeOfForeignToUnicodeKeyedTables16OfIndexedTables16_keyedEntries=();
|
sl@0
|
106 |
|
sl@0
|
107 |
my @sourceCodeOfUnicodeToForeignIndexedTables16=();
|
sl@0
|
108 |
my @sourceCodeOfUnicodeToForeignKeyedTables1616=();
|
sl@0
|
109 |
my @sourceCodeOfUnicodeToForeignKeyedTables16OfIndexedTables16_indexedEntries=();
|
sl@0
|
110 |
my @sourceCodeOfUnicodeToForeignKeyedTables16OfIndexedTables16_keyedEntries=();
|
sl@0
|
111 |
|
sl@0
|
112 |
# new for 32 bit encoding begin
|
sl@0
|
113 |
my @sourceCodeOfForeignToUnicodeIndexedTables32=();
|
sl@0
|
114 |
my @sourceCodeOfForeignToUnicodeKeyedTables3232=();
|
sl@0
|
115 |
my @sourceCodeOfForeignToUnicodeKeyedTables32OfIndexedTables32_indexedEntries=();
|
sl@0
|
116 |
my @sourceCodeOfForeignToUnicodeKeyedTables32OfIndexedTables32_keyedEntries=();
|
sl@0
|
117 |
|
sl@0
|
118 |
my @sourceCodeOfUnicodeToForeignIndexedTables32=();
|
sl@0
|
119 |
my @sourceCodeOfUnicodeToForeignKeyedTables3232=();
|
sl@0
|
120 |
my @sourceCodeOfUnicodeToForeignKeyedTables32OfIndexedTables32_indexedEntries=();
|
sl@0
|
121 |
my @sourceCodeOfUnicodeToForeignKeyedTables32OfIndexedTables32_keyedEntries=();
|
sl@0
|
122 |
# new for 32 bit endcoding end
|
sl@0
|
123 |
|
sl@0
|
124 |
my @sourceCodeOfTopLevelStructures=();
|
sl@0
|
125 |
|
sl@0
|
126 |
&writeSourceCodeHeader(\*OUTPUT_FILE, $outputFile, $replacementForUnconvertibleUnicodeCharacters);
|
sl@0
|
127 |
&writeSourceCodeForeignVariableByteData(\@sourceCodeOfTopLevelStructures, \@foreignVariableByteData);
|
sl@0
|
128 |
&writeSourceCodeOneDirectionData(\@sourceCodeOfTopLevelStructures,
|
sl@0
|
129 |
\@sourceCodeOfForeignToUnicodeIndexedTables16, \@sourceCodeOfForeignToUnicodeKeyedTables1616, \@sourceCodeOfForeignToUnicodeKeyedTables16OfIndexedTables16_indexedEntries, \@sourceCodeOfForeignToUnicodeKeyedTables16OfIndexedTables16_keyedEntries,
|
sl@0
|
130 |
\@sourceCodeOfForeignToUnicodeIndexedTables32, \@sourceCodeOfForeignToUnicodeKeyedTables3232, \@sourceCodeOfForeignToUnicodeKeyedTables32OfIndexedTables32_indexedEntries, \@sourceCodeOfForeignToUnicodeKeyedTables32OfIndexedTables32_keyedEntries,
|
sl@0
|
131 |
\@foreignToUnicodeData, \%unicodeCharacterCodes, 1);
|
sl@0
|
132 |
&writeSourceCodeOneDirectionData(\@sourceCodeOfTopLevelStructures,
|
sl@0
|
133 |
\@sourceCodeOfUnicodeToForeignIndexedTables16, \@sourceCodeOfUnicodeToForeignKeyedTables1616, \@sourceCodeOfUnicodeToForeignKeyedTables16OfIndexedTables16_indexedEntries, \@sourceCodeOfUnicodeToForeignKeyedTables16OfIndexedTables16_keyedEntries,
|
sl@0
|
134 |
\@sourceCodeOfUnicodeToForeignIndexedTables32, \@sourceCodeOfUnicodeToForeignKeyedTables3232, \@sourceCodeOfUnicodeToForeignKeyedTables32OfIndexedTables32_indexedEntries, \@sourceCodeOfUnicodeToForeignKeyedTables32OfIndexedTables32_keyedEntries,
|
sl@0
|
135 |
\@unicodeToForeignData, \%foreignCharacterCodes, 0);
|
sl@0
|
136 |
&writeSourceCodeFinalStuff(\*OUTPUT_FILE,
|
sl@0
|
137 |
\@sourceCodeOfForeignToUnicodeIndexedTables16, \@sourceCodeOfForeignToUnicodeKeyedTables1616, \@sourceCodeOfForeignToUnicodeKeyedTables16OfIndexedTables16_indexedEntries, \@sourceCodeOfForeignToUnicodeKeyedTables16OfIndexedTables16_keyedEntries,
|
sl@0
|
138 |
\@sourceCodeOfUnicodeToForeignIndexedTables16, \@sourceCodeOfUnicodeToForeignKeyedTables1616, \@sourceCodeOfUnicodeToForeignKeyedTables16OfIndexedTables16_indexedEntries, \@sourceCodeOfUnicodeToForeignKeyedTables16OfIndexedTables16_keyedEntries,
|
sl@0
|
139 |
\@sourceCodeOfForeignToUnicodeIndexedTables32, \@sourceCodeOfForeignToUnicodeKeyedTables3232, \@sourceCodeOfForeignToUnicodeKeyedTables32OfIndexedTables32_indexedEntries, \@sourceCodeOfForeignToUnicodeKeyedTables32OfIndexedTables32_keyedEntries,
|
sl@0
|
140 |
\@sourceCodeOfUnicodeToForeignIndexedTables32, \@sourceCodeOfUnicodeToForeignKeyedTables3232, \@sourceCodeOfUnicodeToForeignKeyedTables32OfIndexedTables32_indexedEntries, \@sourceCodeOfUnicodeToForeignKeyedTables32OfIndexedTables32_keyedEntries,
|
sl@0
|
141 |
\@sourceCodeOfTopLevelStructures, $endiannessAsText, \%additionalSubsetTables);
|
sl@0
|
142 |
}
|
sl@0
|
143 |
elsif ($flattenHashAndSave)
|
sl@0
|
144 |
{
|
sl@0
|
145 |
binmode OUTPUT_FILE;
|
sl@0
|
146 |
#instead of calling the writeBinaryHeader, just write the data I need followed by
|
sl@0
|
147 |
# writeBinaryForeignVariableByteData...
|
sl@0
|
148 |
&write8(\*OUTPUT_FILE, $endianness);
|
sl@0
|
149 |
&write8(\*OUTPUT_FILE, length($replacementForUnconvertibleUnicodeCharacters));
|
sl@0
|
150 |
&writeString(\*OUTPUT_FILE, $replacementForUnconvertibleUnicodeCharacters);
|
sl@0
|
151 |
&writeBinaryForeignVariableByteData(\*OUTPUT_FILE, \@foreignVariableByteData);
|
sl@0
|
152 |
#choose %unicodeCharacterCodes and write the data as keypair
|
sl@0
|
153 |
my $key;
|
sl@0
|
154 |
my $rangekey;
|
sl@0
|
155 |
my $limit;
|
sl@0
|
156 |
foreach $key (keys(%unicodeCharacterCodes))
|
sl@0
|
157 |
{
|
sl@0
|
158 |
&write16(\*OUTPUT_FILE,$key);
|
sl@0
|
159 |
&write16(\*OUTPUT_FILE,$unicodeCharacterCodes{$key});
|
sl@0
|
160 |
}
|
sl@0
|
161 |
}
|
sl@0
|
162 |
else
|
sl@0
|
163 |
{
|
sl@0
|
164 |
binmode OUTPUT_FILE;
|
sl@0
|
165 |
&writeBinaryHeader(\*OUTPUT_FILE, $uid, $endianness, $replacementForUnconvertibleUnicodeCharacters);
|
sl@0
|
166 |
&writeBinaryForeignVariableByteData(\*OUTPUT_FILE, \@foreignVariableByteData);
|
sl@0
|
167 |
&writeBinaryOneDirectionData(\*OUTPUT_FILE, \@foreignToUnicodeData, \%unicodeCharacterCodes, 1);
|
sl@0
|
168 |
&writeBinaryOneDirectionData(\*OUTPUT_FILE, \@unicodeToForeignData, \%foreignCharacterCodes, 0);
|
sl@0
|
169 |
}
|
sl@0
|
170 |
close(OUTPUT_FILE) or die("Error: could not close \"$outputFile\"\n");
|
sl@0
|
171 |
print("complete\n\n");
|
sl@0
|
172 |
|
sl@0
|
173 |
sub extractCommandLineFlags()
|
sl@0
|
174 |
{
|
sl@0
|
175 |
my $generateSourceCode=shift;
|
sl@0
|
176 |
my $columns=shift;
|
sl@0
|
177 |
my $omitReplacementForUnconvertibleUnicodeCharacters=shift;
|
sl@0
|
178 |
my $cutOutAnyPrivateUseUnicodeCharacterSlotsBeingUsed=shift;
|
sl@0
|
179 |
my $sourceFilesToSubtract=shift;
|
sl@0
|
180 |
my $flattenHashAndSave=shift;
|
sl@0
|
181 |
my $i;
|
sl@0
|
182 |
for ($i=0; $i<=$#ARGV;) # (i) not cache-ing $#ARGV into a variable as @ARGV may change length in this loop (ii) iterate forwards as some parameters may occupy more than one element in @ARGV
|
sl@0
|
183 |
{
|
sl@0
|
184 |
if (($ARGV[$i]=~/^-s$/i) || ($ARGV[$i]=~/^-generateSourceCode$/i))
|
sl@0
|
185 |
{
|
sl@0
|
186 |
if ($$flattenHashAndSave==1)
|
sl@0
|
187 |
{
|
sl@0
|
188 |
die ("Error: Cannot have -s and -b flags set at the same time");
|
sl@0
|
189 |
}
|
sl@0
|
190 |
else
|
sl@0
|
191 |
{
|
sl@0
|
192 |
splice(@ARGV, $i, 1);
|
sl@0
|
193 |
$$generateSourceCode=1;
|
sl@0
|
194 |
}
|
sl@0
|
195 |
}
|
sl@0
|
196 |
elsif (($ARGV[$i]=~/^-c\b(.*)$/i) || ($ARGV[$i]=~/^-columns\b(.*)$/i))
|
sl@0
|
197 |
{
|
sl@0
|
198 |
my $columnsData=$1;
|
sl@0
|
199 |
splice(@ARGV, $i, 1);
|
sl@0
|
200 |
for (;;)
|
sl@0
|
201 |
{
|
sl@0
|
202 |
if ($columnsData=~/^\s*\(\s*(\d+)\s*:\s*(\d+)\s*\,?\s*(\d+)\s*\)\s*$/)
|
sl@0
|
203 |
{
|
sl@0
|
204 |
@$columns=($1, $2, $3);
|
sl@0
|
205 |
last;
|
sl@0
|
206 |
}
|
sl@0
|
207 |
($#ARGV>=$i) or die("Error: bad \"-columns\" format\n");
|
sl@0
|
208 |
$columnsData.=(splice(@ARGV, $i, 1))[0];
|
sl@0
|
209 |
}
|
sl@0
|
210 |
}
|
sl@0
|
211 |
elsif (($ARGV[$i]=~/^-r$/i) || ($ARGV[$i]=~/^-omitReplacementForUnconvertibleUnicodeCharacters$/i))
|
sl@0
|
212 |
{
|
sl@0
|
213 |
splice(@ARGV, $i, 1);
|
sl@0
|
214 |
$$omitReplacementForUnconvertibleUnicodeCharacters=1;
|
sl@0
|
215 |
}
|
sl@0
|
216 |
elsif (($ARGV[$i]=~/^-p$/i) || ($ARGV[$i]=~/^-cutOutAnyPrivateUseUnicodeCharacterSlotsBeingUsed$/i))
|
sl@0
|
217 |
{
|
sl@0
|
218 |
splice(@ARGV, $i, 1);
|
sl@0
|
219 |
$$cutOutAnyPrivateUseUnicodeCharacterSlotsBeingUsed=1;
|
sl@0
|
220 |
}
|
sl@0
|
221 |
elsif (($ARGV[$i]=~/^-u\b(.*)$/i) || ($ARGV[$i]=~/^-sourceFilesToSubtract\b(.*)$/i))
|
sl@0
|
222 |
{
|
sl@0
|
223 |
my $sourceFilesData=$1;
|
sl@0
|
224 |
splice(@ARGV, $i, 1);
|
sl@0
|
225 |
for (;;)
|
sl@0
|
226 |
{
|
sl@0
|
227 |
if ($sourceFilesData=~/^\s*\(\s*(.+)\)\s*$/)
|
sl@0
|
228 |
{
|
sl@0
|
229 |
my $sourceFilesData=$1;
|
sl@0
|
230 |
@$sourceFilesToSubtract=split(/,/, $sourceFilesData, -1);
|
sl@0
|
231 |
my $j;
|
sl@0
|
232 |
for ($j=$#$sourceFilesToSubtract; $j>=0; --$j)
|
sl@0
|
233 |
{
|
sl@0
|
234 |
$sourceFilesToSubtract->[$j]=~s/^\s+//;
|
sl@0
|
235 |
$sourceFilesToSubtract->[$j]=~s/\s+$//;
|
sl@0
|
236 |
($sourceFilesToSubtract->[$j] ne '') or die("Error: bad \"-sourceFilesToSubtract\" format (1)\n");
|
sl@0
|
237 |
}
|
sl@0
|
238 |
last;
|
sl@0
|
239 |
}
|
sl@0
|
240 |
($#ARGV>=$i) or die("Error: bad \"-sourceFilesToSubtract\" format (2)\n");
|
sl@0
|
241 |
$sourceFilesData.=(splice(@ARGV, $i, 1))[0];
|
sl@0
|
242 |
}
|
sl@0
|
243 |
}
|
sl@0
|
244 |
elsif (($ARGV[$i]=~/^-f$/i) || ($ARGV[$i]=~/^-flattenHashAndSave$/i))
|
sl@0
|
245 |
{
|
sl@0
|
246 |
if ($$generateSourceCode==1)
|
sl@0
|
247 |
{
|
sl@0
|
248 |
die ("Error: Cannot have -s and -b flags set at the same time");
|
sl@0
|
249 |
}
|
sl@0
|
250 |
else
|
sl@0
|
251 |
{
|
sl@0
|
252 |
splice(@ARGV, $i, 1);
|
sl@0
|
253 |
$$flattenHashAndSave=1;
|
sl@0
|
254 |
}
|
sl@0
|
255 |
}
|
sl@0
|
256 |
else
|
sl@0
|
257 |
{
|
sl@0
|
258 |
++$i;
|
sl@0
|
259 |
}
|
sl@0
|
260 |
}
|
sl@0
|
261 |
}
|
sl@0
|
262 |
|
sl@0
|
263 |
sub algorithm
|
sl@0
|
264 |
{
|
sl@0
|
265 |
my $algorithmAsText=shift;
|
sl@0
|
266 |
if ($algorithmAsText=~/^Direct$/i)
|
sl@0
|
267 |
{
|
sl@0
|
268 |
return 0;
|
sl@0
|
269 |
}
|
sl@0
|
270 |
elsif ($algorithmAsText=~/^Offset$/i)
|
sl@0
|
271 |
{
|
sl@0
|
272 |
return 1;
|
sl@0
|
273 |
}
|
sl@0
|
274 |
elsif ($algorithmAsText=~/^IndexedTable16$/i)
|
sl@0
|
275 |
{
|
sl@0
|
276 |
return 2;
|
sl@0
|
277 |
}
|
sl@0
|
278 |
elsif ($algorithmAsText=~/^KeyedTable1616$/i)
|
sl@0
|
279 |
{
|
sl@0
|
280 |
return 3;
|
sl@0
|
281 |
}
|
sl@0
|
282 |
elsif ($algorithmAsText=~/^KeyedTable16OfIndexedTables16$/i)
|
sl@0
|
283 |
{
|
sl@0
|
284 |
return 4;
|
sl@0
|
285 |
}
|
sl@0
|
286 |
elsif ($algorithmAsText=~/^IndexedTable32$/i)
|
sl@0
|
287 |
{
|
sl@0
|
288 |
return 5;
|
sl@0
|
289 |
}
|
sl@0
|
290 |
elsif ($algorithmAsText=~/^KeyedTable3232$/i)
|
sl@0
|
291 |
{
|
sl@0
|
292 |
return 6;
|
sl@0
|
293 |
}
|
sl@0
|
294 |
elsif ($algorithmAsText=~/^KeyedTable32OfIndexedTables32$/i)
|
sl@0
|
295 |
{
|
sl@0
|
296 |
return 7;
|
sl@0
|
297 |
}
|
sl@0
|
298 |
else
|
sl@0
|
299 |
{
|
sl@0
|
300 |
return -1;
|
sl@0
|
301 |
}
|
sl@0
|
302 |
}
|
sl@0
|
303 |
|
sl@0
|
304 |
sub hexadecimalify
|
sl@0
|
305 |
{
|
sl@0
|
306 |
my $string=shift;
|
sl@0
|
307 |
my $result='';
|
sl@0
|
308 |
my $lengthOfString=length($string);
|
sl@0
|
309 |
my $i;
|
sl@0
|
310 |
for ($i=0; $i<$lengthOfString; ++$i)
|
sl@0
|
311 |
{
|
sl@0
|
312 |
$result.=sprintf("\\x%02x", (unpack('C', substr($string, $i, 1)))[0]);
|
sl@0
|
313 |
}
|
sl@0
|
314 |
return $result;
|
sl@0
|
315 |
}
|
sl@0
|
316 |
|
sl@0
|
317 |
sub readSourceFile
|
sl@0
|
318 |
{
|
sl@0
|
319 |
my $fileHandle=shift;
|
sl@0
|
320 |
my $fileName=shift;
|
sl@0
|
321 |
my $foreignCharacterCodes=shift;
|
sl@0
|
322 |
my $unicodeCharacterCodes=shift;
|
sl@0
|
323 |
my $columns=shift;
|
sl@0
|
324 |
my $cutOutAnyPrivateUseUnicodeCharacterSlotsBeingUsed=shift;
|
sl@0
|
325 |
my $privateUseUnicodeCharacterSlotsUsed=shift;
|
sl@0
|
326 |
my $subtract=shift;
|
sl@0
|
327 |
my $foreignCharacterCodeProcessingCode='';
|
sl@0
|
328 |
if (!(($columns->[0]>0) && ($columns->[1]>0) && ($columns->[2]>0) && ($columns->[1]<=$columns->[0]) && ($columns->[2]<=$columns->[0]) && ($columns->[1]!=$columns->[2])))
|
sl@0
|
329 |
{
|
sl@0
|
330 |
close($fileHandle);
|
sl@0
|
331 |
die("Error: bad \"-columns\" data\n");
|
sl@0
|
332 |
}
|
sl@0
|
333 |
my $patternOfLineContainingCharacterCodes=join('\s+', ('0x([0-9a-f]+)') x $columns->[0]);
|
sl@0
|
334 |
my $line;
|
sl@0
|
335 |
my $strippedDownLine;
|
sl@0
|
336 |
for (;;)
|
sl@0
|
337 |
{
|
sl@0
|
338 |
($line, $strippedDownLine)=&nextNonEmptyStrippedDownLine($fileHandle);
|
sl@0
|
339 |
if (($strippedDownLine eq '')||(substr($strippedDownLine,0,1) eq chr(26))) # if there are no more lines in the file or if we encountered EOF character
|
sl@0
|
340 |
{
|
sl@0
|
341 |
last;
|
sl@0
|
342 |
}
|
sl@0
|
343 |
if ($strippedDownLine=~/^SET_FOREIGN_CHARACTER_CODE_PROCESSING_CODE\s+(.*)$/i)
|
sl@0
|
344 |
{
|
sl@0
|
345 |
$foreignCharacterCodeProcessingCode=$1;
|
sl@0
|
346 |
}
|
sl@0
|
347 |
elsif ($strippedDownLine=~/^$patternOfLineContainingCharacterCodes$/i)
|
sl@0
|
348 |
{
|
sl@0
|
349 |
no strict 'refs'; # so that we can use symbolic references for $1, $2, etc
|
sl@0
|
350 |
my $foreignCharacterCode=hex(${$columns->[1]});
|
sl@0
|
351 |
my $unicodeCharacterCode=hex(${$columns->[2]});
|
sl@0
|
352 |
use strict 'refs';
|
sl@0
|
353 |
if ($foreignCharacterCodeProcessingCode ne '')
|
sl@0
|
354 |
{
|
sl@0
|
355 |
$foreignCharacterCode=eval($foreignCharacterCodeProcessingCode);
|
sl@0
|
356 |
}
|
sl@0
|
357 |
my $handleConversionPair=1;
|
sl@0
|
358 |
if ((($unicodeCharacterCode>=0xe000) && ($unicodeCharacterCode<=0xf8ff)) || (($unicodeCharacterCode>=0xf0000) && ($unicodeCharacterCode<=0x10ffff)))
|
sl@0
|
359 |
{
|
sl@0
|
360 |
if ($cutOutAnyPrivateUseUnicodeCharacterSlotsBeingUsed)
|
sl@0
|
361 |
{
|
sl@0
|
362 |
$handleConversionPair=0;
|
sl@0
|
363 |
}
|
sl@0
|
364 |
else
|
sl@0
|
365 |
{
|
sl@0
|
366 |
if ($subtract)
|
sl@0
|
367 |
{
|
sl@0
|
368 |
delete $privateUseUnicodeCharacterSlotsUsed->{$unicodeCharacterCode};
|
sl@0
|
369 |
}
|
sl@0
|
370 |
else
|
sl@0
|
371 |
{
|
sl@0
|
372 |
$privateUseUnicodeCharacterSlotsUsed->{$unicodeCharacterCode}=1;
|
sl@0
|
373 |
}
|
sl@0
|
374 |
}
|
sl@0
|
375 |
}
|
sl@0
|
376 |
if ($handleConversionPair)
|
sl@0
|
377 |
{
|
sl@0
|
378 |
if ($subtract)
|
sl@0
|
379 |
{
|
sl@0
|
380 |
if (!defined($foreignCharacterCodes->{$unicodeCharacterCode}->{$foreignCharacterCode}))
|
sl@0
|
381 |
{
|
sl@0
|
382 |
close($fileHandle);
|
sl@0
|
383 |
die('Error: cannot subtract conversion pair ['.sprintf('foreign 0x%x, Unicode 0x%04x', $foreignCharacterCode, $unicodeCharacterCode)."] as it does not occur in \"$fileName\"\n");
|
sl@0
|
384 |
}
|
sl@0
|
385 |
if (!defined($unicodeCharacterCodes->{$foreignCharacterCode}->{$unicodeCharacterCode}))
|
sl@0
|
386 |
{
|
sl@0
|
387 |
close($fileHandle);
|
sl@0
|
388 |
die('Error: cannot subtract conversion pair ['.sprintf('Unicode 0x%04x, foreign 0x%x', $unicodeCharacterCode, $foreignCharacterCode)."] as it does not occur in \"$fileName\"\n");
|
sl@0
|
389 |
}
|
sl@0
|
390 |
delete $foreignCharacterCodes->{$unicodeCharacterCode}->{$foreignCharacterCode};
|
sl@0
|
391 |
if (keys(%{$foreignCharacterCodes->{$unicodeCharacterCode}})==0)
|
sl@0
|
392 |
{
|
sl@0
|
393 |
delete $foreignCharacterCodes->{$unicodeCharacterCode};
|
sl@0
|
394 |
}
|
sl@0
|
395 |
delete $unicodeCharacterCodes->{$foreignCharacterCode}->{$unicodeCharacterCode};
|
sl@0
|
396 |
if (keys(%{$unicodeCharacterCodes->{$foreignCharacterCode}})==0)
|
sl@0
|
397 |
{
|
sl@0
|
398 |
delete $unicodeCharacterCodes->{$foreignCharacterCode};
|
sl@0
|
399 |
}
|
sl@0
|
400 |
}
|
sl@0
|
401 |
else
|
sl@0
|
402 |
{
|
sl@0
|
403 |
if (defined($foreignCharacterCodes->{$unicodeCharacterCode}->{$foreignCharacterCode}))
|
sl@0
|
404 |
{
|
sl@0
|
405 |
close($fileHandle);
|
sl@0
|
406 |
die('Error: same conversion pair ['.sprintf('foreign 0x%x, Unicode 0x%04x', $foreignCharacterCode, $unicodeCharacterCode)."] occurs more than once in \"$fileName\"\n");
|
sl@0
|
407 |
}
|
sl@0
|
408 |
if (defined($unicodeCharacterCodes->{$foreignCharacterCode}->{$unicodeCharacterCode}))
|
sl@0
|
409 |
{
|
sl@0
|
410 |
close($fileHandle);
|
sl@0
|
411 |
die('Error: same conversion pair ['.sprintf('Unicode 0x%04x, foreign 0x%x', $unicodeCharacterCode, $foreignCharacterCode)."] occurs more than once in \"$fileName\"\n");
|
sl@0
|
412 |
}
|
sl@0
|
413 |
$foreignCharacterCodes->{$unicodeCharacterCode}->{$foreignCharacterCode}=1;
|
sl@0
|
414 |
$unicodeCharacterCodes->{$foreignCharacterCode}->{$unicodeCharacterCode}=1;
|
sl@0
|
415 |
}
|
sl@0
|
416 |
}
|
sl@0
|
417 |
}
|
sl@0
|
418 |
elsif ($line!~/^\s*0x([0-9a-f]+)\s*#\s*undefined.*$/i)
|
sl@0
|
419 |
{
|
sl@0
|
420 |
close($fileHandle);
|
sl@0
|
421 |
die("Error: unexpected line in \"$fileName\":\n $line\n");
|
sl@0
|
422 |
}
|
sl@0
|
423 |
}
|
sl@0
|
424 |
}
|
sl@0
|
425 |
|
sl@0
|
426 |
sub readHeaderFromControlFile
|
sl@0
|
427 |
{
|
sl@0
|
428 |
my $fileHandle=shift;
|
sl@0
|
429 |
my $fileName=shift;
|
sl@0
|
430 |
my $generateSourceCode=shift;
|
sl@0
|
431 |
my $uid=shift;
|
sl@0
|
432 |
my $endiannessAsText=shift;
|
sl@0
|
433 |
my $endianness=shift;
|
sl@0
|
434 |
my $replacementForUnconvertibleUnicodeCharacters=shift;
|
sl@0
|
435 |
my $flattenHashAndSave=shift;
|
sl@0
|
436 |
my $line;
|
sl@0
|
437 |
my $strippedDownLine;
|
sl@0
|
438 |
($line, $strippedDownLine)=&nextNonEmptyStrippedDownLine($fileHandle);
|
sl@0
|
439 |
if ($strippedDownLine=~/^UID\s+0x([0-9a-f]+)$/i)
|
sl@0
|
440 |
{
|
sl@0
|
441 |
if ($generateSourceCode)
|
sl@0
|
442 |
{
|
sl@0
|
443 |
print(STDERR "Warning: \"UID\" keyword should not be used with \"-generateSourceCode\" flag - specify the UID in the MMP file\n");
|
sl@0
|
444 |
}
|
sl@0
|
445 |
$$uid=hex($1);
|
sl@0
|
446 |
($line, $strippedDownLine)=&nextNonEmptyStrippedDownLine($fileHandle);
|
sl@0
|
447 |
}
|
sl@0
|
448 |
else
|
sl@0
|
449 |
{
|
sl@0
|
450 |
if (!$generateSourceCode && !$flattenHashAndSave)
|
sl@0
|
451 |
{
|
sl@0
|
452 |
close($fileHandle);
|
sl@0
|
453 |
die("Error: unexpected line in \"$fileName\" (\"UID\" keyword expected):\n $line\n");
|
sl@0
|
454 |
}
|
sl@0
|
455 |
}
|
sl@0
|
456 |
if ($strippedDownLine=~/^Name\s+"(.+?)"$/i)
|
sl@0
|
457 |
{
|
sl@0
|
458 |
print(STDERR "Warning: obsolete keyword \"Name\" used\n");
|
sl@0
|
459 |
($line, $strippedDownLine)=&nextNonEmptyStrippedDownLine($fileHandle);
|
sl@0
|
460 |
}
|
sl@0
|
461 |
if ($strippedDownLine!~/^Endianness\s+(\w+)$/i)
|
sl@0
|
462 |
{
|
sl@0
|
463 |
close($fileHandle);
|
sl@0
|
464 |
die("Error: unexpected line in \"$fileName\" (\"Endianness\" keyword expected):\n $line\n");
|
sl@0
|
465 |
}
|
sl@0
|
466 |
$$endiannessAsText=$1;
|
sl@0
|
467 |
if ($$endiannessAsText=~/Unspecified/i)
|
sl@0
|
468 |
{
|
sl@0
|
469 |
$$endianness=0; # SCnvConversionData::EUnspecified
|
sl@0
|
470 |
}
|
sl@0
|
471 |
elsif ($$endiannessAsText=~/FixedLittleEndian/i)
|
sl@0
|
472 |
{
|
sl@0
|
473 |
$$endianness=1; # SCnvConversionData::EFixedLittleEndian
|
sl@0
|
474 |
}
|
sl@0
|
475 |
elsif ($$endiannessAsText=~/FixedBigEndian/i)
|
sl@0
|
476 |
{
|
sl@0
|
477 |
$$endianness=2; # SCnvConversionData::EFixedBigEndian
|
sl@0
|
478 |
}
|
sl@0
|
479 |
else
|
sl@0
|
480 |
{
|
sl@0
|
481 |
close($fileHandle);
|
sl@0
|
482 |
die("Error: \"$$endiannessAsText\" is not a legal value for \"Endianness\"\n");
|
sl@0
|
483 |
}
|
sl@0
|
484 |
($line, $strippedDownLine)=&nextNonEmptyStrippedDownLine($fileHandle);
|
sl@0
|
485 |
if ($strippedDownLine!~/^ReplacementForUnconvertibleUnicodeCharacters\s+(.*?)$/i)
|
sl@0
|
486 |
{
|
sl@0
|
487 |
close($fileHandle);
|
sl@0
|
488 |
die("Error: unexpected line in \"$fileName\" (\"ReplacementForUnconvertibleUnicodeCharacters\" keyword expected):\n $line\n");
|
sl@0
|
489 |
}
|
sl@0
|
490 |
$$replacementForUnconvertibleUnicodeCharacters='';
|
sl@0
|
491 |
my $remainderOfXxx=$1;
|
sl@0
|
492 |
while ($remainderOfXxx ne '')
|
sl@0
|
493 |
{
|
sl@0
|
494 |
if ($remainderOfXxx!~/^0x([0-9a-f]{1,2})\s*(.*)$/i)
|
sl@0
|
495 |
{
|
sl@0
|
496 |
close($fileHandle);
|
sl@0
|
497 |
die("Error: unexpected line in \"$fileName\":\n $line\n");
|
sl@0
|
498 |
}
|
sl@0
|
499 |
$$replacementForUnconvertibleUnicodeCharacters.=pack("C", hex($1));
|
sl@0
|
500 |
$remainderOfXxx=$2;
|
sl@0
|
501 |
}
|
sl@0
|
502 |
my @temp=&nextNonEmptyStrippedDownLine($fileHandle);
|
sl@0
|
503 |
if ($temp[1]=~/^ForeignCharacterCodeProcessingCode/i)
|
sl@0
|
504 |
{
|
sl@0
|
505 |
print(STDERR "Warning: obsolete keyword \"ForeignCharacterCodeProcessingCode\" used\n");
|
sl@0
|
506 |
}
|
sl@0
|
507 |
else
|
sl@0
|
508 |
{
|
sl@0
|
509 |
ungetNonEmptyStrippedDownLine(@temp)
|
sl@0
|
510 |
}
|
sl@0
|
511 |
}
|
sl@0
|
512 |
|
sl@0
|
513 |
sub readForeignVariableByteDataFromControlFile
|
sl@0
|
514 |
{
|
sl@0
|
515 |
my $fileHandle=shift;
|
sl@0
|
516 |
my $fileName=shift;
|
sl@0
|
517 |
my $foreignVariableByteData=shift;
|
sl@0
|
518 |
my $line;
|
sl@0
|
519 |
my $strippedDownLine;
|
sl@0
|
520 |
($line, $strippedDownLine)=&nextNonEmptyStrippedDownLine($fileHandle);
|
sl@0
|
521 |
if ($strippedDownLine!~/^StartForeignVariableByteData$/i)
|
sl@0
|
522 |
{
|
sl@0
|
523 |
close($fileHandle);
|
sl@0
|
524 |
die("Error: unexpected line in \"$fileName\":\n $line\n");
|
sl@0
|
525 |
}
|
sl@0
|
526 |
|
sl@0
|
527 |
for (;;)
|
sl@0
|
528 |
{
|
sl@0
|
529 |
($line, $strippedDownLine)=&nextNonEmptyStrippedDownLine($fileHandle);
|
sl@0
|
530 |
if ($strippedDownLine=~/^EndForeignVariableByteData$/i)
|
sl@0
|
531 |
{
|
sl@0
|
532 |
last;
|
sl@0
|
533 |
}
|
sl@0
|
534 |
if ($strippedDownLine!~/^0x([0-9a-f]+)\s+0x([0-9a-f]+)\s+(\d+)$/i)
|
sl@0
|
535 |
{
|
sl@0
|
536 |
close($fileHandle);
|
sl@0
|
537 |
die("Error: unexpected line in \"$fileName\":\n $line\n");
|
sl@0
|
538 |
}
|
sl@0
|
539 |
my $firstInitialByteValueInRange=hex($1);
|
sl@0
|
540 |
my $lastInitialByteValueInRange=hex($2);
|
sl@0
|
541 |
my $numberOfSubsequentBytes=$3;
|
sl@0
|
542 |
if ($firstInitialByteValueInRange>0xff)
|
sl@0
|
543 |
{
|
sl@0
|
544 |
close($fileHandle);
|
sl@0
|
545 |
die("Error: firstInitialByteValueInRange ".sprintf("0x%02x", $firstInitialByteValueInRange)." does not fit in a single byte\n");
|
sl@0
|
546 |
}
|
sl@0
|
547 |
if ($lastInitialByteValueInRange>0xff)
|
sl@0
|
548 |
{
|
sl@0
|
549 |
close($fileHandle);
|
sl@0
|
550 |
die("Error: lastInitialByteValueInRange ".sprintf("0x%02x", $lastInitialByteValueInRange)." does not fit in a single byte\n");
|
sl@0
|
551 |
}
|
sl@0
|
552 |
if ($lastInitialByteValueInRange<$firstInitialByteValueInRange)
|
sl@0
|
553 |
{
|
sl@0
|
554 |
close($fileHandle);
|
sl@0
|
555 |
die("Error: lastInitialByteValueInRange ".sprintf("0x%02x", $lastInitialByteValueInRange)." is less than firstInitialByteValueInRange ".sprintf("0x%02x", $firstInitialByteValueInRange)."\n");
|
sl@0
|
556 |
}
|
sl@0
|
557 |
push(@$foreignVariableByteData, [$firstInitialByteValueInRange, $lastInitialByteValueInRange, $numberOfSubsequentBytes]);
|
sl@0
|
558 |
}
|
sl@0
|
559 |
}
|
sl@0
|
560 |
|
sl@0
|
561 |
sub readOneDirectionDataFromControlFile
|
sl@0
|
562 |
{
|
sl@0
|
563 |
my $fileHandle=shift;
|
sl@0
|
564 |
my $fileName=shift;
|
sl@0
|
565 |
my $oneDirectionData=shift;
|
sl@0
|
566 |
my $preferredCharacterCodesForConflictResolution=shift;
|
sl@0
|
567 |
my $additionalSubsetTables=shift;
|
sl@0
|
568 |
my $outputIsUnicode=shift;
|
sl@0
|
569 |
my $source=$outputIsUnicode? 'foreign': 'Unicode';
|
sl@0
|
570 |
my $target=$outputIsUnicode? 'Unicode': 'foreign';
|
sl@0
|
571 |
my $middlePortionOfKeyWords=$outputIsUnicode? "ForeignToUnicode": "UnicodeToForeign";
|
sl@0
|
572 |
my $extraPatternToMatch=$outputIsUnicode? '()': '\s+(\d+)';
|
sl@0
|
573 |
my $line;
|
sl@0
|
574 |
my $strippedDownLine;
|
sl@0
|
575 |
($line, $strippedDownLine)=&nextNonEmptyStrippedDownLine($fileHandle);
|
sl@0
|
576 |
if ($strippedDownLine!~/^Start${middlePortionOfKeyWords}Data$/i)
|
sl@0
|
577 |
{
|
sl@0
|
578 |
close($fileHandle);
|
sl@0
|
579 |
die("Error: unexpected line in \"$fileName\":\n $line\n");
|
sl@0
|
580 |
}
|
sl@0
|
581 |
my $doingConflictResolution=0;
|
sl@0
|
582 |
for (;;)
|
sl@0
|
583 |
{
|
sl@0
|
584 |
($line, $strippedDownLine)=&nextNonEmptyStrippedDownLine($fileHandle);
|
sl@0
|
585 |
if ($strippedDownLine=~/^End${middlePortionOfKeyWords}Data$/i)
|
sl@0
|
586 |
{
|
sl@0
|
587 |
last;
|
sl@0
|
588 |
}
|
sl@0
|
589 |
if ($strippedDownLine=~/^ConflictResolution$/i)
|
sl@0
|
590 |
{
|
sl@0
|
591 |
$doingConflictResolution=1;
|
sl@0
|
592 |
}
|
sl@0
|
593 |
elsif ($doingConflictResolution)
|
sl@0
|
594 |
{
|
sl@0
|
595 |
if ($strippedDownLine!~/^0x([0-9a-f]+)\s+0x([0-9a-f]+)$/i)
|
sl@0
|
596 |
{
|
sl@0
|
597 |
close($fileHandle);
|
sl@0
|
598 |
die("Error: unexpected line in \"$fileName\":\n $line\n");
|
sl@0
|
599 |
}
|
sl@0
|
600 |
my $sourceCharacterCodeToResolve=hex($1);
|
sl@0
|
601 |
my $targetCharacterCodePreferred=hex($2);
|
sl@0
|
602 |
$preferredCharacterCodesForConflictResolution->{$sourceCharacterCodeToResolve}=$targetCharacterCodePreferred;
|
sl@0
|
603 |
}
|
sl@0
|
604 |
elsif ($strippedDownLine=~/^(Start|End)AdditionalSubsetTable\s+(.*)$/i)
|
sl@0
|
605 |
{
|
sl@0
|
606 |
my $prefix=$1;
|
sl@0
|
607 |
my $nameOfAdditionalSubsetTable=$2;
|
sl@0
|
608 |
my $index=$prefix=~(/^Start$/i)? 0: 1;
|
sl@0
|
609 |
if (!$outputIsUnicode)
|
sl@0
|
610 |
{
|
sl@0
|
611 |
$index+=2;
|
sl@0
|
612 |
}
|
sl@0
|
613 |
if (defined($additionalSubsetTables{$nameOfAdditionalSubsetTable}->[$index]))
|
sl@0
|
614 |
{
|
sl@0
|
615 |
close($fileHandle);
|
sl@0
|
616 |
die("Error: multiple redefinition of \"${prefix}AdditionalSubsetTable $nameOfAdditionalSubsetTable\"\n");
|
sl@0
|
617 |
}
|
sl@0
|
618 |
$additionalSubsetTables{$nameOfAdditionalSubsetTable}->[$index]=@$oneDirectionData;
|
sl@0
|
619 |
}
|
sl@0
|
620 |
else
|
sl@0
|
621 |
{
|
sl@0
|
622 |
if ($strippedDownLine!~/^(\d+)\s+(\d+)\s+0x([0-9a-f]+)\s+0x([0-9a-f]+)\s+(\w+)$extraPatternToMatch\s+\{(.*?)\}$/i)
|
sl@0
|
623 |
{
|
sl@0
|
624 |
close($fileHandle);
|
sl@0
|
625 |
die("Error: unexpected line in \"$fileName\":\n $line\n");
|
sl@0
|
626 |
}
|
sl@0
|
627 |
my $includePriority=$1;
|
sl@0
|
628 |
my $searchPriority=$2;
|
sl@0
|
629 |
my $firstInputCharacterCodeInRange=hex($3);
|
sl@0
|
630 |
my $lastInputCharacterCodeInRange=hex($4);
|
sl@0
|
631 |
my $algorithmAsText=$5;
|
sl@0
|
632 |
my $sizeOfOutputCharacterCodeInBytes=$6;
|
sl@0
|
633 |
my $parameters=$7;
|
sl@0
|
634 |
if ($lastInputCharacterCodeInRange<$firstInputCharacterCodeInRange)
|
sl@0
|
635 |
{
|
sl@0
|
636 |
close($fileHandle);
|
sl@0
|
637 |
die("Error: lastInputCharacterCodeInRange ".sprintf("0x%02x", $lastInputCharacterCodeInRange)." is less than firstInputCharacterCodeInRange ".sprintf("0x%02x", $firstInputCharacterCodeInRange)."\n");
|
sl@0
|
638 |
}
|
sl@0
|
639 |
my $algorithm=&algorithm($algorithmAsText);
|
sl@0
|
640 |
if ($algorithm<0)
|
sl@0
|
641 |
{
|
sl@0
|
642 |
close($fileHandle);
|
sl@0
|
643 |
die("Error: unexpected algorithm \"$algorithmAsText\"\n");
|
sl@0
|
644 |
}
|
sl@0
|
645 |
my $rangeData=[$includePriority, $searchPriority, $firstInputCharacterCodeInRange, $lastInputCharacterCodeInRange, $algorithm];
|
sl@0
|
646 |
if (!$outputIsUnicode)
|
sl@0
|
647 |
{
|
sl@0
|
648 |
push(@$rangeData, $sizeOfOutputCharacterCodeInBytes);
|
sl@0
|
649 |
}
|
sl@0
|
650 |
push(@$rangeData, $parameters);
|
sl@0
|
651 |
push(@$oneDirectionData, $rangeData);
|
sl@0
|
652 |
}
|
sl@0
|
653 |
}
|
sl@0
|
654 |
}
|
sl@0
|
655 |
|
sl@0
|
656 |
sub warnIfAnyPrivateUseUnicodeCharacterSlotsBeingUsed
|
sl@0
|
657 |
{
|
sl@0
|
658 |
my $privateUseUnicodeCharacterSlotsUsed=shift;
|
sl@0
|
659 |
my @sortedPrivateUseUnicodeCharacterSlotsUsed=sort({$a<=>$b} keys(%$privateUseUnicodeCharacterSlotsUsed));
|
sl@0
|
660 |
if (@sortedPrivateUseUnicodeCharacterSlotsUsed>0)
|
sl@0
|
661 |
{
|
sl@0
|
662 |
my $lastPrivateUseUnicodeCharacterSlotUsed=$sortedPrivateUseUnicodeCharacterSlotsUsed[0];
|
sl@0
|
663 |
my $asText=sprintf('0x%04x', $lastPrivateUseUnicodeCharacterSlotUsed);
|
sl@0
|
664 |
my @asText=($asText);
|
sl@0
|
665 |
my $i;
|
sl@0
|
666 |
for ($i=1; $i<@sortedPrivateUseUnicodeCharacterSlotsUsed; ++$i) # this loop starts from 1 not 0 as we have already dealt with $sortedPrivateUseUnicodeCharacterSlotsUsed[0]
|
sl@0
|
667 |
{
|
sl@0
|
668 |
($sortedPrivateUseUnicodeCharacterSlotsUsed[$i]>$lastPrivateUseUnicodeCharacterSlotUsed) or die("Error: internal error 1\n");
|
sl@0
|
669 |
if ($sortedPrivateUseUnicodeCharacterSlotsUsed[$i]>$lastPrivateUseUnicodeCharacterSlotUsed+1)
|
sl@0
|
670 |
{
|
sl@0
|
671 |
$asText=sprintf('0x%04x', $lastPrivateUseUnicodeCharacterSlotUsed);
|
sl@0
|
672 |
if ($asText[-1] ne $asText)
|
sl@0
|
673 |
{
|
sl@0
|
674 |
$asText[-1].='-'.$asText;
|
sl@0
|
675 |
}
|
sl@0
|
676 |
push(@asText, sprintf('0x%04x', $sortedPrivateUseUnicodeCharacterSlotsUsed[$i]));
|
sl@0
|
677 |
}
|
sl@0
|
678 |
$lastPrivateUseUnicodeCharacterSlotUsed=$sortedPrivateUseUnicodeCharacterSlotsUsed[$i];
|
sl@0
|
679 |
}
|
sl@0
|
680 |
$asText=sprintf('0x%04x', $lastPrivateUseUnicodeCharacterSlotUsed);
|
sl@0
|
681 |
if ($asText[-1] ne $asText)
|
sl@0
|
682 |
{
|
sl@0
|
683 |
$asText[-1].='-'.$asText;
|
sl@0
|
684 |
}
|
sl@0
|
685 |
print(STDERR 'Warning: the following private-use Unicode character slots were used: ['.join(', ', @asText)."]\n");
|
sl@0
|
686 |
}
|
sl@0
|
687 |
}
|
sl@0
|
688 |
|
sl@0
|
689 |
sub resolveConflictsAndFlattenArraysToScalars
|
sl@0
|
690 |
{
|
sl@0
|
691 |
my $characterCodes=shift;
|
sl@0
|
692 |
my $preferredCharacterCodesForConflictResolution=shift;
|
sl@0
|
693 |
my $source=shift;
|
sl@0
|
694 |
my $target=shift;
|
sl@0
|
695 |
my $sourceCharacterCode;
|
sl@0
|
696 |
my $candidateTargetCharacterCodes;
|
sl@0
|
697 |
while (($sourceCharacterCode, $candidateTargetCharacterCodes)=each(%$characterCodes))
|
sl@0
|
698 |
{
|
sl@0
|
699 |
my @candidateTargetCharacterCodes=keys(%$candidateTargetCharacterCodes);
|
sl@0
|
700 |
if (@candidateTargetCharacterCodes<1)
|
sl@0
|
701 |
{
|
sl@0
|
702 |
die("Error: internal error 2\n");
|
sl@0
|
703 |
}
|
sl@0
|
704 |
if (@candidateTargetCharacterCodes==1)
|
sl@0
|
705 |
{
|
sl@0
|
706 |
$characterCodes->{$sourceCharacterCode}=$candidateTargetCharacterCodes[0];
|
sl@0
|
707 |
}
|
sl@0
|
708 |
else
|
sl@0
|
709 |
{
|
sl@0
|
710 |
if (!defined($preferredCharacterCodesForConflictResolution->{$sourceCharacterCode}))
|
sl@0
|
711 |
{
|
sl@0
|
712 |
die("Error: no preferred $target character code is specified for conflict resolution for the $source character code ".sprintf("0x%08x", $sourceCharacterCode)."\n");
|
sl@0
|
713 |
}
|
sl@0
|
714 |
my $preferredCharacterCodeIsNotACandidateForConflictResolution=1;
|
sl@0
|
715 |
my $candidateTargetCharacterCode;
|
sl@0
|
716 |
foreach $candidateTargetCharacterCode (@candidateTargetCharacterCodes)
|
sl@0
|
717 |
{
|
sl@0
|
718 |
if ($preferredCharacterCodesForConflictResolution->{$sourceCharacterCode}==$candidateTargetCharacterCode)
|
sl@0
|
719 |
{
|
sl@0
|
720 |
$preferredCharacterCodeIsNotACandidateForConflictResolution=0;
|
sl@0
|
721 |
last;
|
sl@0
|
722 |
}
|
sl@0
|
723 |
}
|
sl@0
|
724 |
if ($preferredCharacterCodeIsNotACandidateForConflictResolution)
|
sl@0
|
725 |
{
|
sl@0
|
726 |
die("Error: the preferred $target character code ".sprintf("0x%08x", $preferredCharacterCodesForConflictResolution->{$sourceCharacterCode})." is not a candidate for conflict resolution for the $source character code ".sprintf("0x%08x", $sourceCharacterCode)."\n");
|
sl@0
|
727 |
}
|
sl@0
|
728 |
$characterCodes->{$sourceCharacterCode}=$preferredCharacterCodesForConflictResolution->{$sourceCharacterCode};
|
sl@0
|
729 |
delete $preferredCharacterCodesForConflictResolution->{$sourceCharacterCode};
|
sl@0
|
730 |
}
|
sl@0
|
731 |
}
|
sl@0
|
732 |
my $numberOfPreferredCharacterCodesForConflictResolution=keys(%$preferredCharacterCodesForConflictResolution);
|
sl@0
|
733 |
if ($numberOfPreferredCharacterCodesForConflictResolution!=0)
|
sl@0
|
734 |
{
|
sl@0
|
735 |
print(STDERR "Warning: there are $numberOfPreferredCharacterCodesForConflictResolution $target preferred character codes specified for which there are no conflicts to resolve\n");
|
sl@0
|
736 |
}
|
sl@0
|
737 |
}
|
sl@0
|
738 |
|
sl@0
|
739 |
sub checkForeignVariableByteData
|
sl@0
|
740 |
{
|
sl@0
|
741 |
my $endianness=shift;
|
sl@0
|
742 |
my $foreignVariableByteData=shift;
|
sl@0
|
743 |
my $foreignToUnicodeData=shift;
|
sl@0
|
744 |
my $rangeData;
|
sl@0
|
745 |
my %initialForeignBytes=();
|
sl@0
|
746 |
foreach $rangeData (@$foreignVariableByteData)
|
sl@0
|
747 |
{
|
sl@0
|
748 |
my $initialByte;
|
sl@0
|
749 |
for ($initialByte=$rangeData->[0]; $initialByte<=$rangeData->[1]; ++$initialByte)
|
sl@0
|
750 |
{
|
sl@0
|
751 |
if (defined($initialForeignBytes{$initialByte}))
|
sl@0
|
752 |
{
|
sl@0
|
753 |
die("Error: the number of bytes subsequent to the initial foreign-byte $initialForeignBytes{$initialByte} is defined more than once\n");
|
sl@0
|
754 |
}
|
sl@0
|
755 |
$initialForeignBytes{$initialByte}=1;
|
sl@0
|
756 |
}
|
sl@0
|
757 |
}
|
sl@0
|
758 |
# if ($endianness!=0) # unfortunately, nothing can be checked if the $endianness is 0 (SCnvConversionData::EUnspecified)
|
sl@0
|
759 |
# {
|
sl@0
|
760 |
# foreach $rangeData (@$foreignToUnicodeData)
|
sl@0
|
761 |
# {
|
sl@0
|
762 |
# my $inputCharacterCode;
|
sl@0
|
763 |
# for ($inputCharacterCode=$rangeData->[2]; $inputCharacterCode<=$rangeData->[3]; ++$inputCharacterCode)
|
sl@0
|
764 |
# {
|
sl@0
|
765 |
# my $initialByte;
|
sl@0
|
766 |
# if ($endianness==1) # SCnvConversionData::EFixedLittleEndian
|
sl@0
|
767 |
# {
|
sl@0
|
768 |
# $initialByte=($inputCharacterCode&0xff);
|
sl@0
|
769 |
# }
|
sl@0
|
770 |
# elsif ($endianness==2) # SCnvConversionData::EFixedBigEndian
|
sl@0
|
771 |
# {
|
sl@0
|
772 |
# $initialByte=($inputCharacterCode&0xff00)>>8; ## this is hard-coded and needs to be done properly!
|
sl@0
|
773 |
# }
|
sl@0
|
774 |
# else
|
sl@0
|
775 |
# {
|
sl@0
|
776 |
# die("Error: internal error ??\n");
|
sl@0
|
777 |
# }
|
sl@0
|
778 |
# if (!defined($initialForeignBytes{$initialByte}))
|
sl@0
|
779 |
# {
|
sl@0
|
780 |
# die("Error: no number-of-subsequent-bytes is specified for the initial byte $initialByte\n");
|
sl@0
|
781 |
# }
|
sl@0
|
782 |
# }
|
sl@0
|
783 |
# }
|
sl@0
|
784 |
# }
|
sl@0
|
785 |
}
|
sl@0
|
786 |
|
sl@0
|
787 |
sub writeSourceCodeHeader
|
sl@0
|
788 |
{
|
sl@0
|
789 |
my $fileHandle=shift;
|
sl@0
|
790 |
my $fileName=shift;
|
sl@0
|
791 |
my $replacementForUnconvertibleUnicodeCharacters=shift;
|
sl@0
|
792 |
while ($fileName=~/^.*\\(.*)$/i)
|
sl@0
|
793 |
{
|
sl@0
|
794 |
$fileName=$1;
|
sl@0
|
795 |
}
|
sl@0
|
796 |
print($fileHandle "// $fileName\n//\n// Copyright (c) Nokia Corporation and/or its subsidiary(-ies) ".(1900+(gmtime(time))[5]).". All rights reserved.\n//\n\n");
|
sl@0
|
797 |
print($fileHandle "#include <e32std.h>\n#include <convdata.h>\n#include <convgeneratedcpp.h>\n\n#define ARRAY_LENGTH(aArray) (sizeof(aArray)/sizeof((aArray)\[0\]))\n\n#pragma warning (disable: 4049) // compiler limit : terminating line number emission\n\n");
|
sl@0
|
798 |
if (!$omitReplacementForUnconvertibleUnicodeCharacters)
|
sl@0
|
799 |
{
|
sl@0
|
800 |
print($fileHandle "_LIT8(KLit8ReplacementForUnconvertibleUnicodeCharacters, \"".&hexadecimalify($replacementForUnconvertibleUnicodeCharacters)."\");\n\n");
|
sl@0
|
801 |
print($fileHandle "GLDEF_C const TDesC8& ReplacementForUnconvertibleUnicodeCharacters_internal()\n\t{\n\treturn KLit8ReplacementForUnconvertibleUnicodeCharacters;\n\t}\n\n");
|
sl@0
|
802 |
}
|
sl@0
|
803 |
}
|
sl@0
|
804 |
|
sl@0
|
805 |
sub writeSourceCodeForeignVariableByteData
|
sl@0
|
806 |
{
|
sl@0
|
807 |
my $sourceCodeOfTopLevelStructures=shift;
|
sl@0
|
808 |
my $foreignVariableByteData=shift;
|
sl@0
|
809 |
push(@$sourceCodeOfTopLevelStructures, "LOCAL_D const SCnvConversionData::SVariableByteData::SRange foreignVariableByteDataRanges[]=\n\t\{\n");
|
sl@0
|
810 |
my $indexOfLastRange=$#$foreignVariableByteData;
|
sl@0
|
811 |
my $i;
|
sl@0
|
812 |
for ($i=0; $i<=$indexOfLastRange; ++$i)
|
sl@0
|
813 |
{
|
sl@0
|
814 |
my $rangeData=$foreignVariableByteData->[$i];
|
sl@0
|
815 |
if (@$rangeData!=3)
|
sl@0
|
816 |
{
|
sl@0
|
817 |
die("Error: internal error 3\n");
|
sl@0
|
818 |
}
|
sl@0
|
819 |
my $firstInitialByteValueInRange=$rangeData->[0];
|
sl@0
|
820 |
my $lastInitialByteValueInRange=$rangeData->[1];
|
sl@0
|
821 |
if ($lastInitialByteValueInRange<$firstInitialByteValueInRange)
|
sl@0
|
822 |
{
|
sl@0
|
823 |
die("Error: internal error 4\n");
|
sl@0
|
824 |
}
|
sl@0
|
825 |
my $numberOfSubsequentBytes=$rangeData->[2];
|
sl@0
|
826 |
push(@$sourceCodeOfTopLevelStructures, "\t\t\{\n\t\t".sprintf("0x%02x", $firstInitialByteValueInRange).",\n\t\t".sprintf("0x%02x", $lastInitialByteValueInRange).",\n\t\t$numberOfSubsequentBytes,\n\t\t0\n\t\t\}");
|
sl@0
|
827 |
if ($i<$indexOfLastRange)
|
sl@0
|
828 |
{
|
sl@0
|
829 |
push(@$sourceCodeOfTopLevelStructures, ',');
|
sl@0
|
830 |
}
|
sl@0
|
831 |
push(@$sourceCodeOfTopLevelStructures, "\n");
|
sl@0
|
832 |
}
|
sl@0
|
833 |
push(@$sourceCodeOfTopLevelStructures, "\t\};\n\n");
|
sl@0
|
834 |
}
|
sl@0
|
835 |
|
sl@0
|
836 |
sub writeSourceCodeOneDirectionData
|
sl@0
|
837 |
{
|
sl@0
|
838 |
my $sourceCodeOfTopLevelStructures=shift;
|
sl@0
|
839 |
my $sourceCodeOfOneDirectionIndexedTables16=shift;
|
sl@0
|
840 |
my $sourceCodeOfOneDirectionKeyedTables1616=shift;
|
sl@0
|
841 |
my $sourceCodeOfOneDirectionKeyedTables16OfIndexedTables16_indexedEntries=shift;
|
sl@0
|
842 |
my $sourceCodeOfOneDirectionKeyedTables16OfIndexedTables16_keyedEntries=shift;
|
sl@0
|
843 |
# new for 32 bit encoding begin
|
sl@0
|
844 |
my $sourceCodeOfOneDirectionIndexedTables32=shift;
|
sl@0
|
845 |
my $sourceCodeOfOneDirectionKeyedTables3232=shift;
|
sl@0
|
846 |
my $sourceCodeOfOneDirectionKeyedTables32OfIndexedTables32_indexedEntries=shift;
|
sl@0
|
847 |
my $sourceCodeOfOneDirectionKeyedTables32OfIndexedTables32_keyedEntries=shift;
|
sl@0
|
848 |
# new for 32 bit encoding end
|
sl@0
|
849 |
|
sl@0
|
850 |
my $oneDirectionData=shift;
|
sl@0
|
851 |
my $characterCodes=shift;
|
sl@0
|
852 |
my $outputIsUnicode=shift;
|
sl@0
|
853 |
push(@$sourceCodeOfTopLevelStructures, 'LOCAL_D const SCnvConversionData::SOneDirectionData::SRange '.($outputIsUnicode? 'foreignToUnicodeDataRanges': 'unicodeToForeignDataRanges')."[]=\n\t\{\n");
|
sl@0
|
854 |
my $formatForInputCharacters=$outputIsUnicode? '0x%02x': '0x%04x';
|
sl@0
|
855 |
my $formatForOutputCharacters=$outputIsUnicode? '0x%04x': '0x%02x';
|
sl@0
|
856 |
my $indexOfLastRange=$#$oneDirectionData;
|
sl@0
|
857 |
my $i;
|
sl@0
|
858 |
for ($i=0; $i<=$indexOfLastRange; ++$i)
|
sl@0
|
859 |
{
|
sl@0
|
860 |
my $rangeData=$oneDirectionData->[$i];
|
sl@0
|
861 |
# $rangeData is $includePriority, $searchPriority, $firstInputCharacterCodeInRange, $lastInputCharacterCodeInRange, $algorithm[, $sizeOfOutputCharacterCodeInBytes], $parameters
|
sl@0
|
862 |
if (scalar(@$rangeData)!=($outputIsUnicode? 6: 7))
|
sl@0
|
863 |
{
|
sl@0
|
864 |
die("Error: internal error 5\n");
|
sl@0
|
865 |
}
|
sl@0
|
866 |
my $firstInputCharacterCodeInRange=$rangeData->[2];
|
sl@0
|
867 |
my $lastInputCharacterCodeInRange=$rangeData->[3];
|
sl@0
|
868 |
if ($lastInputCharacterCodeInRange<$firstInputCharacterCodeInRange)
|
sl@0
|
869 |
{
|
sl@0
|
870 |
die("Error: internal error 6\n");
|
sl@0
|
871 |
}
|
sl@0
|
872 |
my $algorithmAsText=''; # set by the if-elsif stuff below
|
sl@0
|
873 |
my $sizeOfOutputCharacterCodeInBytesIfForeign=$outputIsUnicode? 0: $rangeData->[5];
|
sl@0
|
874 |
my $parameters=$rangeData->[$outputIsUnicode? 5: 6];
|
sl@0
|
875 |
my $word1=0; # set by the if-elsif stuff below
|
sl@0
|
876 |
my $algorithm=$rangeData->[4];
|
sl@0
|
877 |
if ($algorithm==0) # Direct
|
sl@0
|
878 |
{
|
sl@0
|
879 |
$algorithmAsText='Direct';
|
sl@0
|
880 |
my $characterCode;
|
sl@0
|
881 |
for ($characterCode=$firstInputCharacterCodeInRange; $characterCode<=$lastInputCharacterCodeInRange; ++$characterCode)
|
sl@0
|
882 |
{
|
sl@0
|
883 |
if (!defined($characterCodes->{$characterCode}))
|
sl@0
|
884 |
{
|
sl@0
|
885 |
die("Error: There is no conversion defined for ".($outputIsUnicode? 'foreign': 'Unicode')." character code ".sprintf("0x%08x", $characterCode)."\n");
|
sl@0
|
886 |
}
|
sl@0
|
887 |
if ($characterCodes->{$characterCode}!=$characterCode)
|
sl@0
|
888 |
{
|
sl@0
|
889 |
die("Error: the conversion from ".($outputIsUnicode? 'foreign': 'Unicode')." character code ".sprintf("0x%08x", $characterCode)." to ".($outputIsUnicode? 'Unicode': 'foreign')." character code ".sprintf("0x%08x", $characterCodes->{$characterCode})." is not a direct conversion\n");
|
sl@0
|
890 |
}
|
sl@0
|
891 |
delete $characterCodes->{$characterCode};
|
sl@0
|
892 |
}
|
sl@0
|
893 |
}
|
sl@0
|
894 |
elsif ($algorithm==1) # Offset
|
sl@0
|
895 |
{
|
sl@0
|
896 |
$algorithmAsText='Offset';
|
sl@0
|
897 |
my $offset=$characterCodes->{$firstInputCharacterCodeInRange}-$firstInputCharacterCodeInRange;
|
sl@0
|
898 |
delete $characterCodes->{$firstInputCharacterCodeInRange};
|
sl@0
|
899 |
my $characterCode;
|
sl@0
|
900 |
for ($characterCode=$firstInputCharacterCodeInRange+1; $characterCode<=$lastInputCharacterCodeInRange; ++$characterCode)
|
sl@0
|
901 |
{
|
sl@0
|
902 |
if (!defined($characterCodes->{$characterCode}))
|
sl@0
|
903 |
{
|
sl@0
|
904 |
die("Error: There is no conversion defined for ".($outputIsUnicode? 'foreign': 'Unicode')." character code ".sprintf("0x%08x (0x%08x-0x%08x)", $characterCode, $firstInputCharacterCodeInRange, $lastInputCharacterCodeInRange)."\n");
|
sl@0
|
905 |
}
|
sl@0
|
906 |
if ($characterCodes->{$characterCode}-$characterCode!=$offset)
|
sl@0
|
907 |
{
|
sl@0
|
908 |
die("Error: the conversion from ".($outputIsUnicode? 'foreign': 'Unicode')." character code ".sprintf("0x%08x", $characterCode)." to ".($outputIsUnicode? 'Unicode': 'foreign')." character code ".sprintf("0x%08x", $characterCodes->{$characterCode})." has a different offset from the previous one in the range\n");
|
sl@0
|
909 |
}
|
sl@0
|
910 |
delete $characterCodes->{$characterCode};
|
sl@0
|
911 |
}
|
sl@0
|
912 |
$word1="STATIC_CAST(TUint, $offset)";
|
sl@0
|
913 |
}
|
sl@0
|
914 |
elsif ($algorithm==2) # IndexedTable16
|
sl@0
|
915 |
{
|
sl@0
|
916 |
$algorithmAsText='IndexedTable16';
|
sl@0
|
917 |
my $nameOfNextOneDirectionIndexedTable16='indexedTable16_'.($outputIsUnicode? 'foreignToUnicode': 'unicodeToForeign').'_'.($#$sourceCodeOfOneDirectionIndexedTables16+2);
|
sl@0
|
918 |
my $sourceCodeOfNextOneDirectionIndexedTable16=[];
|
sl@0
|
919 |
push(@$sourceCodeOfNextOneDirectionIndexedTable16, "LOCAL_D const SCnvConversionData::SOneDirectionData::SRange::UData::SIndexedTable16::SEntry $nameOfNextOneDirectionIndexedTable16\[\]=\n\t\{\n");
|
sl@0
|
920 |
my $characterCode;
|
sl@0
|
921 |
for ($characterCode=$firstInputCharacterCodeInRange; $characterCode<=$lastInputCharacterCodeInRange; ++$characterCode)
|
sl@0
|
922 |
{
|
sl@0
|
923 |
if (!defined($characterCodes->{$characterCode}))
|
sl@0
|
924 |
{
|
sl@0
|
925 |
die("Error: There is no conversion defined for ".($outputIsUnicode? 'foreign': 'Unicode')." character code ".sprintf("0x%08x", $characterCode)."\n");
|
sl@0
|
926 |
}
|
sl@0
|
927 |
push(@$sourceCodeOfNextOneDirectionIndexedTable16, "\t\t\{\n\t\t".sprintf($formatForOutputCharacters, $characterCodes->{$characterCode})."\n\t\t\}");
|
sl@0
|
928 |
if ($characterCode<$lastInputCharacterCodeInRange)
|
sl@0
|
929 |
{
|
sl@0
|
930 |
push(@$sourceCodeOfNextOneDirectionIndexedTable16, ',');
|
sl@0
|
931 |
}
|
sl@0
|
932 |
push(@$sourceCodeOfNextOneDirectionIndexedTable16, "\n");
|
sl@0
|
933 |
delete $characterCodes->{$characterCode};
|
sl@0
|
934 |
}
|
sl@0
|
935 |
push(@$sourceCodeOfNextOneDirectionIndexedTable16, "\t\};\n\n");
|
sl@0
|
936 |
push(@$sourceCodeOfOneDirectionIndexedTables16, $sourceCodeOfNextOneDirectionIndexedTable16);
|
sl@0
|
937 |
$word1="UData_S$algorithmAsText($nameOfNextOneDirectionIndexedTable16)";
|
sl@0
|
938 |
}
|
sl@0
|
939 |
elsif ($algorithm==3) # KeyedTable1616
|
sl@0
|
940 |
{
|
sl@0
|
941 |
$algorithmAsText='KeyedTable1616';
|
sl@0
|
942 |
my $nameOfNextOneDirectionKeyedTable1616='keyedTable1616_'.($outputIsUnicode? 'foreignToUnicode': 'unicodeToForeign').'_'.($#$sourceCodeOfOneDirectionKeyedTables1616+2);
|
sl@0
|
943 |
my $sourceCodeOfNextOneDirectionKeyedTable1616=[];
|
sl@0
|
944 |
push(@$sourceCodeOfNextOneDirectionKeyedTable1616, "LOCAL_D const SCnvConversionData::SOneDirectionData::SRange::UData::SKeyedTable1616::SEntry $nameOfNextOneDirectionKeyedTable1616\[\]=\n\t\{\n");
|
sl@0
|
945 |
my @characterCodes=grep(($_>=$firstInputCharacterCodeInRange) && ($_<=$lastInputCharacterCodeInRange), sort({$a<=>$b} keys(%$characterCodes)));
|
sl@0
|
946 |
if (@characterCodes==0)
|
sl@0
|
947 |
{
|
sl@0
|
948 |
die("Error: There are no ".($outputIsUnicode? 'foreign': 'Unicode').'-to-'.($outputIsUnicode? 'Unicode': 'foreign')." characters to convert using KeyedTable1616 (range ".sprintf("$formatForInputCharacters-$formatForInputCharacters", $firstInputCharacterCodeInRange, $lastInputCharacterCodeInRange).").\n");
|
sl@0
|
949 |
}
|
sl@0
|
950 |
if ($characterCodes[0]!=$firstInputCharacterCodeInRange)
|
sl@0
|
951 |
{
|
sl@0
|
952 |
print(STDERR 'Warning: the specified start of the '.($outputIsUnicode? 'foreign': 'Unicode').' range '.sprintf("$formatForInputCharacters-$formatForInputCharacters", $firstInputCharacterCodeInRange, $lastInputCharacterCodeInRange).' could actually be '.sprintf("$formatForInputCharacters", $characterCodes[0])."\n");
|
sl@0
|
953 |
}
|
sl@0
|
954 |
if ($characterCodes[-1]!=$lastInputCharacterCodeInRange)
|
sl@0
|
955 |
{
|
sl@0
|
956 |
print(STDERR 'Warning: the specified end of the '.($outputIsUnicode? 'foreign': 'Unicode').' range '.sprintf("$formatForInputCharacters-$formatForInputCharacters", $firstInputCharacterCodeInRange, $lastInputCharacterCodeInRange).' could actually be '.sprintf("$formatForInputCharacters", $characterCodes[-1])."\n");
|
sl@0
|
957 |
}
|
sl@0
|
958 |
my $characterCode;
|
sl@0
|
959 |
foreach $characterCode (@characterCodes)
|
sl@0
|
960 |
{
|
sl@0
|
961 |
if (defined($characterCodes->{$characterCode}))
|
sl@0
|
962 |
{
|
sl@0
|
963 |
push(@$sourceCodeOfNextOneDirectionKeyedTable1616, "\t\t\{\n\t\t".sprintf($formatForInputCharacters, $characterCode).",\n\t\t".sprintf($formatForOutputCharacters, $characterCodes->{$characterCode})."\n\t\t\}");
|
sl@0
|
964 |
if ($characterCode<$characterCodes[-1])
|
sl@0
|
965 |
{
|
sl@0
|
966 |
push(@$sourceCodeOfNextOneDirectionKeyedTable1616, ',');
|
sl@0
|
967 |
}
|
sl@0
|
968 |
push(@$sourceCodeOfNextOneDirectionKeyedTable1616, "\n");
|
sl@0
|
969 |
delete $characterCodes->{$characterCode};
|
sl@0
|
970 |
}
|
sl@0
|
971 |
}
|
sl@0
|
972 |
push(@$sourceCodeOfNextOneDirectionKeyedTable1616, "\t\};\n\n");
|
sl@0
|
973 |
push(@$sourceCodeOfOneDirectionKeyedTables1616, $sourceCodeOfNextOneDirectionKeyedTable1616);
|
sl@0
|
974 |
$word1="UData_S$algorithmAsText($nameOfNextOneDirectionKeyedTable1616)";
|
sl@0
|
975 |
}
|
sl@0
|
976 |
elsif ($algorithm==4) # KeyedTable16OfIndexedTables16
|
sl@0
|
977 |
{
|
sl@0
|
978 |
$algorithmAsText='KeyedTable16OfIndexedTables16';
|
sl@0
|
979 |
my $nameOfNextOneDirectionKeyedTables16OfIndexedTables16_keyedEntries='keyedTables16OfIndexedTables16_keyedEntries_'.($outputIsUnicode? 'foreignToUnicode': 'unicodeToForeign').'_'.($#$sourceCodeOfOneDirectionKeyedTables16OfIndexedTables16_keyedEntries+2);
|
sl@0
|
980 |
my $sourceCodeOfNextOneDirectionKeyedTables16OfIndexedTables16_keyedEntries=[];
|
sl@0
|
981 |
push(@$sourceCodeOfNextOneDirectionKeyedTables16OfIndexedTables16_keyedEntries, "LOCAL_D const SCnvConversionData::SOneDirectionData::SRange::UData::SKeyedTable16OfIndexedTables16::SKeyedEntry $nameOfNextOneDirectionKeyedTables16OfIndexedTables16_keyedEntries\[\]=\n\t\{\n");
|
sl@0
|
982 |
my @characterCodes=grep(($_>=$firstInputCharacterCodeInRange) && ($_<=$lastInputCharacterCodeInRange), sort({$a<=>$b} keys(%$characterCodes)));
|
sl@0
|
983 |
if (@characterCodes==0)
|
sl@0
|
984 |
{
|
sl@0
|
985 |
die("Error: There are no ".($outputIsUnicode? 'foreign': 'Unicode').'-to-'.($outputIsUnicode? 'Unicode': 'foreign')." characters to convert using KeyedTable16OfIndexedTables16 (range ".sprintf("$formatForInputCharacters-$formatForInputCharacters", $firstInputCharacterCodeInRange, $lastInputCharacterCodeInRange).").\n");
|
sl@0
|
986 |
}
|
sl@0
|
987 |
if ($characterCodes[0]!=$firstInputCharacterCodeInRange)
|
sl@0
|
988 |
{
|
sl@0
|
989 |
print(STDERR 'Warning: the specified start of the '.($outputIsUnicode? 'foreign': 'Unicode').' range '.sprintf("$formatForInputCharacters-$formatForInputCharacters", $firstInputCharacterCodeInRange, $lastInputCharacterCodeInRange).' could actually be '.sprintf("$formatForInputCharacters", $characterCodes[0])."\n");
|
sl@0
|
990 |
}
|
sl@0
|
991 |
if ($characterCodes[-1]!=$lastInputCharacterCodeInRange)
|
sl@0
|
992 |
{
|
sl@0
|
993 |
print(STDERR 'Warning: the specified end of the '.($outputIsUnicode? 'foreign': 'Unicode').' range '.sprintf("$formatForInputCharacters-$formatForInputCharacters", $firstInputCharacterCodeInRange, $lastInputCharacterCodeInRange).' could actually be '.sprintf("$formatForInputCharacters", $characterCodes[-1])."\n");
|
sl@0
|
994 |
}
|
sl@0
|
995 |
my @characterCodeRanges=();
|
sl@0
|
996 |
my $minimumNumberOfEntriesPerIndexedTable=($parameters ne '')? $parameters: 0;
|
sl@0
|
997 |
my $firstInputCharacterCodeInIndexedTable=$characterCodes[0];
|
sl@0
|
998 |
my $previousCharacterCode=$firstInputCharacterCodeInIndexedTable;
|
sl@0
|
999 |
my $characterCode;
|
sl@0
|
1000 |
foreach $characterCode (@characterCodes)
|
sl@0
|
1001 |
{
|
sl@0
|
1002 |
($characterCode>=$previousCharacterCode) or die("Error: internal error 7\n");
|
sl@0
|
1003 |
if ($characterCode>$previousCharacterCode+1)
|
sl@0
|
1004 |
{
|
sl@0
|
1005 |
if (($previousCharacterCode-$firstInputCharacterCodeInIndexedTable)+1>=$minimumNumberOfEntriesPerIndexedTable)
|
sl@0
|
1006 |
{
|
sl@0
|
1007 |
push(@characterCodeRanges, [$firstInputCharacterCodeInIndexedTable, $previousCharacterCode]);
|
sl@0
|
1008 |
}
|
sl@0
|
1009 |
$firstInputCharacterCodeInIndexedTable=$characterCode;
|
sl@0
|
1010 |
}
|
sl@0
|
1011 |
$previousCharacterCode=$characterCode;
|
sl@0
|
1012 |
}
|
sl@0
|
1013 |
push(@characterCodeRanges, [$firstInputCharacterCodeInIndexedTable, $previousCharacterCode]);
|
sl@0
|
1014 |
@characterCodes=();
|
sl@0
|
1015 |
my $characterCodeRange;
|
sl@0
|
1016 |
foreach $characterCodeRange (@characterCodeRanges)
|
sl@0
|
1017 |
{
|
sl@0
|
1018 |
my $nameOfNextOneDirectionKeyedTables16OfIndexedTables16_indexedEntries='keyedTables16OfIndexedTables16_indexedEntries_'.($outputIsUnicode? 'foreignToUnicode': 'unicodeToForeign').'_'.($#$sourceCodeOfOneDirectionKeyedTables16OfIndexedTables16_indexedEntries+2);
|
sl@0
|
1019 |
my $sourceCodeOfNextOneDirectionKeyedTables16OfIndexedTables16_indexedEntries=[];
|
sl@0
|
1020 |
push(@$sourceCodeOfNextOneDirectionKeyedTables16OfIndexedTables16_indexedEntries, "LOCAL_D const TUint16 $nameOfNextOneDirectionKeyedTables16OfIndexedTables16_indexedEntries\[\]=\n\t\{\n");
|
sl@0
|
1021 |
my $characterCode;
|
sl@0
|
1022 |
my $lastInputCharacterCodeInIndexedTable=$characterCodeRange->[1];
|
sl@0
|
1023 |
for ($characterCode=$characterCodeRange->[0]; $characterCode<=$lastInputCharacterCodeInIndexedTable; ++$characterCode)
|
sl@0
|
1024 |
{
|
sl@0
|
1025 |
if (!defined($characterCodes->{$characterCode}))
|
sl@0
|
1026 |
{
|
sl@0
|
1027 |
die("Error: internal error 8\n");
|
sl@0
|
1028 |
}
|
sl@0
|
1029 |
push(@$sourceCodeOfNextOneDirectionKeyedTables16OfIndexedTables16_indexedEntries, "\t".sprintf($formatForOutputCharacters, $characterCodes->{$characterCode}));
|
sl@0
|
1030 |
if ($characterCode<$lastInputCharacterCodeInIndexedTable)
|
sl@0
|
1031 |
{
|
sl@0
|
1032 |
push(@$sourceCodeOfNextOneDirectionKeyedTables16OfIndexedTables16_indexedEntries, ',');
|
sl@0
|
1033 |
}
|
sl@0
|
1034 |
push(@$sourceCodeOfNextOneDirectionKeyedTables16OfIndexedTables16_indexedEntries, "\n");
|
sl@0
|
1035 |
delete $characterCodes->{$characterCode};
|
sl@0
|
1036 |
}
|
sl@0
|
1037 |
push(@$sourceCodeOfNextOneDirectionKeyedTables16OfIndexedTables16_indexedEntries, "\t\};\n\n");
|
sl@0
|
1038 |
push(@$sourceCodeOfOneDirectionKeyedTables16OfIndexedTables16_indexedEntries, $sourceCodeOfNextOneDirectionKeyedTables16OfIndexedTables16_indexedEntries);
|
sl@0
|
1039 |
push(@$sourceCodeOfNextOneDirectionKeyedTables16OfIndexedTables16_keyedEntries, "\t\t\{\n\t\t".sprintf($formatForInputCharacters, $characterCodeRange->[0]).",\n\t\t".sprintf($formatForInputCharacters, $characterCodeRange->[1]).",\n\t\t$nameOfNextOneDirectionKeyedTables16OfIndexedTables16_indexedEntries\n\t\t\}");
|
sl@0
|
1040 |
if ($characterCodeRange->[1]<$characterCodeRanges[-1]->[1])
|
sl@0
|
1041 |
{
|
sl@0
|
1042 |
push(@$sourceCodeOfNextOneDirectionKeyedTables16OfIndexedTables16_keyedEntries, ',');
|
sl@0
|
1043 |
}
|
sl@0
|
1044 |
push(@$sourceCodeOfNextOneDirectionKeyedTables16OfIndexedTables16_keyedEntries, "\n");
|
sl@0
|
1045 |
}
|
sl@0
|
1046 |
push(@$sourceCodeOfNextOneDirectionKeyedTables16OfIndexedTables16_keyedEntries, "\t\};\n\n");
|
sl@0
|
1047 |
push(@$sourceCodeOfOneDirectionKeyedTables16OfIndexedTables16_keyedEntries, $sourceCodeOfNextOneDirectionKeyedTables16OfIndexedTables16_keyedEntries);
|
sl@0
|
1048 |
$word1="UData_S$algorithmAsText($nameOfNextOneDirectionKeyedTables16OfIndexedTables16_keyedEntries)";
|
sl@0
|
1049 |
}
|
sl@0
|
1050 |
elsif ($algorithm==5) # IndexedTable32
|
sl@0
|
1051 |
{
|
sl@0
|
1052 |
$algorithmAsText='IndexedTable32';
|
sl@0
|
1053 |
my $nameOfNextOneDirectionIndexedTable32='indexedTable32_'.($outputIsUnicode? 'foreignToUnicode': 'unicodeToForeign').'_'.($#$sourceCodeOfOneDirectionIndexedTables32+2);
|
sl@0
|
1054 |
my $sourceCodeOfNextOneDirectionIndexedTable32=[];
|
sl@0
|
1055 |
push(@$sourceCodeOfNextOneDirectionIndexedTable32, "LOCAL_D const SCnvConversionData::SOneDirectionData::SRange::UData::SIndexedTable32::SEntry $nameOfNextOneDirectionIndexedTable32\[\]=\n\t\{\n");
|
sl@0
|
1056 |
my $characterCode;
|
sl@0
|
1057 |
for ($characterCode=$firstInputCharacterCodeInRange; $characterCode<=$lastInputCharacterCodeInRange; ++$characterCode)
|
sl@0
|
1058 |
{
|
sl@0
|
1059 |
if (!defined($characterCodes->{$characterCode}))
|
sl@0
|
1060 |
{
|
sl@0
|
1061 |
die("Error: There is no conversion defined for ".($outputIsUnicode? 'foreign': 'Unicode')." character code ".sprintf("0x%08x", $characterCode)."\n");
|
sl@0
|
1062 |
}
|
sl@0
|
1063 |
push(@$sourceCodeOfNextOneDirectionIndexedTable32, "\t\t\{\n\t\t".sprintf($formatForOutputCharacters, $characterCodes->{$characterCode})."\n\t\t\}");
|
sl@0
|
1064 |
if ($characterCode<$lastInputCharacterCodeInRange)
|
sl@0
|
1065 |
{
|
sl@0
|
1066 |
push(@$sourceCodeOfNextOneDirectionIndexedTable32, ',');
|
sl@0
|
1067 |
}
|
sl@0
|
1068 |
push(@$sourceCodeOfNextOneDirectionIndexedTable32, "\n");
|
sl@0
|
1069 |
delete $characterCodes->{$characterCode};
|
sl@0
|
1070 |
}
|
sl@0
|
1071 |
push(@$sourceCodeOfNextOneDirectionIndexedTable32, "\t\};\n\n");
|
sl@0
|
1072 |
push(@$sourceCodeOfOneDirectionIndexedTables32, $sourceCodeOfNextOneDirectionIndexedTable32);
|
sl@0
|
1073 |
$word1="UData_S$algorithmAsText($nameOfNextOneDirectionIndexedTable32)";
|
sl@0
|
1074 |
}
|
sl@0
|
1075 |
elsif ($algorithm==6) # KeyedTable3232
|
sl@0
|
1076 |
{
|
sl@0
|
1077 |
$algorithmAsText='KeyedTable3232';
|
sl@0
|
1078 |
my $nameOfNextOneDirectionKeyedTable3232='keyedTable3232_'.($outputIsUnicode? 'foreignToUnicode': 'unicodeToForeign').'_'.($#$sourceCodeOfOneDirectionKeyedTables3232+2);
|
sl@0
|
1079 |
my $sourceCodeOfNextOneDirectionKeyedTable3232=[];
|
sl@0
|
1080 |
push(@$sourceCodeOfNextOneDirectionKeyedTable3232, "LOCAL_D const SCnvConversionData::SOneDirectionData::SRange::UData::SKeyedTable3232::SEntry $nameOfNextOneDirectionKeyedTable3232\[\]=\n\t\{\n");
|
sl@0
|
1081 |
my @characterCodes=grep(($_>=$firstInputCharacterCodeInRange) && ($_<=$lastInputCharacterCodeInRange), sort({$a<=>$b} keys(%$characterCodes)));
|
sl@0
|
1082 |
if (@characterCodes==0)
|
sl@0
|
1083 |
{
|
sl@0
|
1084 |
die("Error: There are no ".($outputIsUnicode? 'foreign': 'Unicode').'-to-'.($outputIsUnicode? 'Unicode': 'foreign')." characters to convert using KeyedTable3232 (range ".sprintf("$formatForInputCharacters-$formatForInputCharacters", $firstInputCharacterCodeInRange, $lastInputCharacterCodeInRange).").\n");
|
sl@0
|
1085 |
}
|
sl@0
|
1086 |
if ($characterCodes[0]!=$firstInputCharacterCodeInRange)
|
sl@0
|
1087 |
{
|
sl@0
|
1088 |
print(STDERR 'Warning: the specified start of the '.($outputIsUnicode? 'foreign': 'Unicode').' range '.sprintf("$formatForInputCharacters-$formatForInputCharacters", $firstInputCharacterCodeInRange, $lastInputCharacterCodeInRange).' could actually be '.sprintf($formatForInputCharacters, $characterCodes[0])."\n");
|
sl@0
|
1089 |
}
|
sl@0
|
1090 |
if ($characterCodes[-1]!=$lastInputCharacterCodeInRange)
|
sl@0
|
1091 |
{
|
sl@0
|
1092 |
print(STDERR 'Warning: the specified end of the '.($outputIsUnicode? 'foreign': 'Unicode').' range '.sprintf("$formatForInputCharacters-$formatForInputCharacters", $firstInputCharacterCodeInRange, $lastInputCharacterCodeInRange).' could actually be '.sprintf($formatForInputCharacters, $characterCodes[-1])."\n");
|
sl@0
|
1093 |
}
|
sl@0
|
1094 |
my $characterCode;
|
sl@0
|
1095 |
foreach $characterCode (@characterCodes)
|
sl@0
|
1096 |
{
|
sl@0
|
1097 |
if (defined($characterCodes->{$characterCode}))
|
sl@0
|
1098 |
{
|
sl@0
|
1099 |
push(@$sourceCodeOfNextOneDirectionKeyedTable3232, "\t\t\{\n\t\t".sprintf($formatForInputCharacters, $characterCode).",\n\t\t".sprintf($formatForOutputCharacters, $characterCodes->{$characterCode})."\n\t\t\}");
|
sl@0
|
1100 |
if ($characterCode<$characterCodes[-1])
|
sl@0
|
1101 |
{
|
sl@0
|
1102 |
push(@$sourceCodeOfNextOneDirectionKeyedTable3232, ',');
|
sl@0
|
1103 |
}
|
sl@0
|
1104 |
push(@$sourceCodeOfNextOneDirectionKeyedTable3232, "\n");
|
sl@0
|
1105 |
delete $characterCodes->{$characterCode};
|
sl@0
|
1106 |
}
|
sl@0
|
1107 |
}
|
sl@0
|
1108 |
push(@$sourceCodeOfNextOneDirectionKeyedTable3232, "\t\};\n\n");
|
sl@0
|
1109 |
push(@$sourceCodeOfOneDirectionKeyedTables3232, $sourceCodeOfNextOneDirectionKeyedTable3232);
|
sl@0
|
1110 |
$word1="UData_S$algorithmAsText($nameOfNextOneDirectionKeyedTable3232)";
|
sl@0
|
1111 |
}
|
sl@0
|
1112 |
elsif ($algorithm==7) # KeyedTable32OfIndexedTables32
|
sl@0
|
1113 |
{
|
sl@0
|
1114 |
$algorithmAsText='KeyedTable32OfIndexedTables32';
|
sl@0
|
1115 |
my $nameOfNextOneDirectionKeyedTables32OfIndexedTables32_keyedEntries='keyedTables32OfIndexedTables32_keyedEntries_'.($outputIsUnicode? 'foreignToUnicode': 'unicodeToForeign').'_'.($#$sourceCodeOfOneDirectionKeyedTables32OfIndexedTables32_keyedEntries+2);
|
sl@0
|
1116 |
my $sourceCodeOfNextOneDirectionKeyedTables32OfIndexedTables32_keyedEntries=[];
|
sl@0
|
1117 |
push(@$sourceCodeOfNextOneDirectionKeyedTables32OfIndexedTables32_keyedEntries, "LOCAL_D const SCnvConversionData::SOneDirectionData::SRange::UData::SKeyedTable32OfIndexedTables32::SKeyedEntry $nameOfNextOneDirectionKeyedTables32OfIndexedTables32_keyedEntries\[\]=\n\t\{\n");
|
sl@0
|
1118 |
my @characterCodes=grep(($_>=$firstInputCharacterCodeInRange) && ($_<=$lastInputCharacterCodeInRange), sort({$a<=>$b} keys(%$characterCodes)));
|
sl@0
|
1119 |
if (@characterCodes==0)
|
sl@0
|
1120 |
{
|
sl@0
|
1121 |
die("Error: There are no ".($outputIsUnicode? 'foreign': 'Unicode').'-to-'.($outputIsUnicode? 'Unicode': 'foreign')." characters to convert using KeyedTable32OfIndexedTables32 (range ".sprintf("$formatForInputCharacters-$formatForInputCharacters", $firstInputCharacterCodeInRange, $lastInputCharacterCodeInRange).").\n");
|
sl@0
|
1122 |
}
|
sl@0
|
1123 |
if ($characterCodes[0]!=$firstInputCharacterCodeInRange)
|
sl@0
|
1124 |
{
|
sl@0
|
1125 |
print(STDERR 'Warning: the specified start of the '.($outputIsUnicode? 'foreign': 'Unicode').' range '.sprintf("$formatForInputCharacters-$formatForInputCharacters", $firstInputCharacterCodeInRange, $lastInputCharacterCodeInRange).' could actually be '.sprintf("$formatForInputCharacters", $characterCodes[0])."\n");
|
sl@0
|
1126 |
}
|
sl@0
|
1127 |
if ($characterCodes[-1]!=$lastInputCharacterCodeInRange)
|
sl@0
|
1128 |
{
|
sl@0
|
1129 |
print(STDERR 'Warning: the specified end of the '.($outputIsUnicode? 'foreign': 'Unicode').' range '.sprintf("$formatForInputCharacters-$formatForInputCharacters", $firstInputCharacterCodeInRange, $lastInputCharacterCodeInRange).' could actually be '.sprintf("$formatForInputCharacters", $characterCodes[-1])."\n");
|
sl@0
|
1130 |
}
|
sl@0
|
1131 |
my @characterCodeRanges=();
|
sl@0
|
1132 |
my $minimumNumberOfEntriesPerIndexedTable=($parameters ne '')? $parameters: 0;
|
sl@0
|
1133 |
my $firstInputCharacterCodeInIndexedTable=$characterCodes[0];
|
sl@0
|
1134 |
my $previousCharacterCode=$firstInputCharacterCodeInIndexedTable;
|
sl@0
|
1135 |
my $characterCode;
|
sl@0
|
1136 |
foreach $characterCode (@characterCodes)
|
sl@0
|
1137 |
{
|
sl@0
|
1138 |
($characterCode>=$previousCharacterCode) or die("Error: internal error 7\n");
|
sl@0
|
1139 |
if ($characterCode>$previousCharacterCode+1)
|
sl@0
|
1140 |
{
|
sl@0
|
1141 |
if (($previousCharacterCode-$firstInputCharacterCodeInIndexedTable)+1>=$minimumNumberOfEntriesPerIndexedTable)
|
sl@0
|
1142 |
{
|
sl@0
|
1143 |
push(@characterCodeRanges, [$firstInputCharacterCodeInIndexedTable, $previousCharacterCode]);
|
sl@0
|
1144 |
}
|
sl@0
|
1145 |
$firstInputCharacterCodeInIndexedTable=$characterCode;
|
sl@0
|
1146 |
}
|
sl@0
|
1147 |
$previousCharacterCode=$characterCode;
|
sl@0
|
1148 |
}
|
sl@0
|
1149 |
push(@characterCodeRanges, [$firstInputCharacterCodeInIndexedTable, $previousCharacterCode]);
|
sl@0
|
1150 |
@characterCodes=();
|
sl@0
|
1151 |
my $characterCodeRange;
|
sl@0
|
1152 |
foreach $characterCodeRange (@characterCodeRanges)
|
sl@0
|
1153 |
{
|
sl@0
|
1154 |
my $nameOfNextOneDirectionKeyedTables32OfIndexedTables32_indexedEntries='keyedTables32OfIndexedTables32_indexedEntries_'.($outputIsUnicode? 'foreignToUnicode': 'unicodeToForeign').'_'.($#$sourceCodeOfOneDirectionKeyedTables32OfIndexedTables32_indexedEntries+2);
|
sl@0
|
1155 |
my $sourceCodeOfNextOneDirectionKeyedTables32OfIndexedTables32_indexedEntries=[];
|
sl@0
|
1156 |
push(@$sourceCodeOfNextOneDirectionKeyedTables32OfIndexedTables32_indexedEntries, "LOCAL_D const TUint32 $nameOfNextOneDirectionKeyedTables32OfIndexedTables32_indexedEntries\[\]=\n\t\{\n");
|
sl@0
|
1157 |
my $characterCode;
|
sl@0
|
1158 |
my $lastInputCharacterCodeInIndexedTable=$characterCodeRange->[1];
|
sl@0
|
1159 |
for ($characterCode=$characterCodeRange->[0]; $characterCode<=$lastInputCharacterCodeInIndexedTable; ++$characterCode)
|
sl@0
|
1160 |
{
|
sl@0
|
1161 |
if (!defined($characterCodes->{$characterCode}))
|
sl@0
|
1162 |
{
|
sl@0
|
1163 |
die("Error: internal error 8\n");
|
sl@0
|
1164 |
}
|
sl@0
|
1165 |
push(@$sourceCodeOfNextOneDirectionKeyedTables32OfIndexedTables32_indexedEntries, "\t".sprintf($formatForOutputCharacters, $characterCodes->{$characterCode}));
|
sl@0
|
1166 |
if ($characterCode<$lastInputCharacterCodeInIndexedTable)
|
sl@0
|
1167 |
{
|
sl@0
|
1168 |
push(@$sourceCodeOfNextOneDirectionKeyedTables32OfIndexedTables32_indexedEntries, ',');
|
sl@0
|
1169 |
}
|
sl@0
|
1170 |
push(@$sourceCodeOfNextOneDirectionKeyedTables32OfIndexedTables32_indexedEntries, "\n");
|
sl@0
|
1171 |
delete $characterCodes->{$characterCode};
|
sl@0
|
1172 |
}
|
sl@0
|
1173 |
push(@$sourceCodeOfNextOneDirectionKeyedTables32OfIndexedTables32_indexedEntries, "\t\};\n\n");
|
sl@0
|
1174 |
push(@$sourceCodeOfOneDirectionKeyedTables32OfIndexedTables32_indexedEntries, $sourceCodeOfNextOneDirectionKeyedTables32OfIndexedTables32_indexedEntries);
|
sl@0
|
1175 |
push(@$sourceCodeOfNextOneDirectionKeyedTables32OfIndexedTables32_keyedEntries, "\t\t\{\n\t\t".sprintf($formatForInputCharacters, $characterCodeRange->[0]).",\n\t\t".sprintf($formatForInputCharacters, $characterCodeRange->[1]).",\n\t\t$nameOfNextOneDirectionKeyedTables32OfIndexedTables32_indexedEntries\n\t\t\}");
|
sl@0
|
1176 |
if ($characterCodeRange->[1]<$characterCodeRanges[-1]->[1])
|
sl@0
|
1177 |
{
|
sl@0
|
1178 |
push(@$sourceCodeOfNextOneDirectionKeyedTables32OfIndexedTables32_keyedEntries, ',');
|
sl@0
|
1179 |
}
|
sl@0
|
1180 |
push(@$sourceCodeOfNextOneDirectionKeyedTables32OfIndexedTables32_keyedEntries, "\n");
|
sl@0
|
1181 |
}
|
sl@0
|
1182 |
push(@$sourceCodeOfNextOneDirectionKeyedTables32OfIndexedTables32_keyedEntries, "\t\};\n\n");
|
sl@0
|
1183 |
push(@$sourceCodeOfOneDirectionKeyedTables32OfIndexedTables32_keyedEntries, $sourceCodeOfNextOneDirectionKeyedTables32OfIndexedTables32_keyedEntries);
|
sl@0
|
1184 |
$word1="UData_S$algorithmAsText($nameOfNextOneDirectionKeyedTables32OfIndexedTables32_keyedEntries)";
|
sl@0
|
1185 |
}
|
sl@0
|
1186 |
else
|
sl@0
|
1187 |
{
|
sl@0
|
1188 |
die("Error: internal error 9\n");
|
sl@0
|
1189 |
}
|
sl@0
|
1190 |
push(@$sourceCodeOfTopLevelStructures, "\t\t\{\n\t\t".sprintf($formatForInputCharacters, $firstInputCharacterCodeInRange).",\n\t\t".sprintf($formatForInputCharacters, $lastInputCharacterCodeInRange).",\n\t\tSCnvConversionData::SOneDirectionData::SRange::E$algorithmAsText,\n\t\t".$sizeOfOutputCharacterCodeInBytesIfForeign.",\n\t\t0,\n\t\t\t\{\n\t\t\t".$word1."\n\t\t\t\}\n\t\t\}");
|
sl@0
|
1191 |
if ($i<$indexOfLastRange)
|
sl@0
|
1192 |
{
|
sl@0
|
1193 |
push(@$sourceCodeOfTopLevelStructures, ',');
|
sl@0
|
1194 |
}
|
sl@0
|
1195 |
push(@$sourceCodeOfTopLevelStructures, "\n");
|
sl@0
|
1196 |
}
|
sl@0
|
1197 |
my @characterCodes=sort({$a<=>$b} keys(%$characterCodes));
|
sl@0
|
1198 |
if (@characterCodes>0)
|
sl@0
|
1199 |
{
|
sl@0
|
1200 |
die('The following '.($outputIsUnicode? 'foreign': 'Unicode').' characters have no conversion algorithm specified: ['.join(', ', map(sprintf($formatForInputCharacters, $_), @characterCodes))."\]\n");
|
sl@0
|
1201 |
}
|
sl@0
|
1202 |
push(@$sourceCodeOfTopLevelStructures, "\t\};\n\n");
|
sl@0
|
1203 |
}
|
sl@0
|
1204 |
|
sl@0
|
1205 |
sub writeSourceCodeFinalStuff
|
sl@0
|
1206 |
{
|
sl@0
|
1207 |
my $fileHandle=shift;
|
sl@0
|
1208 |
my $sourceCodeOfForeignToUnicodeIndexedTables16=shift;
|
sl@0
|
1209 |
my $sourceCodeOfForeignToUnicodeKeyedTables1616=shift;
|
sl@0
|
1210 |
my $sourceCodeOfForeignToUnicodeKeyedTables16OfIndexedTables16_indexedEntries=shift;
|
sl@0
|
1211 |
my $sourceCodeOfForeignToUnicodeKeyedTables16OfIndexedTables16_keyedEntries=shift;
|
sl@0
|
1212 |
my $sourceCodeOfUnicodeToForeignIndexedTables16=shift;
|
sl@0
|
1213 |
my $sourceCodeOfUnicodeToForeignKeyedTables1616=shift;
|
sl@0
|
1214 |
my $sourceCodeOfUnicodeToForeignKeyedTables16OfIndexedTables16_indexedEntries=shift;
|
sl@0
|
1215 |
my $sourceCodeOfUnicodeToForeignKeyedTables16OfIndexedTables16_keyedEntries=shift;
|
sl@0
|
1216 |
|
sl@0
|
1217 |
my $sourceCodeOfForeignToUnicodeIndexedTables32=shift;
|
sl@0
|
1218 |
my $sourceCodeOfForeignToUnicodeKeyedTables3232=shift;
|
sl@0
|
1219 |
my $sourceCodeOfForeignToUnicodeKeyedTables32OfIndexedTables32_indexedEntries=shift;
|
sl@0
|
1220 |
my $sourceCodeOfForeignToUnicodeKeyedTables32OfIndexedTables32_keyedEntries=shift;
|
sl@0
|
1221 |
my $sourceCodeOfUnicodeToForeignIndexedTables32=shift;
|
sl@0
|
1222 |
my $sourceCodeOfUnicodeToForeignKeyedTables3232=shift;
|
sl@0
|
1223 |
my $sourceCodeOfUnicodeToForeignKeyedTables32OfIndexedTables32_indexedEntries=shift;
|
sl@0
|
1224 |
my $sourceCodeOfUnicodeToForeignKeyedTables32OfIndexedTables32_keyedEntries=shift;
|
sl@0
|
1225 |
|
sl@0
|
1226 |
my $sourceCodeOfTopLevelStructures=shift;
|
sl@0
|
1227 |
my $endiannessAsText=shift;
|
sl@0
|
1228 |
my $additionalSubsetTables=shift;
|
sl@0
|
1229 |
my $sourceCodeChunk;
|
sl@0
|
1230 |
my $arrayOfSourceCodeChunks;
|
sl@0
|
1231 |
|
sl@0
|
1232 |
foreach $arrayOfSourceCodeChunks (@$sourceCodeOfForeignToUnicodeIndexedTables16)
|
sl@0
|
1233 |
{
|
sl@0
|
1234 |
foreach $sourceCodeChunk (@$arrayOfSourceCodeChunks)
|
sl@0
|
1235 |
{
|
sl@0
|
1236 |
print($fileHandle $sourceCodeChunk);
|
sl@0
|
1237 |
}
|
sl@0
|
1238 |
}
|
sl@0
|
1239 |
foreach $arrayOfSourceCodeChunks (@$sourceCodeOfForeignToUnicodeKeyedTables1616)
|
sl@0
|
1240 |
{
|
sl@0
|
1241 |
foreach $sourceCodeChunk (@$arrayOfSourceCodeChunks)
|
sl@0
|
1242 |
{
|
sl@0
|
1243 |
print($fileHandle $sourceCodeChunk);
|
sl@0
|
1244 |
}
|
sl@0
|
1245 |
}
|
sl@0
|
1246 |
foreach $arrayOfSourceCodeChunks (@$sourceCodeOfForeignToUnicodeKeyedTables16OfIndexedTables16_indexedEntries)
|
sl@0
|
1247 |
{
|
sl@0
|
1248 |
foreach $sourceCodeChunk (@$arrayOfSourceCodeChunks)
|
sl@0
|
1249 |
{
|
sl@0
|
1250 |
print($fileHandle $sourceCodeChunk);
|
sl@0
|
1251 |
}
|
sl@0
|
1252 |
}
|
sl@0
|
1253 |
foreach $arrayOfSourceCodeChunks (@$sourceCodeOfForeignToUnicodeKeyedTables16OfIndexedTables16_keyedEntries)
|
sl@0
|
1254 |
{
|
sl@0
|
1255 |
foreach $sourceCodeChunk (@$arrayOfSourceCodeChunks)
|
sl@0
|
1256 |
{
|
sl@0
|
1257 |
print($fileHandle $sourceCodeChunk);
|
sl@0
|
1258 |
}
|
sl@0
|
1259 |
}
|
sl@0
|
1260 |
foreach $arrayOfSourceCodeChunks (@$sourceCodeOfUnicodeToForeignIndexedTables16)
|
sl@0
|
1261 |
{
|
sl@0
|
1262 |
foreach $sourceCodeChunk (@$arrayOfSourceCodeChunks)
|
sl@0
|
1263 |
{
|
sl@0
|
1264 |
print($fileHandle $sourceCodeChunk);
|
sl@0
|
1265 |
}
|
sl@0
|
1266 |
}
|
sl@0
|
1267 |
foreach $arrayOfSourceCodeChunks (@$sourceCodeOfUnicodeToForeignKeyedTables1616)
|
sl@0
|
1268 |
{
|
sl@0
|
1269 |
foreach $sourceCodeChunk (@$arrayOfSourceCodeChunks)
|
sl@0
|
1270 |
{
|
sl@0
|
1271 |
print($fileHandle $sourceCodeChunk);
|
sl@0
|
1272 |
}
|
sl@0
|
1273 |
}
|
sl@0
|
1274 |
foreach $arrayOfSourceCodeChunks (@$sourceCodeOfUnicodeToForeignKeyedTables16OfIndexedTables16_indexedEntries)
|
sl@0
|
1275 |
{
|
sl@0
|
1276 |
foreach $sourceCodeChunk (@$arrayOfSourceCodeChunks)
|
sl@0
|
1277 |
{
|
sl@0
|
1278 |
print($fileHandle $sourceCodeChunk);
|
sl@0
|
1279 |
}
|
sl@0
|
1280 |
}
|
sl@0
|
1281 |
foreach $arrayOfSourceCodeChunks (@$sourceCodeOfUnicodeToForeignKeyedTables16OfIndexedTables16_keyedEntries)
|
sl@0
|
1282 |
{
|
sl@0
|
1283 |
foreach $sourceCodeChunk (@$arrayOfSourceCodeChunks)
|
sl@0
|
1284 |
{
|
sl@0
|
1285 |
print($fileHandle $sourceCodeChunk);
|
sl@0
|
1286 |
}
|
sl@0
|
1287 |
}
|
sl@0
|
1288 |
# for 32 bit encoding begin
|
sl@0
|
1289 |
foreach $arrayOfSourceCodeChunks (@$sourceCodeOfForeignToUnicodeIndexedTables32)
|
sl@0
|
1290 |
{
|
sl@0
|
1291 |
foreach $sourceCodeChunk (@$arrayOfSourceCodeChunks)
|
sl@0
|
1292 |
{
|
sl@0
|
1293 |
print($fileHandle $sourceCodeChunk);
|
sl@0
|
1294 |
}
|
sl@0
|
1295 |
}
|
sl@0
|
1296 |
foreach $arrayOfSourceCodeChunks (@$sourceCodeOfForeignToUnicodeKeyedTables3232)
|
sl@0
|
1297 |
{
|
sl@0
|
1298 |
foreach $sourceCodeChunk (@$arrayOfSourceCodeChunks)
|
sl@0
|
1299 |
{
|
sl@0
|
1300 |
print($fileHandle $sourceCodeChunk);
|
sl@0
|
1301 |
}
|
sl@0
|
1302 |
}
|
sl@0
|
1303 |
foreach $arrayOfSourceCodeChunks (@$sourceCodeOfForeignToUnicodeKeyedTables32OfIndexedTables32_indexedEntries)
|
sl@0
|
1304 |
{
|
sl@0
|
1305 |
foreach $sourceCodeChunk (@$arrayOfSourceCodeChunks)
|
sl@0
|
1306 |
{
|
sl@0
|
1307 |
print($fileHandle $sourceCodeChunk);
|
sl@0
|
1308 |
}
|
sl@0
|
1309 |
}
|
sl@0
|
1310 |
foreach $arrayOfSourceCodeChunks (@$sourceCodeOfForeignToUnicodeKeyedTables32OfIndexedTables32_keyedEntries)
|
sl@0
|
1311 |
{
|
sl@0
|
1312 |
foreach $sourceCodeChunk (@$arrayOfSourceCodeChunks)
|
sl@0
|
1313 |
{
|
sl@0
|
1314 |
print($fileHandle $sourceCodeChunk);
|
sl@0
|
1315 |
}
|
sl@0
|
1316 |
}
|
sl@0
|
1317 |
foreach $arrayOfSourceCodeChunks (@$sourceCodeOfUnicodeToForeignIndexedTables32)
|
sl@0
|
1318 |
{
|
sl@0
|
1319 |
foreach $sourceCodeChunk (@$arrayOfSourceCodeChunks)
|
sl@0
|
1320 |
{
|
sl@0
|
1321 |
print($fileHandle $sourceCodeChunk);
|
sl@0
|
1322 |
}
|
sl@0
|
1323 |
}
|
sl@0
|
1324 |
foreach $arrayOfSourceCodeChunks (@$sourceCodeOfUnicodeToForeignKeyedTables3232)
|
sl@0
|
1325 |
{
|
sl@0
|
1326 |
foreach $sourceCodeChunk (@$arrayOfSourceCodeChunks)
|
sl@0
|
1327 |
{
|
sl@0
|
1328 |
print($fileHandle $sourceCodeChunk);
|
sl@0
|
1329 |
}
|
sl@0
|
1330 |
}
|
sl@0
|
1331 |
foreach $arrayOfSourceCodeChunks (@$sourceCodeOfUnicodeToForeignKeyedTables32OfIndexedTables32_indexedEntries)
|
sl@0
|
1332 |
{
|
sl@0
|
1333 |
foreach $sourceCodeChunk (@$arrayOfSourceCodeChunks)
|
sl@0
|
1334 |
{
|
sl@0
|
1335 |
print($fileHandle $sourceCodeChunk);
|
sl@0
|
1336 |
}
|
sl@0
|
1337 |
}
|
sl@0
|
1338 |
foreach $arrayOfSourceCodeChunks (@$sourceCodeOfUnicodeToForeignKeyedTables32OfIndexedTables32_keyedEntries)
|
sl@0
|
1339 |
{
|
sl@0
|
1340 |
foreach $sourceCodeChunk (@$arrayOfSourceCodeChunks)
|
sl@0
|
1341 |
{
|
sl@0
|
1342 |
print($fileHandle $sourceCodeChunk);
|
sl@0
|
1343 |
}
|
sl@0
|
1344 |
}
|
sl@0
|
1345 |
# for 32 bit encoding end
|
sl@0
|
1346 |
foreach $sourceCodeChunk (@$sourceCodeOfTopLevelStructures)
|
sl@0
|
1347 |
{
|
sl@0
|
1348 |
print($fileHandle $sourceCodeChunk);
|
sl@0
|
1349 |
}
|
sl@0
|
1350 |
|
sl@0
|
1351 |
print($fileHandle "GLDEF_D const SCnvConversionData conversionData=\n\t\{\n\tSCnvConversionData::E$endiannessAsText,\n\t\t\{\n\t\tARRAY_LENGTH(foreignVariableByteDataRanges),\n\t\tforeignVariableByteDataRanges\n\t\t\},\n\t\t\{\n\t\tARRAY_LENGTH(foreignToUnicodeDataRanges),\n\t\tforeignToUnicodeDataRanges\n\t\t\},\n\t\t\{\n\t\tARRAY_LENGTH(unicodeToForeignDataRanges),\n\t\tunicodeToForeignDataRanges\n\t\t\},\n\tNULL,\n\tNULL\n\t\};\n\n");
|
sl@0
|
1352 |
|
sl@0
|
1353 |
my $additionalSubsetTableName;
|
sl@0
|
1354 |
my $additionalSubsetTableData;
|
sl@0
|
1355 |
while (($additionalSubsetTableName, $additionalSubsetTableData)=each(%$additionalSubsetTables))
|
sl@0
|
1356 |
{
|
sl@0
|
1357 |
(defined($additionalSubsetTableData->[0]) && defined($additionalSubsetTableData->[1]) && defined($additionalSubsetTableData->[2]) && defined($additionalSubsetTableData->[3])) or die("Error: incomplete definition of \"$additionalSubsetTableName\"\n");
|
sl@0
|
1358 |
print($fileHandle "GLREF_D const SCnvConversionData $additionalSubsetTableName;\n");
|
sl@0
|
1359 |
print($fileHandle "GLDEF_D const SCnvConversionData $additionalSubsetTableName=\n\t\{\n\tSCnvConversionData::E$endiannessAsText,\n\t\t\{\n\t\tARRAY_LENGTH(foreignVariableByteDataRanges),\n\t\tforeignVariableByteDataRanges\n\t\t\},\n\t\t\{\n\t\t$additionalSubsetTableData->[1]-$additionalSubsetTableData->[0],\n\t\tforeignToUnicodeDataRanges+$additionalSubsetTableData->[0]\n\t\t\},\n\t\t\{\n\t\t$additionalSubsetTableData->[3]-$additionalSubsetTableData->[2],\n\t\tunicodeToForeignDataRanges+$additionalSubsetTableData->[2]\n\t\t\}\n\t\};\n\n");
|
sl@0
|
1360 |
}
|
sl@0
|
1361 |
}
|
sl@0
|
1362 |
|
sl@0
|
1363 |
sub writeBinaryHeader
|
sl@0
|
1364 |
{
|
sl@0
|
1365 |
my $fileHandle=shift;
|
sl@0
|
1366 |
my $uid=shift;
|
sl@0
|
1367 |
my $endianness=shift;
|
sl@0
|
1368 |
my $replacementForUnconvertibleUnicodeCharacters=shift;
|
sl@0
|
1369 |
&writeUids($fileHandle, 0x100011bd, $uid, 0);
|
sl@0
|
1370 |
&write32($fileHandle, 1); # version number of the file format
|
sl@0
|
1371 |
&write32($fileHandle, 0); # not currently used
|
sl@0
|
1372 |
&write8($fileHandle, 0); # number of Unicode characters in the name (which is now derived from the file-name, hence why this is zero)
|
sl@0
|
1373 |
&write8($fileHandle, $endianness);
|
sl@0
|
1374 |
&write8($fileHandle, length($replacementForUnconvertibleUnicodeCharacters));
|
sl@0
|
1375 |
&writeString($fileHandle, $replacementForUnconvertibleUnicodeCharacters);
|
sl@0
|
1376 |
}
|
sl@0
|
1377 |
|
sl@0
|
1378 |
sub writeBinaryForeignVariableByteData
|
sl@0
|
1379 |
{
|
sl@0
|
1380 |
my $fileHandle=shift;
|
sl@0
|
1381 |
my $foreignVariableByteData=shift;
|
sl@0
|
1382 |
&writePositiveIntegerCompacted30($fileHandle, scalar(@$foreignVariableByteData));
|
sl@0
|
1383 |
my $rangeData;
|
sl@0
|
1384 |
foreach $rangeData (@$foreignVariableByteData)
|
sl@0
|
1385 |
{
|
sl@0
|
1386 |
if (@$rangeData!=3)
|
sl@0
|
1387 |
{
|
sl@0
|
1388 |
die("Error: internal error 10\n");
|
sl@0
|
1389 |
}
|
sl@0
|
1390 |
my $firstInitialByteValueInRange=$rangeData->[0];
|
sl@0
|
1391 |
my $lastInitialByteValueInRange=$rangeData->[1];
|
sl@0
|
1392 |
if ($lastInitialByteValueInRange<$firstInitialByteValueInRange)
|
sl@0
|
1393 |
{
|
sl@0
|
1394 |
die("Error: internal error 11\n");
|
sl@0
|
1395 |
}
|
sl@0
|
1396 |
&write8($fileHandle, $firstInitialByteValueInRange);
|
sl@0
|
1397 |
&write8($fileHandle, $lastInitialByteValueInRange);
|
sl@0
|
1398 |
&write8($fileHandle, $rangeData->[2]); # numberOfSubsequentBytes
|
sl@0
|
1399 |
}
|
sl@0
|
1400 |
}
|
sl@0
|
1401 |
|
sl@0
|
1402 |
sub writeBinaryOneDirectionData
|
sl@0
|
1403 |
{
|
sl@0
|
1404 |
my $fileHandle=shift;
|
sl@0
|
1405 |
my $oneDirectionData=shift;
|
sl@0
|
1406 |
my $characterCodes=shift;
|
sl@0
|
1407 |
my $outputIsUnicode=shift;
|
sl@0
|
1408 |
&writePositiveIntegerCompacted30($fileHandle, scalar(@$oneDirectionData));
|
sl@0
|
1409 |
my $rangeData;
|
sl@0
|
1410 |
foreach $rangeData (@$oneDirectionData)
|
sl@0
|
1411 |
{
|
sl@0
|
1412 |
## $rangeData is $includePriority, $searchPriority, $firstInputCharacterCodeInRange, $lastInputCharacterCodeInRange, $algorithm[, $sizeOfOutputCharacterCodeInBytes], $parameters
|
sl@0
|
1413 |
if (scalar(@$rangeData)!=($outputIsUnicode? 6: 7))
|
sl@0
|
1414 |
{
|
sl@0
|
1415 |
die("Error: internal error 12\n");
|
sl@0
|
1416 |
}
|
sl@0
|
1417 |
my $firstInputCharacterCodeInRange=$rangeData->[2];
|
sl@0
|
1418 |
my $lastInputCharacterCodeInRange=$rangeData->[3];
|
sl@0
|
1419 |
if ($lastInputCharacterCodeInRange<$firstInputCharacterCodeInRange)
|
sl@0
|
1420 |
{
|
sl@0
|
1421 |
die("Error: internal error 13\n");
|
sl@0
|
1422 |
}
|
sl@0
|
1423 |
&writePositiveIntegerCompacted30($fileHandle, $firstInputCharacterCodeInRange);
|
sl@0
|
1424 |
&writePositiveIntegerCompacted30($fileHandle, $lastInputCharacterCodeInRange);
|
sl@0
|
1425 |
my $algorithm=$rangeData->[4];
|
sl@0
|
1426 |
&write8($fileHandle, $algorithm);
|
sl@0
|
1427 |
if (!$outputIsUnicode)
|
sl@0
|
1428 |
{
|
sl@0
|
1429 |
&write8($fileHandle, $rangeData->[5]); # sizeOfOutputCharacterCodeInBytesIfForeign
|
sl@0
|
1430 |
}
|
sl@0
|
1431 |
if ($algorithm==0) # Direct
|
sl@0
|
1432 |
{
|
sl@0
|
1433 |
my $characterCode;
|
sl@0
|
1434 |
for ($characterCode=$firstInputCharacterCodeInRange; $characterCode<=$lastInputCharacterCodeInRange; ++$characterCode)
|
sl@0
|
1435 |
{
|
sl@0
|
1436 |
if (!defined($characterCodes->{$characterCode}))
|
sl@0
|
1437 |
{
|
sl@0
|
1438 |
die("Error: There is no conversion defined for ".($outputIsUnicode? 'foreign': 'Unicode')." character code ".sprintf("0x%08x", $characterCode)."\n");
|
sl@0
|
1439 |
}
|
sl@0
|
1440 |
if ($characterCodes->{$characterCode}!=$characterCode)
|
sl@0
|
1441 |
{
|
sl@0
|
1442 |
die("Error: the conversion from ".($outputIsUnicode? 'foreign': 'Unicode')." character code ".sprintf("0x%08x", $characterCode)." to ".($outputIsUnicode? 'Unicode': 'foreign')." character code ".sprintf("0x%08x", $characterCodes->{$characterCode})." is not a direct conversion\n");
|
sl@0
|
1443 |
}
|
sl@0
|
1444 |
delete $characterCodes->{$characterCode};
|
sl@0
|
1445 |
}
|
sl@0
|
1446 |
}
|
sl@0
|
1447 |
elsif ($algorithm==1) # Offset
|
sl@0
|
1448 |
{
|
sl@0
|
1449 |
my $offset=$characterCodes->{$firstInputCharacterCodeInRange}-$firstInputCharacterCodeInRange;
|
sl@0
|
1450 |
delete $characterCodes->{$firstInputCharacterCodeInRange};
|
sl@0
|
1451 |
my $characterCode;
|
sl@0
|
1452 |
for ($characterCode=$firstInputCharacterCodeInRange+1; $characterCode<=$lastInputCharacterCodeInRange; ++$characterCode)
|
sl@0
|
1453 |
{
|
sl@0
|
1454 |
if (!defined($characterCodes->{$characterCode}))
|
sl@0
|
1455 |
{
|
sl@0
|
1456 |
die("Error: There is no conversion defined for ".($outputIsUnicode? 'foreign': 'Unicode')." character code ".sprintf("0x%08x (0x%08x-0x%08x)", $characterCode, $firstInputCharacterCodeInRange, $lastInputCharacterCodeInRange)."\n");
|
sl@0
|
1457 |
}
|
sl@0
|
1458 |
if ($characterCodes->{$characterCode}-$characterCode!=$offset)
|
sl@0
|
1459 |
{
|
sl@0
|
1460 |
die("Error: the conversion from ".($outputIsUnicode? 'foreign': 'Unicode')." character code ".sprintf("0x%08x", $characterCode)." to ".($outputIsUnicode? 'Unicode': 'foreign')." character code ".sprintf("0x%08x", $characterCodes->{$characterCode})." has a different offset from the previous one in the range\n");
|
sl@0
|
1461 |
}
|
sl@0
|
1462 |
delete $characterCodes->{$characterCode};
|
sl@0
|
1463 |
}
|
sl@0
|
1464 |
&writeSignedIntegerCompacted29($fileHandle, $offset);
|
sl@0
|
1465 |
}
|
sl@0
|
1466 |
elsif ($algorithm==2) # IndexedTable16
|
sl@0
|
1467 |
{
|
sl@0
|
1468 |
my $characterCode;
|
sl@0
|
1469 |
for ($characterCode=$firstInputCharacterCodeInRange; $characterCode<=$lastInputCharacterCodeInRange; ++$characterCode)
|
sl@0
|
1470 |
{
|
sl@0
|
1471 |
if (!defined($characterCodes->{$characterCode}))
|
sl@0
|
1472 |
{
|
sl@0
|
1473 |
die("Error: There is no conversion defined for ".($outputIsUnicode? 'foreign': 'Unicode')." character code ".sprintf("0x%08x", $characterCode)."\n");
|
sl@0
|
1474 |
}
|
sl@0
|
1475 |
&write16($fileHandle, $characterCodes->{$characterCode});
|
sl@0
|
1476 |
delete $characterCodes->{$characterCode};
|
sl@0
|
1477 |
}
|
sl@0
|
1478 |
}
|
sl@0
|
1479 |
elsif ($algorithm==3) # KeyedTable1616
|
sl@0
|
1480 |
{
|
sl@0
|
1481 |
my $characterCode;
|
sl@0
|
1482 |
my @table=();
|
sl@0
|
1483 |
for ($characterCode=$firstInputCharacterCodeInRange; $characterCode<=$lastInputCharacterCodeInRange; ++$characterCode)
|
sl@0
|
1484 |
{
|
sl@0
|
1485 |
if (defined($characterCodes->{$characterCode}))
|
sl@0
|
1486 |
{
|
sl@0
|
1487 |
push(@table, [$characterCode, $characterCodes->{$characterCode}]);
|
sl@0
|
1488 |
delete $characterCodes->{$characterCode};
|
sl@0
|
1489 |
}
|
sl@0
|
1490 |
}
|
sl@0
|
1491 |
my $firstIteration=1;
|
sl@0
|
1492 |
my $lastKey;
|
sl@0
|
1493 |
&writePositiveIntegerCompacted30($fileHandle, scalar(@table));
|
sl@0
|
1494 |
if ($table[0][0]!=$firstInputCharacterCodeInRange)
|
sl@0
|
1495 |
{
|
sl@0
|
1496 |
die("Error: no conversion is specified for the first ".($outputIsUnicode? 'foreign': 'Unicode')." character code in the KeyedTable1616 range ".sprintf("0x%08x to 0x%08x", $firstInputCharacterCodeInRange, $lastInputCharacterCodeInRange)."\n");
|
sl@0
|
1497 |
}
|
sl@0
|
1498 |
my $pair;
|
sl@0
|
1499 |
foreach $pair (@table)
|
sl@0
|
1500 |
{
|
sl@0
|
1501 |
my $key=$pair->[0];
|
sl@0
|
1502 |
if ($firstIteration)
|
sl@0
|
1503 |
{
|
sl@0
|
1504 |
$firstIteration=0;
|
sl@0
|
1505 |
}
|
sl@0
|
1506 |
else
|
sl@0
|
1507 |
{
|
sl@0
|
1508 |
if ($key<=$lastKey)
|
sl@0
|
1509 |
{
|
sl@0
|
1510 |
die("Error: internal error 14\n");
|
sl@0
|
1511 |
}
|
sl@0
|
1512 |
&writePositiveIntegerCompacted15($fileHandle, $key-$lastKey);
|
sl@0
|
1513 |
}
|
sl@0
|
1514 |
&write16($fileHandle, $pair->[1]);
|
sl@0
|
1515 |
$lastKey=$key;
|
sl@0
|
1516 |
}
|
sl@0
|
1517 |
}
|
sl@0
|
1518 |
elsif ($algorithm==4) # KeyedTable16OfIndexedTables16
|
sl@0
|
1519 |
{
|
sl@0
|
1520 |
die("Error: \"KeyedTable16OfIndexedTables16\" is only supported if generating source code\n");
|
sl@0
|
1521 |
}
|
sl@0
|
1522 |
else
|
sl@0
|
1523 |
{
|
sl@0
|
1524 |
die("Error: internal error 15\n");
|
sl@0
|
1525 |
}
|
sl@0
|
1526 |
}
|
sl@0
|
1527 |
my @characterCodes=sort({$a<=>$b} keys(%$characterCodes));
|
sl@0
|
1528 |
if (@characterCodes>0)
|
sl@0
|
1529 |
{
|
sl@0
|
1530 |
die('The following '.($outputIsUnicode? 'foreign': 'Unicode').'characters have no conversion algorithm specified: ['.join(', ', map({sprintf('0x%x', $_)} @characterCodes))."\]\n");
|
sl@0
|
1531 |
}
|
sl@0
|
1532 |
}
|
sl@0
|
1533 |
|