sl@0: # sl@0: # Copyright (c) 1997-2009 Nokia Corporation and/or its subsidiary(-ies). sl@0: # All rights reserved. sl@0: # This component and the accompanying materials are made available sl@0: # under the terms of "Eclipse Public License v1.0" sl@0: # which accompanies this distribution, and is available sl@0: # at the URL "http://www.eclipse.org/legal/epl-v10.html". sl@0: # sl@0: # Initial Contributors: sl@0: # Nokia Corporation - initial contribution. sl@0: # sl@0: # Contributors: sl@0: # sl@0: # Description: sl@0: # sl@0: sl@0: use strict; sl@0: use integer; sl@0: sl@0: BEGIN sl@0: { sl@0: my $perlScriptPath=$0; sl@0: my $os = $^O; #get the OS type sl@0: #check OS type sl@0: if($os=~/MSWin32/) #Windows OS sl@0: { sl@0: $perlScriptPath=~s/\//\\/g; # replace any forward-slashes with back-slashes sl@0: $perlScriptPath=~s/(\\?)[^\\]+$/$1/; # get rid of this Perl-script's file-name sl@0: } sl@0: else #Unix OS sl@0: { sl@0: $perlScriptPath=~s/\\/\//g; # replace any back-slashes with forward-slashes sl@0: $perlScriptPath=~s/(\/?)[^\/]+$/$1/; # get rid of this Perl-script's file-name sl@0: } sl@0: unshift(@INC, $perlScriptPath); # can't do "use lib $perlScriptPath" here as "use lib" only seems to work with *hard-coded* directory names sl@0: } sl@0: use PARSER; sl@0: use WRITER; sl@0: sl@0: $|=1; # ensures that any progress information sent to the screen is displayed immediately and not buffered sl@0: if ((@ARGV==0) || ($ARGV[0]=~/\?/i) || ($ARGV[0]=~/-h/i) || ($ARGV[0]=~/help/i)) sl@0: { sl@0: die("\nVersion 021\n\nCharacter-set conversion-table generating tool\nCopyright (c) 2000-2009 Nokia Corporation and/or its subsidiary(-ies).\n\nUsage:\n\n\tcnvtool [options]\n\nwhere the following options are available (each has a short form and a long form which are shown below separated by a '|'):\n\n\t-s | -generateSourceCode\n\t-c | -columns(: , )\n\t-r | -omitReplacementForUnconvertibleUnicodeCharacters\n\t-p | -cutOutAnyPrivateUseUnicodeCharacterSlotsBeingUsed\n\t-u | -sourceFilesToSubtract(, , ...)\n\n"); sl@0: } sl@0: my $generateSourceCode=0; sl@0: my @columns=(2, 1, 2); sl@0: my $omitReplacementForUnconvertibleUnicodeCharacters=0; sl@0: my $cutOutAnyPrivateUseUnicodeCharacterSlotsBeingUsed=0; sl@0: my @sourceFilesToSubtract=(); sl@0: my $flattenHashAndSave=0; # this flag is not published for use outside of the CHARCONV component sl@0: &extractCommandLineFlags(\$generateSourceCode, \@columns, \$omitReplacementForUnconvertibleUnicodeCharacters, \$cutOutAnyPrivateUseUnicodeCharacterSlotsBeingUsed, \@sourceFilesToSubtract, \$flattenHashAndSave); sl@0: (!$omitReplacementForUnconvertibleUnicodeCharacters || $generateSourceCode) or die("Error: bad combination of flags\n"); sl@0: my $controlFile=shift; sl@0: my $sourceFile=shift; sl@0: my $outputFile=shift; sl@0: print("Generating $outputFile...\n"); sl@0: my $uid=0; sl@0: my $endiannessAsText=''; sl@0: my $endianness=0; sl@0: my $replacementForUnconvertibleUnicodeCharacters=''; sl@0: my @foreignVariableByteData=(); sl@0: my @foreignToUnicodeData=(); sl@0: my @unicodeToForeignData=(); sl@0: my %foreignCharacterCodes=(); sl@0: my %unicodeCharacterCodes=(); sl@0: my %preferredForeignCharacterCodesForConflictResolution=(); sl@0: my %preferredUnicodeCharacterCodesForConflictResolution=(); sl@0: my %additionalSubsetTables=(); sl@0: my %privateUseUnicodeCharacterSlotsUsed=(); sl@0: sl@0: print(" reading $controlFile...\n"); sl@0: open(CONTROL_FILE, "< $controlFile") or die("Error: could not open \"$controlFile\" for reading\n"); sl@0: &readHeaderFromControlFile(\*CONTROL_FILE, $controlFile, $generateSourceCode, \$uid, \$endiannessAsText, \$endianness, \$replacementForUnconvertibleUnicodeCharacters, $flattenHashAndSave); sl@0: &readForeignVariableByteDataFromControlFile(\*CONTROL_FILE, $controlFile, \@foreignVariableByteData); sl@0: &readOneDirectionDataFromControlFile(\*CONTROL_FILE, $controlFile, \@foreignToUnicodeData, \%preferredUnicodeCharacterCodesForConflictResolution, \%additionalSubsetTables, 1); sl@0: &readOneDirectionDataFromControlFile(\*CONTROL_FILE, $controlFile, \@unicodeToForeignData, \%preferredForeignCharacterCodesForConflictResolution, \%additionalSubsetTables, 0); sl@0: close(CONTROL_FILE) or die("Error: could not close \"$controlFile\"\n"); sl@0: sl@0: print(" reading $sourceFile...\n"); sl@0: open(SOURCE_FILE, "< $sourceFile") or die("Error: could not open \"$sourceFile\" for reading\n"); sl@0: &readSourceFile(\*SOURCE_FILE, $sourceFile, \%foreignCharacterCodes, \%unicodeCharacterCodes, \@columns, $cutOutAnyPrivateUseUnicodeCharacterSlotsBeingUsed, \%privateUseUnicodeCharacterSlotsUsed, 0); sl@0: close(SOURCE_FILE) or die("Error: could not close \"$sourceFile\"\n"); sl@0: sl@0: my $sourceFileToSubtract; sl@0: foreach $sourceFileToSubtract (@sourceFilesToSubtract) sl@0: { sl@0: print(" subtracting from $sourceFileToSubtract...\n"); sl@0: open(SOURCE_FILE_TO_SUBTRACT, "< $sourceFileToSubtract") or die("Error: could not open \"$sourceFileToSubtract\" for reading\n"); sl@0: &readSourceFile(\*SOURCE_FILE_TO_SUBTRACT, $sourceFileToSubtract, \%foreignCharacterCodes, \%unicodeCharacterCodes, \@columns, $cutOutAnyPrivateUseUnicodeCharacterSlotsBeingUsed, \%privateUseUnicodeCharacterSlotsUsed, 1); sl@0: close(SOURCE_FILE_TO_SUBTRACT) or die("Error: could not close \"$sourceFileToSubtract\"\n"); sl@0: } sl@0: sl@0: &warnIfAnyPrivateUseUnicodeCharacterSlotsBeingUsed(\%privateUseUnicodeCharacterSlotsUsed); sl@0: &resolveConflictsAndFlattenArraysToScalars(\%foreignCharacterCodes, \%preferredForeignCharacterCodesForConflictResolution, 'Unicode', 'foreign'); sl@0: &resolveConflictsAndFlattenArraysToScalars(\%unicodeCharacterCodes, \%preferredUnicodeCharacterCodesForConflictResolution, 'foreign', 'Unicode'); sl@0: &checkForeignVariableByteData($endianness, \@foreignVariableByteData, \@foreignToUnicodeData); sl@0: sl@0: print(" writing $outputFile...\n"); sl@0: open(OUTPUT_FILE, "> $outputFile") or die("Error: could not open \"$outputFile\" for writing\n"); sl@0: if ($generateSourceCode) sl@0: { sl@0: my @sourceCodeOfForeignToUnicodeIndexedTables16=(); sl@0: my @sourceCodeOfForeignToUnicodeKeyedTables1616=(); sl@0: my @sourceCodeOfForeignToUnicodeKeyedTables16OfIndexedTables16_indexedEntries=(); sl@0: my @sourceCodeOfForeignToUnicodeKeyedTables16OfIndexedTables16_keyedEntries=(); sl@0: sl@0: my @sourceCodeOfUnicodeToForeignIndexedTables16=(); sl@0: my @sourceCodeOfUnicodeToForeignKeyedTables1616=(); sl@0: my @sourceCodeOfUnicodeToForeignKeyedTables16OfIndexedTables16_indexedEntries=(); sl@0: my @sourceCodeOfUnicodeToForeignKeyedTables16OfIndexedTables16_keyedEntries=(); sl@0: sl@0: # new for 32 bit encoding begin sl@0: my @sourceCodeOfForeignToUnicodeIndexedTables32=(); sl@0: my @sourceCodeOfForeignToUnicodeKeyedTables3232=(); sl@0: my @sourceCodeOfForeignToUnicodeKeyedTables32OfIndexedTables32_indexedEntries=(); sl@0: my @sourceCodeOfForeignToUnicodeKeyedTables32OfIndexedTables32_keyedEntries=(); sl@0: sl@0: my @sourceCodeOfUnicodeToForeignIndexedTables32=(); sl@0: my @sourceCodeOfUnicodeToForeignKeyedTables3232=(); sl@0: my @sourceCodeOfUnicodeToForeignKeyedTables32OfIndexedTables32_indexedEntries=(); sl@0: my @sourceCodeOfUnicodeToForeignKeyedTables32OfIndexedTables32_keyedEntries=(); sl@0: # new for 32 bit endcoding end sl@0: sl@0: my @sourceCodeOfTopLevelStructures=(); sl@0: sl@0: &writeSourceCodeHeader(\*OUTPUT_FILE, $outputFile, $replacementForUnconvertibleUnicodeCharacters); sl@0: &writeSourceCodeForeignVariableByteData(\@sourceCodeOfTopLevelStructures, \@foreignVariableByteData); sl@0: &writeSourceCodeOneDirectionData(\@sourceCodeOfTopLevelStructures, sl@0: \@sourceCodeOfForeignToUnicodeIndexedTables16, \@sourceCodeOfForeignToUnicodeKeyedTables1616, \@sourceCodeOfForeignToUnicodeKeyedTables16OfIndexedTables16_indexedEntries, \@sourceCodeOfForeignToUnicodeKeyedTables16OfIndexedTables16_keyedEntries, sl@0: \@sourceCodeOfForeignToUnicodeIndexedTables32, \@sourceCodeOfForeignToUnicodeKeyedTables3232, \@sourceCodeOfForeignToUnicodeKeyedTables32OfIndexedTables32_indexedEntries, \@sourceCodeOfForeignToUnicodeKeyedTables32OfIndexedTables32_keyedEntries, sl@0: \@foreignToUnicodeData, \%unicodeCharacterCodes, 1); sl@0: &writeSourceCodeOneDirectionData(\@sourceCodeOfTopLevelStructures, sl@0: \@sourceCodeOfUnicodeToForeignIndexedTables16, \@sourceCodeOfUnicodeToForeignKeyedTables1616, \@sourceCodeOfUnicodeToForeignKeyedTables16OfIndexedTables16_indexedEntries, \@sourceCodeOfUnicodeToForeignKeyedTables16OfIndexedTables16_keyedEntries, sl@0: \@sourceCodeOfUnicodeToForeignIndexedTables32, \@sourceCodeOfUnicodeToForeignKeyedTables3232, \@sourceCodeOfUnicodeToForeignKeyedTables32OfIndexedTables32_indexedEntries, \@sourceCodeOfUnicodeToForeignKeyedTables32OfIndexedTables32_keyedEntries, sl@0: \@unicodeToForeignData, \%foreignCharacterCodes, 0); sl@0: &writeSourceCodeFinalStuff(\*OUTPUT_FILE, sl@0: \@sourceCodeOfForeignToUnicodeIndexedTables16, \@sourceCodeOfForeignToUnicodeKeyedTables1616, \@sourceCodeOfForeignToUnicodeKeyedTables16OfIndexedTables16_indexedEntries, \@sourceCodeOfForeignToUnicodeKeyedTables16OfIndexedTables16_keyedEntries, sl@0: \@sourceCodeOfUnicodeToForeignIndexedTables16, \@sourceCodeOfUnicodeToForeignKeyedTables1616, \@sourceCodeOfUnicodeToForeignKeyedTables16OfIndexedTables16_indexedEntries, \@sourceCodeOfUnicodeToForeignKeyedTables16OfIndexedTables16_keyedEntries, sl@0: \@sourceCodeOfForeignToUnicodeIndexedTables32, \@sourceCodeOfForeignToUnicodeKeyedTables3232, \@sourceCodeOfForeignToUnicodeKeyedTables32OfIndexedTables32_indexedEntries, \@sourceCodeOfForeignToUnicodeKeyedTables32OfIndexedTables32_keyedEntries, sl@0: \@sourceCodeOfUnicodeToForeignIndexedTables32, \@sourceCodeOfUnicodeToForeignKeyedTables3232, \@sourceCodeOfUnicodeToForeignKeyedTables32OfIndexedTables32_indexedEntries, \@sourceCodeOfUnicodeToForeignKeyedTables32OfIndexedTables32_keyedEntries, sl@0: \@sourceCodeOfTopLevelStructures, $endiannessAsText, \%additionalSubsetTables); sl@0: } sl@0: elsif ($flattenHashAndSave) sl@0: { sl@0: binmode OUTPUT_FILE; sl@0: #instead of calling the writeBinaryHeader, just write the data I need followed by sl@0: # writeBinaryForeignVariableByteData... sl@0: &write8(\*OUTPUT_FILE, $endianness); sl@0: &write8(\*OUTPUT_FILE, length($replacementForUnconvertibleUnicodeCharacters)); sl@0: &writeString(\*OUTPUT_FILE, $replacementForUnconvertibleUnicodeCharacters); sl@0: &writeBinaryForeignVariableByteData(\*OUTPUT_FILE, \@foreignVariableByteData); sl@0: #choose %unicodeCharacterCodes and write the data as keypair sl@0: my $key; sl@0: my $rangekey; sl@0: my $limit; sl@0: foreach $key (keys(%unicodeCharacterCodes)) sl@0: { sl@0: &write16(\*OUTPUT_FILE,$key); sl@0: &write16(\*OUTPUT_FILE,$unicodeCharacterCodes{$key}); sl@0: } sl@0: } sl@0: else sl@0: { sl@0: binmode OUTPUT_FILE; sl@0: &writeBinaryHeader(\*OUTPUT_FILE, $uid, $endianness, $replacementForUnconvertibleUnicodeCharacters); sl@0: &writeBinaryForeignVariableByteData(\*OUTPUT_FILE, \@foreignVariableByteData); sl@0: &writeBinaryOneDirectionData(\*OUTPUT_FILE, \@foreignToUnicodeData, \%unicodeCharacterCodes, 1); sl@0: &writeBinaryOneDirectionData(\*OUTPUT_FILE, \@unicodeToForeignData, \%foreignCharacterCodes, 0); sl@0: } sl@0: close(OUTPUT_FILE) or die("Error: could not close \"$outputFile\"\n"); sl@0: print("complete\n\n"); sl@0: sl@0: sub extractCommandLineFlags() sl@0: { sl@0: my $generateSourceCode=shift; sl@0: my $columns=shift; sl@0: my $omitReplacementForUnconvertibleUnicodeCharacters=shift; sl@0: my $cutOutAnyPrivateUseUnicodeCharacterSlotsBeingUsed=shift; sl@0: my $sourceFilesToSubtract=shift; sl@0: my $flattenHashAndSave=shift; sl@0: my $i; sl@0: for ($i=0; $i<=$#ARGV;) # (i) not cache-ing $#ARGV into a variable as @ARGV may change length in this loop (ii) iterate forwards as some parameters may occupy more than one element in @ARGV sl@0: { sl@0: if (($ARGV[$i]=~/^-s$/i) || ($ARGV[$i]=~/^-generateSourceCode$/i)) sl@0: { sl@0: if ($$flattenHashAndSave==1) sl@0: { sl@0: die ("Error: Cannot have -s and -b flags set at the same time"); sl@0: } sl@0: else sl@0: { sl@0: splice(@ARGV, $i, 1); sl@0: $$generateSourceCode=1; sl@0: } sl@0: } sl@0: elsif (($ARGV[$i]=~/^-c\b(.*)$/i) || ($ARGV[$i]=~/^-columns\b(.*)$/i)) sl@0: { sl@0: my $columnsData=$1; sl@0: splice(@ARGV, $i, 1); sl@0: for (;;) sl@0: { sl@0: if ($columnsData=~/^\s*\(\s*(\d+)\s*:\s*(\d+)\s*\,?\s*(\d+)\s*\)\s*$/) sl@0: { sl@0: @$columns=($1, $2, $3); sl@0: last; sl@0: } sl@0: ($#ARGV>=$i) or die("Error: bad \"-columns\" format\n"); sl@0: $columnsData.=(splice(@ARGV, $i, 1))[0]; sl@0: } sl@0: } sl@0: elsif (($ARGV[$i]=~/^-r$/i) || ($ARGV[$i]=~/^-omitReplacementForUnconvertibleUnicodeCharacters$/i)) sl@0: { sl@0: splice(@ARGV, $i, 1); sl@0: $$omitReplacementForUnconvertibleUnicodeCharacters=1; sl@0: } sl@0: elsif (($ARGV[$i]=~/^-p$/i) || ($ARGV[$i]=~/^-cutOutAnyPrivateUseUnicodeCharacterSlotsBeingUsed$/i)) sl@0: { sl@0: splice(@ARGV, $i, 1); sl@0: $$cutOutAnyPrivateUseUnicodeCharacterSlotsBeingUsed=1; sl@0: } sl@0: elsif (($ARGV[$i]=~/^-u\b(.*)$/i) || ($ARGV[$i]=~/^-sourceFilesToSubtract\b(.*)$/i)) sl@0: { sl@0: my $sourceFilesData=$1; sl@0: splice(@ARGV, $i, 1); sl@0: for (;;) sl@0: { sl@0: if ($sourceFilesData=~/^\s*\(\s*(.+)\)\s*$/) sl@0: { sl@0: my $sourceFilesData=$1; sl@0: @$sourceFilesToSubtract=split(/,/, $sourceFilesData, -1); sl@0: my $j; sl@0: for ($j=$#$sourceFilesToSubtract; $j>=0; --$j) sl@0: { sl@0: $sourceFilesToSubtract->[$j]=~s/^\s+//; sl@0: $sourceFilesToSubtract->[$j]=~s/\s+$//; sl@0: ($sourceFilesToSubtract->[$j] ne '') or die("Error: bad \"-sourceFilesToSubtract\" format (1)\n"); sl@0: } sl@0: last; sl@0: } sl@0: ($#ARGV>=$i) or die("Error: bad \"-sourceFilesToSubtract\" format (2)\n"); sl@0: $sourceFilesData.=(splice(@ARGV, $i, 1))[0]; sl@0: } sl@0: } sl@0: elsif (($ARGV[$i]=~/^-f$/i) || ($ARGV[$i]=~/^-flattenHashAndSave$/i)) sl@0: { sl@0: if ($$generateSourceCode==1) sl@0: { sl@0: die ("Error: Cannot have -s and -b flags set at the same time"); sl@0: } sl@0: else sl@0: { sl@0: splice(@ARGV, $i, 1); sl@0: $$flattenHashAndSave=1; sl@0: } sl@0: } sl@0: else sl@0: { sl@0: ++$i; sl@0: } sl@0: } sl@0: } sl@0: sl@0: sub algorithm sl@0: { sl@0: my $algorithmAsText=shift; sl@0: if ($algorithmAsText=~/^Direct$/i) sl@0: { sl@0: return 0; sl@0: } sl@0: elsif ($algorithmAsText=~/^Offset$/i) sl@0: { sl@0: return 1; sl@0: } sl@0: elsif ($algorithmAsText=~/^IndexedTable16$/i) sl@0: { sl@0: return 2; sl@0: } sl@0: elsif ($algorithmAsText=~/^KeyedTable1616$/i) sl@0: { sl@0: return 3; sl@0: } sl@0: elsif ($algorithmAsText=~/^KeyedTable16OfIndexedTables16$/i) sl@0: { sl@0: return 4; sl@0: } sl@0: elsif ($algorithmAsText=~/^IndexedTable32$/i) sl@0: { sl@0: return 5; sl@0: } sl@0: elsif ($algorithmAsText=~/^KeyedTable3232$/i) sl@0: { sl@0: return 6; sl@0: } sl@0: elsif ($algorithmAsText=~/^KeyedTable32OfIndexedTables32$/i) sl@0: { sl@0: return 7; sl@0: } sl@0: else sl@0: { sl@0: return -1; sl@0: } sl@0: } sl@0: sl@0: sub hexadecimalify sl@0: { sl@0: my $string=shift; sl@0: my $result=''; sl@0: my $lengthOfString=length($string); sl@0: my $i; sl@0: for ($i=0; $i<$lengthOfString; ++$i) sl@0: { sl@0: $result.=sprintf("\\x%02x", (unpack('C', substr($string, $i, 1)))[0]); sl@0: } sl@0: return $result; sl@0: } sl@0: sl@0: sub readSourceFile sl@0: { sl@0: my $fileHandle=shift; sl@0: my $fileName=shift; sl@0: my $foreignCharacterCodes=shift; sl@0: my $unicodeCharacterCodes=shift; sl@0: my $columns=shift; sl@0: my $cutOutAnyPrivateUseUnicodeCharacterSlotsBeingUsed=shift; sl@0: my $privateUseUnicodeCharacterSlotsUsed=shift; sl@0: my $subtract=shift; sl@0: my $foreignCharacterCodeProcessingCode=''; sl@0: if (!(($columns->[0]>0) && ($columns->[1]>0) && ($columns->[2]>0) && ($columns->[1]<=$columns->[0]) && ($columns->[2]<=$columns->[0]) && ($columns->[1]!=$columns->[2]))) sl@0: { sl@0: close($fileHandle); sl@0: die("Error: bad \"-columns\" data\n"); sl@0: } sl@0: my $patternOfLineContainingCharacterCodes=join('\s+', ('0x([0-9a-f]+)') x $columns->[0]); sl@0: my $line; sl@0: my $strippedDownLine; sl@0: for (;;) sl@0: { sl@0: ($line, $strippedDownLine)=&nextNonEmptyStrippedDownLine($fileHandle); sl@0: if (($strippedDownLine eq '')||(substr($strippedDownLine,0,1) eq chr(26))) # if there are no more lines in the file or if we encountered EOF character sl@0: { sl@0: last; sl@0: } sl@0: if ($strippedDownLine=~/^SET_FOREIGN_CHARACTER_CODE_PROCESSING_CODE\s+(.*)$/i) sl@0: { sl@0: $foreignCharacterCodeProcessingCode=$1; sl@0: } sl@0: elsif ($strippedDownLine=~/^$patternOfLineContainingCharacterCodes$/i) sl@0: { sl@0: no strict 'refs'; # so that we can use symbolic references for $1, $2, etc sl@0: my $foreignCharacterCode=hex(${$columns->[1]}); sl@0: my $unicodeCharacterCode=hex(${$columns->[2]}); sl@0: use strict 'refs'; sl@0: if ($foreignCharacterCodeProcessingCode ne '') sl@0: { sl@0: $foreignCharacterCode=eval($foreignCharacterCodeProcessingCode); sl@0: } sl@0: my $handleConversionPair=1; sl@0: if ((($unicodeCharacterCode>=0xe000) && ($unicodeCharacterCode<=0xf8ff)) || (($unicodeCharacterCode>=0xf0000) && ($unicodeCharacterCode<=0x10ffff))) sl@0: { sl@0: if ($cutOutAnyPrivateUseUnicodeCharacterSlotsBeingUsed) sl@0: { sl@0: $handleConversionPair=0; sl@0: } sl@0: else sl@0: { sl@0: if ($subtract) sl@0: { sl@0: delete $privateUseUnicodeCharacterSlotsUsed->{$unicodeCharacterCode}; sl@0: } sl@0: else sl@0: { sl@0: $privateUseUnicodeCharacterSlotsUsed->{$unicodeCharacterCode}=1; sl@0: } sl@0: } sl@0: } sl@0: if ($handleConversionPair) sl@0: { sl@0: if ($subtract) sl@0: { sl@0: if (!defined($foreignCharacterCodes->{$unicodeCharacterCode}->{$foreignCharacterCode})) sl@0: { sl@0: close($fileHandle); sl@0: die('Error: cannot subtract conversion pair ['.sprintf('foreign 0x%x, Unicode 0x%04x', $foreignCharacterCode, $unicodeCharacterCode)."] as it does not occur in \"$fileName\"\n"); sl@0: } sl@0: if (!defined($unicodeCharacterCodes->{$foreignCharacterCode}->{$unicodeCharacterCode})) sl@0: { sl@0: close($fileHandle); sl@0: die('Error: cannot subtract conversion pair ['.sprintf('Unicode 0x%04x, foreign 0x%x', $unicodeCharacterCode, $foreignCharacterCode)."] as it does not occur in \"$fileName\"\n"); sl@0: } sl@0: delete $foreignCharacterCodes->{$unicodeCharacterCode}->{$foreignCharacterCode}; sl@0: if (keys(%{$foreignCharacterCodes->{$unicodeCharacterCode}})==0) sl@0: { sl@0: delete $foreignCharacterCodes->{$unicodeCharacterCode}; sl@0: } sl@0: delete $unicodeCharacterCodes->{$foreignCharacterCode}->{$unicodeCharacterCode}; sl@0: if (keys(%{$unicodeCharacterCodes->{$foreignCharacterCode}})==0) sl@0: { sl@0: delete $unicodeCharacterCodes->{$foreignCharacterCode}; sl@0: } sl@0: } sl@0: else sl@0: { sl@0: if (defined($foreignCharacterCodes->{$unicodeCharacterCode}->{$foreignCharacterCode})) sl@0: { sl@0: close($fileHandle); sl@0: die('Error: same conversion pair ['.sprintf('foreign 0x%x, Unicode 0x%04x', $foreignCharacterCode, $unicodeCharacterCode)."] occurs more than once in \"$fileName\"\n"); sl@0: } sl@0: if (defined($unicodeCharacterCodes->{$foreignCharacterCode}->{$unicodeCharacterCode})) sl@0: { sl@0: close($fileHandle); sl@0: die('Error: same conversion pair ['.sprintf('Unicode 0x%04x, foreign 0x%x', $unicodeCharacterCode, $foreignCharacterCode)."] occurs more than once in \"$fileName\"\n"); sl@0: } sl@0: $foreignCharacterCodes->{$unicodeCharacterCode}->{$foreignCharacterCode}=1; sl@0: $unicodeCharacterCodes->{$foreignCharacterCode}->{$unicodeCharacterCode}=1; sl@0: } sl@0: } sl@0: } sl@0: elsif ($line!~/^\s*0x([0-9a-f]+)\s*#\s*undefined.*$/i) sl@0: { sl@0: close($fileHandle); sl@0: die("Error: unexpected line in \"$fileName\":\n $line\n"); sl@0: } sl@0: } sl@0: } sl@0: sl@0: sub readHeaderFromControlFile sl@0: { sl@0: my $fileHandle=shift; sl@0: my $fileName=shift; sl@0: my $generateSourceCode=shift; sl@0: my $uid=shift; sl@0: my $endiannessAsText=shift; sl@0: my $endianness=shift; sl@0: my $replacementForUnconvertibleUnicodeCharacters=shift; sl@0: my $flattenHashAndSave=shift; sl@0: my $line; sl@0: my $strippedDownLine; sl@0: ($line, $strippedDownLine)=&nextNonEmptyStrippedDownLine($fileHandle); sl@0: if ($strippedDownLine=~/^UID\s+0x([0-9a-f]+)$/i) sl@0: { sl@0: if ($generateSourceCode) sl@0: { sl@0: print(STDERR "Warning: \"UID\" keyword should not be used with \"-generateSourceCode\" flag - specify the UID in the MMP file\n"); sl@0: } sl@0: $$uid=hex($1); sl@0: ($line, $strippedDownLine)=&nextNonEmptyStrippedDownLine($fileHandle); sl@0: } sl@0: else sl@0: { sl@0: if (!$generateSourceCode && !$flattenHashAndSave) sl@0: { sl@0: close($fileHandle); sl@0: die("Error: unexpected line in \"$fileName\" (\"UID\" keyword expected):\n $line\n"); sl@0: } sl@0: } sl@0: if ($strippedDownLine=~/^Name\s+"(.+?)"$/i) sl@0: { sl@0: print(STDERR "Warning: obsolete keyword \"Name\" used\n"); sl@0: ($line, $strippedDownLine)=&nextNonEmptyStrippedDownLine($fileHandle); sl@0: } sl@0: if ($strippedDownLine!~/^Endianness\s+(\w+)$/i) sl@0: { sl@0: close($fileHandle); sl@0: die("Error: unexpected line in \"$fileName\" (\"Endianness\" keyword expected):\n $line\n"); sl@0: } sl@0: $$endiannessAsText=$1; sl@0: if ($$endiannessAsText=~/Unspecified/i) sl@0: { sl@0: $$endianness=0; # SCnvConversionData::EUnspecified sl@0: } sl@0: elsif ($$endiannessAsText=~/FixedLittleEndian/i) sl@0: { sl@0: $$endianness=1; # SCnvConversionData::EFixedLittleEndian sl@0: } sl@0: elsif ($$endiannessAsText=~/FixedBigEndian/i) sl@0: { sl@0: $$endianness=2; # SCnvConversionData::EFixedBigEndian sl@0: } sl@0: else sl@0: { sl@0: close($fileHandle); sl@0: die("Error: \"$$endiannessAsText\" is not a legal value for \"Endianness\"\n"); sl@0: } sl@0: ($line, $strippedDownLine)=&nextNonEmptyStrippedDownLine($fileHandle); sl@0: if ($strippedDownLine!~/^ReplacementForUnconvertibleUnicodeCharacters\s+(.*?)$/i) sl@0: { sl@0: close($fileHandle); sl@0: die("Error: unexpected line in \"$fileName\" (\"ReplacementForUnconvertibleUnicodeCharacters\" keyword expected):\n $line\n"); sl@0: } sl@0: $$replacementForUnconvertibleUnicodeCharacters=''; sl@0: my $remainderOfXxx=$1; sl@0: while ($remainderOfXxx ne '') sl@0: { sl@0: if ($remainderOfXxx!~/^0x([0-9a-f]{1,2})\s*(.*)$/i) sl@0: { sl@0: close($fileHandle); sl@0: die("Error: unexpected line in \"$fileName\":\n $line\n"); sl@0: } sl@0: $$replacementForUnconvertibleUnicodeCharacters.=pack("C", hex($1)); sl@0: $remainderOfXxx=$2; sl@0: } sl@0: my @temp=&nextNonEmptyStrippedDownLine($fileHandle); sl@0: if ($temp[1]=~/^ForeignCharacterCodeProcessingCode/i) sl@0: { sl@0: print(STDERR "Warning: obsolete keyword \"ForeignCharacterCodeProcessingCode\" used\n"); sl@0: } sl@0: else sl@0: { sl@0: ungetNonEmptyStrippedDownLine(@temp) sl@0: } sl@0: } sl@0: sl@0: sub readForeignVariableByteDataFromControlFile sl@0: { sl@0: my $fileHandle=shift; sl@0: my $fileName=shift; sl@0: my $foreignVariableByteData=shift; sl@0: my $line; sl@0: my $strippedDownLine; sl@0: ($line, $strippedDownLine)=&nextNonEmptyStrippedDownLine($fileHandle); sl@0: if ($strippedDownLine!~/^StartForeignVariableByteData$/i) sl@0: { sl@0: close($fileHandle); sl@0: die("Error: unexpected line in \"$fileName\":\n $line\n"); sl@0: } sl@0: sl@0: for (;;) sl@0: { sl@0: ($line, $strippedDownLine)=&nextNonEmptyStrippedDownLine($fileHandle); sl@0: if ($strippedDownLine=~/^EndForeignVariableByteData$/i) sl@0: { sl@0: last; sl@0: } sl@0: if ($strippedDownLine!~/^0x([0-9a-f]+)\s+0x([0-9a-f]+)\s+(\d+)$/i) sl@0: { sl@0: close($fileHandle); sl@0: die("Error: unexpected line in \"$fileName\":\n $line\n"); sl@0: } sl@0: my $firstInitialByteValueInRange=hex($1); sl@0: my $lastInitialByteValueInRange=hex($2); sl@0: my $numberOfSubsequentBytes=$3; sl@0: if ($firstInitialByteValueInRange>0xff) sl@0: { sl@0: close($fileHandle); sl@0: die("Error: firstInitialByteValueInRange ".sprintf("0x%02x", $firstInitialByteValueInRange)." does not fit in a single byte\n"); sl@0: } sl@0: if ($lastInitialByteValueInRange>0xff) sl@0: { sl@0: close($fileHandle); sl@0: die("Error: lastInitialByteValueInRange ".sprintf("0x%02x", $lastInitialByteValueInRange)." does not fit in a single byte\n"); sl@0: } sl@0: if ($lastInitialByteValueInRange<$firstInitialByteValueInRange) sl@0: { sl@0: close($fileHandle); sl@0: die("Error: lastInitialByteValueInRange ".sprintf("0x%02x", $lastInitialByteValueInRange)." is less than firstInitialByteValueInRange ".sprintf("0x%02x", $firstInitialByteValueInRange)."\n"); sl@0: } sl@0: push(@$foreignVariableByteData, [$firstInitialByteValueInRange, $lastInitialByteValueInRange, $numberOfSubsequentBytes]); sl@0: } sl@0: } sl@0: sl@0: sub readOneDirectionDataFromControlFile sl@0: { sl@0: my $fileHandle=shift; sl@0: my $fileName=shift; sl@0: my $oneDirectionData=shift; sl@0: my $preferredCharacterCodesForConflictResolution=shift; sl@0: my $additionalSubsetTables=shift; sl@0: my $outputIsUnicode=shift; sl@0: my $source=$outputIsUnicode? 'foreign': 'Unicode'; sl@0: my $target=$outputIsUnicode? 'Unicode': 'foreign'; sl@0: my $middlePortionOfKeyWords=$outputIsUnicode? "ForeignToUnicode": "UnicodeToForeign"; sl@0: my $extraPatternToMatch=$outputIsUnicode? '()': '\s+(\d+)'; sl@0: my $line; sl@0: my $strippedDownLine; sl@0: ($line, $strippedDownLine)=&nextNonEmptyStrippedDownLine($fileHandle); sl@0: if ($strippedDownLine!~/^Start${middlePortionOfKeyWords}Data$/i) sl@0: { sl@0: close($fileHandle); sl@0: die("Error: unexpected line in \"$fileName\":\n $line\n"); sl@0: } sl@0: my $doingConflictResolution=0; sl@0: for (;;) sl@0: { sl@0: ($line, $strippedDownLine)=&nextNonEmptyStrippedDownLine($fileHandle); sl@0: if ($strippedDownLine=~/^End${middlePortionOfKeyWords}Data$/i) sl@0: { sl@0: last; sl@0: } sl@0: if ($strippedDownLine=~/^ConflictResolution$/i) sl@0: { sl@0: $doingConflictResolution=1; sl@0: } sl@0: elsif ($doingConflictResolution) sl@0: { sl@0: if ($strippedDownLine!~/^0x([0-9a-f]+)\s+0x([0-9a-f]+)$/i) sl@0: { sl@0: close($fileHandle); sl@0: die("Error: unexpected line in \"$fileName\":\n $line\n"); sl@0: } sl@0: my $sourceCharacterCodeToResolve=hex($1); sl@0: my $targetCharacterCodePreferred=hex($2); sl@0: $preferredCharacterCodesForConflictResolution->{$sourceCharacterCodeToResolve}=$targetCharacterCodePreferred; sl@0: } sl@0: elsif ($strippedDownLine=~/^(Start|End)AdditionalSubsetTable\s+(.*)$/i) sl@0: { sl@0: my $prefix=$1; sl@0: my $nameOfAdditionalSubsetTable=$2; sl@0: my $index=$prefix=~(/^Start$/i)? 0: 1; sl@0: if (!$outputIsUnicode) sl@0: { sl@0: $index+=2; sl@0: } sl@0: if (defined($additionalSubsetTables{$nameOfAdditionalSubsetTable}->[$index])) sl@0: { sl@0: close($fileHandle); sl@0: die("Error: multiple redefinition of \"${prefix}AdditionalSubsetTable $nameOfAdditionalSubsetTable\"\n"); sl@0: } sl@0: $additionalSubsetTables{$nameOfAdditionalSubsetTable}->[$index]=@$oneDirectionData; sl@0: } sl@0: else sl@0: { sl@0: if ($strippedDownLine!~/^(\d+)\s+(\d+)\s+0x([0-9a-f]+)\s+0x([0-9a-f]+)\s+(\w+)$extraPatternToMatch\s+\{(.*?)\}$/i) sl@0: { sl@0: close($fileHandle); sl@0: die("Error: unexpected line in \"$fileName\":\n $line\n"); sl@0: } sl@0: my $includePriority=$1; sl@0: my $searchPriority=$2; sl@0: my $firstInputCharacterCodeInRange=hex($3); sl@0: my $lastInputCharacterCodeInRange=hex($4); sl@0: my $algorithmAsText=$5; sl@0: my $sizeOfOutputCharacterCodeInBytes=$6; sl@0: my $parameters=$7; sl@0: if ($lastInputCharacterCodeInRange<$firstInputCharacterCodeInRange) sl@0: { sl@0: close($fileHandle); sl@0: die("Error: lastInputCharacterCodeInRange ".sprintf("0x%02x", $lastInputCharacterCodeInRange)." is less than firstInputCharacterCodeInRange ".sprintf("0x%02x", $firstInputCharacterCodeInRange)."\n"); sl@0: } sl@0: my $algorithm=&algorithm($algorithmAsText); sl@0: if ($algorithm<0) sl@0: { sl@0: close($fileHandle); sl@0: die("Error: unexpected algorithm \"$algorithmAsText\"\n"); sl@0: } sl@0: my $rangeData=[$includePriority, $searchPriority, $firstInputCharacterCodeInRange, $lastInputCharacterCodeInRange, $algorithm]; sl@0: if (!$outputIsUnicode) sl@0: { sl@0: push(@$rangeData, $sizeOfOutputCharacterCodeInBytes); sl@0: } sl@0: push(@$rangeData, $parameters); sl@0: push(@$oneDirectionData, $rangeData); sl@0: } sl@0: } sl@0: } sl@0: sl@0: sub warnIfAnyPrivateUseUnicodeCharacterSlotsBeingUsed sl@0: { sl@0: my $privateUseUnicodeCharacterSlotsUsed=shift; sl@0: my @sortedPrivateUseUnicodeCharacterSlotsUsed=sort({$a<=>$b} keys(%$privateUseUnicodeCharacterSlotsUsed)); sl@0: if (@sortedPrivateUseUnicodeCharacterSlotsUsed>0) sl@0: { sl@0: my $lastPrivateUseUnicodeCharacterSlotUsed=$sortedPrivateUseUnicodeCharacterSlotsUsed[0]; sl@0: my $asText=sprintf('0x%04x', $lastPrivateUseUnicodeCharacterSlotUsed); sl@0: my @asText=($asText); sl@0: my $i; sl@0: for ($i=1; $i<@sortedPrivateUseUnicodeCharacterSlotsUsed; ++$i) # this loop starts from 1 not 0 as we have already dealt with $sortedPrivateUseUnicodeCharacterSlotsUsed[0] sl@0: { sl@0: ($sortedPrivateUseUnicodeCharacterSlotsUsed[$i]>$lastPrivateUseUnicodeCharacterSlotUsed) or die("Error: internal error 1\n"); sl@0: if ($sortedPrivateUseUnicodeCharacterSlotsUsed[$i]>$lastPrivateUseUnicodeCharacterSlotUsed+1) sl@0: { sl@0: $asText=sprintf('0x%04x', $lastPrivateUseUnicodeCharacterSlotUsed); sl@0: if ($asText[-1] ne $asText) sl@0: { sl@0: $asText[-1].='-'.$asText; sl@0: } sl@0: push(@asText, sprintf('0x%04x', $sortedPrivateUseUnicodeCharacterSlotsUsed[$i])); sl@0: } sl@0: $lastPrivateUseUnicodeCharacterSlotUsed=$sortedPrivateUseUnicodeCharacterSlotsUsed[$i]; sl@0: } sl@0: $asText=sprintf('0x%04x', $lastPrivateUseUnicodeCharacterSlotUsed); sl@0: if ($asText[-1] ne $asText) sl@0: { sl@0: $asText[-1].='-'.$asText; sl@0: } sl@0: print(STDERR 'Warning: the following private-use Unicode character slots were used: ['.join(', ', @asText)."]\n"); sl@0: } sl@0: } sl@0: sl@0: sub resolveConflictsAndFlattenArraysToScalars sl@0: { sl@0: my $characterCodes=shift; sl@0: my $preferredCharacterCodesForConflictResolution=shift; sl@0: my $source=shift; sl@0: my $target=shift; sl@0: my $sourceCharacterCode; sl@0: my $candidateTargetCharacterCodes; sl@0: while (($sourceCharacterCode, $candidateTargetCharacterCodes)=each(%$characterCodes)) sl@0: { sl@0: my @candidateTargetCharacterCodes=keys(%$candidateTargetCharacterCodes); sl@0: if (@candidateTargetCharacterCodes<1) sl@0: { sl@0: die("Error: internal error 2\n"); sl@0: } sl@0: if (@candidateTargetCharacterCodes==1) sl@0: { sl@0: $characterCodes->{$sourceCharacterCode}=$candidateTargetCharacterCodes[0]; sl@0: } sl@0: else sl@0: { sl@0: if (!defined($preferredCharacterCodesForConflictResolution->{$sourceCharacterCode})) sl@0: { sl@0: die("Error: no preferred $target character code is specified for conflict resolution for the $source character code ".sprintf("0x%08x", $sourceCharacterCode)."\n"); sl@0: } sl@0: my $preferredCharacterCodeIsNotACandidateForConflictResolution=1; sl@0: my $candidateTargetCharacterCode; sl@0: foreach $candidateTargetCharacterCode (@candidateTargetCharacterCodes) sl@0: { sl@0: if ($preferredCharacterCodesForConflictResolution->{$sourceCharacterCode}==$candidateTargetCharacterCode) sl@0: { sl@0: $preferredCharacterCodeIsNotACandidateForConflictResolution=0; sl@0: last; sl@0: } sl@0: } sl@0: if ($preferredCharacterCodeIsNotACandidateForConflictResolution) sl@0: { sl@0: die("Error: the preferred $target character code ".sprintf("0x%08x", $preferredCharacterCodesForConflictResolution->{$sourceCharacterCode})." is not a candidate for conflict resolution for the $source character code ".sprintf("0x%08x", $sourceCharacterCode)."\n"); sl@0: } sl@0: $characterCodes->{$sourceCharacterCode}=$preferredCharacterCodesForConflictResolution->{$sourceCharacterCode}; sl@0: delete $preferredCharacterCodesForConflictResolution->{$sourceCharacterCode}; sl@0: } sl@0: } sl@0: my $numberOfPreferredCharacterCodesForConflictResolution=keys(%$preferredCharacterCodesForConflictResolution); sl@0: if ($numberOfPreferredCharacterCodesForConflictResolution!=0) sl@0: { sl@0: print(STDERR "Warning: there are $numberOfPreferredCharacterCodesForConflictResolution $target preferred character codes specified for which there are no conflicts to resolve\n"); sl@0: } sl@0: } sl@0: sl@0: sub checkForeignVariableByteData sl@0: { sl@0: my $endianness=shift; sl@0: my $foreignVariableByteData=shift; sl@0: my $foreignToUnicodeData=shift; sl@0: my $rangeData; sl@0: my %initialForeignBytes=(); sl@0: foreach $rangeData (@$foreignVariableByteData) sl@0: { sl@0: my $initialByte; sl@0: for ($initialByte=$rangeData->[0]; $initialByte<=$rangeData->[1]; ++$initialByte) sl@0: { sl@0: if (defined($initialForeignBytes{$initialByte})) sl@0: { sl@0: die("Error: the number of bytes subsequent to the initial foreign-byte $initialForeignBytes{$initialByte} is defined more than once\n"); sl@0: } sl@0: $initialForeignBytes{$initialByte}=1; sl@0: } sl@0: } sl@0: # if ($endianness!=0) # unfortunately, nothing can be checked if the $endianness is 0 (SCnvConversionData::EUnspecified) sl@0: # { sl@0: # foreach $rangeData (@$foreignToUnicodeData) sl@0: # { sl@0: # my $inputCharacterCode; sl@0: # for ($inputCharacterCode=$rangeData->[2]; $inputCharacterCode<=$rangeData->[3]; ++$inputCharacterCode) sl@0: # { sl@0: # my $initialByte; sl@0: # if ($endianness==1) # SCnvConversionData::EFixedLittleEndian sl@0: # { sl@0: # $initialByte=($inputCharacterCode&0xff); sl@0: # } sl@0: # elsif ($endianness==2) # SCnvConversionData::EFixedBigEndian sl@0: # { sl@0: # $initialByte=($inputCharacterCode&0xff00)>>8; ## this is hard-coded and needs to be done properly! sl@0: # } sl@0: # else sl@0: # { sl@0: # die("Error: internal error ??\n"); sl@0: # } sl@0: # if (!defined($initialForeignBytes{$initialByte})) sl@0: # { sl@0: # die("Error: no number-of-subsequent-bytes is specified for the initial byte $initialByte\n"); sl@0: # } sl@0: # } sl@0: # } sl@0: # } sl@0: } sl@0: sl@0: sub writeSourceCodeHeader sl@0: { sl@0: my $fileHandle=shift; sl@0: my $fileName=shift; sl@0: my $replacementForUnconvertibleUnicodeCharacters=shift; sl@0: while ($fileName=~/^.*\\(.*)$/i) sl@0: { sl@0: $fileName=$1; sl@0: } sl@0: print($fileHandle "// $fileName\n//\n// Copyright (c) Nokia Corporation and/or its subsidiary(-ies) ".(1900+(gmtime(time))[5]).". All rights reserved.\n//\n\n"); sl@0: print($fileHandle "#include \n#include \n#include \n\n#define ARRAY_LENGTH(aArray) (sizeof(aArray)/sizeof((aArray)\[0\]))\n\n#pragma warning (disable: 4049) // compiler limit : terminating line number emission\n\n"); sl@0: if (!$omitReplacementForUnconvertibleUnicodeCharacters) sl@0: { sl@0: print($fileHandle "_LIT8(KLit8ReplacementForUnconvertibleUnicodeCharacters, \"".&hexadecimalify($replacementForUnconvertibleUnicodeCharacters)."\");\n\n"); sl@0: print($fileHandle "GLDEF_C const TDesC8& ReplacementForUnconvertibleUnicodeCharacters_internal()\n\t{\n\treturn KLit8ReplacementForUnconvertibleUnicodeCharacters;\n\t}\n\n"); sl@0: } sl@0: } sl@0: sl@0: sub writeSourceCodeForeignVariableByteData sl@0: { sl@0: my $sourceCodeOfTopLevelStructures=shift; sl@0: my $foreignVariableByteData=shift; sl@0: push(@$sourceCodeOfTopLevelStructures, "LOCAL_D const SCnvConversionData::SVariableByteData::SRange foreignVariableByteDataRanges[]=\n\t\{\n"); sl@0: my $indexOfLastRange=$#$foreignVariableByteData; sl@0: my $i; sl@0: for ($i=0; $i<=$indexOfLastRange; ++$i) sl@0: { sl@0: my $rangeData=$foreignVariableByteData->[$i]; sl@0: if (@$rangeData!=3) sl@0: { sl@0: die("Error: internal error 3\n"); sl@0: } sl@0: my $firstInitialByteValueInRange=$rangeData->[0]; sl@0: my $lastInitialByteValueInRange=$rangeData->[1]; sl@0: if ($lastInitialByteValueInRange<$firstInitialByteValueInRange) sl@0: { sl@0: die("Error: internal error 4\n"); sl@0: } sl@0: my $numberOfSubsequentBytes=$rangeData->[2]; sl@0: push(@$sourceCodeOfTopLevelStructures, "\t\t\{\n\t\t".sprintf("0x%02x", $firstInitialByteValueInRange).",\n\t\t".sprintf("0x%02x", $lastInitialByteValueInRange).",\n\t\t$numberOfSubsequentBytes,\n\t\t0\n\t\t\}"); sl@0: if ($i<$indexOfLastRange) sl@0: { sl@0: push(@$sourceCodeOfTopLevelStructures, ','); sl@0: } sl@0: push(@$sourceCodeOfTopLevelStructures, "\n"); sl@0: } sl@0: push(@$sourceCodeOfTopLevelStructures, "\t\};\n\n"); sl@0: } sl@0: sl@0: sub writeSourceCodeOneDirectionData sl@0: { sl@0: my $sourceCodeOfTopLevelStructures=shift; sl@0: my $sourceCodeOfOneDirectionIndexedTables16=shift; sl@0: my $sourceCodeOfOneDirectionKeyedTables1616=shift; sl@0: my $sourceCodeOfOneDirectionKeyedTables16OfIndexedTables16_indexedEntries=shift; sl@0: my $sourceCodeOfOneDirectionKeyedTables16OfIndexedTables16_keyedEntries=shift; sl@0: # new for 32 bit encoding begin sl@0: my $sourceCodeOfOneDirectionIndexedTables32=shift; sl@0: my $sourceCodeOfOneDirectionKeyedTables3232=shift; sl@0: my $sourceCodeOfOneDirectionKeyedTables32OfIndexedTables32_indexedEntries=shift; sl@0: my $sourceCodeOfOneDirectionKeyedTables32OfIndexedTables32_keyedEntries=shift; sl@0: # new for 32 bit encoding end sl@0: sl@0: my $oneDirectionData=shift; sl@0: my $characterCodes=shift; sl@0: my $outputIsUnicode=shift; sl@0: push(@$sourceCodeOfTopLevelStructures, 'LOCAL_D const SCnvConversionData::SOneDirectionData::SRange '.($outputIsUnicode? 'foreignToUnicodeDataRanges': 'unicodeToForeignDataRanges')."[]=\n\t\{\n"); sl@0: my $formatForInputCharacters=$outputIsUnicode? '0x%02x': '0x%04x'; sl@0: my $formatForOutputCharacters=$outputIsUnicode? '0x%04x': '0x%02x'; sl@0: my $indexOfLastRange=$#$oneDirectionData; sl@0: my $i; sl@0: for ($i=0; $i<=$indexOfLastRange; ++$i) sl@0: { sl@0: my $rangeData=$oneDirectionData->[$i]; sl@0: # $rangeData is $includePriority, $searchPriority, $firstInputCharacterCodeInRange, $lastInputCharacterCodeInRange, $algorithm[, $sizeOfOutputCharacterCodeInBytes], $parameters sl@0: if (scalar(@$rangeData)!=($outputIsUnicode? 6: 7)) sl@0: { sl@0: die("Error: internal error 5\n"); sl@0: } sl@0: my $firstInputCharacterCodeInRange=$rangeData->[2]; sl@0: my $lastInputCharacterCodeInRange=$rangeData->[3]; sl@0: if ($lastInputCharacterCodeInRange<$firstInputCharacterCodeInRange) sl@0: { sl@0: die("Error: internal error 6\n"); sl@0: } sl@0: my $algorithmAsText=''; # set by the if-elsif stuff below sl@0: my $sizeOfOutputCharacterCodeInBytesIfForeign=$outputIsUnicode? 0: $rangeData->[5]; sl@0: my $parameters=$rangeData->[$outputIsUnicode? 5: 6]; sl@0: my $word1=0; # set by the if-elsif stuff below sl@0: my $algorithm=$rangeData->[4]; sl@0: if ($algorithm==0) # Direct sl@0: { sl@0: $algorithmAsText='Direct'; sl@0: my $characterCode; sl@0: for ($characterCode=$firstInputCharacterCodeInRange; $characterCode<=$lastInputCharacterCodeInRange; ++$characterCode) sl@0: { sl@0: if (!defined($characterCodes->{$characterCode})) sl@0: { sl@0: die("Error: There is no conversion defined for ".($outputIsUnicode? 'foreign': 'Unicode')." character code ".sprintf("0x%08x", $characterCode)."\n"); sl@0: } sl@0: if ($characterCodes->{$characterCode}!=$characterCode) sl@0: { sl@0: die("Error: the conversion from ".($outputIsUnicode? 'foreign': 'Unicode')." character code ".sprintf("0x%08x", $characterCode)." to ".($outputIsUnicode? 'Unicode': 'foreign')." character code ".sprintf("0x%08x", $characterCodes->{$characterCode})." is not a direct conversion\n"); sl@0: } sl@0: delete $characterCodes->{$characterCode}; sl@0: } sl@0: } sl@0: elsif ($algorithm==1) # Offset sl@0: { sl@0: $algorithmAsText='Offset'; sl@0: my $offset=$characterCodes->{$firstInputCharacterCodeInRange}-$firstInputCharacterCodeInRange; sl@0: delete $characterCodes->{$firstInputCharacterCodeInRange}; sl@0: my $characterCode; sl@0: for ($characterCode=$firstInputCharacterCodeInRange+1; $characterCode<=$lastInputCharacterCodeInRange; ++$characterCode) sl@0: { sl@0: if (!defined($characterCodes->{$characterCode})) sl@0: { sl@0: die("Error: There is no conversion defined for ".($outputIsUnicode? 'foreign': 'Unicode')." character code ".sprintf("0x%08x (0x%08x-0x%08x)", $characterCode, $firstInputCharacterCodeInRange, $lastInputCharacterCodeInRange)."\n"); sl@0: } sl@0: if ($characterCodes->{$characterCode}-$characterCode!=$offset) sl@0: { sl@0: die("Error: the conversion from ".($outputIsUnicode? 'foreign': 'Unicode')." character code ".sprintf("0x%08x", $characterCode)." to ".($outputIsUnicode? 'Unicode': 'foreign')." character code ".sprintf("0x%08x", $characterCodes->{$characterCode})." has a different offset from the previous one in the range\n"); sl@0: } sl@0: delete $characterCodes->{$characterCode}; sl@0: } sl@0: $word1="STATIC_CAST(TUint, $offset)"; sl@0: } sl@0: elsif ($algorithm==2) # IndexedTable16 sl@0: { sl@0: $algorithmAsText='IndexedTable16'; sl@0: my $nameOfNextOneDirectionIndexedTable16='indexedTable16_'.($outputIsUnicode? 'foreignToUnicode': 'unicodeToForeign').'_'.($#$sourceCodeOfOneDirectionIndexedTables16+2); sl@0: my $sourceCodeOfNextOneDirectionIndexedTable16=[]; sl@0: push(@$sourceCodeOfNextOneDirectionIndexedTable16, "LOCAL_D const SCnvConversionData::SOneDirectionData::SRange::UData::SIndexedTable16::SEntry $nameOfNextOneDirectionIndexedTable16\[\]=\n\t\{\n"); sl@0: my $characterCode; sl@0: for ($characterCode=$firstInputCharacterCodeInRange; $characterCode<=$lastInputCharacterCodeInRange; ++$characterCode) sl@0: { sl@0: if (!defined($characterCodes->{$characterCode})) sl@0: { sl@0: die("Error: There is no conversion defined for ".($outputIsUnicode? 'foreign': 'Unicode')." character code ".sprintf("0x%08x", $characterCode)."\n"); sl@0: } sl@0: push(@$sourceCodeOfNextOneDirectionIndexedTable16, "\t\t\{\n\t\t".sprintf($formatForOutputCharacters, $characterCodes->{$characterCode})."\n\t\t\}"); sl@0: if ($characterCode<$lastInputCharacterCodeInRange) sl@0: { sl@0: push(@$sourceCodeOfNextOneDirectionIndexedTable16, ','); sl@0: } sl@0: push(@$sourceCodeOfNextOneDirectionIndexedTable16, "\n"); sl@0: delete $characterCodes->{$characterCode}; sl@0: } sl@0: push(@$sourceCodeOfNextOneDirectionIndexedTable16, "\t\};\n\n"); sl@0: push(@$sourceCodeOfOneDirectionIndexedTables16, $sourceCodeOfNextOneDirectionIndexedTable16); sl@0: $word1="UData_S$algorithmAsText($nameOfNextOneDirectionIndexedTable16)"; sl@0: } sl@0: elsif ($algorithm==3) # KeyedTable1616 sl@0: { sl@0: $algorithmAsText='KeyedTable1616'; sl@0: my $nameOfNextOneDirectionKeyedTable1616='keyedTable1616_'.($outputIsUnicode? 'foreignToUnicode': 'unicodeToForeign').'_'.($#$sourceCodeOfOneDirectionKeyedTables1616+2); sl@0: my $sourceCodeOfNextOneDirectionKeyedTable1616=[]; sl@0: push(@$sourceCodeOfNextOneDirectionKeyedTable1616, "LOCAL_D const SCnvConversionData::SOneDirectionData::SRange::UData::SKeyedTable1616::SEntry $nameOfNextOneDirectionKeyedTable1616\[\]=\n\t\{\n"); sl@0: my @characterCodes=grep(($_>=$firstInputCharacterCodeInRange) && ($_<=$lastInputCharacterCodeInRange), sort({$a<=>$b} keys(%$characterCodes))); sl@0: if (@characterCodes==0) sl@0: { sl@0: die("Error: There are no ".($outputIsUnicode? 'foreign': 'Unicode').'-to-'.($outputIsUnicode? 'Unicode': 'foreign')." characters to convert using KeyedTable1616 (range ".sprintf("$formatForInputCharacters-$formatForInputCharacters", $firstInputCharacterCodeInRange, $lastInputCharacterCodeInRange).").\n"); sl@0: } sl@0: if ($characterCodes[0]!=$firstInputCharacterCodeInRange) sl@0: { sl@0: print(STDERR 'Warning: the specified start of the '.($outputIsUnicode? 'foreign': 'Unicode').' range '.sprintf("$formatForInputCharacters-$formatForInputCharacters", $firstInputCharacterCodeInRange, $lastInputCharacterCodeInRange).' could actually be '.sprintf("$formatForInputCharacters", $characterCodes[0])."\n"); sl@0: } sl@0: if ($characterCodes[-1]!=$lastInputCharacterCodeInRange) sl@0: { sl@0: print(STDERR 'Warning: the specified end of the '.($outputIsUnicode? 'foreign': 'Unicode').' range '.sprintf("$formatForInputCharacters-$formatForInputCharacters", $firstInputCharacterCodeInRange, $lastInputCharacterCodeInRange).' could actually be '.sprintf("$formatForInputCharacters", $characterCodes[-1])."\n"); sl@0: } sl@0: my $characterCode; sl@0: foreach $characterCode (@characterCodes) sl@0: { sl@0: if (defined($characterCodes->{$characterCode})) sl@0: { sl@0: push(@$sourceCodeOfNextOneDirectionKeyedTable1616, "\t\t\{\n\t\t".sprintf($formatForInputCharacters, $characterCode).",\n\t\t".sprintf($formatForOutputCharacters, $characterCodes->{$characterCode})."\n\t\t\}"); sl@0: if ($characterCode<$characterCodes[-1]) sl@0: { sl@0: push(@$sourceCodeOfNextOneDirectionKeyedTable1616, ','); sl@0: } sl@0: push(@$sourceCodeOfNextOneDirectionKeyedTable1616, "\n"); sl@0: delete $characterCodes->{$characterCode}; sl@0: } sl@0: } sl@0: push(@$sourceCodeOfNextOneDirectionKeyedTable1616, "\t\};\n\n"); sl@0: push(@$sourceCodeOfOneDirectionKeyedTables1616, $sourceCodeOfNextOneDirectionKeyedTable1616); sl@0: $word1="UData_S$algorithmAsText($nameOfNextOneDirectionKeyedTable1616)"; sl@0: } sl@0: elsif ($algorithm==4) # KeyedTable16OfIndexedTables16 sl@0: { sl@0: $algorithmAsText='KeyedTable16OfIndexedTables16'; sl@0: my $nameOfNextOneDirectionKeyedTables16OfIndexedTables16_keyedEntries='keyedTables16OfIndexedTables16_keyedEntries_'.($outputIsUnicode? 'foreignToUnicode': 'unicodeToForeign').'_'.($#$sourceCodeOfOneDirectionKeyedTables16OfIndexedTables16_keyedEntries+2); sl@0: my $sourceCodeOfNextOneDirectionKeyedTables16OfIndexedTables16_keyedEntries=[]; sl@0: push(@$sourceCodeOfNextOneDirectionKeyedTables16OfIndexedTables16_keyedEntries, "LOCAL_D const SCnvConversionData::SOneDirectionData::SRange::UData::SKeyedTable16OfIndexedTables16::SKeyedEntry $nameOfNextOneDirectionKeyedTables16OfIndexedTables16_keyedEntries\[\]=\n\t\{\n"); sl@0: my @characterCodes=grep(($_>=$firstInputCharacterCodeInRange) && ($_<=$lastInputCharacterCodeInRange), sort({$a<=>$b} keys(%$characterCodes))); sl@0: if (@characterCodes==0) sl@0: { sl@0: die("Error: There are no ".($outputIsUnicode? 'foreign': 'Unicode').'-to-'.($outputIsUnicode? 'Unicode': 'foreign')." characters to convert using KeyedTable16OfIndexedTables16 (range ".sprintf("$formatForInputCharacters-$formatForInputCharacters", $firstInputCharacterCodeInRange, $lastInputCharacterCodeInRange).").\n"); sl@0: } sl@0: if ($characterCodes[0]!=$firstInputCharacterCodeInRange) sl@0: { sl@0: print(STDERR 'Warning: the specified start of the '.($outputIsUnicode? 'foreign': 'Unicode').' range '.sprintf("$formatForInputCharacters-$formatForInputCharacters", $firstInputCharacterCodeInRange, $lastInputCharacterCodeInRange).' could actually be '.sprintf("$formatForInputCharacters", $characterCodes[0])."\n"); sl@0: } sl@0: if ($characterCodes[-1]!=$lastInputCharacterCodeInRange) sl@0: { sl@0: print(STDERR 'Warning: the specified end of the '.($outputIsUnicode? 'foreign': 'Unicode').' range '.sprintf("$formatForInputCharacters-$formatForInputCharacters", $firstInputCharacterCodeInRange, $lastInputCharacterCodeInRange).' could actually be '.sprintf("$formatForInputCharacters", $characterCodes[-1])."\n"); sl@0: } sl@0: my @characterCodeRanges=(); sl@0: my $minimumNumberOfEntriesPerIndexedTable=($parameters ne '')? $parameters: 0; sl@0: my $firstInputCharacterCodeInIndexedTable=$characterCodes[0]; sl@0: my $previousCharacterCode=$firstInputCharacterCodeInIndexedTable; sl@0: my $characterCode; sl@0: foreach $characterCode (@characterCodes) sl@0: { sl@0: ($characterCode>=$previousCharacterCode) or die("Error: internal error 7\n"); sl@0: if ($characterCode>$previousCharacterCode+1) sl@0: { sl@0: if (($previousCharacterCode-$firstInputCharacterCodeInIndexedTable)+1>=$minimumNumberOfEntriesPerIndexedTable) sl@0: { sl@0: push(@characterCodeRanges, [$firstInputCharacterCodeInIndexedTable, $previousCharacterCode]); sl@0: } sl@0: $firstInputCharacterCodeInIndexedTable=$characterCode; sl@0: } sl@0: $previousCharacterCode=$characterCode; sl@0: } sl@0: push(@characterCodeRanges, [$firstInputCharacterCodeInIndexedTable, $previousCharacterCode]); sl@0: @characterCodes=(); sl@0: my $characterCodeRange; sl@0: foreach $characterCodeRange (@characterCodeRanges) sl@0: { sl@0: my $nameOfNextOneDirectionKeyedTables16OfIndexedTables16_indexedEntries='keyedTables16OfIndexedTables16_indexedEntries_'.($outputIsUnicode? 'foreignToUnicode': 'unicodeToForeign').'_'.($#$sourceCodeOfOneDirectionKeyedTables16OfIndexedTables16_indexedEntries+2); sl@0: my $sourceCodeOfNextOneDirectionKeyedTables16OfIndexedTables16_indexedEntries=[]; sl@0: push(@$sourceCodeOfNextOneDirectionKeyedTables16OfIndexedTables16_indexedEntries, "LOCAL_D const TUint16 $nameOfNextOneDirectionKeyedTables16OfIndexedTables16_indexedEntries\[\]=\n\t\{\n"); sl@0: my $characterCode; sl@0: my $lastInputCharacterCodeInIndexedTable=$characterCodeRange->[1]; sl@0: for ($characterCode=$characterCodeRange->[0]; $characterCode<=$lastInputCharacterCodeInIndexedTable; ++$characterCode) sl@0: { sl@0: if (!defined($characterCodes->{$characterCode})) sl@0: { sl@0: die("Error: internal error 8\n"); sl@0: } sl@0: push(@$sourceCodeOfNextOneDirectionKeyedTables16OfIndexedTables16_indexedEntries, "\t".sprintf($formatForOutputCharacters, $characterCodes->{$characterCode})); sl@0: if ($characterCode<$lastInputCharacterCodeInIndexedTable) sl@0: { sl@0: push(@$sourceCodeOfNextOneDirectionKeyedTables16OfIndexedTables16_indexedEntries, ','); sl@0: } sl@0: push(@$sourceCodeOfNextOneDirectionKeyedTables16OfIndexedTables16_indexedEntries, "\n"); sl@0: delete $characterCodes->{$characterCode}; sl@0: } sl@0: push(@$sourceCodeOfNextOneDirectionKeyedTables16OfIndexedTables16_indexedEntries, "\t\};\n\n"); sl@0: push(@$sourceCodeOfOneDirectionKeyedTables16OfIndexedTables16_indexedEntries, $sourceCodeOfNextOneDirectionKeyedTables16OfIndexedTables16_indexedEntries); sl@0: push(@$sourceCodeOfNextOneDirectionKeyedTables16OfIndexedTables16_keyedEntries, "\t\t\{\n\t\t".sprintf($formatForInputCharacters, $characterCodeRange->[0]).",\n\t\t".sprintf($formatForInputCharacters, $characterCodeRange->[1]).",\n\t\t$nameOfNextOneDirectionKeyedTables16OfIndexedTables16_indexedEntries\n\t\t\}"); sl@0: if ($characterCodeRange->[1]<$characterCodeRanges[-1]->[1]) sl@0: { sl@0: push(@$sourceCodeOfNextOneDirectionKeyedTables16OfIndexedTables16_keyedEntries, ','); sl@0: } sl@0: push(@$sourceCodeOfNextOneDirectionKeyedTables16OfIndexedTables16_keyedEntries, "\n"); sl@0: } sl@0: push(@$sourceCodeOfNextOneDirectionKeyedTables16OfIndexedTables16_keyedEntries, "\t\};\n\n"); sl@0: push(@$sourceCodeOfOneDirectionKeyedTables16OfIndexedTables16_keyedEntries, $sourceCodeOfNextOneDirectionKeyedTables16OfIndexedTables16_keyedEntries); sl@0: $word1="UData_S$algorithmAsText($nameOfNextOneDirectionKeyedTables16OfIndexedTables16_keyedEntries)"; sl@0: } sl@0: elsif ($algorithm==5) # IndexedTable32 sl@0: { sl@0: $algorithmAsText='IndexedTable32'; sl@0: my $nameOfNextOneDirectionIndexedTable32='indexedTable32_'.($outputIsUnicode? 'foreignToUnicode': 'unicodeToForeign').'_'.($#$sourceCodeOfOneDirectionIndexedTables32+2); sl@0: my $sourceCodeOfNextOneDirectionIndexedTable32=[]; sl@0: push(@$sourceCodeOfNextOneDirectionIndexedTable32, "LOCAL_D const SCnvConversionData::SOneDirectionData::SRange::UData::SIndexedTable32::SEntry $nameOfNextOneDirectionIndexedTable32\[\]=\n\t\{\n"); sl@0: my $characterCode; sl@0: for ($characterCode=$firstInputCharacterCodeInRange; $characterCode<=$lastInputCharacterCodeInRange; ++$characterCode) sl@0: { sl@0: if (!defined($characterCodes->{$characterCode})) sl@0: { sl@0: die("Error: There is no conversion defined for ".($outputIsUnicode? 'foreign': 'Unicode')." character code ".sprintf("0x%08x", $characterCode)."\n"); sl@0: } sl@0: push(@$sourceCodeOfNextOneDirectionIndexedTable32, "\t\t\{\n\t\t".sprintf($formatForOutputCharacters, $characterCodes->{$characterCode})."\n\t\t\}"); sl@0: if ($characterCode<$lastInputCharacterCodeInRange) sl@0: { sl@0: push(@$sourceCodeOfNextOneDirectionIndexedTable32, ','); sl@0: } sl@0: push(@$sourceCodeOfNextOneDirectionIndexedTable32, "\n"); sl@0: delete $characterCodes->{$characterCode}; sl@0: } sl@0: push(@$sourceCodeOfNextOneDirectionIndexedTable32, "\t\};\n\n"); sl@0: push(@$sourceCodeOfOneDirectionIndexedTables32, $sourceCodeOfNextOneDirectionIndexedTable32); sl@0: $word1="UData_S$algorithmAsText($nameOfNextOneDirectionIndexedTable32)"; sl@0: } sl@0: elsif ($algorithm==6) # KeyedTable3232 sl@0: { sl@0: $algorithmAsText='KeyedTable3232'; sl@0: my $nameOfNextOneDirectionKeyedTable3232='keyedTable3232_'.($outputIsUnicode? 'foreignToUnicode': 'unicodeToForeign').'_'.($#$sourceCodeOfOneDirectionKeyedTables3232+2); sl@0: my $sourceCodeOfNextOneDirectionKeyedTable3232=[]; sl@0: push(@$sourceCodeOfNextOneDirectionKeyedTable3232, "LOCAL_D const SCnvConversionData::SOneDirectionData::SRange::UData::SKeyedTable3232::SEntry $nameOfNextOneDirectionKeyedTable3232\[\]=\n\t\{\n"); sl@0: my @characterCodes=grep(($_>=$firstInputCharacterCodeInRange) && ($_<=$lastInputCharacterCodeInRange), sort({$a<=>$b} keys(%$characterCodes))); sl@0: if (@characterCodes==0) sl@0: { sl@0: die("Error: There are no ".($outputIsUnicode? 'foreign': 'Unicode').'-to-'.($outputIsUnicode? 'Unicode': 'foreign')." characters to convert using KeyedTable3232 (range ".sprintf("$formatForInputCharacters-$formatForInputCharacters", $firstInputCharacterCodeInRange, $lastInputCharacterCodeInRange).").\n"); sl@0: } sl@0: if ($characterCodes[0]!=$firstInputCharacterCodeInRange) sl@0: { sl@0: print(STDERR 'Warning: the specified start of the '.($outputIsUnicode? 'foreign': 'Unicode').' range '.sprintf("$formatForInputCharacters-$formatForInputCharacters", $firstInputCharacterCodeInRange, $lastInputCharacterCodeInRange).' could actually be '.sprintf($formatForInputCharacters, $characterCodes[0])."\n"); sl@0: } sl@0: if ($characterCodes[-1]!=$lastInputCharacterCodeInRange) sl@0: { sl@0: print(STDERR 'Warning: the specified end of the '.($outputIsUnicode? 'foreign': 'Unicode').' range '.sprintf("$formatForInputCharacters-$formatForInputCharacters", $firstInputCharacterCodeInRange, $lastInputCharacterCodeInRange).' could actually be '.sprintf($formatForInputCharacters, $characterCodes[-1])."\n"); sl@0: } sl@0: my $characterCode; sl@0: foreach $characterCode (@characterCodes) sl@0: { sl@0: if (defined($characterCodes->{$characterCode})) sl@0: { sl@0: push(@$sourceCodeOfNextOneDirectionKeyedTable3232, "\t\t\{\n\t\t".sprintf($formatForInputCharacters, $characterCode).",\n\t\t".sprintf($formatForOutputCharacters, $characterCodes->{$characterCode})."\n\t\t\}"); sl@0: if ($characterCode<$characterCodes[-1]) sl@0: { sl@0: push(@$sourceCodeOfNextOneDirectionKeyedTable3232, ','); sl@0: } sl@0: push(@$sourceCodeOfNextOneDirectionKeyedTable3232, "\n"); sl@0: delete $characterCodes->{$characterCode}; sl@0: } sl@0: } sl@0: push(@$sourceCodeOfNextOneDirectionKeyedTable3232, "\t\};\n\n"); sl@0: push(@$sourceCodeOfOneDirectionKeyedTables3232, $sourceCodeOfNextOneDirectionKeyedTable3232); sl@0: $word1="UData_S$algorithmAsText($nameOfNextOneDirectionKeyedTable3232)"; sl@0: } sl@0: elsif ($algorithm==7) # KeyedTable32OfIndexedTables32 sl@0: { sl@0: $algorithmAsText='KeyedTable32OfIndexedTables32'; sl@0: my $nameOfNextOneDirectionKeyedTables32OfIndexedTables32_keyedEntries='keyedTables32OfIndexedTables32_keyedEntries_'.($outputIsUnicode? 'foreignToUnicode': 'unicodeToForeign').'_'.($#$sourceCodeOfOneDirectionKeyedTables32OfIndexedTables32_keyedEntries+2); sl@0: my $sourceCodeOfNextOneDirectionKeyedTables32OfIndexedTables32_keyedEntries=[]; sl@0: push(@$sourceCodeOfNextOneDirectionKeyedTables32OfIndexedTables32_keyedEntries, "LOCAL_D const SCnvConversionData::SOneDirectionData::SRange::UData::SKeyedTable32OfIndexedTables32::SKeyedEntry $nameOfNextOneDirectionKeyedTables32OfIndexedTables32_keyedEntries\[\]=\n\t\{\n"); sl@0: my @characterCodes=grep(($_>=$firstInputCharacterCodeInRange) && ($_<=$lastInputCharacterCodeInRange), sort({$a<=>$b} keys(%$characterCodes))); sl@0: if (@characterCodes==0) sl@0: { sl@0: die("Error: There are no ".($outputIsUnicode? 'foreign': 'Unicode').'-to-'.($outputIsUnicode? 'Unicode': 'foreign')." characters to convert using KeyedTable32OfIndexedTables32 (range ".sprintf("$formatForInputCharacters-$formatForInputCharacters", $firstInputCharacterCodeInRange, $lastInputCharacterCodeInRange).").\n"); sl@0: } sl@0: if ($characterCodes[0]!=$firstInputCharacterCodeInRange) sl@0: { sl@0: print(STDERR 'Warning: the specified start of the '.($outputIsUnicode? 'foreign': 'Unicode').' range '.sprintf("$formatForInputCharacters-$formatForInputCharacters", $firstInputCharacterCodeInRange, $lastInputCharacterCodeInRange).' could actually be '.sprintf("$formatForInputCharacters", $characterCodes[0])."\n"); sl@0: } sl@0: if ($characterCodes[-1]!=$lastInputCharacterCodeInRange) sl@0: { sl@0: print(STDERR 'Warning: the specified end of the '.($outputIsUnicode? 'foreign': 'Unicode').' range '.sprintf("$formatForInputCharacters-$formatForInputCharacters", $firstInputCharacterCodeInRange, $lastInputCharacterCodeInRange).' could actually be '.sprintf("$formatForInputCharacters", $characterCodes[-1])."\n"); sl@0: } sl@0: my @characterCodeRanges=(); sl@0: my $minimumNumberOfEntriesPerIndexedTable=($parameters ne '')? $parameters: 0; sl@0: my $firstInputCharacterCodeInIndexedTable=$characterCodes[0]; sl@0: my $previousCharacterCode=$firstInputCharacterCodeInIndexedTable; sl@0: my $characterCode; sl@0: foreach $characterCode (@characterCodes) sl@0: { sl@0: ($characterCode>=$previousCharacterCode) or die("Error: internal error 7\n"); sl@0: if ($characterCode>$previousCharacterCode+1) sl@0: { sl@0: if (($previousCharacterCode-$firstInputCharacterCodeInIndexedTable)+1>=$minimumNumberOfEntriesPerIndexedTable) sl@0: { sl@0: push(@characterCodeRanges, [$firstInputCharacterCodeInIndexedTable, $previousCharacterCode]); sl@0: } sl@0: $firstInputCharacterCodeInIndexedTable=$characterCode; sl@0: } sl@0: $previousCharacterCode=$characterCode; sl@0: } sl@0: push(@characterCodeRanges, [$firstInputCharacterCodeInIndexedTable, $previousCharacterCode]); sl@0: @characterCodes=(); sl@0: my $characterCodeRange; sl@0: foreach $characterCodeRange (@characterCodeRanges) sl@0: { sl@0: my $nameOfNextOneDirectionKeyedTables32OfIndexedTables32_indexedEntries='keyedTables32OfIndexedTables32_indexedEntries_'.($outputIsUnicode? 'foreignToUnicode': 'unicodeToForeign').'_'.($#$sourceCodeOfOneDirectionKeyedTables32OfIndexedTables32_indexedEntries+2); sl@0: my $sourceCodeOfNextOneDirectionKeyedTables32OfIndexedTables32_indexedEntries=[]; sl@0: push(@$sourceCodeOfNextOneDirectionKeyedTables32OfIndexedTables32_indexedEntries, "LOCAL_D const TUint32 $nameOfNextOneDirectionKeyedTables32OfIndexedTables32_indexedEntries\[\]=\n\t\{\n"); sl@0: my $characterCode; sl@0: my $lastInputCharacterCodeInIndexedTable=$characterCodeRange->[1]; sl@0: for ($characterCode=$characterCodeRange->[0]; $characterCode<=$lastInputCharacterCodeInIndexedTable; ++$characterCode) sl@0: { sl@0: if (!defined($characterCodes->{$characterCode})) sl@0: { sl@0: die("Error: internal error 8\n"); sl@0: } sl@0: push(@$sourceCodeOfNextOneDirectionKeyedTables32OfIndexedTables32_indexedEntries, "\t".sprintf($formatForOutputCharacters, $characterCodes->{$characterCode})); sl@0: if ($characterCode<$lastInputCharacterCodeInIndexedTable) sl@0: { sl@0: push(@$sourceCodeOfNextOneDirectionKeyedTables32OfIndexedTables32_indexedEntries, ','); sl@0: } sl@0: push(@$sourceCodeOfNextOneDirectionKeyedTables32OfIndexedTables32_indexedEntries, "\n"); sl@0: delete $characterCodes->{$characterCode}; sl@0: } sl@0: push(@$sourceCodeOfNextOneDirectionKeyedTables32OfIndexedTables32_indexedEntries, "\t\};\n\n"); sl@0: push(@$sourceCodeOfOneDirectionKeyedTables32OfIndexedTables32_indexedEntries, $sourceCodeOfNextOneDirectionKeyedTables32OfIndexedTables32_indexedEntries); sl@0: push(@$sourceCodeOfNextOneDirectionKeyedTables32OfIndexedTables32_keyedEntries, "\t\t\{\n\t\t".sprintf($formatForInputCharacters, $characterCodeRange->[0]).",\n\t\t".sprintf($formatForInputCharacters, $characterCodeRange->[1]).",\n\t\t$nameOfNextOneDirectionKeyedTables32OfIndexedTables32_indexedEntries\n\t\t\}"); sl@0: if ($characterCodeRange->[1]<$characterCodeRanges[-1]->[1]) sl@0: { sl@0: push(@$sourceCodeOfNextOneDirectionKeyedTables32OfIndexedTables32_keyedEntries, ','); sl@0: } sl@0: push(@$sourceCodeOfNextOneDirectionKeyedTables32OfIndexedTables32_keyedEntries, "\n"); sl@0: } sl@0: push(@$sourceCodeOfNextOneDirectionKeyedTables32OfIndexedTables32_keyedEntries, "\t\};\n\n"); sl@0: push(@$sourceCodeOfOneDirectionKeyedTables32OfIndexedTables32_keyedEntries, $sourceCodeOfNextOneDirectionKeyedTables32OfIndexedTables32_keyedEntries); sl@0: $word1="UData_S$algorithmAsText($nameOfNextOneDirectionKeyedTables32OfIndexedTables32_keyedEntries)"; sl@0: } sl@0: else sl@0: { sl@0: die("Error: internal error 9\n"); sl@0: } sl@0: push(@$sourceCodeOfTopLevelStructures, "\t\t\{\n\t\t".sprintf($formatForInputCharacters, $firstInputCharacterCodeInRange).",\n\t\t".sprintf($formatForInputCharacters, $lastInputCharacterCodeInRange).",\n\t\tSCnvConversionData::SOneDirectionData::SRange::E$algorithmAsText,\n\t\t".$sizeOfOutputCharacterCodeInBytesIfForeign.",\n\t\t0,\n\t\t\t\{\n\t\t\t".$word1."\n\t\t\t\}\n\t\t\}"); sl@0: if ($i<$indexOfLastRange) sl@0: { sl@0: push(@$sourceCodeOfTopLevelStructures, ','); sl@0: } sl@0: push(@$sourceCodeOfTopLevelStructures, "\n"); sl@0: } sl@0: my @characterCodes=sort({$a<=>$b} keys(%$characterCodes)); sl@0: if (@characterCodes>0) sl@0: { sl@0: die('The following '.($outputIsUnicode? 'foreign': 'Unicode').' characters have no conversion algorithm specified: ['.join(', ', map(sprintf($formatForInputCharacters, $_), @characterCodes))."\]\n"); sl@0: } sl@0: push(@$sourceCodeOfTopLevelStructures, "\t\};\n\n"); sl@0: } sl@0: sl@0: sub writeSourceCodeFinalStuff sl@0: { sl@0: my $fileHandle=shift; sl@0: my $sourceCodeOfForeignToUnicodeIndexedTables16=shift; sl@0: my $sourceCodeOfForeignToUnicodeKeyedTables1616=shift; sl@0: my $sourceCodeOfForeignToUnicodeKeyedTables16OfIndexedTables16_indexedEntries=shift; sl@0: my $sourceCodeOfForeignToUnicodeKeyedTables16OfIndexedTables16_keyedEntries=shift; sl@0: my $sourceCodeOfUnicodeToForeignIndexedTables16=shift; sl@0: my $sourceCodeOfUnicodeToForeignKeyedTables1616=shift; sl@0: my $sourceCodeOfUnicodeToForeignKeyedTables16OfIndexedTables16_indexedEntries=shift; sl@0: my $sourceCodeOfUnicodeToForeignKeyedTables16OfIndexedTables16_keyedEntries=shift; sl@0: sl@0: my $sourceCodeOfForeignToUnicodeIndexedTables32=shift; sl@0: my $sourceCodeOfForeignToUnicodeKeyedTables3232=shift; sl@0: my $sourceCodeOfForeignToUnicodeKeyedTables32OfIndexedTables32_indexedEntries=shift; sl@0: my $sourceCodeOfForeignToUnicodeKeyedTables32OfIndexedTables32_keyedEntries=shift; sl@0: my $sourceCodeOfUnicodeToForeignIndexedTables32=shift; sl@0: my $sourceCodeOfUnicodeToForeignKeyedTables3232=shift; sl@0: my $sourceCodeOfUnicodeToForeignKeyedTables32OfIndexedTables32_indexedEntries=shift; sl@0: my $sourceCodeOfUnicodeToForeignKeyedTables32OfIndexedTables32_keyedEntries=shift; sl@0: sl@0: my $sourceCodeOfTopLevelStructures=shift; sl@0: my $endiannessAsText=shift; sl@0: my $additionalSubsetTables=shift; sl@0: my $sourceCodeChunk; sl@0: my $arrayOfSourceCodeChunks; sl@0: sl@0: foreach $arrayOfSourceCodeChunks (@$sourceCodeOfForeignToUnicodeIndexedTables16) sl@0: { sl@0: foreach $sourceCodeChunk (@$arrayOfSourceCodeChunks) sl@0: { sl@0: print($fileHandle $sourceCodeChunk); sl@0: } sl@0: } sl@0: foreach $arrayOfSourceCodeChunks (@$sourceCodeOfForeignToUnicodeKeyedTables1616) sl@0: { sl@0: foreach $sourceCodeChunk (@$arrayOfSourceCodeChunks) sl@0: { sl@0: print($fileHandle $sourceCodeChunk); sl@0: } sl@0: } sl@0: foreach $arrayOfSourceCodeChunks (@$sourceCodeOfForeignToUnicodeKeyedTables16OfIndexedTables16_indexedEntries) sl@0: { sl@0: foreach $sourceCodeChunk (@$arrayOfSourceCodeChunks) sl@0: { sl@0: print($fileHandle $sourceCodeChunk); sl@0: } sl@0: } sl@0: foreach $arrayOfSourceCodeChunks (@$sourceCodeOfForeignToUnicodeKeyedTables16OfIndexedTables16_keyedEntries) sl@0: { sl@0: foreach $sourceCodeChunk (@$arrayOfSourceCodeChunks) sl@0: { sl@0: print($fileHandle $sourceCodeChunk); sl@0: } sl@0: } sl@0: foreach $arrayOfSourceCodeChunks (@$sourceCodeOfUnicodeToForeignIndexedTables16) sl@0: { sl@0: foreach $sourceCodeChunk (@$arrayOfSourceCodeChunks) sl@0: { sl@0: print($fileHandle $sourceCodeChunk); sl@0: } sl@0: } sl@0: foreach $arrayOfSourceCodeChunks (@$sourceCodeOfUnicodeToForeignKeyedTables1616) sl@0: { sl@0: foreach $sourceCodeChunk (@$arrayOfSourceCodeChunks) sl@0: { sl@0: print($fileHandle $sourceCodeChunk); sl@0: } sl@0: } sl@0: foreach $arrayOfSourceCodeChunks (@$sourceCodeOfUnicodeToForeignKeyedTables16OfIndexedTables16_indexedEntries) sl@0: { sl@0: foreach $sourceCodeChunk (@$arrayOfSourceCodeChunks) sl@0: { sl@0: print($fileHandle $sourceCodeChunk); sl@0: } sl@0: } sl@0: foreach $arrayOfSourceCodeChunks (@$sourceCodeOfUnicodeToForeignKeyedTables16OfIndexedTables16_keyedEntries) sl@0: { sl@0: foreach $sourceCodeChunk (@$arrayOfSourceCodeChunks) sl@0: { sl@0: print($fileHandle $sourceCodeChunk); sl@0: } sl@0: } sl@0: # for 32 bit encoding begin sl@0: foreach $arrayOfSourceCodeChunks (@$sourceCodeOfForeignToUnicodeIndexedTables32) sl@0: { sl@0: foreach $sourceCodeChunk (@$arrayOfSourceCodeChunks) sl@0: { sl@0: print($fileHandle $sourceCodeChunk); sl@0: } sl@0: } sl@0: foreach $arrayOfSourceCodeChunks (@$sourceCodeOfForeignToUnicodeKeyedTables3232) sl@0: { sl@0: foreach $sourceCodeChunk (@$arrayOfSourceCodeChunks) sl@0: { sl@0: print($fileHandle $sourceCodeChunk); sl@0: } sl@0: } sl@0: foreach $arrayOfSourceCodeChunks (@$sourceCodeOfForeignToUnicodeKeyedTables32OfIndexedTables32_indexedEntries) sl@0: { sl@0: foreach $sourceCodeChunk (@$arrayOfSourceCodeChunks) sl@0: { sl@0: print($fileHandle $sourceCodeChunk); sl@0: } sl@0: } sl@0: foreach $arrayOfSourceCodeChunks (@$sourceCodeOfForeignToUnicodeKeyedTables32OfIndexedTables32_keyedEntries) sl@0: { sl@0: foreach $sourceCodeChunk (@$arrayOfSourceCodeChunks) sl@0: { sl@0: print($fileHandle $sourceCodeChunk); sl@0: } sl@0: } sl@0: foreach $arrayOfSourceCodeChunks (@$sourceCodeOfUnicodeToForeignIndexedTables32) sl@0: { sl@0: foreach $sourceCodeChunk (@$arrayOfSourceCodeChunks) sl@0: { sl@0: print($fileHandle $sourceCodeChunk); sl@0: } sl@0: } sl@0: foreach $arrayOfSourceCodeChunks (@$sourceCodeOfUnicodeToForeignKeyedTables3232) sl@0: { sl@0: foreach $sourceCodeChunk (@$arrayOfSourceCodeChunks) sl@0: { sl@0: print($fileHandle $sourceCodeChunk); sl@0: } sl@0: } sl@0: foreach $arrayOfSourceCodeChunks (@$sourceCodeOfUnicodeToForeignKeyedTables32OfIndexedTables32_indexedEntries) sl@0: { sl@0: foreach $sourceCodeChunk (@$arrayOfSourceCodeChunks) sl@0: { sl@0: print($fileHandle $sourceCodeChunk); sl@0: } sl@0: } sl@0: foreach $arrayOfSourceCodeChunks (@$sourceCodeOfUnicodeToForeignKeyedTables32OfIndexedTables32_keyedEntries) sl@0: { sl@0: foreach $sourceCodeChunk (@$arrayOfSourceCodeChunks) sl@0: { sl@0: print($fileHandle $sourceCodeChunk); sl@0: } sl@0: } sl@0: # for 32 bit encoding end sl@0: foreach $sourceCodeChunk (@$sourceCodeOfTopLevelStructures) sl@0: { sl@0: print($fileHandle $sourceCodeChunk); sl@0: } sl@0: sl@0: print($fileHandle "GLDEF_D const SCnvConversionData conversionData=\n\t\{\n\tSCnvConversionData::E$endiannessAsText,\n\t\t\{\n\t\tARRAY_LENGTH(foreignVariableByteDataRanges),\n\t\tforeignVariableByteDataRanges\n\t\t\},\n\t\t\{\n\t\tARRAY_LENGTH(foreignToUnicodeDataRanges),\n\t\tforeignToUnicodeDataRanges\n\t\t\},\n\t\t\{\n\t\tARRAY_LENGTH(unicodeToForeignDataRanges),\n\t\tunicodeToForeignDataRanges\n\t\t\},\n\tNULL,\n\tNULL\n\t\};\n\n"); sl@0: sl@0: my $additionalSubsetTableName; sl@0: my $additionalSubsetTableData; sl@0: while (($additionalSubsetTableName, $additionalSubsetTableData)=each(%$additionalSubsetTables)) sl@0: { sl@0: (defined($additionalSubsetTableData->[0]) && defined($additionalSubsetTableData->[1]) && defined($additionalSubsetTableData->[2]) && defined($additionalSubsetTableData->[3])) or die("Error: incomplete definition of \"$additionalSubsetTableName\"\n"); sl@0: print($fileHandle "GLREF_D const SCnvConversionData $additionalSubsetTableName;\n"); sl@0: print($fileHandle "GLDEF_D const SCnvConversionData $additionalSubsetTableName=\n\t\{\n\tSCnvConversionData::E$endiannessAsText,\n\t\t\{\n\t\tARRAY_LENGTH(foreignVariableByteDataRanges),\n\t\tforeignVariableByteDataRanges\n\t\t\},\n\t\t\{\n\t\t$additionalSubsetTableData->[1]-$additionalSubsetTableData->[0],\n\t\tforeignToUnicodeDataRanges+$additionalSubsetTableData->[0]\n\t\t\},\n\t\t\{\n\t\t$additionalSubsetTableData->[3]-$additionalSubsetTableData->[2],\n\t\tunicodeToForeignDataRanges+$additionalSubsetTableData->[2]\n\t\t\}\n\t\};\n\n"); sl@0: } sl@0: } sl@0: sl@0: sub writeBinaryHeader sl@0: { sl@0: my $fileHandle=shift; sl@0: my $uid=shift; sl@0: my $endianness=shift; sl@0: my $replacementForUnconvertibleUnicodeCharacters=shift; sl@0: &writeUids($fileHandle, 0x100011bd, $uid, 0); sl@0: &write32($fileHandle, 1); # version number of the file format sl@0: &write32($fileHandle, 0); # not currently used sl@0: &write8($fileHandle, 0); # number of Unicode characters in the name (which is now derived from the file-name, hence why this is zero) sl@0: &write8($fileHandle, $endianness); sl@0: &write8($fileHandle, length($replacementForUnconvertibleUnicodeCharacters)); sl@0: &writeString($fileHandle, $replacementForUnconvertibleUnicodeCharacters); sl@0: } sl@0: sl@0: sub writeBinaryForeignVariableByteData sl@0: { sl@0: my $fileHandle=shift; sl@0: my $foreignVariableByteData=shift; sl@0: &writePositiveIntegerCompacted30($fileHandle, scalar(@$foreignVariableByteData)); sl@0: my $rangeData; sl@0: foreach $rangeData (@$foreignVariableByteData) sl@0: { sl@0: if (@$rangeData!=3) sl@0: { sl@0: die("Error: internal error 10\n"); sl@0: } sl@0: my $firstInitialByteValueInRange=$rangeData->[0]; sl@0: my $lastInitialByteValueInRange=$rangeData->[1]; sl@0: if ($lastInitialByteValueInRange<$firstInitialByteValueInRange) sl@0: { sl@0: die("Error: internal error 11\n"); sl@0: } sl@0: &write8($fileHandle, $firstInitialByteValueInRange); sl@0: &write8($fileHandle, $lastInitialByteValueInRange); sl@0: &write8($fileHandle, $rangeData->[2]); # numberOfSubsequentBytes sl@0: } sl@0: } sl@0: sl@0: sub writeBinaryOneDirectionData sl@0: { sl@0: my $fileHandle=shift; sl@0: my $oneDirectionData=shift; sl@0: my $characterCodes=shift; sl@0: my $outputIsUnicode=shift; sl@0: &writePositiveIntegerCompacted30($fileHandle, scalar(@$oneDirectionData)); sl@0: my $rangeData; sl@0: foreach $rangeData (@$oneDirectionData) sl@0: { sl@0: ## $rangeData is $includePriority, $searchPriority, $firstInputCharacterCodeInRange, $lastInputCharacterCodeInRange, $algorithm[, $sizeOfOutputCharacterCodeInBytes], $parameters sl@0: if (scalar(@$rangeData)!=($outputIsUnicode? 6: 7)) sl@0: { sl@0: die("Error: internal error 12\n"); sl@0: } sl@0: my $firstInputCharacterCodeInRange=$rangeData->[2]; sl@0: my $lastInputCharacterCodeInRange=$rangeData->[3]; sl@0: if ($lastInputCharacterCodeInRange<$firstInputCharacterCodeInRange) sl@0: { sl@0: die("Error: internal error 13\n"); sl@0: } sl@0: &writePositiveIntegerCompacted30($fileHandle, $firstInputCharacterCodeInRange); sl@0: &writePositiveIntegerCompacted30($fileHandle, $lastInputCharacterCodeInRange); sl@0: my $algorithm=$rangeData->[4]; sl@0: &write8($fileHandle, $algorithm); sl@0: if (!$outputIsUnicode) sl@0: { sl@0: &write8($fileHandle, $rangeData->[5]); # sizeOfOutputCharacterCodeInBytesIfForeign sl@0: } sl@0: if ($algorithm==0) # Direct sl@0: { sl@0: my $characterCode; sl@0: for ($characterCode=$firstInputCharacterCodeInRange; $characterCode<=$lastInputCharacterCodeInRange; ++$characterCode) sl@0: { sl@0: if (!defined($characterCodes->{$characterCode})) sl@0: { sl@0: die("Error: There is no conversion defined for ".($outputIsUnicode? 'foreign': 'Unicode')." character code ".sprintf("0x%08x", $characterCode)."\n"); sl@0: } sl@0: if ($characterCodes->{$characterCode}!=$characterCode) sl@0: { sl@0: die("Error: the conversion from ".($outputIsUnicode? 'foreign': 'Unicode')." character code ".sprintf("0x%08x", $characterCode)." to ".($outputIsUnicode? 'Unicode': 'foreign')." character code ".sprintf("0x%08x", $characterCodes->{$characterCode})." is not a direct conversion\n"); sl@0: } sl@0: delete $characterCodes->{$characterCode}; sl@0: } sl@0: } sl@0: elsif ($algorithm==1) # Offset sl@0: { sl@0: my $offset=$characterCodes->{$firstInputCharacterCodeInRange}-$firstInputCharacterCodeInRange; sl@0: delete $characterCodes->{$firstInputCharacterCodeInRange}; sl@0: my $characterCode; sl@0: for ($characterCode=$firstInputCharacterCodeInRange+1; $characterCode<=$lastInputCharacterCodeInRange; ++$characterCode) sl@0: { sl@0: if (!defined($characterCodes->{$characterCode})) sl@0: { sl@0: die("Error: There is no conversion defined for ".($outputIsUnicode? 'foreign': 'Unicode')." character code ".sprintf("0x%08x (0x%08x-0x%08x)", $characterCode, $firstInputCharacterCodeInRange, $lastInputCharacterCodeInRange)."\n"); sl@0: } sl@0: if ($characterCodes->{$characterCode}-$characterCode!=$offset) sl@0: { sl@0: die("Error: the conversion from ".($outputIsUnicode? 'foreign': 'Unicode')." character code ".sprintf("0x%08x", $characterCode)." to ".($outputIsUnicode? 'Unicode': 'foreign')." character code ".sprintf("0x%08x", $characterCodes->{$characterCode})." has a different offset from the previous one in the range\n"); sl@0: } sl@0: delete $characterCodes->{$characterCode}; sl@0: } sl@0: &writeSignedIntegerCompacted29($fileHandle, $offset); sl@0: } sl@0: elsif ($algorithm==2) # IndexedTable16 sl@0: { sl@0: my $characterCode; sl@0: for ($characterCode=$firstInputCharacterCodeInRange; $characterCode<=$lastInputCharacterCodeInRange; ++$characterCode) sl@0: { sl@0: if (!defined($characterCodes->{$characterCode})) sl@0: { sl@0: die("Error: There is no conversion defined for ".($outputIsUnicode? 'foreign': 'Unicode')." character code ".sprintf("0x%08x", $characterCode)."\n"); sl@0: } sl@0: &write16($fileHandle, $characterCodes->{$characterCode}); sl@0: delete $characterCodes->{$characterCode}; sl@0: } sl@0: } sl@0: elsif ($algorithm==3) # KeyedTable1616 sl@0: { sl@0: my $characterCode; sl@0: my @table=(); sl@0: for ($characterCode=$firstInputCharacterCodeInRange; $characterCode<=$lastInputCharacterCodeInRange; ++$characterCode) sl@0: { sl@0: if (defined($characterCodes->{$characterCode})) sl@0: { sl@0: push(@table, [$characterCode, $characterCodes->{$characterCode}]); sl@0: delete $characterCodes->{$characterCode}; sl@0: } sl@0: } sl@0: my $firstIteration=1; sl@0: my $lastKey; sl@0: &writePositiveIntegerCompacted30($fileHandle, scalar(@table)); sl@0: if ($table[0][0]!=$firstInputCharacterCodeInRange) sl@0: { sl@0: die("Error: no conversion is specified for the first ".($outputIsUnicode? 'foreign': 'Unicode')." character code in the KeyedTable1616 range ".sprintf("0x%08x to 0x%08x", $firstInputCharacterCodeInRange, $lastInputCharacterCodeInRange)."\n"); sl@0: } sl@0: my $pair; sl@0: foreach $pair (@table) sl@0: { sl@0: my $key=$pair->[0]; sl@0: if ($firstIteration) sl@0: { sl@0: $firstIteration=0; sl@0: } sl@0: else sl@0: { sl@0: if ($key<=$lastKey) sl@0: { sl@0: die("Error: internal error 14\n"); sl@0: } sl@0: &writePositiveIntegerCompacted15($fileHandle, $key-$lastKey); sl@0: } sl@0: &write16($fileHandle, $pair->[1]); sl@0: $lastKey=$key; sl@0: } sl@0: } sl@0: elsif ($algorithm==4) # KeyedTable16OfIndexedTables16 sl@0: { sl@0: die("Error: \"KeyedTable16OfIndexedTables16\" is only supported if generating source code\n"); sl@0: } sl@0: else sl@0: { sl@0: die("Error: internal error 15\n"); sl@0: } sl@0: } sl@0: my @characterCodes=sort({$a<=>$b} keys(%$characterCodes)); sl@0: if (@characterCodes>0) sl@0: { sl@0: die('The following '.($outputIsUnicode? 'foreign': 'Unicode').'characters have no conversion algorithm specified: ['.join(', ', map({sprintf('0x%x', $_)} @characterCodes))."\]\n"); sl@0: } sl@0: } sl@0: