os/textandloc/charconvfw/fatfilenameconversionplugins/group/cp54936_allbmp_fromunicode.pl
1.1 --- /dev/null Thu Jan 01 00:00:00 1970 +0000
1.2 +++ b/os/textandloc/charconvfw/fatfilenameconversionplugins/group/cp54936_allbmp_fromunicode.pl Fri Jun 15 03:10:57 2012 +0200
1.3 @@ -0,0 +1,154 @@
1.4 +#
1.5 +# Copyright (c) 2008-2009 Nokia Corporation and/or its subsidiary(-ies).
1.6 +# All rights reserved.
1.7 +# This component and the accompanying materials are made available
1.8 +# under the terms of "Eclipse Public License v1.0"
1.9 +# which accompanies this distribution, and is available
1.10 +# at the URL "http://www.eclipse.org/legal/epl-v10.html".
1.11 +#
1.12 +# Initial Contributors:
1.13 +# Nokia Corporation - initial contribution.
1.14 +#
1.15 +# Contributors:
1.16 +#
1.17 +# Description:
1.18 +# See line 99 of this file.
1.19 +#
1.20 +
1.21 +if (@ARGV != 2 && @ARGV != 3)
1.22 + {
1.23 + print <<EOD;
1.24 +Usage: cp54936_allbmp_fromunicode.pl cp54936_2byte.txt cp54936_4byte.txt cp54936_allbmp_fromunicode.cpp
1.25 +EOD
1.26 + exit(1);
1.27 + }
1.28 +
1.29 +my $root = "cp54936_allbmp_fromunicode.cpp";
1.30 +if (@ARGV == 3)
1.31 + {
1.32 + $root = $ARGV[3];
1.33 + }
1.34 +
1.35 +
1.36 +my %lines; # the hash table to hold all characters with key=unicode(dec) and value=foreign(string)
1.37 +
1.38 +
1.39 +# read 2 byte input file
1.40 +open (IN2, "<$ARGV[0]") or die ("Error: $ARGV[0] $!");
1.41 +my $lineNumber = 0;
1.42 +my $acceptLineNumber = 0;
1.43 +while (!eof(IN2))
1.44 + {
1.45 + my $line = <IN2>;
1.46 + $lineNumber++;
1.47 + if ($line =~ /^(0[xX][\da-fA-F]{1,4})\s*(0[xX][\da-fA-F]{1,4}).*/)
1.48 + {
1.49 + $acceptLineNumber++;
1.50 + my $foreign = $1;
1.51 + my $unicode = hex($2);
1.52 + if (exists ($lines{$unicode}))
1.53 + {
1.54 + print "ERROR: Unicode $unicode is reused by $lines{$unicode} and $foreign.\n";
1.55 + exit(1);
1.56 + }
1.57 + $lines{$unicode} = $foreign;
1.58 + }
1.59 + else
1.60 + {
1.61 + #print "Ignore line: $line";
1.62 + }
1.63 + }
1.64 +close IN2;
1.65 +print "\nRead $ARGV[0] done.\n";
1.66 +print "$acceptLineNumber of $lineNumber lines accepted.\n\n";
1.67 +
1.68 +
1.69 +# read 4 byte input file
1.70 +open (IN4, "<$ARGV[1]") or die ("Error: $ARGV[1] $!");
1.71 +$lineNumber = 0;
1.72 +$acceptLineNumber = 0;
1.73 +while (!eof(IN4))
1.74 + {
1.75 + my $line = <IN4>;
1.76 + $lineNumber++;
1.77 + if ($line =~ /^(0[xX]8[1-4]3\d[\da-fA-F]{2}3\d)\s*(0[xX][\da-fA-F]{4}).*/)
1.78 + {
1.79 + $acceptLineNumber++;
1.80 + my $foreign = $1;
1.81 + my $unicode = hex($2);
1.82 + if (exists ($lines{$unicode}))
1.83 + {
1.84 + print "ERROR: Unicode $unicode is reused by $lines{$unicode} and $foreign.\n";
1.85 + exit(1);
1.86 + }
1.87 + $lines{$unicode} = $foreign;
1.88 + }
1.89 + else
1.90 + {
1.91 + #print "Ignore line: $line";
1.92 + }
1.93 + }
1.94 +close IN4;
1.95 +print "Read $ARGV[1] done.\n";
1.96 +print "$acceptLineNumber of $lineNumber lines accepted.\n\n";
1.97 +
1.98 +
1.99 +# write to output file
1.100 +print "Write to $root...\n";
1.101 +open (CPP, ">$root") or die ("Error: Can't open cpp file");
1.102 +print CPP <<EOD;
1.103 +// Copyright (c) 2008-2009 Nokia Corporation and/or its subsidiary(-ies).
1.104 +// All rights reserved.
1.105 +// This component and the accompanying materials are made available
1.106 +// under the terms of the License "Eclipse Public License v1.0"
1.107 +// which accompanies this distribution, and is available
1.108 +// at the URL "http://www.eclipse.org/legal/epl-v10.html".
1.109 +//
1.110 +// Initial Contributors:
1.111 +// Nokia Corporation - initial contribution.
1.112 +//
1.113 +// Contributors:
1.114 +//
1.115 +// Description:
1.116 +//
1.117 +// Generated by the cp54936_allbmp_fromunicode.pl tool - Do not edit!!!
1.118 +// Generated with \"perl -w ..\\group\\cp54936_allbmp_fromunicode.pl cp54936_2byte.txt cp54936_4byte.txt\".
1.119 +//
1.120 +
1.121 +#include <e32std.h>
1.122 +#include <e32def.h>
1.123 +#include "cp54936.h"
1.124 +
1.125 +const TUint8 KForeignReplacement = 0x5F;
1.126 +
1.127 +EOD
1.128 +print CPP "const TUint32 KMappingTableUnicodeBmp2CP54936\[65536\] = \n";
1.129 +print CPP "\t\{\n\t";
1.130 +
1.131 +my $bytecount = 0;
1.132 +my $expectUnicode = 0;
1.133 +while ($expectUnicode <= 0xFFFF)
1.134 + {
1.135 + if (exists ($lines{$expectUnicode}))
1.136 + {
1.137 + print CPP "$lines{$expectUnicode}, ";
1.138 + }
1.139 + else
1.140 + {
1.141 + print CPP "KForeignReplacement, ";
1.142 + }
1.143 + $bytecount += 4;
1.144 + $expectUnicode++;
1.145 + if (($expectUnicode % 16) == 0)
1.146 + {
1.147 + print CPP sprintf("// %04X - %04X\n\t", $expectUnicode-16, $expectUnicode-1);
1.148 + }
1.149 + }
1.150 +print CPP "};\t";
1.151 +
1.152 +$bytecount += 8;
1.153 +print CPP "// total byte count = $bytecount\n";
1.154 +print "\nTotal byte count: $bytecount.\n";
1.155 +close CPP;
1.156 +
1.157 +print "\nDone.";