os/textandloc/charconvfw/fatfilenameconversionplugins/group/cp54936_allbmp_fromunicode.pl
author sl@SLION-WIN7.fritz.box
Fri, 15 Jun 2012 03:10:57 +0200
changeset 0 bde4ae8d615e
permissions -rw-r--r--
First public contribution.
sl@0
     1
#
sl@0
     2
# Copyright (c) 2008-2009 Nokia Corporation and/or its subsidiary(-ies).
sl@0
     3
# All rights reserved.
sl@0
     4
# This component and the accompanying materials are made available
sl@0
     5
# under the terms of "Eclipse Public License v1.0"
sl@0
     6
# which accompanies this distribution, and is available
sl@0
     7
# at the URL "http://www.eclipse.org/legal/epl-v10.html".
sl@0
     8
#
sl@0
     9
# Initial Contributors:
sl@0
    10
# Nokia Corporation - initial contribution.
sl@0
    11
#
sl@0
    12
# Contributors:
sl@0
    13
#
sl@0
    14
# Description: 
sl@0
    15
# See line 99 of this file.
sl@0
    16
#
sl@0
    17
sl@0
    18
if (@ARGV != 2 && @ARGV != 3)
sl@0
    19
	{
sl@0
    20
	print <<EOD;
sl@0
    21
Usage: cp54936_allbmp_fromunicode.pl cp54936_2byte.txt cp54936_4byte.txt cp54936_allbmp_fromunicode.cpp
sl@0
    22
EOD
sl@0
    23
	exit(1);
sl@0
    24
	}
sl@0
    25
sl@0
    26
my $root = "cp54936_allbmp_fromunicode.cpp";
sl@0
    27
if (@ARGV == 3)
sl@0
    28
	{
sl@0
    29
	$root = $ARGV[3];
sl@0
    30
	}
sl@0
    31
sl@0
    32
sl@0
    33
my %lines;	# the hash table to hold all characters with key=unicode(dec) and value=foreign(string)
sl@0
    34
sl@0
    35
sl@0
    36
# read 2 byte input file
sl@0
    37
open (IN2, "<$ARGV[0]") or die ("Error: $ARGV[0] $!");
sl@0
    38
my $lineNumber = 0;
sl@0
    39
my $acceptLineNumber = 0;
sl@0
    40
while (!eof(IN2))
sl@0
    41
	{
sl@0
    42
	my $line = <IN2>;
sl@0
    43
	$lineNumber++;
sl@0
    44
	if ($line =~ /^(0[xX][\da-fA-F]{1,4})\s*(0[xX][\da-fA-F]{1,4}).*/)
sl@0
    45
		{
sl@0
    46
		$acceptLineNumber++;
sl@0
    47
		my $foreign = $1;
sl@0
    48
		my $unicode = hex($2);
sl@0
    49
		if (exists ($lines{$unicode}))
sl@0
    50
			{
sl@0
    51
			print "ERROR: Unicode $unicode is reused by $lines{$unicode} and $foreign.\n";
sl@0
    52
			exit(1);
sl@0
    53
			}
sl@0
    54
		$lines{$unicode} = $foreign;
sl@0
    55
		}
sl@0
    56
	else
sl@0
    57
		{
sl@0
    58
		#print "Ignore line: $line";
sl@0
    59
		}
sl@0
    60
	}
sl@0
    61
close IN2;
sl@0
    62
print "\nRead $ARGV[0] done.\n";
sl@0
    63
print "$acceptLineNumber of $lineNumber lines accepted.\n\n";
sl@0
    64
sl@0
    65
sl@0
    66
# read 4 byte input file
sl@0
    67
open (IN4, "<$ARGV[1]") or die ("Error: $ARGV[1] $!");
sl@0
    68
$lineNumber = 0;
sl@0
    69
$acceptLineNumber = 0;
sl@0
    70
while (!eof(IN4))
sl@0
    71
	{
sl@0
    72
	my $line = <IN4>;
sl@0
    73
	$lineNumber++;
sl@0
    74
	if ($line =~ /^(0[xX]8[1-4]3\d[\da-fA-F]{2}3\d)\s*(0[xX][\da-fA-F]{4}).*/)
sl@0
    75
		{
sl@0
    76
		$acceptLineNumber++;
sl@0
    77
		my $foreign = $1;
sl@0
    78
		my $unicode = hex($2);
sl@0
    79
		if (exists ($lines{$unicode}))
sl@0
    80
			{
sl@0
    81
			print "ERROR: Unicode $unicode is reused by $lines{$unicode} and $foreign.\n";
sl@0
    82
			exit(1);
sl@0
    83
			}
sl@0
    84
		$lines{$unicode} = $foreign;
sl@0
    85
		}
sl@0
    86
	else
sl@0
    87
		{
sl@0
    88
		#print "Ignore line: $line";
sl@0
    89
		}
sl@0
    90
	}
sl@0
    91
close IN4;
sl@0
    92
print "Read $ARGV[1] done.\n";
sl@0
    93
print "$acceptLineNumber of $lineNumber lines accepted.\n\n";
sl@0
    94
sl@0
    95
sl@0
    96
# write to output file
sl@0
    97
print "Write to $root...\n";
sl@0
    98
open (CPP, ">$root") or die ("Error: Can't open cpp file");
sl@0
    99
print CPP <<EOD;
sl@0
   100
// Copyright (c) 2008-2009 Nokia Corporation and/or its subsidiary(-ies).
sl@0
   101
// All rights reserved.
sl@0
   102
// This component and the accompanying materials are made available
sl@0
   103
// under the terms of the License "Eclipse Public License v1.0"
sl@0
   104
// which accompanies this distribution, and is available
sl@0
   105
// at the URL "http://www.eclipse.org/legal/epl-v10.html".
sl@0
   106
//
sl@0
   107
// Initial Contributors:
sl@0
   108
// Nokia Corporation - initial contribution.
sl@0
   109
//
sl@0
   110
// Contributors:
sl@0
   111
//
sl@0
   112
// Description:
sl@0
   113
//
sl@0
   114
// Generated by the cp54936_allbmp_fromunicode.pl tool - Do not edit!!!
sl@0
   115
// Generated with \"perl -w ..\\group\\cp54936_allbmp_fromunicode.pl cp54936_2byte.txt cp54936_4byte.txt\".
sl@0
   116
//
sl@0
   117
sl@0
   118
#include <e32std.h>
sl@0
   119
#include <e32def.h>
sl@0
   120
#include "cp54936.h"
sl@0
   121
sl@0
   122
const TUint8 KForeignReplacement = 0x5F;
sl@0
   123
sl@0
   124
EOD
sl@0
   125
print CPP "const TUint32 KMappingTableUnicodeBmp2CP54936\[65536\] = \n";
sl@0
   126
print CPP "\t\{\n\t";
sl@0
   127
sl@0
   128
my $bytecount = 0;
sl@0
   129
my $expectUnicode = 0;
sl@0
   130
while ($expectUnicode <= 0xFFFF)
sl@0
   131
	{
sl@0
   132
	if (exists ($lines{$expectUnicode}))
sl@0
   133
		{
sl@0
   134
		print CPP "$lines{$expectUnicode}, ";
sl@0
   135
		}
sl@0
   136
	else
sl@0
   137
		{
sl@0
   138
		print CPP "KForeignReplacement, ";
sl@0
   139
		}
sl@0
   140
	$bytecount += 4;
sl@0
   141
	$expectUnicode++;
sl@0
   142
	if (($expectUnicode % 16) == 0)
sl@0
   143
		{
sl@0
   144
		print CPP sprintf("// %04X - %04X\n\t", $expectUnicode-16, $expectUnicode-1);
sl@0
   145
		}
sl@0
   146
	}
sl@0
   147
print CPP "};\t";
sl@0
   148
sl@0
   149
$bytecount += 8;
sl@0
   150
print CPP "// total byte count = $bytecount\n";
sl@0
   151
print "\nTotal byte count: $bytecount.\n";
sl@0
   152
close CPP;
sl@0
   153
sl@0
   154
print "\nDone.";