mirror of
https://github.com/mozilla/gecko-dev.git
synced 2024-12-06 12:43:53 +00:00
fd06eca99b
Tools written by Anthony (anthony@thizlinux.com) to generate the new conversion table for hkscs. Not part of the build, just put here for future reference.
93 lines
2.6 KiB
Perl
93 lines
2.6 KiB
Perl
#!/usr/bin/perl
|
|
# parse-mozilla-encoding-table.pl, version 0.6
|
|
#
|
|
# Script to deassemble existing Mozilla *.uf or *.ut files
|
|
# back to source conversion tables.
|
|
# by Anthony Fok <anthony@thizlinux.com>, ThizLinux Laboratory Ltd., 2002/11/27
|
|
# License: GNU General Public License, version 2 or newer
|
|
#
|
|
# Used for verifying HKSCS-1999 hkscs.uf and hkscs.ut so that I can make
|
|
# new ones for HKSCS-2001. This script is quick-and-dirty and not very
|
|
# robust, so if the debug output of fromu/tou ever changes, this script
|
|
# will need to be modified too. :-)
|
|
|
|
my %data = ();
|
|
my $mappingPos = 0;
|
|
my $filename = shift;
|
|
my $mode;
|
|
if ($filename =~ /\.(ut|uf)$/) {
|
|
print $filename, "\n";
|
|
$mode = $1;
|
|
} else {
|
|
die;
|
|
}
|
|
|
|
open(INFILE, "<$filename") or die;
|
|
|
|
# Quick-and-dirty routine to populate %data
|
|
while (<INFILE>) {
|
|
if (/^Begin of Item ([[:xdigit:]]+)/) {
|
|
die if defined($itemId) and hex($itemId) + 1 != hex($1);
|
|
$itemId = $1;
|
|
<INFILE> =~ /Format ([012])/ or die;
|
|
$format = $1;
|
|
<INFILE> =~ /srcBegin = ([[:xdigit:]]+)/ or die;
|
|
$srcBegin = $1;
|
|
|
|
if ($format == 0) { # Range
|
|
<INFILE> =~ /srcEnd = ([[:xdigit:]]+)/ or die;
|
|
$srcEnd = $1;
|
|
<INFILE> =~ /destBegin = ([[:xdigit:]]+)/ or die;
|
|
$destBegin = $1;
|
|
|
|
for ($i = hex($srcBegin); $i <= hex($srcEnd); $i++) {
|
|
$data{sprintf("%04X",$i)} = sprintf("%04X",
|
|
hex($destBegin) + $i - hex($srcBegin));
|
|
}
|
|
|
|
<INFILE> =~ /^End of Item $itemId\s*$/ or die;
|
|
}
|
|
elsif ($format == 1) { # Mapping
|
|
<INFILE> =~ /srcEnd = ([[:xdigit:]]+)/ or die;
|
|
$srcEnd = $1;
|
|
<INFILE> =~ /mappingOffset = ([[:xdigit:]]+)/ or die;
|
|
$mappingOffset = hex($1);
|
|
die unless $mappingOffset == $mappingPos;
|
|
<INFILE> =~ /Mapping =\s*$/ or die;
|
|
until ($_ = <INFILE>, /^End of Item/) {
|
|
chop;
|
|
for $i (split ' ') {
|
|
$key = sprintf("%04X", hex($srcBegin) - $mappingOffset + $mappingPos++);
|
|
next if $i eq "FFFD";
|
|
if (defined($data{$key})) {
|
|
print "Error: doubly defined. $key was $data{$key}, and now $i.\n";
|
|
} else {
|
|
$data{$key} = $i;
|
|
}
|
|
}
|
|
}
|
|
die unless $mappingPos - $mappingOffset == hex($srcEnd) - hex($srcBegin) + 1;
|
|
/^End of Item $itemId\s*$/ or die;
|
|
}
|
|
else { # Single ($format == 2)
|
|
<INFILE> =~ /destBegin = ([[:xdigit:]]+)/ or die;
|
|
$destBegin = $1;
|
|
$data{$srcBegin} = $destBegin;
|
|
<INFILE> =~ /^End of Item $itemId\s*$/ or die;
|
|
}
|
|
}
|
|
}
|
|
|
|
# Generate conversion table
|
|
for $key (sort keys %data) {
|
|
if ($mode eq "ut") {
|
|
print "0x$key\t0x$data{$key}\n";
|
|
} elsif ($mode eq "uf") {
|
|
print "0x$data{$key}\t0x$key\n";
|
|
} else {
|
|
die;
|
|
}
|
|
}
|
|
|
|
close INFILE;
|