summaryrefslogtreecommitdiffstats
path: root/intl/uconv/tools/cp936tocdx.pl
diff options
context:
space:
mode:
Diffstat (limited to 'intl/uconv/tools/cp936tocdx.pl')
-rw-r--r--intl/uconv/tools/cp936tocdx.pl133
1 files changed, 133 insertions, 0 deletions
diff --git a/intl/uconv/tools/cp936tocdx.pl b/intl/uconv/tools/cp936tocdx.pl
new file mode 100644
index 000000000..b85972b04
--- /dev/null
+++ b/intl/uconv/tools/cp936tocdx.pl
@@ -0,0 +1,133 @@
+#!/user/local/bin/perl
+# -*- Mode: C++; tab-width: 2; indent-tabs-mode: nil; c-basic-offset: 2 -*-
+#
+# This Source Code Form is subject to the terms of the Mozilla Public
+# License, v. 2.0. If a copy of the MPL was not distributed with this
+# file, You can obtain one at http://mozilla.org/MPL/2.0/.
+$rowwidth = ((0xff - 0x80)+(0x7f - 0x40));
+sub cp936tonum()
+{
+ my($cp936) = (@_);
+ my($first,$second,$jnum);
+ $first = hex(substr($cp936,2,2));
+ $second = hex(substr($cp936,4,2));
+ $jnum = ($first - 0x81 ) * $rowwidth;
+ if($second >= 0x80)
+ {
+ $jnum += $second - 0x80 + (0x7f-0x40);
+ }
+ else
+ {
+ $jnum += $second - 0x40;
+ }
+ return $jnum;
+}
+
+@map = {};
+sub readtable()
+{
+open(CP936, "<gbkcommon.txt") || die "cannot open gbkcommon.txt";
+while(<CP936>)
+{
+ if(! /^#/) {
+ chop();
+ ($j, $u, $r) = split(/\t/,$_);
+ if(length($j) > 4)
+ {
+ $n = &cp936tonum($j);
+ $map{$n} = $u;
+ }
+ }
+}
+}
+
+
+sub printtable()
+{
+ for($i=0;$i<126;$i++)
+ {
+ printf ( "/* 0x%2XXX */\n", ( $i + 0x81));
+ for($j=0;$j<(0x7f-0x40);$j++)
+ {
+ if("" eq ($map{($i * $rowwidth + $j)}))
+ {
+ printf "0xFFFD,"
+ }
+ else
+ {
+ printf $map{($i * $rowwidth + $j)} . ",";
+ }
+ if( 0 == (($j + 1) % 8))
+ {
+ printf "/* 0x%2X%1X%1X*/\n", $i+0x81, 4+($j/16), (7==($j%16))?0:8;
+ }
+ }
+
+ print "0xFFFD,";
+
+ printf "/* 0x%2X%1X%1X*/\n", $i+0x81, 4+($j/16),(7==($j%16))?0:8;
+ for($j=0;$j < (0xff-0x80);$j++)
+ {
+ if("" eq ($map{($i * $rowwidth + $j + 0x3f)})) # user defined chars map to 0xFFFD
+ {
+
+ if ( ( $i == 125 ) and ( $j == (0xff - 0x80 - 1 )))
+ {
+ printf "0xFFFD"; #has no ',' followed last item
+ }
+ else
+ {
+ printf "0xFFFD,";
+ }
+ }
+ else
+ {
+ if ( ( $i == 125 ) and ( $j == (0xff - 0x80 - 1 )))
+ {
+ printf $map{($i * $rowwidth + $j + 0x3f)}; #has no ',' followed last item
+ }
+ else
+ {
+ printf $map{($i * $rowwidth + $j + 0x3f)} . ",";
+ }
+ }
+
+ if( 0 == (($j + 1) % 8))
+ {
+ printf "/* 0x%2X%1X%1X*/\n", $i+0x81, 8+($j/16), (7==($j%16))?0:8;
+ }
+ }
+ printf " /* 0x%2X%1X%1X*/\n", $i+0x81, 8+($j/16),(7==($j%16))?0:8;
+ }
+}
+sub printnpl()
+{
+$npl = <<END_OF_NPL;
+/* -*- Mode: C++; tab-width: 2; indent-tabs-mode: nil; c-basic-offset: 2 -*- */
+/* This Source Code Form is subject to the terms of the Mozilla Public
+ * License, v. 2.0. If a copy of the MPL was not distributed with this
+ * file, You can obtain one at http://mozilla.org/MPL/2.0/. */
+END_OF_NPL
+print $npl;
+}
+sub printdontmodify()
+{
+$dont_modify = <<END_OF_DONT_MODIFY;
+/*
+ This file is generated by mozilla/intl/uconv/tools/cp936tocdx.pl
+ Please do not modify this file by hand
+ Instead, you should download CP936.TXT from
+ http://www.unicode.org/Public/MAPPINGS/VENDORS/MICSFT/WINDOWS/
+ and put under mozilla/intl/uconv/toools
+ and run perl cp936tocdx.pl > ../ucvcn/cp936map.h
+ If you have question, mailto:ftan\@netscape.com
+ */
+END_OF_DONT_MODIFY
+print $dont_modify;
+}
+
+&readtable();
+&printnpl();
+&printdontmodify();
+&printtable();
+