diff options
Diffstat (limited to 'intl/uconv/tools/cp936tocdx.pl')
-rw-r--r-- | intl/uconv/tools/cp936tocdx.pl | 133 |
1 files changed, 133 insertions, 0 deletions
diff --git a/intl/uconv/tools/cp936tocdx.pl b/intl/uconv/tools/cp936tocdx.pl new file mode 100644 index 000000000..b85972b04 --- /dev/null +++ b/intl/uconv/tools/cp936tocdx.pl @@ -0,0 +1,133 @@ +#!/user/local/bin/perl +# -*- Mode: C++; tab-width: 2; indent-tabs-mode: nil; c-basic-offset: 2 -*- +# +# This Source Code Form is subject to the terms of the Mozilla Public +# License, v. 2.0. If a copy of the MPL was not distributed with this +# file, You can obtain one at http://mozilla.org/MPL/2.0/. +$rowwidth = ((0xff - 0x80)+(0x7f - 0x40)); +sub cp936tonum() +{ + my($cp936) = (@_); + my($first,$second,$jnum); + $first = hex(substr($cp936,2,2)); + $second = hex(substr($cp936,4,2)); + $jnum = ($first - 0x81 ) * $rowwidth; + if($second >= 0x80) + { + $jnum += $second - 0x80 + (0x7f-0x40); + } + else + { + $jnum += $second - 0x40; + } + return $jnum; +} + +@map = {}; +sub readtable() +{ +open(CP936, "<gbkcommon.txt") || die "cannot open gbkcommon.txt"; +while(<CP936>) +{ + if(! /^#/) { + chop(); + ($j, $u, $r) = split(/\t/,$_); + if(length($j) > 4) + { + $n = &cp936tonum($j); + $map{$n} = $u; + } + } +} +} + + +sub printtable() +{ + for($i=0;$i<126;$i++) + { + printf ( "/* 0x%2XXX */\n", ( $i + 0x81)); + for($j=0;$j<(0x7f-0x40);$j++) + { + if("" eq ($map{($i * $rowwidth + $j)})) + { + printf "0xFFFD," + } + else + { + printf $map{($i * $rowwidth + $j)} . ","; + } + if( 0 == (($j + 1) % 8)) + { + printf "/* 0x%2X%1X%1X*/\n", $i+0x81, 4+($j/16), (7==($j%16))?0:8; + } + } + + print "0xFFFD,"; + + printf "/* 0x%2X%1X%1X*/\n", $i+0x81, 4+($j/16),(7==($j%16))?0:8; + for($j=0;$j < (0xff-0x80);$j++) + { + if("" eq ($map{($i * $rowwidth + $j + 0x3f)})) # user defined chars map to 0xFFFD + { + + if ( ( $i == 125 ) and ( $j == (0xff - 0x80 - 1 ))) + { + printf "0xFFFD"; #has no ',' followed last item + } + else + { + printf "0xFFFD,"; + } + } + else + { + if ( ( $i == 125 ) and ( $j == (0xff - 0x80 - 1 ))) + { + printf $map{($i * $rowwidth + $j + 0x3f)}; #has no ',' followed last item + } + else + { + printf $map{($i * $rowwidth + $j + 0x3f)} . ","; + } + } + + if( 0 == (($j + 1) % 8)) + { + printf "/* 0x%2X%1X%1X*/\n", $i+0x81, 8+($j/16), (7==($j%16))?0:8; + } + } + printf " /* 0x%2X%1X%1X*/\n", $i+0x81, 8+($j/16),(7==($j%16))?0:8; + } +} +sub printnpl() +{ +$npl = <<END_OF_NPL; +/* -*- Mode: C++; tab-width: 2; indent-tabs-mode: nil; c-basic-offset: 2 -*- */ +/* This Source Code Form is subject to the terms of the Mozilla Public + * License, v. 2.0. If a copy of the MPL was not distributed with this + * file, You can obtain one at http://mozilla.org/MPL/2.0/. */ +END_OF_NPL +print $npl; +} +sub printdontmodify() +{ +$dont_modify = <<END_OF_DONT_MODIFY; +/* + This file is generated by mozilla/intl/uconv/tools/cp936tocdx.pl + Please do not modify this file by hand + Instead, you should download CP936.TXT from + http://www.unicode.org/Public/MAPPINGS/VENDORS/MICSFT/WINDOWS/ + and put under mozilla/intl/uconv/toools + and run perl cp936tocdx.pl > ../ucvcn/cp936map.h + If you have question, mailto:ftan\@netscape.com + */ +END_OF_DONT_MODIFY +print $dont_modify; +} + +&readtable(); +&printnpl(); +&printdontmodify(); +&printtable(); + |