123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134 |
- #!/user/local/bin/perl
- # -*- Mode: C++; tab-width: 2; indent-tabs-mode: nil; c-basic-offset: 2 -*-
- #
- # This Source Code Form is subject to the terms of the Mozilla Public
- # License, v. 2.0. If a copy of the MPL was not distributed with this
- # file, You can obtain one at http://mozilla.org/MPL/2.0/.
- $rowwidth = ((0xff - 0x80)+(0x7f - 0x40));
- sub cp936tonum()
- {
- my($cp936) = (@_);
- my($first,$second,$jnum);
- $first = hex(substr($cp936,2,2));
- $second = hex(substr($cp936,4,2));
- $jnum = ($first - 0x81 ) * $rowwidth;
- if($second >= 0x80)
- {
- $jnum += $second - 0x80 + (0x7f-0x40);
- }
- else
- {
- $jnum += $second - 0x40;
- }
- return $jnum;
- }
- @map = {};
- sub readtable()
- {
- open(CP936, "<gbkcommon.txt") || die "cannot open gbkcommon.txt";
- while(<CP936>)
- {
- if(! /^#/) {
- chop();
- ($j, $u, $r) = split(/\t/,$_);
- if(length($j) > 4)
- {
- $n = &cp936tonum($j);
- $map{$n} = $u;
- }
- }
- }
- }
- sub printtable()
- {
- for($i=0;$i<126;$i++)
- {
- printf ( "/* 0x%2XXX */\n", ( $i + 0x81));
- for($j=0;$j<(0x7f-0x40);$j++)
- {
- if("" eq ($map{($i * $rowwidth + $j)}))
- {
- printf "0xFFFD,"
- }
- else
- {
- printf $map{($i * $rowwidth + $j)} . ",";
- }
- if( 0 == (($j + 1) % 8))
- {
- printf "/* 0x%2X%1X%1X*/\n", $i+0x81, 4+($j/16), (7==($j%16))?0:8;
- }
- }
-
- print "0xFFFD,";
- printf "/* 0x%2X%1X%1X*/\n", $i+0x81, 4+($j/16),(7==($j%16))?0:8;
- for($j=0;$j < (0xff-0x80);$j++)
- {
- if("" eq ($map{($i * $rowwidth + $j + 0x3f)})) # user defined chars map to 0xFFFD
- {
- if ( ( $i == 125 ) and ( $j == (0xff - 0x80 - 1 )))
- {
- printf "0xFFFD"; #has no ',' followed last item
- }
- else
- {
- printf "0xFFFD,";
- }
- }
- else
- {
- if ( ( $i == 125 ) and ( $j == (0xff - 0x80 - 1 )))
- {
- printf $map{($i * $rowwidth + $j + 0x3f)}; #has no ',' followed last item
- }
- else
- {
- printf $map{($i * $rowwidth + $j + 0x3f)} . ",";
- }
- }
-
- if( 0 == (($j + 1) % 8))
- {
- printf "/* 0x%2X%1X%1X*/\n", $i+0x81, 8+($j/16), (7==($j%16))?0:8;
- }
- }
- printf " /* 0x%2X%1X%1X*/\n", $i+0x81, 8+($j/16),(7==($j%16))?0:8;
- }
- }
- sub printnpl()
- {
- $npl = <<END_OF_NPL;
- /* -*- Mode: C++; tab-width: 2; indent-tabs-mode: nil; c-basic-offset: 2 -*- */
- /* This Source Code Form is subject to the terms of the Mozilla Public
- * License, v. 2.0. If a copy of the MPL was not distributed with this
- * file, You can obtain one at http://mozilla.org/MPL/2.0/. */
- END_OF_NPL
- print $npl;
- }
- sub printdontmodify()
- {
- $dont_modify = <<END_OF_DONT_MODIFY;
- /*
- This file is generated by mozilla/intl/uconv/tools/cp936tocdx.pl
- Please do not modify this file by hand
- Instead, you should download CP936.TXT from
- http://www.unicode.org/Public/MAPPINGS/VENDORS/MICSFT/WINDOWS/
- and put under mozilla/intl/uconv/toools
- and run perl cp936tocdx.pl > ../ucvcn/cp936map.h
- If you have question, mailto:ftan\@netscape.com
- */
- END_OF_DONT_MODIFY
- print $dont_modify;
- }
- &readtable();
- &printnpl();
- &printdontmodify();
- &printtable();
|