diff options
author | Matt A. Tobin <mattatobin@localhost.localdomain> | 2018-02-02 04:16:08 -0500 |
---|---|---|
committer | Matt A. Tobin <mattatobin@localhost.localdomain> | 2018-02-02 04:16:08 -0500 |
commit | 5f8de423f190bbb79a62f804151bc24824fa32d8 (patch) | |
tree | 10027f336435511475e392454359edea8e25895d /intl/chardet/tools/charfreq.pl | |
parent | 49ee0794b5d912db1f95dce6eb52d781dc210db5 (diff) | |
download | UXP-5f8de423f190bbb79a62f804151bc24824fa32d8.tar UXP-5f8de423f190bbb79a62f804151bc24824fa32d8.tar.gz UXP-5f8de423f190bbb79a62f804151bc24824fa32d8.tar.lz UXP-5f8de423f190bbb79a62f804151bc24824fa32d8.tar.xz UXP-5f8de423f190bbb79a62f804151bc24824fa32d8.zip |
Add m-esr52 at 52.6.0
Diffstat (limited to 'intl/chardet/tools/charfreq.pl')
-rw-r--r-- | intl/chardet/tools/charfreq.pl | 50 |
1 files changed, 50 insertions, 0 deletions
diff --git a/intl/chardet/tools/charfreq.pl b/intl/chardet/tools/charfreq.pl new file mode 100644 index 000000000..4232d4765 --- /dev/null +++ b/intl/chardet/tools/charfreq.pl @@ -0,0 +1,50 @@ +#!/usr/bin/perl +#!/usr/bin/perl +# +# This Source Code Form is subject to the terms of the Mozilla Public +# License, v. 2.0. If a copy of the MPL was not distributed with this +# file, You can obtain one at http://mozilla.org/MPL/2.0/. +open (STAT,$ARGV[0]) || die " cannot open data file $ARGV[0]\n"; +@count; +while(<STAT>) +{ + @k = split(/\s+/, $_); + $count{$k[0]} = $k[1]; +} +$count = 0; +while(<STDIN>) +{ + @ck = split /\s*/, $_; + $s = 0; + $fb = 0; + $cl = $#ck; + $j = 0; + while($j < $cl) { + $cc = unpack("C", $ck[$j]); + if(0 eq $s ) { + if($cc > 0x80) { + if($cc > 0xa0) { + $fb = $ck[$j]; + $s = 2; + } else { + $s = 1; + } + } + } elsif (1 eq $s) { + } else { + if($cc > 0xa0) { + $fb .= $ck[$j]; + $count{$fb}++; + print $fb . " " .$count{$fb} . "\n"; + $s = 0; + } else { + $s = 1; + } + } + $j = $j + 1; + } +} +foreach $c (sort(keys( %count ))) +{ + print $c . " ". $count{$c} . "\n"; +} |