annotate findUnicode.pl @ 6:4ed010b4a017

batsu
author Shinji KONO <kono@ie.u-ryukyu.ac.jp>
date Thu, 26 Dec 2013 09:01:31 +0900
parents 8da43f287516
children b86def18da67
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
1
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents:
diff changeset
1 #!/usr/bin/perl
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents:
diff changeset
2
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents:
diff changeset
3 # find used unicode
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents:
diff changeset
4 use strict;
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents:
diff changeset
5 use utf8;
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents:
diff changeset
6 use open qw(:std :utf8); # input/output default encoding will be UTF-8, it looks like default
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents:
diff changeset
7
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents:
diff changeset
8 my %used;
6
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents: 4
diff changeset
9 my @fonts = <1[0-9]*.bdf> ;
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents: 4
diff changeset
10
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents: 4
diff changeset
11 use Getopt::Std;
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents: 4
diff changeset
12 our ($opt_f);
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents: 4
diff changeset
13
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents: 4
diff changeset
14 getopts('f:');
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents: 4
diff changeset
15
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents: 4
diff changeset
16 if ($opt_f) {
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents: 4
diff changeset
17 @fonts = ($opt_f);
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents: 4
diff changeset
18 }
1
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents:
diff changeset
19
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents:
diff changeset
20 while(<>) {
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents:
diff changeset
21 for my $ch ( /(.)/g ) {
2
7f5d4dad9d6b merge operation
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents: 1
diff changeset
22 next if (ord($ch)<128);
4
8da43f287516 make file and merge
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents: 2
diff changeset
23 # next if (ord($ch)>=12288); # ignore CJKV
1
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents:
diff changeset
24 $used{ord($ch)}++;
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents:
diff changeset
25 }
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents:
diff changeset
26 }
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents:
diff changeset
27
6
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents: 4
diff changeset
28 for my $bdf ( @fonts ) {
1
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents:
diff changeset
29 open(my $f,"<",$bdf);
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents:
diff changeset
30 my %has;
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents:
diff changeset
31 while(<$f>) {
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents:
diff changeset
32 if (/^ENCODING\s+(\d+)/) {
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents:
diff changeset
33 my $encoding=$1;
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents:
diff changeset
34 $has{$encoding} = 1;
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents:
diff changeset
35 }
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents:
diff changeset
36 }
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents:
diff changeset
37 my %no;
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents:
diff changeset
38 for my $ch ( keys %used ) {
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents:
diff changeset
39 $no{$ch} ++ if (! defined $has{$ch}) ;
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents:
diff changeset
40 }
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents:
diff changeset
41 for my $ch ( sort {$a<=>$b} keys %no ) {
2
7f5d4dad9d6b merge operation
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents: 1
diff changeset
42 my $hex = sprintf("%x",$ch);
7f5d4dad9d6b merge operation
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents: 1
diff changeset
43 print chr($ch)," $ch 0x$hex is not in $bdf\n";
1
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents:
diff changeset
44 }
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents:
diff changeset
45 }