Changeset 189 in lab
- Timestamp:
- Jan 24, 2013 9:17:01 PM (11 years ago)
- File:
-
- 1 copied
Legend:
- Unmodified
- Added
- Removed
-
trunk/misc/findnonsjis.pl
r188 r189 6 6 use encoding 'utf-8'; 7 7 8 use Unicode:: Normalize qw(NFC NFKC);8 use Unicode::Japanese qw(unijp); 9 9 10 10 my $top = shift @ARGV || exit; … … 16 16 my $str = shift @_; 17 17 18 if ($str ne NFC($str)) { 19 return 1; 20 } 21 if ($str ne NFKC($str)) { 18 my $sjis = unijp($str)->sjis; 19 if ($sjis =~ /&#\d{4,};/) { 22 20 return 1; 23 21 } … … 38 36 next if ($entry =~ /^\.+$/); 39 37 if (match($entry)) { 40 print "'$target/$entry' c an be composed\n";38 print "'$target/$entry' contains non Shift_JIS character\n"; 41 39 next; 42 40 }
Note: See TracChangeset
for help on using the changeset viewer.