7 use open OUT => ':utf8', ':std';
8 use List::Util 'reduce';
9 use File::Basename 'basename';
12 our $VERSION = '1.00';
15 my $incsuffix = '.inc.pl';
16 for my $fontfile (glob 'ttfsupport/*'.$incsuffix) {
17 my ($fontid) = basename($fontfile, $incsuffix);
18 my ($fontmeta, @fontrange) = do $fontfile or next;
20 -id => $fontmeta->{id} || $fontid,
21 -name => $fontmeta->{name},
22 map { (chr $_ => 1) } @fontrange
28 my $chartables = do 'unicode-table.inc.pl' or warn $@ || $!;
30 while (my ($tablegroup, $grouprow) = each %{$chartables}) {
31 while (my ($tablename, $chars) = each %{$grouprow}) {
32 next if $tablename =~ /^-/;
33 my $includerows; # ignore rows before body row
35 $includerows ||= m/^[.]/ or next;
37 next if $_ eq '>' or $_ eq '=';
39 push @{ $charlist{table}->{"$tablegroup/$tablename"} }, $_;
40 push @{ $charlist{table}->{$tablegroup} }, $_;
43 # if ($tablegroup eq 'ipa') {
44 # @chars = grep { !m/[a-zA-Z]/ } @chars;
50 require HTML::Entities;
52 HTML::Entities->import('%char2entity');
53 while (my ($char, $entity) = each %char2entity) {
54 $entity =~ /[a-zA-Z]/ or next; # only actual aliases
55 push @{ $charlist{table}->{html} }, $char;
58 } or warn "Could not include count for html entities: $@";
60 use Unicode::UCD 'charinfo';
61 for my $code (0 .. 256**2) {
62 my $charinfo = charinfo($code) or next;
63 next if $charinfo->{category} =~ /^[MC]/; # ignore Marks and "other" Control chars
64 push @{ $charlist{$_}->{ $charinfo->{$_} } }, chr $code
65 for qw( script category block );
68 for (values %charlist) {
69 for my $chars (values %{$_}) {
71 my $fontcover = $font{$_};
72 ($_ => scalar grep { $fontcover->{$_} } @{$chars});
74 $row{-count} = scalar @{$chars};
77 my @query = map { ord } sort @{$chars};
84 last if $query[$j] != $v;
88 splice(@query, $i, $j - $i, "$query[$i]-$query[$j-1]");
92 return join '+', @query;
99 say "# automatically generated by $0";
101 say '+'.pp(\%charlist);
107 mkfontinfo - Prepare font coverage of various character groups
111 mkfontinfo > unicode-cover.inc.pl
113 Test by finding the number of cyrillic characters in DejaVu Sans:
115 perl -E'$f = do "unicode-cover.inc.pl"; say $f->{Cyrillic}->{dvsans}'
119 Mischa POSLAWSKY <perl@shiar.org>
123 Licensed under the GNU Affero General Public License version 3.