use Shiar_Sheet::FormatChar;
my $glyphs = Shiar_Sheet::FormatChar->new;
+my %oslist = (
+ win95 => [qw( arial ariuni verdana times )], # microsoft
+ mac10 => [qw( )], # apple
+ android => [qw( droidsans )], # google
+ oss => [qw( dvsans c2k unifont )],
+);
+my @ossel = qw( win95 oss android );
+
my $tables = do 'unicode-table.inc.pl' or die $@ || $!;
my (%font, @fontlist);
-for my $fontid (qw(d tnr a dv dvs c2k u)) {
- my ($fontmeta, @fontrange) = do "ttfsupport/$fontid.inc.pl";
- push @fontlist, $fontid;
- $font{$fontid} = {
- -name => $fontmeta->{name},
- map { (chr $_ => 1) } @fontrange
- };
+for my $os (@ossel) {
+ my $osfonts = $oslist{$os};
+ for my $fontid (@{$osfonts}) {
+ push @fontlist, $fontid;
+ my ($fontmeta, @fontrange) = do "ttfsupport/$fontid.inc.pl";
+ $fontmeta or next;
+ $font{$fontid} = {
+ -id => $fontmeta->{id} || $fontid,
+ -name => $fontmeta->{name},
+ map { (chr $_ => 1) } @fontrange
+ };
+ }
}
-my @config = qw(
- punctuation/common punctuation/marks
- latin/sample
- symbols/signs1
-);
-$_ and m{/*+(.+)} and @config = split /[ ]/, $1 for $ENV{PATH_INFO}, $get{q};
-@config = qw(ipa/cons ipa/vowels) if 0;
-
-for (@config) {
- my ($tablegroup, $tablename) = split m{/}, $_, 2;
-
- print '<table>';
- printf '<caption>%s</caption>', "$tablegroup: $tablename";
- say '';
- my $table = $tables->{$tablegroup}->{$tablename};
-
- for my $chr (@$table) {
- $chr =~ m/^\./ .. 1 or next;
- given ($chr) {
- when (/^[.]/) {
- print "<tbody style=\"border-bottom:3px double #AAA\">\n";
- next;
- }
- when ([qw(> - =)]) {
- next;
+# parse input
+
+my @chars;
+my @querydesc;
+
+my $query = $ENV{PATH_INFO} || $get{q} || 'ipa';
+for ($query) {
+ s{^/}{};
+ when (qr{^[a-z]+(?:/|\z)}) {
+ for (split / /) {
+ push @querydesc, "preset group $_";
+ my ($tablegroup, $tablename) = split m{/}, $_, 2;
+ my @tables = $tablename ? $tables->{$tablegroup}->{$tablename}
+ : sort values %{ $tables->{$tablegroup} };
+ for (@tables) {
+ my $includerows; # ignore rows before body row
+ for (@{$_}) {
+ $includerows ||= m/^[.]/ or next;
+ next if /^[.-]/;
+ next if $_ eq '>' or $_ eq '=';
+ push @chars, $_;
+ }
}
}
-
- my $ex = s/^-//;
- my $codepoint = ord $chr;
- my $ascii = $codepoint <= 127;
-
- print "<tr><th>$chr\n";
- my $info = $glyphs->glyph_info($codepoint);
- my ($class, $name, $mnem, $html, $string) = @$info;
- print "<td>$_" for $codepoint, EscapeHTML($name);
- printf '<td class="%s">%s', @$_ for (
- [$ascii ? 'l0' : defined $mnem ? 'l4' : 'l1', $mnem // ''],
- [$ascii ? 'l0' : defined $html ? 'l4' : 'l1', $html // ''],
- (map { $font{$_}->{$chr} ? [l4 => $font{$_}->{-name}] : [l1 => ''] }
- @fontlist),
- );
}
- say "</table>\n";
+ when (qr{[\d,;\s+-]+}) {
+ push @querydesc, "character codepoints $_";
+ for (map { split /[^\d-]/ } $_) {
+ my ($charnum, $range) = split /-/, $_;
+ push @chars, chr $_ for $charnum .. ($range // $charnum);
+ }
+ }
+ when (qr{[A-Z]}) {
+ push @querydesc, "unicode match $_";
+ eval {
+ my $match = qr/\A\p{$_}\z/;
+ push @chars, grep { m/$match/ } map { chr $_ }
+ 0..0xD7FF, 0xE000..0xFDCF, 0xFDF0..0xFFFD;
+ } or die "invalid unicode match: $_\n";
+ }
+ default {
+ die "unknown parameter: $_\n";
+ }
}
-:></div>
-<script type="text/javascript" src="/clipboard.js"></script>
+@chars <= 1500 or die sprintf(
+ 'too many matches (%d) for %s'."\n",
+ scalar @chars, join(', ', @querydesc),
+);
+
+# output character list
+
+print '<table class=mapped>';
+say '<caption>'.EscapeHTML(join ', ', @querydesc).'</caption>';
+print '<col>' x 3;
+print "<colgroup span=$_>" for 2, map { scalar @{$oslist{$_}} } @ossel;
+
+print '<thead><tr>';
+print '<td colspan=3>character';
+print '<td colspan=2>input';
+printf '<td colspan=%d>%s fonts', scalar @{ $oslist{$_} }, $_
+ for @ossel;
+
+print '<tr>';
+print '<td colspan=2>unicode';
+print '<td>name';
+print '<td><a href="/digraphs" title="digraph">di</a><td>html';
+printf '<td title="%s">%s', $font{$_}->{-name}, $font{$_}->{-id} // $_
+ for @fontlist;
+say '</thead>';
+
+for my $chr (@chars) {
+ my $codepoint = ord $chr;
+ my $ascii = $codepoint <= 127;
+
+ print "<tr><th>$chr\n";
+ my $info = $glyphs->glyph_info($codepoint);
+ my ($class, $name, $mnem, $html, $string) = @$info;
+ print "<td>$_" for sprintf('%X', $codepoint), EscapeHTML($name || '?');
+ printf '<td class="%s">%s', @$_ for (
+ [$ascii ? 'l0' : defined $mnem ? 'l4' : 'l1', $mnem // ''],
+ [$ascii ? 'l0' : defined $html ? 'l4' : 'l1', $html // ''],
+ (map {
+ !$font{$_}->{-id} ? [l0 => '?'] :
+ $font{$_}->{$chr} ? [l4 => '✔'] : [l1 => '✘']
+ } @fontlist),
+ );
+}
+
+say "</table>\n";
+
+:></div>