package Shiar_Sheet::FormatChar;
+use 5.010;
use strict;
use warnings;
my ($self, $char) = @_;
my $codepoint = ord $char;
my $info = $self->glyph_info($codepoint);
- my ($class, $name, $mnem, $string) = @$info;
+ my ($class, $name, $mnem, $html, $string) = @$info;
my $cell = EscapeHTML($string || $char);
my $title = sprintf 'U+%04X%s', $codepoint, $name && " ($name)";
$cell = "<span>$cell</span>" if $class =~ /\bZs\b/;
$cell = ' ' if $cell eq '';
- return ($cell, EscapeHTML($title), "X $class", $mnem);
+ return ($cell, EscapeHTML($title), "X $class", $mnem, $html);
}
sub glyphs_html {
sub cell {
my ($self, $input, $html) = @_;
- my (@class, $title, $cell, $mnem);
+ my (@class, $title, $cell, $mnem, $entity);
if ($input eq '-') {
$cell = '';
push @class, 'u-invalid';
$cell = '';
}
- else {
+ else {{
push @class, 'X';
if ($input =~ s/^-//) {
}
$input =~ s/^\\//; # escaped char
- ($cell, $title, my $class, $mnem) = $self->glyphs_html($input);
+ ($cell, $title, my $class, $mnem, $entity) = $self->glyphs_html($input);
+ my $codepoint = ord(substr $input, 0, 1);
+
+ if ($self->{style} eq 'univer') {
+ if ($input =~ /\p{age=unassigned}/) {
+ # check include for assignments after unicode 6.0 (perl v5.14)
+ state $agemap = do 'unicode-age.inc.pl';
+ my $version = $agemap->{$codepoint};
+ push @class, $version ? 'l2' : 'l1';
+ }
+ elsif ($input =~ /^\p{in=1.1}*$/) {
+ push @class, 'l5'; # first release 1993
+ }
+ elsif ($input =~ /^\p{in=3.0}*$/) {
+ push @class, 'l4'; # 20th century
+ }
+ elsif ($input =~ /^\p{in=4.1}*$/) {
+ push @class, 'l4'; # over 10 years ago
+ }
+ elsif ($input =~ /^\p{in=6.0}*$/) {
+ push @class, 'l3'; # before 2012
+ }
+ else {
+ push @class, 'l2'; # more recent
+ }
+ next;
+ }
- if ($self->{style} = 'di') {
+ if ($self->{style} eq 'di') {
if ($class =~ /\bu-di\b/) {
- push @class, ('l3', 'u-di'); # standard digraph
+ push @class, ('l4', 'u-di'); # standard digraph
}
elsif ($class =~ /\bu-prop\b/) {
- push @class, ('l2', 'u-prop'); # unofficial
+ push @class, ('l3', 'u-prop'); # unofficial
+ }
+ }
+ elsif ($self->{style} eq 'html') {
+ if (defined $entity) {
+ push @class, ($codepoint <= 0xFF ? 'l4' : 'l3', 'u-html');
}
}
else {
- my $codepoint = ord(substr $input, 0, 1);
if ($codepoint <= 0xFF) {
- push @class, 'l3', 'u-lat1'; # latin1
+ push @class, 'l4', 'u-lat1'; # latin1
}
elsif ($codepoint <= 0xD7FF) {
- push @class, 'l2', 'u-bmp'; # bmp
+ push @class, 'l3', 'u-bmp'; # bmp
}
}
if ($input =~ /[ -~]/) {
- push @class, 'l4', 'u-ascii'; # ascii
+ push @class, 'l5', 'u-ascii'; # ascii
+ }
+ elsif ($input =~ /^\p{in=6.0}+$/) {
+ push @class, 'l2'; # in unicode 6.0
}
else {
- push @class, 'l1'; # basic unicode
+ push @class, 'l1'; # any unicode
}
- }
+ }}
my $anno = '';
if ($cell ne '') {
for (@{ $self->{anno} }) {
if (/html$/) {
- require HTML::Entities;
- if (my $entity = $HTML::Entities::char2entity{$cell}) {
- $entity = substr($entity, 1, -1) unless /^&/;
+ if (defined $entity) {
+ $entity = "&$entity;" if /^&/;
$anno = sprintf(' <small class="digraph">%s</small>', EscapeHTML($entity));
last;
}
if ($cell =~ s/^>//) {
# header cell text follows
$cell =~ s/_/ /g; # underscores may be used instead of whitespace (for qw//ability)
- $rows[-1] .= '<th>'.($cell || ' ');
+ my $class = $cell =~ s/^-// && ' class="ex"';
+ $rows[-1] .= "<th$class>".($cell || ' ');
}
next;
}