common: drop leading 'v' in version numbers

[sheet.git] / chars.plp
diff --git a/chars.plp b/chars.plp

index b081ac2749567468c920a663f81b52ffafed1372..943bf8c818453e07ea933ffb2a39e2315f377bb7 100644 (file)
--- a/chars.plp
+++ b/chars.plp
@@ -2,125 +2,112 @@
  
  Html({
         title => 'character support sheet',
-       version => 'v1.0',
+       version => '1.0',
         keywords => [qw'
                 unicode glyph char character reference common ipa symbol sign mark table digraph
         '],
         stylesheet => [qw'light dark mono circus red'],
-       data => [qw'unicode-table.inc.pl unicode-char.inc.pl'],
+       data => [qw( unicode-cover.inc.pl ttfsupport unicode-char.inc.pl )],
  });
  
-:>
-<h1>Character support</h1>
-
-<p>
-Selected characters from Unicode <a href="/unicode">preset</a>
-or <a href="/charset">range</a>.
-</p>
-
-<div>
-
-<:
  use 5.010;
  use Shiar_Sheet::FormatChar;
  my $glyphs = Shiar_Sheet::FormatChar->new;
  
-my %oslist = (
-       win95   => [qw( arial ariuni verdana times )],  # microsoft
-       mac10   => [qw( )],  # apple
-       android => [qw( droidsans )],  # google
-       oss     => [qw( dvsans c2k unifont )],
-);
-my @ossel = qw( win95 oss android );
-
-my $tables = do 'unicode-table.inc.pl' or die $@ || $!;
-my (%font, @fontlist);
-for my $os (@ossel) {
-       my $osfonts = $oslist{$os};
-       for my $fontid (@{$osfonts}) {
-               push @fontlist, $fontid;
+my $groupinfo = do 'unicode-cover.inc.pl' or die $@ || $!;
+
+my @ossel = @{ $groupinfo->{osdefault} };
+my @fontlist = map { $_->{file} }
+       @{ $groupinfo->{fonts} }[ map { @{ $groupinfo->{os}->{$_} } } @ossel ];
+
+my %font;
+for my $fontid (@fontlist) {
                 my ($fontmeta, @fontrange) = do "ttfsupport/$fontid.inc.pl";
                 $fontmeta or next;
                 $font{$fontid} = {
-                       -id   => $fontmeta->{id} || $fontid,
-                       -name => $fontmeta->{name},
+                       (map { (-$_ => $fontmeta->{$_}) } keys %{$fontmeta}),
                         map { (chr $_ => 1) } @fontrange
                 };
-       }
  }
  
  # parse input
  
-my @chars;
-my @querydesc;
-
-my $query = $ENV{PATH_INFO} || $get{q} || 'ipa';
-for ($query) {
-       s{^/}{};
-       when (qr{^[a-z]+(?:/|\z)}) {
-               for (split / /) {
-                       push @querydesc, "preset group $_";
-                       my ($tablegroup, $tablename) = split m{/}, $_, 2;
-                       my @tables = $tablename ? $tables->{$tablegroup}->{$tablename}
-                                  : sort values %{ $tables->{$tablegroup} };
-                       for (@tables) {
-                               my $includerows;  # ignore rows before body row
-                               for (@{$_}) {
-                                       $includerows ||= m/^[.]/ or next;
-                                       next if /^[.-]/;
-                                       next if $_ eq '>' or $_ eq '=';
-                                       push @chars, $_;
-                               }
-                       }
-               }
-               when ('ipa') {
-                       @chars = grep { !m/[a-zA-Z]/ } @chars;
-               }
-       }
-       when (qr{[\d,;\s+-]+}) {
-               push @querydesc, "character codepoints $_";
-               for (map { split /[^\d-]/ } $_) {
-                       my ($charnum, $range) = split /-/, $_;
-                       push @chars, chr $_ for $charnum .. ($range // $charnum);
+my ($title, $parent) = ('Character overview');
+my $query = eval {
+       for ($ENV{PATH_INFO} || ()) {
+               s{^/}{};
+               return $_ if m{^[0-9 +-]+$};
+
+               my ($cat, $name) = split m{/}, $_, 2 or die "invalid query\n";
+               if (!$name) {
+                       ($cat, $name) = ('table', $cat);
                 }
+
+               my $row = $groupinfo->{$cat}->{$name}
+                       or die "unknown character group $cat/$name\n";
+
+               $title = ucfirst EscapeHTML($name).' characters';
+               $parent = $cat;
+               return EscapeHTML($row->{query});
         }
-       when (qr{[A-Z]}) {
-               push @querydesc, "unicode match $_";
-               eval {
-                       my $match = qr/\A\p{$_}\z/;
-                       push @chars, grep { m/$match/ } map { chr $_ }
-                               0..0xD7FF, 0xE000..0xFDCF, 0xFDF0..0xFFFD;
-               } or die "invalid unicode match: $_\n";
-       }
-       default {
-               die "unknown parameter: $_\n";
-       }
+} || $get{q};
+
+say "<h1>$title</h1>";
+
+if (!$query) {
+       say "<p>Unicode group not specified: $@</p>";
+       exit;
+};
+
+for ($parent || 'Unicode range') {
+       my %CATDESC = (
+               block    => '<a href="/charset/unicode">Unicode block</a>',
+               script   => 'Unicode script',
+               category => 'Unicode category',
+               table    => '<a href="/unicode">Unicode preset group</a>',
+       );
+       say sprintf('<p>List %s in selected %s.</p>',
+               'characters and <a href="/font">font support</a>',
+               $CATDESC{$parent} || $parent,
+       );
+}
+
+my @chars;
+for (map { split /[^\d-]/ } $query) {
+       my @range = split /-/, $_, 2;
+       m/^[0-9]+$/ or die "Invalid code point $_ in query $query\n" for @range;
+       push @chars, chr $_ for $range[0] .. ($range[1] // $range[0]);
  }
  
+@chars or die "No match for query $query\n";
+
  @chars <= 1500 or die sprintf(
-       'too many matches (%d) for %s'."\n",
-       scalar @chars, join(', ', @querydesc),
+       'Too many matches (%d) for query %s'."\n",
+       scalar @chars, $query,
  );
  
  # output character list
  
+say '<div>';
  print '<table class=mapped>';
-say '<caption>'.EscapeHTML(join ', ', @querydesc).'</caption>';
  print '<col>' x 3;
-print "<colgroup span=$_>" for 2, map { scalar @{$oslist{$_}} } @ossel;
+print "<colgroup span=$_>"
+       for 2, map { scalar @{ $groupinfo->{os}->{$_} } } @ossel;
  
  print '<thead><tr>';
  print '<td colspan=3>character';
  print '<td colspan=2>input';
-printf '<td colspan=%d>%s fonts', scalar @{ $oslist{$_} }, $_
+printf '<td colspan=%d>%s', scalar @{ $groupinfo->{os}->{$_} }, $_
         for @ossel;
  
  print '<tr>';
  print '<td colspan=2>unicode';
  print '<td>name';
  print '<td><a href="/digraphs" title="digraph">di</a><td>html';
-printf '<td title="%s">%s', $font{$_}->{-name}, $font{$_}->{-id} // $_
-       for @fontlist;
+printf('<td title="%s">%s', map { EscapeHTML($_) }
+       join("\n", $font{$_}->{-name}, $font{$_}->{-description}),
+       $font{$_}->{-abbr},
+) for @fontlist;
  say '</thead>';
  
  for my $chr (@chars) {
@@ -132,16 +119,16 @@ for my $chr (@chars) {
         my ($class, $name, $mnem, $html, $string) = @$info;
         print "<td>$_" for sprintf('%X', $codepoint), EscapeHTML($name || '?');
         printf '<td class="%s">%s', @$_ for (
-               [$ascii ? 'l0' : defined $mnem ? $class =~ /\bu-di\b/ ? 'l4' : 'l3' : 'l1', $mnem // ''],
+               [$ascii ? 'l0' : defined $mnem ? $class =~ /\bu-di\b/ ? 'l4' : 'l3' : 'l1',
+                       EscapeHTML($mnem) // ''],
                 [$ascii ? 'l0' : defined $html ? 'l4' : 'l1', $html // ''],
                 (map {
-                       !$font{$_}->{-id} ? [l0 => '?'] :
+                       !defined $font{$_}->{-name} ? [l0 => '?'] :
                         $font{$_}->{$chr} ? [l4 => '✔'] : [l1 => '✘']
                 } @fontlist),
         );
  }
  
  say "</table>\n";
-
-:></div>
+say "</div>\n";