digraphs: map private use characters to modern equivalents
[sheet.git] / digraphs.plp
index 9a20f580dd8d405c30d8076618765fb78405c5ac..a8f681d959b80a8b450ba7b62188dcd28e5c2663 100644 (file)
@@ -15,34 +15,12 @@ $header{content_type} = 'text/html; charset=utf-8';
 <head>
 <title>digraph cheat sheet</title>
 <meta http-equiv="content-type" content="utf-8">
-<style>
-h1 {
-       text-align: center;
-       margin: 0 auto 0.2em;
-}
-table {
-       border-collapse: collapse;
-       table-layout: fixed; /* prevent resizing, notably in msie6 */
-}
-thead th, td {
-       width: 1.2em; /* msie only looks at the first row */
-       min-width: 1em; /* prevents gecko from restricting to page width */
-}
-th, td {
-       text-align: center;
-}
-td {
-       border: 1px solid #888;
-       background: #DDD;
-}
-td.any {
-       background: #FFF;
-}
-</style>
+<link rel="stylesheet" type="text/css" media="all" href="digraphs.css">
 </head>
 
 <body>
 <h1>RFC-1345 Digraphs</h1>
+
 <:
 my $di = do 'digraphs.inc.pl';
 
@@ -54,28 +32,94 @@ sub quote {
        return $_;
 }
 
-my @chars = ((map {chr} ord '!' .. ord 'Z'), 'a'..'z');
-splice @chars, $_, 1, () for 2, 3-1, 5-2, 31-3;  # remove character exceptions # $ & @
-print '<table>';
-print '<thead><tr><th>&nbsp;';
-print "<th>$_" for @chars, '_';
-print '<tbody>';
-for my $c1 (@chars) {
-       print "<tr><th>$c1";
-       for my $c2 (@chars, '_') {
-               my $mnem = $c1 . $c2;
-               if (not defined $di->{$mnem}) {
-                       print '<td>';
-                       next;
-               }
-               my $chr = $di->{$mnem};
+my @chars = (
+       [qw{! " % ' ( ) * + , - . /}],
+       ['0'..'9'], [qw{: ; < = > ?}],
+       ['A'..'M'], ['N'..'Z'],
+       ['a'..'m'], ['n'..'z'],
+);
+my @chars2 = (@chars, ['_']);  # trailing character (extended set)
+
+print '<table><col>';
+print qq'<colgroup span="$_">' for map {scalar @$_} @chars2;
+print "\n";
+for my $section (qw{thead tfoot}) {
+       print "<$section><tr><th>&nbsp;";
+       print "<th>$_" for map {@$_} @chars2;
+}
+for my $c1group (@chars) {
+       print '<tbody>';
+       for my $c1 (@$c1group) {
+               print "<tr><th>$c1";
+               for my $c2 (map {@$_} @chars2) {
+                       my $mnem = $c1 . $c2;
+                       if (not defined $di->{$mnem}) {
+                               print '<td>';
+                               next;
+                       }
+                       if (ref $di->{$mnem} ne 'ARRAY') {
+                               printf '<td class="X Xr" title="%s">', quote($mnem);
+                               next;
+                       }
+                       my ($codepoint, $name, $prop, $script) = @{ $di->{$mnem} };
+
+                       my $glyph = chr $codepoint;
+                       utf8::upgrade($glyph);  # prevent latin1 output
+                       my $desc = $mnem . ($name && " ($name)");
+                       my @class = ('X', grep {$_} $prop, $script);
 
-               my @class = 'any';
+                       $glyph = quote($glyph);
+                       $glyph = "<span>$glyph</span>" if $prop eq 'Zs';
 
-               printf '<td class="%s" title="%s">%s',
-                       join(' ', @class), quote($mnem), quote(chr $chr);
+                       printf "\n".'<td class="%s" title="%s">%s',
+                               join(' ', @class), quote($desc), $glyph;
+               }
+               print "\n<th>$c1\n";
        }
-       print "\n";
 }
 print "</table>\n";
+:>
+<div id="legend">
+       <table><tr>
+       <td class="X Cc">control
+       <td class="X Zs"><span>spacing</span>
+       <td class="X Mn">modifier
+       <td class="X Sk">spacing modifier
+       <td class="X Pf">quote
+       <td class="X Po">punctuation
+       <td class="X So">symbol
+       <td class="X Sm">math
+       <td class="X Sc">currency
+       <td class="X No">numeric
+       <td class="X Greek">greek
+       <td class="X Cyrillic">cyrillic
+       <td class="X Latin">latin
+       <td class="X Hebrew">hebrew
+       <td class="X Arabic">arabic
+       <td class="X Hangul">korean
+       <td class="X Hiragana">japanese
+       <td class="X Bopomofo">chinese
+       </table>
+
+       <table><tr>
+       <td class="X">unicode
+       <td class="X Xl">latin1
+       <td class="X Xa">ascii
+       <td class="X Co">private
+       <td class="X Xz">proposed
+       </table>
+</div>
+
+<p id="footer">
+       <a href="http://vi.shiar.net/digraphs">vi.<strong>shiar.net</strong>/digraphs</a>
+       <a href="git://dev.shiar.net/vi-cheat"><:= "v$VERSION" :></a>
+       created by Shiar •
+       <a title="Licensed under the GNU Affero General Public License, version 3"
+          href="http://www.fsf.org/licensing/licenses/agpl-3.0.html">AGPLv3</a> •
+       last update <:
+               use Time::Format qw(time_format);
+               print time_format('yyyy-mm-dd', (stat 'digraphs.inc.pl')[9]);
+       :>
+</p>
 
+</html>