X-Git-Url: http://git.shiar.nl/sheet.git/blobdiff_plain/04d963b223ec1e49784c96a1b6b36cddf6cd29f0..29b407ddf91b653e6e8380f73e221628a392376f:/digraphs.plp diff --git a/digraphs.plp b/digraphs.plp index 67d2a1a..44f93e6 100644 --- a/digraphs.plp +++ b/digraphs.plp @@ -1,148 +1,156 @@ -<: -use utf8; -use strict; -use warnings; -use open IO => ':utf8'; - -our $VERSION = '1.0'; - -$header{content_type} = 'text/html; charset=utf-8'; - -:> - - - -digraph cheat sheet - - - - - -

RFC-1345 Digraphs

+:> +

<:= $modename :> Digraphs

+ +

Character mnemonics following compose key ⎄<: +say join("\n", + $mode ? ( + ' in the X Window System (Shift+AltGr by default).', + 'Differences from RFC-1345 are indicated.', + ) : (':', + 'i^k in Vim,', + '^u^\ in Emacs,', + '^a^v in Screen.', + 'Similar but different from X.Org.', + ), + 'Also see common Unicode.

', +); +say '

Unofficial proposals', + ' are available as ex commands.' if not $mode; +:> <: -my $di = do 'digraphs.inc.pl'; - -sub quote { - local $_ = shift; - s/"/"/g; - s//>/g; - return $_; +my $di = do 'digraphs.inc.pl' + or die "Error loading digraphs data: ", $@ // $!; + +if (exists $get{v}) { + # show characters for inverted mnemonics (vim alternatives) + $di->{ substr($_, 1, 1) . substr($_, 0, 1) } ||= + [ $di->{$_}->[0], '', 'l0 ex', '', $di->{$_}->[4] ] + for grep { ref $di->{$_} } keys %{$di}; } -my @chars = ((map {chr} ord '!' .. ord 'Z'), 'a'..'z'); -splice @chars, $_, 1, () for 2, 3-1, 5-2, 31-3; # remove character exceptions # $ & @ -my @chars2 = (@chars, '_'); # trailing character (extended set) +my @chars = ( + [qw{! " % ' ( ) * + , - . /}], + ['0'..'9'], [qw{: ; < = > ?}], + ['A'..'M'], ['N'..'Z'], + ['a'..'m'], ['n'..'z'], +); +my @chars2 = (['_'], @chars); # trailing character (extended set) +my @columns = !exists $get{split} ? \@chars2 : + ([@chars2[0, 1, 3, 4, 6]], [@chars2[2, 5, 7]]); + +if ($mode) { + my $xorg = do 'data/digraphs-xorg.inc.pl' + or die "Error loading Xorg data: ", $@ // $!; + $_ = [ord $_] for values %{$xorg}; + $xorg->{$_}->[2] = # class = compatibility + $di->{$_} ? $di->{$_}->[0] != $xorg->{$_}->[0] ? 'l1' : # conflict + $di->{$_}->[2] =~ /\bu-di\b/ ? 'l5' : 'l3' : 'l2' # rfc|any|none + for keys %{$xorg}; + + for my $cp (map {$_->[0]} values %{$xorg}) { + next if (state $seen = {})->{$cp}++; # List::MoreUtils::uniq + + # find multiple equivalent mnemonics + my @equiv = grep {$cp eq $_->[0]} + map {$xorg->{$_}} sort keys %{$xorg}; # values ordered by mnem. + + # search for the most compatible match + my ($compat) = sort { + $equiv[$b]->[2] cmp $equiv[$a]->[2] # highest level + || $b <=> $a # fallback to last mnemonic + } 0 .. $#equiv; + + # reclassify all but one as level 0 (omitted) + splice @equiv, $compat // -1, 1, (); + $_->[2] = 'l0 ex' for @equiv; + } + + $chars2[0] = [qw( # ^ _ ` ~ )]; + @chars = @chars2; + $di = $xorg; +} -print ''; +for my $colchars (@columns) { +print '
'; +print qq'' for map {scalar @$_} @{$colchars}; +say ''; for my $section (qw{thead tfoot}) { - print "<$section>'; -for my $c1 (@chars) { - print "'; + for my $c1 (@$c1group) { + print '
 "; - print "$_" for @chars2; + print "<$section>
↳"; + print '', EscapeHTML($_) for map {@$_} @{$colchars}; + say ' '; } -print '
$c1"; - for my $c2 (@chars2) { - my $mnem = $c1 . $c2; - if (not defined $di->{$mnem}) { - print ''; - next; +for my $c1group (@chars) { + print '
', EscapeHTML($c1); + for my $c2 (map {@$_} @$colchars) { + my $mnem = $c1 . $c2; + if (not defined $di->{$mnem}) { + print ''; + next; + } + if (ref $di->{$mnem} ne 'ARRAY') { + printf '', EscapeHTML($mnem); + next; + } + my ($codepoint, $name, $support, $script, $string) = @{ $di->{$mnem} }; + + my $glyph = $string || chr $codepoint; + utf8::upgrade($glyph); # prevent latin1 output + my $desc = $mnem . ($name && " ($name)"); + my @class = ('X', grep {$_} $support && "u-$support", $script); + + $glyph = EscapeHTML($glyph); + $glyph = "$glyph" if $script =~ /\bZs\b/; + + printf "\n".'%s', + join(' ', @class), EscapeHTML($desc), $glyph; } - my ($codepoint, $name, $prop, $script) = @{ $di->{$mnem} }; - - my $glyph = chr $codepoint; - utf8::upgrade($glyph); # prevent latin1 output - my $desc = $mnem . ($name && " ($name)"); - my @class = ('X', grep {$_} $prop, $script); - - $glyph = quote($glyph); - $glyph = "$glyph" if $prop eq 'Zs'; - - printf "\n".'%s', - join(' ', @class), quote($desc), $glyph; + say "\n", EscapeHTML($c1); } - print "\n$c1\n"; } -print "
\n"; +say ''; +print '


' if exists $get{split}; +} + +if ($mode) { :> -
- +
+
+
matching RFC-1345 + matching proposal + unique to Xorg + conflict + duplicate +
+
+<: } else { :> +
+
control - spacing - modifier - spacing modifier + space + combining + spacing modifier quote punctuation symbol @@ -154,17 +162,18 @@ print "
\n"; latin hebrew arabic + korean japanese chinese - -
unicode - ascii - latin1 - private - proposed + +
full support + vim extension + vim v8.0 + proposal + not in vim
- +<: }