digraph cheat sheet

Character mnemonics following compose key â<: +say join("\n", + $mode ? ( + ' in the X Window System (Shift+AltGr by default).', + 'Differences from RFC-1345 are indicated.', + ) : (':', + 'i^k in Vim,', + '^u^\ in Emacs,', + '^a^v in Screen.', + 'Similar but different from X.Org.', + ), + 'Also see common Unicode.

Unofficial proposals', + ' are available as ex commands.' if not $mode; +:> <: -my $di = do 'digraphs.inc.pl'; - -sub quote { - local $_ = shift; - s/"/"/g; - s//>/g; - return $_; +my $di = do 'digraphs.inc.pl' + or die "Error loading digraphs data: ", $@ // $!; + +if (exists $get{v}) { + # show characters for inverted mnemonics (vim alternatives) + $di->{ substr($_, 1, 1) . substr($_, 0, 1) } ||= + [ $di->{$_}->[0], '', 'l0 ex', '', $di->{$_}->[4] ] + for grep { ref $di->{$_} } keys %{$di}; } -my @chars = ((map {chr} ord '!' .. ord 'Z'), 'a'..'z'); -splice @chars, $_, 1, () for 2, 3-1, 5-2, 31-3; # remove character exceptions # $ & @ -my @chars2 = (@chars, '_'); # trailing character (extended set) +my @chars = ( + [qw{! " % ' ( ) * + , - . /}], + ['0'..'9'], [qw{: ; < = > ?}], + ['A'..'M'], ['N'..'Z'], + ['a'..'m'], ['n'..'z'], +); +my @chars2 = (['_'], @chars); # trailing character (extended set) +my @columns = !exists $get{split} ? \@chars2 : + ([@chars2[0, 1, 3, 4, 6]], [@chars2[2, 5, 7]]); + +if ($mode) { + my $xorg = do 'data/digraphs-xorg.inc.pl' + or die "Error loading Xorg data: ", $@ // $!; + $_ = [ord $_] for values %{$xorg}; + $xorg->{$_}->[2] = # class = compatibility + $di->{$_} ? $di->{$_}->[0] != $xorg->{$_}->[0] ? 'l1' : # conflict + $di->{$_}->[2] =~ /\bu-di\b/ ? 'l5' : 'l3' : 'l2' # rfc|any|none + for keys %{$xorg}; + + for my $cp (map {$_->[0]} values %{$xorg}) { + next if (state $seen = {})->{$cp}++; # List::MoreUtils::uniq + + # find multiple equivalent mnemonics + my @equiv = grep {$cp eq $_->[0]} + map {$xorg->{$_}} sort keys %{$xorg}; # values ordered by mnem. + + # search for the most compatible match + my ($compat) = sort { + $equiv[$b]->[2] cmp $equiv[$a]->[2] # highest level + || $b <=> $a # fallback to last mnemonic + } 0 .. $#equiv; + + # reclassify all but one as level 0 (omitted) + splice @equiv, $compat // -1, 1, (); + $_->[2] = 'l0 ex' for @equiv; + } + + $chars2[0] = [qw( # ^ _ ` ~ )]; + @chars = @chars2; + $di = $xorg; +} -print ''; +for my $colchars (@columns) { +print '

'; +print qq'' for map {scalar @$_} @{$colchars}; +say ''; for my $section (qw{thead tfoot}) { - print "<$section>'; -for my $c1 (@chars) { - print "'; + for my $c1 (@$c1group) { + print '

"; - print "	$_" for @chars2; + print "<$section>
â³"; + print '	', EscapeHTML($_) for map {@$_} @{$colchars}; + say '	'; } -print '
$c1"; - for my $c2 (@chars2) { - my $mnem = $c1 . $c2; - if (not defined $di->{$mnem}) { - print '	'; - next; +for my $c1group (@chars) { + print '
', EscapeHTML($c1); + for my $c2 (map {@$_} @$colchars) { + my $mnem = $c1 . $c2; + if (not defined $di->{$mnem}) { + print '	'; + next; + } + if (ref $di->{$mnem} ne 'ARRAY') { + printf '	', EscapeHTML($mnem); + next; + } + my ($codepoint, $name, $support, $script, $string) = @{ $di->{$mnem} }; + + my $glyph = $string \|\| chr $codepoint; + utf8::upgrade($glyph); # prevent latin1 output + my $desc = $mnem . ($name && " ($name)"); + my @class = ('X', grep {$_} $support && "u-$support", $script); + + $glyph = EscapeHTML($glyph); + $glyph = "$glyph" if $script =~ /\bZs\b/; + + printf "\n".'	%s', + join(' ', @class), EscapeHTML($desc), $glyph; } - my ($codepoint, $name, $prop, $script) = @{ $di->{$mnem} }; - - my $glyph = chr $codepoint; - utf8::upgrade($glyph); # prevent latin1 output - my $desc = $mnem . ($name && " ($name)"); - my @class = ('X', grep {$_} $prop, $script); - - $glyph = quote($glyph); - $glyph = "$glyph" if $prop eq 'Zs'; - - printf "\n".'	%s', - join(' ', @class), quote($desc), $glyph; + say "\n	", EscapeHTML($c1); } - print "\n	$c1\n"; } -print "

\n"; +say ''; +print '

- +

matching RFC-1345
+	matching proposal
+	unique to Xorg
+	conflict
+	duplicate
+	

control -

spacing -

modifier -

spacing modifier +

space +

combining +

spacing modifier

quote

punctuation

symbol @@ -154,17 +162,18 @@ print "

\n"; latin hebrew arabic + korean japanese chinese - -

unicode -

ascii -

latin1 -

private -

proposed + +

full support +

vim extension +

vim v8.0 +

proposal +

not in vim

- +<: }

RFC-1345 Digraphs

<:= $modename :> Digraphs