charset cheat sheet

Character encoding

Encoding $input unknown

$input

$name"; } -my @nibble = (0..9, 'A'..'F'); for my $row (@request) { + my $cols = $row->{cols}; + my $colsize = $row->{cell} && $row->{cell}->{colsize} || 1; + my $coldigits = ceil(log($colsize * $cols) / log(16)); # uniform length of hexadecimal header + my $rowdiv = 16 ** $coldigits; # row divide for column digits + $rowdiv = 1 if $rowdiv != $cols * $colsize; # divide only if all columns are matched + my $offset = 0; + my $endpoint = $offset + (length($row->{table}) || 256) * $colsize; + printf '

', !$row->{cell} && ' charmap'; - printf '', $row->{set}; - print '' x 17; + my $title = $row->{set}; + $title .= " " for $row->{setnote} // (); + printf '', $title; + print '' x ($cols + 1); for my $section (qw{thead}) { - print "<$section>'; - for my $msb (0 .. (length($row->{table}) || 256) - 1 >> 4) { - printf '

%s
â±"; - print '	', $_ for @nibble; + print "<$section>
", $rowdiv == 1 ? '+' : 'â±'; + printf '	%0X', $coldigits, $_ $colsize for 0 .. $cols - 1; print "\n"; } print '
%X', $msb + ($row->{offset} >> 4); - for my $lsb (0 .. $#nibble) { + while ($offset < $endpoint - 1) { + print '
'; + { + if (my $rowmod = $offset % $rowdiv) { + # offset in column units + printf '+%X', $rowmod; + } + else { + # divided row offset + printf '%X', ($offset + $row->{offset}) / $rowdiv; + } + } + for (1 .. $cols) { if ($row->{cell}) { - print $row->{cell}->(($msb<<4) + $lsb); + print range_cell($row, $offset); next; } - my $glyph = substr $row->{table}, ($msb<<4) + $lsb, 1; + my $glyph = substr $row->{table}, $offset, 1; if ($glyph eq $NOCHAR) { print '	'; next; } - my $info = [ord $glyph]; - if (defined (my $mnem = $di{ord $glyph})) { - $info = $diinfo->{$mnem}; - } - else { - require Unicode::UCD; - my $fullinfo = Unicode::UCD::charinfo(ord $glyph); - $info = [@$fullinfo{qw/code name category script string/}] if $fullinfo; - } - my ($codepoint, $name, $prop, $script, $string) = @$info; - - $glyph = quote($string \|\| $glyph); - my $desc = sprintf 'U+%04X%s', $codepoint, $name && " ($name)"; - my @class = ('X', grep {$_} $prop, $script); - - $glyph = "$glyph" if $prop eq 'Zs'; - - printf "\n".'	%s', - join(' ', @class), quote($desc), $glyph; + print "\n".$glyphs->glyph_cell($glyph); + } + continue { + $offset += $colsize; } print "\n"; } - print "

\n"; + say ''; } :> @@ -195,7 +270,7 @@ for my $row (@request) { -

unicode 5.0 +

unicode 7.0

proposed

deprecated

unassigned @@ -203,14 +278,3 @@ for my $row (@request) {

- - -