X-Git-Url: http://git.shiar.nl/sheet.git/blobdiff_plain/130c94fc7747fd586b677f48fbabd2ecf10297c5..1d6eab5fa03b9b245c50637bae352344f9f53ef5:/charset-ucplanes.inc.pl diff --git a/charset-ucplanes.inc.pl b/charset-ucplanes.inc.pl index 607f8be..8042f70 100644 --- a/charset-ucplanes.inc.pl +++ b/charset-ucplanes.inc.pl @@ -1,83 +1,106 @@ use utf8; -my %uniblock = ( - 0x0000, 'ascii', - 0x0008, 'latin', -# 0x0028, 'spacing modifier', - 0x0028, 'comb', - 0x0038, 'grk', - 0x0040, 'cyr', - 0x0050, 'arm', - 0x0058, 'heb', - 0x0060, 'arabic', - 0x0070, 'aram', - 0x0080, 'aramaic', - 0x0090, 'brahmic', - 0x0100, 'mm', - 0x0108, 'geor', - 0x0110, 'jamo', - 0x0120, 'ethiopic', - 0x0138, 'aboriginal', - 0x0168, 'ger', - 0x0170, 'brahm', - 0x0180, 'mon', - 0x0188, 'can', - 0x0190, 'brahmic', - 0x01D0, 'extensions', - 0x01F0, 'greek', - 0x0200, '·…', - 0x0208, 'symbols', - 0x0220, 'maths', - 0x0230, 'technical', - 0x0248, '()', - 0x0250, 'draw', - 0x0260, 'symbols', - 0x0280, 'braille', - 0x0290, 'arr', - 0x0298, 'maths', - 0x02B0, 'misc', - 0x02C0, 'ancient', - 0x02D0, 'ext', - 0x02E0, '·+', - 0x02E8, 'radicals', - 0x0300, 'japanese', - 0x0310, 'cjk+', - 0x0330, 'compat', - 0x0340, '', - 0x0380, 'cjk ideographs A', #+2 - 0x04E0, 'cjk unified ideographs', - 0x0A00, 'yi', - 0x0A48, 'lisu', - 0x0A50, 'vai', - 0x0A60, 'cyr', - 0x0A68, 'bam', - 0x0A70, 'lat-D', - 0x0A80, 'brahmic', - 0x0AB0, 'ext', - 0x0AC0, '', - 0x0B00, 'hangeul syllables', - 0x0D80, 'surrogates', - 0x0E00, 'private use', - 0x0F80, '', - 0x0F90, 'cjk compat', - 0x0FB0, 'presentation', - 0x0FF0, 'width', - 0x7D80, 'presentation', - 0x7DA8, '', - 0x7E00, 'arabic presentation forms A', - 0x7E80, '', - 0x7EE8, '?', - 0x7EF8, '', - 0x7F00, 'var', - 0x7F08, 'ver', - 0x7F10, '½', - 0x7F18, 'comp', - 0x7F28, 'small', - 0x7F38, 'arabic presentation B', - 0x7F80, 'halfwidth & fullwidth forms', - 0x7FF8, 'sp', -); - -sub { - return defined $uniblock{$_[0]} ? $uniblock{$_[0]} : (); -} ++{ + colsize => 0x80, + 0x00000 => [0x0080, 'X Po', 'ascii'], + 0x00080 => [0x0200, 'X L Latin', 'latin'], + 0x00280 => [0x0100, 'X Mn', 'diac', 'diacritics'], # also spacing Sk + 0x00380 => [0x0080, 'X L Greek', 'grk', 'greek'], + 0x00400 => [0x0100, 'X L Cyrillic', 'cyr', 'cyrillic'], + 0x00500 => [0x0080, 'X L Armenian', 'arm', 'armenian'], + 0x00580 => [0x0080, 'X L Aramaic', 'heb', 'hebrew'], + 0x00600 => [0x0100, 'X L Arabic', 'arabic'], + 0x00700 => [0x0200, 'X L African', 'rtl', 'various right-to-left scripts'], + 0x00900 => [0x0500, 'X L Brahmic', 'brahmic'], + 0x00E00 => [0x0100, 'X L Brahmic Khmer', 's-br', 'south brahmic: lao and thai'], + 0x00F00 => [0x0100, 'X L Brahmic', 'tibet', 'tibetan'], + 0x01000 => [0x0080, 'X L Brahmic', 'mm', 'myanmar'], + 0x01080 => [0x0080, 'X L Aramaic', 'geor', 'georgian'], + 0x01100 => [0x0100, 'X L Hangul', 'jamo'], + 0x01200 => [0x0180, 'X L African', 'ethiopic'], + 0x01380 => [0x0300, 'X L Syllabic', 'aboriginal', 'cherokee and canadian syllabics'], + 0x01680 => [0x0080, 'X L Alpha', 'ger', 'germanic runes'], + 0x01700 => [0x0100, 'X L Brahmic', 'brahm', 'various brahmic'], + 0x01800 => [0x0080, 'X L Aramaic', 'mon', 'mongolian'], + 0x01880 => [0x0080, 'X L Syllabic', 'can', 'canadian supplement'], + 0x01900 => [0x0400, 'X L Brahmic', 'brahmic'], + 0x01D00 => [0x0200, 'X L Latin', 'extensions'], + 0x01F00 => [0x0100, 'X L Greek', 'greek'], + 0x02000 => [0x0080, 'X Po', '·…', 'punctuation'], + 0x02080 => [0x0180, 'X So', 'symbols'], + 0x02200 => [0x0100, 'X Sm', 'maths'], + 0x02300 => [0x0180, 'X So', 'technical'], + 0x02480 => [0x0080, 'X Latin', '()', 'enclosed alphanumerics'], + 0x02500 => [0x0100, 'X So', 'draw', 'box drawing and shapes'], + 0x02600 => [0x0200, 'X So', 'symbols'], + 0x02800 => [0x0100, 'X L Alpha', 'braille'], + 0x02900 => [0x0080, 'X So', 'arr', 'arrows'], + 0x02980 => [0x0180, 'X Sm', 'maths'], + 0x02B00 => [0x0100, 'X So', 'misc', 'miscellaneous symbols'], + 0x02C00 => [0x0100, 'X L Greek', 'ancient', 'glagolitic, latin, coptic'], + 0x02D00 => [0x0100, 'X L Alpha', 'ext', 'extensions of various alphabets'], + 0x02E00 => [0x0080, 'X Po', '·+', 'punctuation'], + 0x02E80 => [0x0180, 'X L Han', 'radicals'], + 0x03000 => [0x0100, 'X L Katakana', 'japanese'], + 0x03100 => [0x0200, 'X L Han', 'cjk+'], + 0x03300 => [0x0100, 'X Xd L Han', 'compat', 'cjk compatibility'], + 0x03400 => [0x1A00, 'X L Han', 'cjk ideographs A'], + 0x04E00 => [0x5200, 'X L Han', 'cjk unified ideographs'], + 0x0A000 => [0x0480, 'X L Syllabic', 'yi'], + 0x0A480 => [0x0080, 'X L Latin', 'lisu'], + 0x0A500 => [0x0100, 'X L Syllabic', 'vai'], + 0x0A600 => [0x0080, 'X L Cyrillic', 'cyr', 'cyrillic ext-B'], + 0x0A680 => [0x0080, 'X L Syllabic', 'bam', 'bamum'], + 0x0A700 => [0x0100, 'X L Latin', 'lat-D'], + 0x0A800 => [0x0300, 'X L Brahmic', 'brahmic'], + 0x0AB00 => [0x0100, 'X L Alpha', 'ext', 'various extensions'], + 0x0AC00 => [0x2C00, 'X L Hangul', 'hangeul syllables'], + 0x0D800 => [0x0800, 'X Cs', 'surrogates'], + 0x0E000 => [0x1000, 'X Co', 'private use'], + 0x0F000 => [0x0900, 'X Co', 'corporate use'], + 0x0F900 => [0x0200, 'X L Han', 'cjk compat'], + 0x0FB00 => [0x0400, 'X L Arabic', 'presentation'], + 0x0FF00 => [0x0100, 'X L Latin', 'width'], + 0x10000 => [0x0100, 'X L Syllabic', 'linear B'], + 0x10100 => [0x0100, 'X No', 'a num'], + 0x10200 => [0x0400, 'X L Alpha', 'ltr'], + 0x10600 => [0x0180, 'X L Syllabic', 'linear A'], + 0x10780 => [0x0080, 'X L Alpha', 'ltr'], + 0x10800 => [0x0800, 'X L Aramaic', 'rtl'], + 0x11000 => [0x1000, 'X L Brahmic', 'brahmic'], + 0x12000 => [0x0600, 'X L Syllabic', 'cuneiform'], + 0x12600 => [0x0800, 'X L Syllabic', 'proto-cuneiform'], + 0x12E00 => [0x0200, 'X L Syllabic', 'indus'], + 0x13000 => [0x1400, 'X L Syllabic', 'egyptian hieroglyphs'], + 0x14400 => [0x0280, 'X L Syllabic', 'anatolian'], + 0x14680 => [0x0980, 'X L Syllabic', 'egyptian'], + 0x15000 => [0x0080, 'X L Brahmic', 'bra', 'brahmic'], + 0x15080 => [0x0480, 'X L Syllabic', 'mandombe'], + 0x15500 => [0x0B00, 'X L Syllabic', 'american hieroglyphs'], + 0x16000 => [0x1000, 'X L Alpha', 'recent'], + 0x17000 => [0x1B00, 'X L Syllabic', 'tangut'], + 0x18B00 => [0x0B00, 'X L Han', 'khitan'], + 0x19600 => [0x0600, 'X L Han', 'jurchen'], + 0x19C00 => [0x1400, 'X L Han', 'southeast asian'], + 0x1B000 => [0x0180, 'X L Hiragana', 'kana'], + 0x1B180 => [0x0180, 'X L Han', 'nushu'], + 0x1B300 => [0x0200, 'X L Han', 'shuishu'], + 0x1B500 => [0x0700, 'X L Syllabic', 'proto-elamite'], + 0x1BC00 => [0x0400, 'X L Alpha', 'shorthands'], + 0x1C000 => [0x0B00, 'X L Syllabic', 'micmac hieroglyphs'], + 0x1CB00 => [0x0300, 'X L Syllabic', 'rongorongo'], + 0x1CE00 => [0x0200, '', 'large scripts'], + 0x1D000 => [0x0380, 'X So', 'notational systems'], + 0x1D380 => [0x0480, 'X Sm', 'math alphanumeric'], + 0x1D800 => [0x0400, 'X L Alpha', 'sutton signs'], + 0x1DC00 => [0x0400, '', 'notational'], + 0x1E000 => [0x0800, 'X L Alpha', 'ltr'], + 0x1E800 => [0x0600, 'X L Alpha', 'rtl'], + 0x1EE00 => [0x0200, 'X L Arabic', 'arabic math'], + 0x1F000 => [0x0100, 'X So', 'game'], + 0x1F100 => [0x0200, 'X L So', 'enclosed'], + 0x1F300 => [0x0500, 'X So', 'pictographic'], + 0x1F800 => [0x0100, 'X So', 'arrows'], + 0x1F900 => [0x0100, 'X So', 'pict', 'supplemental pictographs'], + 0x1FA00 => [0x0600, '', 'unassigned'], +};