charset: unicode block allocations for plane 1
authorMischa POSLAWSKY <perl@shiar.org>
Fri, 13 Mar 2015 09:50:31 +0000 (10:50 +0100)
committerMischa POSLAWSKY <perl@shiar.org>
Tue, 9 Jun 2015 03:43:44 +0000 (05:43 +0200)
charset-unicode.inc.pl
charset.plp

index 2b709c287b9f716f50fc5bfd56712b44289c1b0b..94bbd67301e4745a8ee874891ca314347b4116b5 100644 (file)
@@ -178,6 +178,241 @@ my %uniblock = (
        0xFE7, '<td colspan="9" class="X Xd L Arabic">arabic presentation B',
        0xFF0, '<td colspan="15" class="X L Latin">halfwidth &amp; fullwidth forms',
        0xFFF, '<td colspan="1" class="X Cc">sp',
+
+       0x1000, '<td colspan="8" class="X L Syllabic">linear B syllabary',
+       0x1008, '<td colspan="8" class="X L Syllabic">linear B ideograms',
+       0x1010, '<td colspan="4" class="X No">aegean num',
+       0x1014, '<td colspan="5" class="X No">greek numbers',
+       0x1019, '<td colspan="4" class="X So">ancient sym',
+       0x101D, '<td colspan="3" class="X L Syllabic">phaistos',
+       0x1020, '<td colspan="8" class="">reserved',
+       0x1028, '<td colspan="2" class="X L Greek">lycian',
+       0x102A, '<td colspan="4" class="X L Greek">carian',
+       0x102E, '<td colspan="2" class="X L No">coptic',
+       0x1030, '<td colspan="3" class="X L Greek">italic',
+       0x1033, '<td colspan="2" class="X L Greek">gothic',
+       0x1035, '<td colspan="3" class="X L Cyrillic">permic',
+       0x1038, '<td colspan="2" class="X L Alpha">ugarit',
+       0x103A, '<td colspan="4" class="X L Alpha">old persian',
+       0x103E, '<td colspan="2" class="">res',
+       0x1040, '<td colspan="5" class="X L Alpha">deseret',
+       0x1045, '<td colspan="3" class="X L Alpha">shavian',
+       0x1048, '<td colspan="3" class="X L Alpha">osmanya',
+       0x104B, '<td colspan="5" class="X Xr L Alpha">osage',
+       0x1050, '<td colspan="3" class="X L Alpha">elbasan',
+       0x1053, '<td colspan="4" class="X L Alpha">c albanian',
+       0x1057, '<td colspan="1" class="X Xr L Alpha">qs',
+       0x1058, '<td colspan="5" class="X Xr L Alpha">vithkuqi',
+       0x105D, '<td colspan="1" class="">res',
+       0x105E, '<td colspan="2" class="X Xr L Syllabic">iber',
+       0x1060, '<td colspan="16" class="X L Syllabic">linear A',
+       0x1070, '<td colspan="8" class="X L Syllabic">linear A',
+       0x1078, '<td colspan="4" class="X L Alpha">todhri',
+       0x107C, '<td colspan="4" class="X L Syllabic">cyp minoan',
+       0x1080, '<td colspan="4" class="X L Syllabic">cypriot',
+       0x1084, '<td colspan="2" class="X L Aramaic">aram',
+       0x1086, '<td colspan="2" class="X L Aramaic">palmr',
+       0x1088, '<td colspan="3" class="X L Aramaic">nabataean',
+       0x108A, '<td colspan="1" class="">res',
+       0x108C, '<td colspan="2" class="X Xr L Alpha">numid',
+       0x108E, '<td colspan="2" class="X Xr L Aramaic">hatr',
+       0x1090, '<td colspan="2" class="X L Aramaic">phoen',
+       0x1092, '<td colspan="2" class="X L Greek">lydian',
+       0x1094, '<td colspan="4" class="">reserved',
+       0x1098, '<td colspan="2" class="X L Alpha" title="meroitic hieroglyphs">mero h',
+       0x109A, '<td colspan="6" class="X L Alpha">meroitic cursive',
+       0x10A0, '<td colspan="6" class="X L Syllabic">kharoshthi',
+       0x10A6, '<td colspan="2" class="X L Aramaic">s arab',
+       0x10A8, '<td colspan="2" class="X L Aramaic">n arab',
+       0x10AA, '<td colspan="2" class="X Xr L Brahmic">balti',
+       0x10AC, '<td colspan="4" class="X L Aramaic">manichaean',
+       0x10B0, '<td colspan="4" class="X L Aramaic">avestan',
+       0x10B4, '<td colspan="2" class="X L Aramaic">parth',
+       0x10B6, '<td colspan="2" class="X L Aramaic" title="inscriptional pahlavi">pahlav',
+       0x10B8, '<td colspan="3" class="X L Aramaic" title="psalter pahlavi">psalt pahl',
+       0x10BB, '<td colspan="3" class="X Xr L Aramaic" title="book pahlavi">book pahl',
+       0x10BE, '<td colspan="2" class="X Xr L Alpha">babur',
+       0x10C0, '<td colspan="5" class="X L Aramaic">old turkic',
+       0x10C5, '<td colspan="3" class="">reserved',
+       0x10C8, '<td colspan="8" class="X Xr L Aramaic">old hungarian',
+       0x10D0, '<td colspan="4" class="X Xr L Alpha">rohingya',
+       0x10D4, '<td colspan="4" class="X Xr L Alpha">garay',
+       0x10D8, '<td colspan="8" class="">reserved',
+       0x10E0, '<td colspan="6" class="X Xr L Aramaic">sogdian',
+       0x10E6, '<td colspan="2" class="X No">rumi',
+       0x10E8, '<td colspan="6" class="X Xr L Aramaic">uyghur',
+       0x10EE, '<td colspan="2" class="X Xr L Aramaic">elym',
+       0x10F0, '<td colspan="16" class="">reserved',
+       0x1100, '<td colspan="8" class="X L Brahmic">brahmi',
+       0x1108, '<td colspan="5" class="X L Brahmic">kaithi',
+       0x110D, '<td colspan="3" class="X L Brahmic">sora som',
+       0x1110, '<td colspan="5" class="X L Brahmic">chakma',
+       0x1115, '<td colspan="3" class="X L Brahmic">mahajani',
+       0x1118, '<td colspan="6" class="X L Brahmic">sharada',
+       0x111E, '<td colspan="2" class="X No Brahmic">sinhal',
+       0x1120, '<td colspan="5" class="X L Brahmic">khojki',
+       0x1125, '<td colspan="3" class="X Xr L Brahmic">landa',
+       0x1128, '<td colspan="3" class="X Xr L Brahmic">multani',
+       0x112B, '<td colspan="5" class="X L Brahmic">khudabadi',
+       0x1130, '<td colspan="8" class="X L Brahmic">grantha',
+       0x1138, '<td colspan="6" class="X Xr L Brahmic">tulu',
+       0x113E, '<td colspan="2" class="X Xr L Brahmic" title="sharada extension">shar+',
+       0x1140, '<td colspan="8" class="X Xr L Brahmic">newar',
+       0x1148, '<td colspan="6" class="X L Brahmic">tirhuta',
+       0x114E, '<td colspan="2" class="X Xr L Alpha">tani',
+       0x1150, '<td colspan="6" class="X Xr L Brahmic">ranjana',
+       0x1156, '<td colspan="2" class="">res',
+       0x1158, '<td colspan="8" class="X L Brahmic">siddham',
+       0x1160, '<td colspan="6" class="X L Brahmic">modi',
+       0x1166, '<td colspan="2" class="X Xr L Aramaic" title="mongolian extension">mong',
+       0x1168, '<td colspan="5" class="X L Brahmic">takri',
+       0x116D, '<td colspan="3" class="X Xr L Brahmic">jenticha',
+       0x1170, '<td colspan="4" class="X Xr L Brahmic">ahom',
+       0x1174, '<td colspan="6" class="X Xr L Alpha">zou',
+       0x117A, '<td colspan="6" class="X Xr L Brahmic">pyu',
+       0x1180, '<td colspan="4" class="X Xr L Brahmic">khema',
+       0x1184, '<td colspan="4" class="X Xr L Brahmic">khe prih',
+       0x1188, '<td colspan="2" class="">reserved', #TODO
+       0x118A, '<td colspan="6" class="X L Syllabic">warang citi',
+       0x1190, '<td colspan="4" class="X Xr L Brahmic">tolong siki',
+       0x1194, '<td colspan="4" class="X Xr L Brahmic">tikamuli',
+       0x1198, '<td colspan="4" class="X Xr L Brahmic">khambu rai',
+       0x119C, '<td colspan="4" class="X Xr L Brahmic">kirat rai',
+       0x11A0, '<td colspan="5" class="X Xr L Brahmic">zanabazar square',
+       0x11A5, '<td colspan="6" class="X Xr L Brahmic">soyombo',
+       0x11AB, '<td colspan="1" class="">res',
+       0x11AC, '<td colspan="4" class="X L Alpha">pau cin hau',
+       0x11B0, '<td colspan="5" class="X Xr L Brahmic">dhives akuru',
+       0x11B5, '<td colspan="4" class="X Xr L Brahmic">leke',
+       0x11B9, '<td colspan="6" class="X Xr L Brahmic">gondi',
+       0x11BF, '<td colspan="1" class="">res',
+       0x11C0, '<td colspan="7" class="X Xr L Brahmic">bhaiksuki',
+       0x11C7, '<td colspan="5" class="X Xr L Brahmic">marchen',
+       0x11CC, '<td colspan="4" class="X Xr L Brahmic">balti B',
+       0x11D0, '<td colspan="5" class="X Xr L Brahmic">kawi',
+       0x11D5, '<td colspan="6" class="X Xr L Brahmic">nandinagari',
+       0x11DB, '<td colspan="5" class="">reserved',
+       0x11E0, '<td colspan="6" class="X Xr L Brahmic">chalukya',
+       0x11E6, '<td colspan="6" class="X Xr L Brahmic">chola',
+       0x11EC, '<td colspan="4" class="">reserved',
+       0x11F0, '<td colspan="6" class="X Xr Brahmic">satavahana',
+       0x11F6, '<td colspan="6" class="X Xr L Brahmic" title="Tocharian &amp; Khotanese">turkestani',
+       0x11FC, '<td colspan="4" class="X Xr L Brahmic">tamil+',
+       0x1200, '<td colspan="16" rowspan="4" class="X L Syllabic">cuneiform',
+       0x1240, '<td colspan="8" class="X No">cuneiform numbers',
+       0x1248, '<td colspan="8" class="X Xr L Syllabic">early dynastic cuneiform',
+       0x1250, '<td colspan="8" class="X Xr L Syllabic">early dynastic cuneiform',
+       0x1258, '<td colspan="8" class="">reserved',
+       0x1260, '<td colspan="16" rowspan="8" class="X Xr L Syllabic">proto-cuneiform',
+       0x12E0, '<td colspan="16" class="X Xr L Syllabic">indus',
+       0x12F0, '<td colspan="9" class="X Xr L Syllabic">indus',
+       0x12F9, '<td colspan="7" class="">reserved',
+       0x1300, '<td colspan="16" rowspan="4" class="X L Syllabic">egyptian hieroglyphs',
+       0x1340, '<td colspan="3" class="X L Syllabic">egyptian',
+       0x1343, '<td colspan="13" class="">reserved',
+       0x1350, '<td colspan="16" rowspan="12" class="X Xr L Syllabic">egyptian hieroglyphs extended',
+       0x1410, '<td colspan="16" rowspan="3" class="X Xr L Syllabic">pau cin hau syllabary',
+       0x1440, '<td colspan="16" rowspan="2" class="X Xr L Syllabic">anatolian hieroglyphs',
+       0x1460, '<td colspan="8" class="X Xr L Syllabic">anatolian hieroglyphs',
+       0x1468, '<td colspan="8" class="">reserved',
+       0x1470, '<td colspan="16" rowspan="4" class="X Xr L Syllabic">eskaya',
+       0x14B0, '<td colspan="6" class="X Xr L Syllabic">eskaya',
+       0x14B6, '<td colspan="10" class="">reserved',
+       0x14C0, '<td colspan="16" rowspan="8" class="">reserved',
+       0x1540, '<td colspan="16" rowspan="5" class="X Xr L Syllabic">maya hieroglyphs',
+       0x1590, '<td colspan="16" rowspan="3" class="">reserved',
+       0x15C0, '<td colspan="16" rowspan="4" class="X Xr L Syllabic">aztec pictograms',
+       0x1600, '<td colspan="8" class="X Xr L Alpha">cirth',
+       0x1608, '<td colspan="8" class="X Xr L Alpha">tengwar',
+       0x1610, '<td colspan="10" class="">reserved',
+       0x161A, '<td colspan="6" class="X Xr L Alpha">moon',
+       0x1620, '<td colspan="16" rowspan="5" class="X Xr L Syllabic">blissymbols',
+       0x1670, '<td colspan="11" class="X Xr L Syllabic">bagam',
+       0x167B, '<td colspan="5" class="">reserved',
+       0x1680, '<td colspan="16" rowspan="2" class="X L Syllabic">bamum supplement',
+       0x16A0, '<td colspan="4" class="X L Syllabic">bamum+',
+       0x16A4, '<td colspan="3" class="X L Alpha">mro',
+       0x16A7, '<td colspan="6" class="X Xr L Alpha">mossang tangsa',
+       0x16AD, '<td colspan="3" class="X L Alpha">bassa vah',
+       0x16B0, '<td colspan="9" class="X L Syllabic">pahawh hmong',
+       0x16B9, '<td colspan="7" class="X Xr L Syllabic">woleai',
+       0x16C0, '<td colspan="8" class="X Xr L Syllabic">kpelle',
+       0x16C8, '<td colspan="5" class="X Xr L Syllabic">afaka',
+       0x16CD, '<td colspan="3" class="X Xr L Syllabic" title="Latsam Khimhun Tangsa">lk tangsa',
+       0x16D0, '<td colspan="13" class="X Xr L Syllabic">loma',
+       0x16DD, '<td colspan="3" class="X Xr L Alpha">zaghawa',
+       0x16E0, '<td colspan="5" class="X Xr L Alpha">mwangwego',
+       0x16E5, '<td colspan="11" class="">reserved',
+       0x16F0, '<td colspan="10" class="X L Syllabic">miao',
+       0x16FA, '<td colspan="4" class="">reserved',
+       0x16FE, '<td colspan="2" class="X Xr So" title="Ideographic Symbols and Punctuation">ideo',
+       0x1700, '<td colspan="16" rowspan="24" class="X Xr L Syllabic">tangut ideographs',
+       0x1880, '<td colspan="16" class="">reserved',
+       0x1890, '<td colspan="16" rowspan="3" class="X Xr L Syllabic">tangut radicals',
+       0x18C0, '<td colspan="16" rowspan="4" class="">reserved',
+       0x1900, '<td colspan="16" rowspan="5" class="X Xr L Han">jurchen',
+       0x1950, '<td colspan="6" class="X Xr L Han">jurchen',
+       0x1956, '<td colspan="4" class="X Xr L Han">jurchen rad',
+       0x195A, '<td colspan="6" class="">reserved',
+       0x1960, '<td colspan="16" class="X Xr L Han">khitan small',
+       0x1970, '<td colspan="8" class="X Xr L Han">khitan small',
+       0x1978, '<td colspan="8" class="">reserved',
+       0x1980, '<td colspan="16" rowspan="9" class="X Xr L Han">khitan large',
+       0x1A10, '<td colspan="16" rowspan="7" class="">reserved',
+       0x1A80, '<td colspan="16" rowspan="2" class="X Xr L Syllabic">naxi geba',
+       0x1AA0, '<td colspan="11" class="X Xr L Syllabic">naxi geba',
+       0x1AAB, '<td colspan="1" class="">res',
+       0x1AAC, '<td colspan="4" class="X Xr L Syllabic">naxi dongba',
+       0x1AB0, '<td colspan="16" rowspan="5" class="X Xr L Syllabic">naxi dongba',
+       0x1B00, '<td colspan="16" class="X L Hiragana">kana supplement',
+       0x1B10, '<td colspan="16" class="X Xr L Han">nushu',
+       0x1B20, '<td colspan="9" class="X Xr L Han">nushu',
+       0x1B29, '<td colspan="7" class="">reserved',
+       0x1B30, '<td colspan="8" class="X Xr L Syllabic">kaida',
+       0x1B38, '<td colspan="8" class="">reserved',
+       0x1B40, '<td colspan="16" class="">reserved',
+       0x1B50, '<td colspan="16" rowspan="7" class="X Xr L Syllabic">proto-elamite',
+       0x1BC0, '<td colspan="10" class="X L Alpha">duployan',
+       0x1BCA, '<td colspan="1" class="X L Cc" title="Shorthand Formatting">sh',
+       0x1BCB, '<td colspan="5" class="X Xr L Alpha">pitman',
+       0x1D00, '<td colspan="16" class="X So">byzantine musical',
+       0x1D10, '<td colspan="16" class="X So">musical symbols',
+       0x1D20, '<td colspan="5" class="X So">anc greek music',
+       0x1D25, '<td colspan="11" class="">reserved',
+       0x1D30, '<td colspan="6" class="X So" title="tetragrams">tai xuan jing',
+       0x1D36, '<td colspan="2" class="X No">rod',
+       0x1D38, '<td colspan="8" class="">reserved',
+       0x1D40, '<td colspan="16" rowspan="4" class="X L Latin">mathematical alphanumeric', # Sm
+       0x1D80, '<td colspan="16" rowspan="3" class="X Xr L Alpha">sutton',
+       0x1DB0, '<td colspan="16" rowspan="5" class="">reserved',
+       0x1E00, '<td colspan="3" class="X Xr L Cyrillic">glagol+',
+       0x1E03, '<td colspan="13" class="">reserved',
+       0x1E10, '<td colspan="16" rowspan="7" class="">reserved',
+       0x1E80, '<td colspan="14" class="X L Syllabic">mende kikakui',
+       0x1E90, '<td colspan="6" class="X Xr L Alpha">adlam',
+       0x1E96, '<td colspan="10" class="">reserved',
+       0x1EA0, '<td colspan="16" rowspan="2" class="">reserved',
+       0x1EC0, '<td colspan="7" class="X Xr No">persian siyaq',
+       0x1EC7, '<td colspan="5" class="X Xr No">indic siyaq',
+       0x1ECC, '<td colspan="4" class="X Xr No">diwani siyaq',
+       0x1ED0, '<td colspan="4" class="X Xr No">ottoman siyaq',
+       0x1ED4, '<td colspan="12" class="">reserved',
+       0x1E8E, '<td colspan="2" class="">res',
+       0x1EE0, '<td colspan="16" class="X L Arabic">arabic mathematical alphabetic', # Sm
+       0x1EF0, '<td colspan="16" class="">reserved',
+       0x1F00, '<td colspan="3" class="X So">mahjong',
+       0x1F03, '<td colspan="7" class="X So">domino tiles',
+       0x1F0A, '<td colspan="6" class="X So">playing cards',
+       0x1F10, '<td colspan="16" class="X L Latin">enclosed alphanumeric supplement', # So
+       0x1F20, '<td colspan="16" class="X L Han">enclosed ideographic supplement', # So
+       0x1F30, '<td colspan="16" rowspan="3" class="X So">miscellaneous symbols and pictographs',
+       0x1F60, '<td colspan="5" class="X So">emoticons',
+       0x1F65, '<td colspan="3" class="X So">ornament',
+       0x1F68, '<td colspan="8" class="X So">transport',
+       0x1F70, '<td colspan="8" class="X So">alchemical',
+       0x1F78, '<td colspan="8" class="X So">geometric shapes ext',
+       0x1F80, '<td colspan="16" class="X So">supplemental arrows-C',
+       0x1F90, '<td colspan="16" rowspan="7" class="">reserved',
 );
 
 sub {
index 26b58e4af9bbcf2baca42b180a89fcb734247c63..98a7345b28d072bf254a9ac37f82af7d85812c7a 100644 (file)
@@ -64,7 +64,7 @@ my @request = map {
                }
                elsif ($row{set} = resolve_alias($input)) {
                        if ($row{set} eq 'Internal') {
-                               $row{table} = ' ' x ($endpoint < 255 ? 640 : 4096);
+                               $row{table} = ' ' x ($endpoint < 255 ? 640 : 8192);
                                $row{set} = 'Unicode BMP';
                                $row{cell} = do 'charset-unicode.inc.pl';
                        }