From fc33639e320c49693604bf0e259a29a07f2076b4 Mon Sep 17 00:00:00 2001 From: Mischa POSLAWSKY Date: Fri, 13 Mar 2015 10:50:31 +0100 Subject: [PATCH] charset: unicode block allocations for plane 1 --- charset-unicode.inc.pl | 235 +++++++++++++++++++++++++++++++++++++++++ charset.plp | 2 +- 2 files changed, 236 insertions(+), 1 deletion(-) diff --git a/charset-unicode.inc.pl b/charset-unicode.inc.pl index 2b709c2..94bbd67 100644 --- a/charset-unicode.inc.pl +++ b/charset-unicode.inc.pl @@ -178,6 +178,241 @@ my %uniblock = ( 0xFE7, 'arabic presentation B', 0xFF0, 'halfwidth & fullwidth forms', 0xFFF, 'sp', + + 0x1000, 'linear B syllabary', + 0x1008, 'linear B ideograms', + 0x1010, 'aegean num', + 0x1014, 'greek numbers', + 0x1019, 'ancient sym', + 0x101D, 'phaistos', + 0x1020, 'reserved', + 0x1028, 'lycian', + 0x102A, 'carian', + 0x102E, 'coptic', + 0x1030, 'italic', + 0x1033, 'gothic', + 0x1035, 'permic', + 0x1038, 'ugarit', + 0x103A, 'old persian', + 0x103E, 'res', + 0x1040, 'deseret', + 0x1045, 'shavian', + 0x1048, 'osmanya', + 0x104B, 'osage', + 0x1050, 'elbasan', + 0x1053, 'c albanian', + 0x1057, 'qs', + 0x1058, 'vithkuqi', + 0x105D, 'res', + 0x105E, 'iber', + 0x1060, 'linear A', + 0x1070, 'linear A', + 0x1078, 'todhri', + 0x107C, 'cyp minoan', + 0x1080, 'cypriot', + 0x1084, 'aram', + 0x1086, 'palmr', + 0x1088, 'nabataean', + 0x108A, 'res', + 0x108C, 'numid', + 0x108E, 'hatr', + 0x1090, 'phoen', + 0x1092, 'lydian', + 0x1094, 'reserved', + 0x1098, 'mero h', + 0x109A, 'meroitic cursive', + 0x10A0, 'kharoshthi', + 0x10A6, 's arab', + 0x10A8, 'n arab', + 0x10AA, 'balti', + 0x10AC, 'manichaean', + 0x10B0, 'avestan', + 0x10B4, 'parth', + 0x10B6, 'pahlav', + 0x10B8, 'psalt pahl', + 0x10BB, 'book pahl', + 0x10BE, 'babur', + 0x10C0, 'old turkic', + 0x10C5, 'reserved', + 0x10C8, 'old hungarian', + 0x10D0, 'rohingya', + 0x10D4, 'garay', + 0x10D8, 'reserved', + 0x10E0, 'sogdian', + 0x10E6, 'rumi', + 0x10E8, 'uyghur', + 0x10EE, 'elym', + 0x10F0, 'reserved', + 0x1100, 'brahmi', + 0x1108, 'kaithi', + 0x110D, 'sora som', + 0x1110, 'chakma', + 0x1115, 'mahajani', + 0x1118, 'sharada', + 0x111E, 'sinhal', + 0x1120, 'khojki', + 0x1125, 'landa', + 0x1128, 'multani', + 0x112B, 'khudabadi', + 0x1130, 'grantha', + 0x1138, 'tulu', + 0x113E, 'shar+', + 0x1140, 'newar', + 0x1148, 'tirhuta', + 0x114E, 'tani', + 0x1150, 'ranjana', + 0x1156, 'res', + 0x1158, 'siddham', + 0x1160, 'modi', + 0x1166, 'mong', + 0x1168, 'takri', + 0x116D, 'jenticha', + 0x1170, 'ahom', + 0x1174, 'zou', + 0x117A, 'pyu', + 0x1180, 'khema', + 0x1184, 'khe prih', + 0x1188, 'reserved', #TODO + 0x118A, 'warang citi', + 0x1190, 'tolong siki', + 0x1194, 'tikamuli', + 0x1198, 'khambu rai', + 0x119C, 'kirat rai', + 0x11A0, 'zanabazar square', + 0x11A5, 'soyombo', + 0x11AB, 'res', + 0x11AC, 'pau cin hau', + 0x11B0, 'dhives akuru', + 0x11B5, 'leke', + 0x11B9, 'gondi', + 0x11BF, 'res', + 0x11C0, 'bhaiksuki', + 0x11C7, 'marchen', + 0x11CC, 'balti B', + 0x11D0, 'kawi', + 0x11D5, 'nandinagari', + 0x11DB, 'reserved', + 0x11E0, 'chalukya', + 0x11E6, 'chola', + 0x11EC, 'reserved', + 0x11F0, 'satavahana', + 0x11F6, 'turkestani', + 0x11FC, 'tamil+', + 0x1200, 'cuneiform', + 0x1240, 'cuneiform numbers', + 0x1248, 'early dynastic cuneiform', + 0x1250, 'early dynastic cuneiform', + 0x1258, 'reserved', + 0x1260, 'proto-cuneiform', + 0x12E0, 'indus', + 0x12F0, 'indus', + 0x12F9, 'reserved', + 0x1300, 'egyptian hieroglyphs', + 0x1340, 'egyptian', + 0x1343, 'reserved', + 0x1350, 'egyptian hieroglyphs extended', + 0x1410, 'pau cin hau syllabary', + 0x1440, 'anatolian hieroglyphs', + 0x1460, 'anatolian hieroglyphs', + 0x1468, 'reserved', + 0x1470, 'eskaya', + 0x14B0, 'eskaya', + 0x14B6, 'reserved', + 0x14C0, 'reserved', + 0x1540, 'maya hieroglyphs', + 0x1590, 'reserved', + 0x15C0, 'aztec pictograms', + 0x1600, 'cirth', + 0x1608, 'tengwar', + 0x1610, 'reserved', + 0x161A, 'moon', + 0x1620, 'blissymbols', + 0x1670, 'bagam', + 0x167B, 'reserved', + 0x1680, 'bamum supplement', + 0x16A0, 'bamum+', + 0x16A4, 'mro', + 0x16A7, 'mossang tangsa', + 0x16AD, 'bassa vah', + 0x16B0, 'pahawh hmong', + 0x16B9, 'woleai', + 0x16C0, 'kpelle', + 0x16C8, 'afaka', + 0x16CD, 'lk tangsa', + 0x16D0, 'loma', + 0x16DD, 'zaghawa', + 0x16E0, 'mwangwego', + 0x16E5, 'reserved', + 0x16F0, 'miao', + 0x16FA, 'reserved', + 0x16FE, 'ideo', + 0x1700, 'tangut ideographs', + 0x1880, 'reserved', + 0x1890, 'tangut radicals', + 0x18C0, 'reserved', + 0x1900, 'jurchen', + 0x1950, 'jurchen', + 0x1956, 'jurchen rad', + 0x195A, 'reserved', + 0x1960, 'khitan small', + 0x1970, 'khitan small', + 0x1978, 'reserved', + 0x1980, 'khitan large', + 0x1A10, 'reserved', + 0x1A80, 'naxi geba', + 0x1AA0, 'naxi geba', + 0x1AAB, 'res', + 0x1AAC, 'naxi dongba', + 0x1AB0, 'naxi dongba', + 0x1B00, 'kana supplement', + 0x1B10, 'nushu', + 0x1B20, 'nushu', + 0x1B29, 'reserved', + 0x1B30, 'kaida', + 0x1B38, 'reserved', + 0x1B40, 'reserved', + 0x1B50, 'proto-elamite', + 0x1BC0, 'duployan', + 0x1BCA, 'sh', + 0x1BCB, 'pitman', + 0x1D00, 'byzantine musical', + 0x1D10, 'musical symbols', + 0x1D20, 'anc greek music', + 0x1D25, 'reserved', + 0x1D30, 'tai xuan jing', + 0x1D36, 'rod', + 0x1D38, 'reserved', + 0x1D40, 'mathematical alphanumeric', # Sm + 0x1D80, 'sutton', + 0x1DB0, 'reserved', + 0x1E00, 'glagol+', + 0x1E03, 'reserved', + 0x1E10, 'reserved', + 0x1E80, 'mende kikakui', + 0x1E90, 'adlam', + 0x1E96, 'reserved', + 0x1EA0, 'reserved', + 0x1EC0, 'persian siyaq', + 0x1EC7, 'indic siyaq', + 0x1ECC, 'diwani siyaq', + 0x1ED0, 'ottoman siyaq', + 0x1ED4, 'reserved', + 0x1E8E, 'res', + 0x1EE0, 'arabic mathematical alphabetic', # Sm + 0x1EF0, 'reserved', + 0x1F00, 'mahjong', + 0x1F03, 'domino tiles', + 0x1F0A, 'playing cards', + 0x1F10, 'enclosed alphanumeric supplement', # So + 0x1F20, 'enclosed ideographic supplement', # So + 0x1F30, 'miscellaneous symbols and pictographs', + 0x1F60, 'emoticons', + 0x1F65, 'ornament', + 0x1F68, 'transport', + 0x1F70, 'alchemical', + 0x1F78, 'geometric shapes ext', + 0x1F80, 'supplemental arrows-C', + 0x1F90, 'reserved', ); sub { diff --git a/charset.plp b/charset.plp index 26b58e4..98a7345 100644 --- a/charset.plp +++ b/charset.plp @@ -64,7 +64,7 @@ my @request = map { } elsif ($row{set} = resolve_alias($input)) { if ($row{set} eq 'Internal') { - $row{table} = ' ' x ($endpoint < 255 ? 640 : 4096); + $row{table} = ' ' x ($endpoint < 255 ? 640 : 8192); $row{set} = 'Unicode BMP'; $row{cell} = do 'charset-unicode.inc.pl'; } -- 2.30.0