From 1a31f360dede26675fce9b4f36ed856eb7fbf70f Mon Sep 17 00:00:00 2001 From: Mischa POSLAWSKY Date: Mon, 27 Mar 2017 17:45:33 +0200 Subject: [PATCH] charset: update smp allocation to unicode v9.0 roadmap --- charset-unicode.inc.pl | 202 +++++++++++++++++++++++------------------ 1 file changed, 112 insertions(+), 90 deletions(-) diff --git a/charset-unicode.inc.pl b/charset-unicode.inc.pl index b96701e..f12c505 100644 --- a/charset-unicode.inc.pl +++ b/charset-unicode.inc.pl @@ -1,5 +1,6 @@ use utf8; my %uniblock = ( + # bmp 0x000, 'control', 0x002, 'comn', 0x004, 'basic latin', @@ -180,13 +181,15 @@ my %uniblock = ( 0xFF0, 'halfwidth & fullwidth forms', 0xFFF, 'sp', + # smp 0x1000, 'linear B syllabary', 0x1008, 'linear B ideograms', 0x1010, 'aegean num', 0x1014, 'greek numbers', 0x1019, 'ancient sym', 0x101D, 'phaistos', - 0x1020, 'reserved', + 0x1020, 'iberian', + 0x1024, 'reserved', 0x1028, 'lycian', 0x102A, 'carian', 0x102E, 'coptic', @@ -195,28 +198,25 @@ my %uniblock = ( 0x1035, 'permic', 0x1038, 'ugarit', 0x103A, 'old persian', - 0x103E, 'res', + 0x103E, 'sh.qs', 0x1040, 'deseret', 0x1045, 'shavian', 0x1048, 'osmanya', - 0x104B, 'osage', + 0x104B, 'osage', 0x1050, 'elbasan', 0x1053, 'c albanian', - 0x1057, 'qs', - 0x1058, 'vithkuqi', - 0x105D, 'res', - 0x105E, 'iber', + 0x1057, 'vithkuqi', + 0x105C, 'todhri', 0x1060, 'linear A', 0x1070, 'linear A', - 0x1078, 'todhri', - 0x107C, 'cyp minoan', + 0x1078, 'cypro-minoan', 0x1080, 'cypriot', 0x1084, 'aram', 0x1086, 'palmr', 0x1088, 'nabataean', 0x108A, 'res', 0x108C, 'numid', - 0x108E, 'hatr', + 0x108E, 'hatr', 0x1090, 'phoen', 0x1092, 'lydian', 0x1094, 'reserved', @@ -235,15 +235,18 @@ my %uniblock = ( 0x10BE, 'babur', 0x10C0, 'old turkic', 0x10C5, 'reserved', - 0x10C8, 'old hungarian', + 0x10C8, 'old hungarian', 0x10D0, 'rohingya', 0x10D4, 'garay', - 0x10D8, 'reserved', - 0x10E0, 'sogdian', + 0x10D8, 'byblos', + 0x10E0, 'reserved', 0x10E6, 'rumi', - 0x10E8, 'uyghur', + 0x10E8, 'reserved', 0x10EE, 'elym', - 0x10F0, 'reserved', + 0x10F0, 'old sog', + 0x10F3, 'sogdian', + 0x10F7, 'res', + 0x10F8, 'uyghur', 0x1100, 'brahmi', 0x1108, 'kaithi', 0x110D, 'sora som', @@ -253,27 +256,26 @@ my %uniblock = ( 0x111E, 'sinhal', 0x1120, 'khojki', 0x1125, 'landa', - 0x1128, 'multani', + 0x1128, 'multani', 0x112B, 'khudabadi', 0x1130, 'grantha', 0x1138, 'tulu', 0x113E, 'shar+', - 0x1140, 'newar', + 0x1140, 'newar', 0x1148, 'tirhuta', 0x114E, 'tani', - 0x1150, 'ranjana', - 0x1156, 'res', + 0x1150, 'ranjana', 0x1158, 'siddham', 0x1160, 'modi', - 0x1166, 'mong', + 0x1166, 'mong', 0x1168, 'takri', 0x116D, 'jenticha', 0x1170, 'ahom', 0x1174, 'zou', 0x117A, 'pyu', - 0x1180, 'khema', - 0x1184, 'khe prih', - 0x1188, 'reserved', #TODO + 0x1180, 'dogra', + 0x1185, 'sirmauri', + 0x1189, 'res', 0x118A, 'warang citi', 0x1190, 'tolong siki', 0x1194, 'tikamuli', @@ -285,51 +287,57 @@ my %uniblock = ( 0x11AC, 'pau cin hau', 0x11B0, 'dhives akuru', 0x11B5, 'leke', - 0x11B9, 'gondi', + 0x11B9, 'nandinagari', 0x11BF, 'res', - 0x11C0, 'bhaiksuki', - 0x11C7, 'marchen', + 0x11C0, 'bhaiksuki', + 0x11C7, 'marchen', 0x11CC, 'balti B', - 0x11D0, 'kawi', - 0x11D5, 'nandinagari', - 0x11DB, 'reserved', - 0x11E0, 'chalukya', - 0x11E6, 'chola', - 0x11EC, 'reserved', - 0x11F0, 'satavahana', - 0x11F6, 'turkestani', + 0x11D0, 'masaram gondi', + 0x11D6, 'gunjala gondi', + 0x11DB, 'kawi', + 0x11E0, 'tocharian', + 0x11E7, 'khotanese', + 0x11ED, 'res', + 0x11EE, 'makas', + 0x11F0, 'vatteluttu', + 0x11F4, 'res', + 0x11F6, 'chola', 0x11FC, 'tamil+', 0x1200, 'cuneiform', 0x1240, 'cuneiform numbers', - 0x1248, 'early dynastic cuneiform', - 0x1250, 'early dynastic cuneiform', - 0x1258, 'reserved', + 0x1248, 'early dynastic cuneiform', + 0x1250, 'e. dyn. cuneiform', + 0x1255, 'reserved', 0x1260, 'proto-cuneiform', 0x12E0, 'indus', 0x12F0, 'indus', 0x12F9, 'reserved', 0x1300, 'egyptian hieroglyphs', 0x1340, 'egyptian', - 0x1343, 'reserved', - 0x1350, 'egyptian hieroglyphs extended', - 0x1410, 'pau cin hau syllabary', - 0x1440, 'anatolian hieroglyphs', - 0x1460, 'anatolian hieroglyphs', - 0x1468, 'reserved', - 0x1470, 'eskaya', - 0x14B0, 'eskaya', - 0x14B6, 'reserved', - 0x14C0, 'reserved', - 0x1540, 'maya hieroglyphs', - 0x1590, 'reserved', + 0x1343, 'eg.c', + 0x1344, '', + 0x1350, 'egyptian hieroglyphs extended-A', + 0x1440, 'anatolian hieroglyphs', + 0x1460, 'anatolian', + 0x1468, '', + 0x1470, 'egyptian hieroglyphs extended-B', + 0x1500, 'lampung', + 0x1504, 'kerinci', + 0x1507, 'res', + 0x1508, '', + 0x1510, 'mandombe', + 0x1550, 'maya hieroglyphs', + 0x15A0, 'reserved', 0x15C0, 'aztec pictograms', 0x1600, 'cirth', 0x1608, 'tengwar', - 0x1610, 'reserved', + 0x1610, 'khema', + 0x1614, 'khe prih', + 0x1618, 'res', 0x161A, 'moon', 0x1620, 'blissymbols', 0x1670, 'bagam', - 0x167B, 'reserved', + 0x167B, 'iban', 0x1680, 'bamum supplement', 0x16A0, 'bamum+', 0x16A4, 'mro', @@ -340,65 +348,78 @@ my %uniblock = ( 0x16C0, 'kpelle', 0x16C8, 'afaka', 0x16CD, 'lk tangsa', - 0x16D0, 'loma', - 0x16DD, 'zaghawa', - 0x16E0, 'mwangwego', - 0x16E5, 'reserved', + 0x16D0, 'reserved', + 0x16DD, 'kulitan', + 0x16E0, 'mwangwego', + 0x16E4, 'medefaidrin', + 0x16EA, 'lontara+', 0x16F0, 'miao', - 0x16FA, 'reserved', - 0x16FE, 'ideo', - 0x1700, 'tangut ideographs', - 0x1880, 'reserved', - 0x1890, 'tangut radicals', - 0x18C0, 'reserved', - 0x1900, 'jurchen', - 0x1950, 'jurchen', - 0x1956, 'jurchen rad', - 0x195A, 'reserved', - 0x1960, 'khitan small', - 0x1970, 'khitan small', - 0x1978, 'reserved', - 0x1980, 'khitan large', - 0x1A10, 'reserved', + 0x16FA, 'lontara b-b', + 0x16FE, 'ideo', + 0x1700, 'tangut ideographs', + 0x1880, 'tangut components', + 0x18B0, 'khitan small', + 0x18D0, 'khitan ideographs', + 0x1960, 'jurchen', + 0x19B0, 'jurchen', + 0x19B6, 'jurchen rad', + 0x19BA, 'reserved', + 0x19C0, 'reserved', + 0x19E0, 'pau cin hau syllabary', + 0x1A30, 'eskaya', 0x1A80, 'naxi geba', 0x1AA0, 'naxi geba', 0x1AAB, 'res', - 0x1AAC, 'naxi dongba', - 0x1AB0, 'naxi dongba', + 0x1AAC, '', + 0x1AB0, 'naxi dongba', 0x1B00, 'kana supplement', - 0x1B10, 'nushu', - 0x1B20, 'nushu', - 0x1B29, 'reserved', - 0x1B30, 'kaida', - 0x1B38, 'reserved', - 0x1B40, 'reserved', + 0x1B10, 'kana+A', + 0x1B13, 'kaidā', + 0x1B17, '', + 0x1B20, 'nushu', + 0x1B30, 'shuishu', 0x1B50, 'proto-elamite', 0x1BC0, 'duployan', 0x1BCA, 'sh', 0x1BCB, 'pitman', + 0x1BD0, 'shorthands?', + 0x1C00, 'micmac hieroglyphs', + 0x1CB0, 'rongorongo', + 0x1CE0, 'reserved', 0x1D00, 'byzantine musical', 0x1D10, 'musical symbols', 0x1D20, 'anc greek music', - 0x1D25, 'reserved', + 0x1D25, 'reserved', + 0x1D2E, 'mayan', 0x1D30, 'tai xuan jing', 0x1D36, 'rod', - 0x1D38, 'reserved', - 0x1D40, 'mathematical alphanumeric', # Sm - 0x1D80, 'sutton', + 0x1D38, 'mathematical alphanumeric+', + 0x1D40, 'mathematical alphanumeric', + 0x1D80, 'sutton', + 0x1DA0, '', + 0x1DAB, 'reserved', 0x1DB0, 'reserved', - 0x1E00, 'glagol+', - 0x1E03, 'reserved', - 0x1E10, 'reserved', + 0x1E00, 'glagol+', + 0x1E03, 'pallava', + 0x1E08, 'chalukya', + 0x1E0E, 'res', + 0x1E10, 'eebee hmong', + 0x1E1B, 'cher vang hmong', + 0x1E20, 'western cham', + 0x1E27, 'beria', + 0x1E2A, 'reserved', + 0x1E30, 'loma', + 0x1E50, 'reserved', 0x1E80, 'mende kikakui', - 0x1E90, 'adlam', + 0x1E8E, 'res', + 0x1E90, 'adlam', 0x1E96, 'reserved', 0x1EA0, 'reserved', 0x1EC0, 'persian siyaq', 0x1EC7, 'indic siyaq', 0x1ECC, 'diwani siyaq', - 0x1ED0, 'ottoman siyaq', - 0x1ED4, 'reserved', - 0x1E8E, 'res', + 0x1ED0, 'ottoman siyaq', + 0x1ED5, 'reserved', 0x1EE0, 'arabic mathematical alphabetic', # Sm 0x1EF0, 'reserved', 0x1F00, 'mahjong', @@ -413,7 +434,8 @@ my %uniblock = ( 0x1F70, 'alchemical', 0x1F78, 'geometric shapes ext', 0x1F80, 'supplemental arrows-C', - 0x1F90, 'reserved', + 0x1F90, 'supplemental symbols and pictographs', + 0x1FA0, 'reserved', ); sub { -- 2.30.0