X-Git-Url: http://git.shiar.nl/sheet.git/blobdiff_plain/9e57a0c381c63dcd3ec4803da1616a5f34bf694c..1a31f360dede26675fce9b4f36ed856eb7fbf70f:/charset-unicode.inc.pl
diff --git a/charset-unicode.inc.pl b/charset-unicode.inc.pl
index b96701e..f12c505 100644
--- a/charset-unicode.inc.pl
+++ b/charset-unicode.inc.pl
@@ -1,5 +1,6 @@
use utf8;
my %uniblock = (
+ # bmp
0x000, '
control',
0x002, ' | comn',
0x004, ' | basic latin',
@@ -180,13 +181,15 @@ my %uniblock = (
0xFF0, ' | halfwidth & fullwidth forms',
0xFFF, ' | sp',
+ # smp
0x1000, ' | linear B syllabary',
0x1008, ' | linear B ideograms',
0x1010, ' | aegean num',
0x1014, ' | greek numbers',
0x1019, ' | ancient sym',
0x101D, ' | phaistos',
- 0x1020, ' | reserved',
+ 0x1020, ' | iberian',
+ 0x1024, ' | reserved',
0x1028, ' | lycian',
0x102A, ' | carian',
0x102E, ' | coptic',
@@ -195,28 +198,25 @@ my %uniblock = (
0x1035, ' | permic',
0x1038, ' | ugarit',
0x103A, ' | old persian',
- 0x103E, ' | res',
+ 0x103E, ' | sh.qs',
0x1040, ' | deseret',
0x1045, ' | shavian',
0x1048, ' | osmanya',
- 0x104B, ' | osage',
+ 0x104B, ' | osage',
0x1050, ' | elbasan',
0x1053, ' | c albanian',
- 0x1057, ' | qs',
- 0x1058, ' | vithkuqi',
- 0x105D, ' | res',
- 0x105E, ' | iber',
+ 0x1057, ' | vithkuqi',
+ 0x105C, ' | todhri',
0x1060, ' | linear A',
0x1070, ' | linear A',
- 0x1078, ' | todhri',
- 0x107C, ' | cyp minoan',
+ 0x1078, ' | cypro-minoan',
0x1080, ' | cypriot',
0x1084, ' | aram',
0x1086, ' | palmr',
0x1088, ' | nabataean',
0x108A, ' | res',
0x108C, ' | numid',
- 0x108E, ' | hatr',
+ 0x108E, ' | hatr',
0x1090, ' | phoen',
0x1092, ' | lydian',
0x1094, ' | reserved',
@@ -235,15 +235,18 @@ my %uniblock = (
0x10BE, ' | babur',
0x10C0, ' | old turkic',
0x10C5, ' | reserved',
- 0x10C8, ' | old hungarian',
+ 0x10C8, ' | old hungarian',
0x10D0, ' | rohingya',
0x10D4, ' | garay',
- 0x10D8, ' | reserved',
- 0x10E0, ' | sogdian',
+ 0x10D8, ' | byblos',
+ 0x10E0, ' | reserved',
0x10E6, ' | rumi',
- 0x10E8, ' | uyghur',
+ 0x10E8, ' | reserved',
0x10EE, ' | elym',
- 0x10F0, ' | reserved',
+ 0x10F0, ' | old sog',
+ 0x10F3, ' | sogdian',
+ 0x10F7, ' | res',
+ 0x10F8, ' | uyghur',
0x1100, ' | brahmi',
0x1108, ' | kaithi',
0x110D, ' | sora som',
@@ -253,27 +256,26 @@ my %uniblock = (
0x111E, ' | sinhal',
0x1120, ' | khojki',
0x1125, ' | landa',
- 0x1128, ' | multani',
+ 0x1128, ' | multani',
0x112B, ' | khudabadi',
0x1130, ' | grantha',
0x1138, ' | tulu',
0x113E, ' | shar+',
- 0x1140, ' | newar',
+ 0x1140, ' | newar',
0x1148, ' | tirhuta',
0x114E, ' | tani',
- 0x1150, ' | ranjana',
- 0x1156, ' | res',
+ 0x1150, ' | ranjana',
0x1158, ' | siddham',
0x1160, ' | modi',
- 0x1166, ' | mong',
+ 0x1166, ' | mong',
0x1168, ' | takri',
0x116D, ' | jenticha',
0x1170, ' | ahom',
0x1174, ' | zou',
0x117A, ' | pyu',
- 0x1180, ' | khema',
- 0x1184, ' | khe prih',
- 0x1188, ' | reserved', #TODO
+ 0x1180, ' | dogra',
+ 0x1185, ' | sirmauri',
+ 0x1189, ' | res',
0x118A, ' | warang citi',
0x1190, ' | tolong siki',
0x1194, ' | tikamuli',
@@ -285,51 +287,57 @@ my %uniblock = (
0x11AC, ' | pau cin hau',
0x11B0, ' | dhives akuru',
0x11B5, ' | leke',
- 0x11B9, ' | gondi',
+ 0x11B9, ' | nandinagari',
0x11BF, ' | res',
- 0x11C0, ' | bhaiksuki',
- 0x11C7, ' | marchen',
+ 0x11C0, ' | bhaiksuki',
+ 0x11C7, ' | marchen',
0x11CC, ' | balti B',
- 0x11D0, ' | kawi',
- 0x11D5, ' | nandinagari',
- 0x11DB, ' | reserved',
- 0x11E0, ' | chalukya',
- 0x11E6, ' | chola',
- 0x11EC, ' | reserved',
- 0x11F0, ' | satavahana',
- 0x11F6, ' | turkestani',
+ 0x11D0, ' | masaram gondi',
+ 0x11D6, ' | gunjala gondi',
+ 0x11DB, ' | kawi',
+ 0x11E0, ' | tocharian',
+ 0x11E7, ' | khotanese',
+ 0x11ED, ' | res',
+ 0x11EE, ' | makas',
+ 0x11F0, ' | vatteluttu',
+ 0x11F4, ' | res',
+ 0x11F6, ' | chola',
0x11FC, ' | tamil+',
0x1200, ' | cuneiform',
0x1240, ' | cuneiform numbers',
- 0x1248, ' | early dynastic cuneiform',
- 0x1250, ' | early dynastic cuneiform',
- 0x1258, ' | reserved',
+ 0x1248, ' | early dynastic cuneiform',
+ 0x1250, ' | e. dyn. cuneiform',
+ 0x1255, ' | reserved',
0x1260, ' | proto-cuneiform',
0x12E0, ' | indus',
0x12F0, ' | indus',
0x12F9, ' | reserved',
0x1300, ' | egyptian hieroglyphs',
0x1340, ' | egyptian',
- 0x1343, ' | reserved',
- 0x1350, ' | egyptian hieroglyphs extended',
- 0x1410, ' | pau cin hau syllabary',
- 0x1440, ' | anatolian hieroglyphs',
- 0x1460, ' | anatolian hieroglyphs',
- 0x1468, ' | reserved',
- 0x1470, ' | eskaya',
- 0x14B0, ' | eskaya',
- 0x14B6, ' | reserved',
- 0x14C0, ' | reserved',
- 0x1540, ' | maya hieroglyphs',
- 0x1590, ' | reserved',
+ 0x1343, ' | eg.c',
+ 0x1344, ' | ',
+ 0x1350, ' | egyptian hieroglyphs extended-A',
+ 0x1440, ' | anatolian hieroglyphs',
+ 0x1460, ' | anatolian',
+ 0x1468, ' | ',
+ 0x1470, ' | egyptian hieroglyphs extended-B',
+ 0x1500, ' | lampung',
+ 0x1504, ' | kerinci',
+ 0x1507, ' | res',
+ 0x1508, ' | ',
+ 0x1510, ' | mandombe',
+ 0x1550, ' | maya hieroglyphs',
+ 0x15A0, ' | reserved',
0x15C0, ' | aztec pictograms',
0x1600, ' | cirth',
0x1608, ' | tengwar',
- 0x1610, ' | reserved',
+ 0x1610, ' | khema',
+ 0x1614, ' | khe prih',
+ 0x1618, ' | res',
0x161A, ' | moon',
0x1620, ' | blissymbols',
0x1670, ' | bagam',
- 0x167B, ' | reserved',
+ 0x167B, ' | iban',
0x1680, ' | bamum supplement',
0x16A0, ' | bamum+',
0x16A4, ' | mro',
@@ -340,65 +348,78 @@ my %uniblock = (
0x16C0, ' | kpelle',
0x16C8, ' | afaka',
0x16CD, ' | lk tangsa',
- 0x16D0, ' | loma',
- 0x16DD, ' | zaghawa',
- 0x16E0, ' | mwangwego',
- 0x16E5, ' | reserved',
+ 0x16D0, ' | reserved',
+ 0x16DD, ' | kulitan',
+ 0x16E0, ' | mwangwego',
+ 0x16E4, ' | medefaidrin',
+ 0x16EA, ' | lontara+',
0x16F0, ' | miao',
- 0x16FA, ' | reserved',
- 0x16FE, ' | ideo',
- 0x1700, ' | tangut ideographs',
- 0x1880, ' | reserved',
- 0x1890, ' | tangut radicals',
- 0x18C0, ' | reserved',
- 0x1900, ' | jurchen',
- 0x1950, ' | jurchen',
- 0x1956, ' | jurchen rad',
- 0x195A, ' | reserved',
- 0x1960, ' | khitan small',
- 0x1970, ' | khitan small',
- 0x1978, ' | reserved',
- 0x1980, ' | khitan large',
- 0x1A10, ' | reserved',
+ 0x16FA, ' | lontara b-b',
+ 0x16FE, ' | ideo',
+ 0x1700, ' | tangut ideographs',
+ 0x1880, ' | tangut components',
+ 0x18B0, ' | khitan small',
+ 0x18D0, ' | khitan ideographs',
+ 0x1960, ' | jurchen',
+ 0x19B0, ' | jurchen',
+ 0x19B6, ' | jurchen rad',
+ 0x19BA, ' | reserved',
+ 0x19C0, ' | reserved',
+ 0x19E0, ' | pau cin hau syllabary',
+ 0x1A30, ' | eskaya',
0x1A80, ' | naxi geba',
0x1AA0, ' | naxi geba',
0x1AAB, ' | res',
- 0x1AAC, ' | naxi dongba',
- 0x1AB0, ' | naxi dongba',
+ 0x1AAC, ' | ',
+ 0x1AB0, ' | naxi dongba',
0x1B00, ' | kana supplement',
- 0x1B10, ' | nushu',
- 0x1B20, ' | nushu',
- 0x1B29, ' | reserved',
- 0x1B30, ' | kaida',
- 0x1B38, ' | reserved',
- 0x1B40, ' | reserved',
+ 0x1B10, ' | kana+A',
+ 0x1B13, ' | kaidÄ',
+ 0x1B17, ' | ',
+ 0x1B20, ' | nushu',
+ 0x1B30, ' | shuishu',
0x1B50, ' | proto-elamite',
0x1BC0, ' | duployan',
0x1BCA, ' | sh',
0x1BCB, ' | pitman',
+ 0x1BD0, ' | shorthands?',
+ 0x1C00, ' | micmac hieroglyphs',
+ 0x1CB0, ' | rongorongo',
+ 0x1CE0, ' | reserved',
0x1D00, ' | byzantine musical',
0x1D10, ' | musical symbols',
0x1D20, ' | anc greek music',
- 0x1D25, ' | reserved',
+ 0x1D25, ' | reserved',
+ 0x1D2E, ' | mayan',
0x1D30, ' | tai xuan jing',
0x1D36, ' | rod',
- 0x1D38, ' | reserved',
- 0x1D40, ' | mathematical alphanumeric', # Sm
- 0x1D80, ' | sutton',
+ 0x1D38, ' | mathematical alphanumeric+',
+ 0x1D40, ' | mathematical alphanumeric',
+ 0x1D80, ' | sutton',
+ 0x1DA0, ' | ',
+ 0x1DAB, ' | reserved',
0x1DB0, ' | reserved',
- 0x1E00, ' | glagol+',
- 0x1E03, ' | reserved',
- 0x1E10, ' | reserved',
+ 0x1E00, ' | glagol+',
+ 0x1E03, ' | pallava',
+ 0x1E08, ' | chalukya',
+ 0x1E0E, ' | res',
+ 0x1E10, ' | eebee hmong',
+ 0x1E1B, ' | cher vang hmong',
+ 0x1E20, ' | western cham',
+ 0x1E27, ' | beria',
+ 0x1E2A, ' | reserved',
+ 0x1E30, ' | loma',
+ 0x1E50, ' | reserved',
0x1E80, ' | mende kikakui',
- 0x1E90, ' | adlam',
+ 0x1E8E, ' | res',
+ 0x1E90, ' | adlam',
0x1E96, ' | reserved',
0x1EA0, ' | reserved',
0x1EC0, ' | persian siyaq',
0x1EC7, ' | indic siyaq',
0x1ECC, ' | diwani siyaq',
- 0x1ED0, ' | ottoman siyaq',
- 0x1ED4, ' | reserved',
- 0x1E8E, ' | res',
+ 0x1ED0, ' | ottoman siyaq',
+ 0x1ED5, ' | reserved',
0x1EE0, ' | arabic mathematical alphabetic', # Sm
0x1EF0, ' | reserved',
0x1F00, ' | mahjong',
@@ -413,7 +434,8 @@ my %uniblock = (
0x1F70, ' | alchemical',
0x1F78, ' | geometric shapes ext',
0x1F80, ' | supplemental arrows-C',
- 0x1F90, ' | reserved',
+ 0x1F90, ' | supplemental symbols and pictographs',
+ 0x1FA0, ' | reserved',
);
sub {
|