From 7d1044e5e4df51459cafb742090ce62b52d9e087 Mon Sep 17 00:00:00 2001 From: Mischa POSLAWSKY Date: Sat, 13 Sep 2008 03:11:33 +0000 Subject: [PATCH 1/1] digraphs: custom shiar digraphs Quite some personal addendums not in the official RFC-1345. Indicated as such, so should not be much of a hindrance (on the contrary, people looking for these missing characters will find and perhaps add them themselves). --- digraphs.inc.pl | 161 ++++++++++++++++++++++++++++++++++ rfc1345convert | 21 ++++- shiar.inc.txt | 228 ++++++++++++++++++++++++++++++++++++++++++++++++ 3 files changed, 409 insertions(+), 1 deletion(-) create mode 100644 shiar.inc.txt diff --git a/digraphs.inc.pl b/digraphs.inc.pl index 748134d..cfa65d2 100644 --- a/digraphs.inc.pl +++ b/digraphs.inc.pl @@ -2,12 +2,17 @@ q{!!}=>[124,'VERTICAL LINE','Sm Xa','Common'], q{!)}=>[125,'RIGHT CURLY BRACKET','Pe Xa','Common'], q{!*}=>[57382,'','Co','Common'], +q{!-}=>[450,'LATIN LETTER ALVEOLAR CLICK','Lo Xz','Latin'], q{!2}=>[8214,'DOUBLE VERTICAL LINE','Po','Common'], q{!:}=>[7942,'GREEK SMALL LETTER ALPHA WITH PSILI AND PERISPOMENI','Ll','Greek'], q{!<}=>[8814,'NOT LESS-THAN','Sm','Common'], q{!=}=>[8800,'NOT EQUAL TO','Sm','Common'], q{!>}=>[8815,'NOT GREATER-THAN','Sm','Common'], q{!I}=>[161,'INVERTED EXCLAMATION MARK','Po Xl','Common'], +q{!b}=>[664,'LATIN LETTER BILABIAL CLICK','Ll Xz','Latin'], +q{!c}=>[448,'LATIN LETTER DENTAL CLICK','Lo Xz','Latin'], +q{!q}=>[451,'LATIN LETTER RETROFLEX CLICK','Lo Xz','Latin'], +q{!x}=>[449,'LATIN LETTER LATERAL CLICK','Lo Xz','Latin'], q{"!}=>[57350,'','Co','Common'], q{""}=>[57359,'','Co','Common'], q{"'}=>[57351,'','Co','Common'], @@ -36,6 +41,9 @@ q{"p}=>[57368,'','Co','Common'], q{%"}=>[1068,'CYRILLIC CAPITAL LETTER SOFT SIGN','Lu','Cyrillic'], q{%'}=>[1100,'CYRILLIC SMALL LETTER SOFT SIGN','Ll','Cyrillic'], q{%0}=>[8240,'PER MILLE SIGN','Po','Common'], +q{%2}=>[423,'LATIN CAPITAL LETTER TONE TWO','Lu Xz','Latin'], +q{%5}=>[444,'LATIN CAPITAL LETTER TONE FIVE','Lu Xz','Latin'], +q{%6}=>[388,'LATIN CAPITAL LETTER TONE SIX','Lu Xz','Latin'], q{'!}=>[96,'GRAVE ACCENT','Sk Xa','Common'], q{'"}=>[733,'DOUBLE ACUTE ACCENT','Sk','Common'], q{'%}=>[1012,'GREEK CAPITAL THETA SYMBOL','Lu','Greek'], @@ -76,6 +84,7 @@ q{)S}=>[8318,'SUPERSCRIPT RIGHT PARENTHESIS','Pe','Common'], q{)U}=>[8746,'UNION','Sm','Common'], q{)_}=>[8839,'SUPERSET OF OR EQUAL TO','Sm','Common'], q{)s}=>[8334,'SUBSCRIPT RIGHT PARENTHESIS','Pe','Common'], +q{**}=>[8273,'TWO ASTERISKS ALIGNED VERTICALLY','Po Xz','Common'], q{*-}=>[8727,'ASTERISK OPERATOR','Sm','Common'], q{*1}=>[9734,'WHITE STAR','So','Common'], q{*2}=>[9733,'BLACK STAR','So','Common'], @@ -180,8 +189,10 @@ q{1j}=>[9286,'OCR BRANCH BANK IDENTIFICATION','So','Common'], q{1r}=>[8560,'SMALL ROMAN NUMERAL ONE','Nl','Common'], q{1s}=>[8321,'SUBSCRIPT ONE','No','Common'], q{2"}=>[8246,'REVERSED DOUBLE PRIME','Po','Common'], +q{2%}=>[424,'LATIN SMALL LETTER TONE TWO','Ll Xz','Latin'], q{2'}=>[8243,'DOUBLE PRIME','Po','Common'], q{2.}=>[9353,'DIGIT TWO FULL STOP','No','Common'], +q{2/}=>[443,'LATIN LETTER TWO WITH STROKE','Lo Xz','Latin'], q{23}=>[8532,'VULGAR FRACTION TWO THIRDS','No','Common'], q{25}=>[8534,'VULGAR FRACTION TWO FIFTHS','No','Common'], q{2R}=>[8545,'ROMAN NUMERAL TWO','Nl','Common'], @@ -195,6 +206,7 @@ q{2s}=>[8322,'SUBSCRIPT TWO','No','Common'], q{3!}=>[9478,'BOX DRAWINGS LIGHT TRIPLE DASH VERTICAL','So','Common'], q{3"}=>[8247,'REVERSED TRIPLE PRIME','Po','Common'], q{3'}=>[8244,'TRIPLE PRIME','Po','Common'], +q{3*}=>[8258,'ASTERISM','Po Xz','Common'], q{3+}=>[1617,'ARABIC SHADDA','Mn','Inherited'], q{3-}=>[9476,'BOX DRAWINGS LIGHT TRIPLE DASH HORIZONTAL','So','Common'], q{3.}=>[9354,'DIGIT THREE FULL STOP','No','Common'], @@ -227,6 +239,7 @@ q{4h}=>[9283,'OCR INVERTED FORK','So','Common'], q{4j}=>[9289,'OCR CUSTOMER ACCOUNT NUMBER','So','Common'], q{4r}=>[8563,'SMALL ROMAN NUMERAL FOUR','Nl','Common'], q{4s}=>[8324,'SUBSCRIPT FOUR','No','Common'], +q{5%}=>[445,'LATIN SMALL LETTER TONE FIVE','Ll Xz','Latin'], q{5.}=>[9356,'DIGIT FIVE FULL STOP','No','Common'], q{56}=>[8538,'VULGAR FRACTION FIVE SIXTHS','No','Common'], q{58}=>[8541,'VULGAR FRACTION FIVE EIGHTHS','No','Common'], @@ -236,6 +249,7 @@ q{5a}=>[1781,'EXTENDED ARABIC-INDIC DIGIT FIVE','Nd','Arabic'], q{5c}=>[12836,'PARENTHESIZED IDEOGRAPH FIVE','No','Common'], q{5r}=>[8564,'SMALL ROMAN NUMERAL FIVE','Nl','Common'], q{5s}=>[8325,'SUBSCRIPT FIVE','No','Common'], +q{6%}=>[389,'LATIN SMALL LETTER TONE SIX','Ll Xz','Latin'], q{6.}=>[9357,'DIGIT SIX FULL STOP','No','Common'], q{6M}=>[8198,'SIX-PER-EM SPACE','Zs','Common'], q{6R}=>[8549,'ROMAN NUMERAL SIX','Nl','Common'], @@ -270,6 +284,8 @@ q{9a}=>[1785,'EXTENDED ARABIC-INDIC DIGIT NINE','Nd','Arabic'], q{9c}=>[12840,'PARENTHESIZED IDEOGRAPH NINE','No','Common'], q{9r}=>[8568,'SMALL ROMAN NUMERAL NINE','Nl','Common'], q{9s}=>[8329,'SUBSCRIPT NINE','No','Common'], +q{:(}=>[9785,'WHITE FROWNING FACE','So Xz','Common'], +q{:)}=>[9786,'WHITE SMILING FACE','So Xz','Common'], q{:+}=>[1611,'ARABIC FATHATAN','Mn','Inherited'], q{:.}=>[8757,'BECAUSE','Sm','Common'], q{:3}=>[8942,'VERTICAL ELLIPSIS','Sm','Common'], @@ -292,6 +308,7 @@ q{<+}=>[12298,'LEFT DOUBLE ANGLE BRACKET','Ps','Common'], q{<-}=>[8592,'LEFTWARDS ARROW','Sm','Common'], q{[9001,'LEFT-POINTING ANGLE BRACKET','Ps','Common'], q{<1}=>[8249,'SINGLE LEFT-POINTING ANGLE QUOTATION MARK','Pi','Common'], +q{<3}=>[9829,'BLACK HEART SUIT','So Xz','Common'], q{<7}=>[8968,'LEFT CEILING','Sm','Common'], q{<<}=>[171,'LEFT-POINTING DOUBLE ANGLE QUOTATION MARK','Pi Xl','Common'], q{<=}=>[8656,'LEFTWARDS DOUBLE ARROW','So','Common'], @@ -309,6 +326,7 @@ q{=?}=>[8780,'ALL EQUAL TO','Sm','Common'], q{=S}=>[8316,'SUPERSCRIPT EQUALS SIGN','Sm','Common'], q{=T}=>[12306,'POSTAL MARK','So','Common'], q{=_}=>[12307,'GETA MARK','So','Common'], +q{=e}=>[8364,'EURO SIGN','Sc Xz','Common'], q{=s}=>[8332,'SUBSCRIPT EQUALS SIGN','Sm','Common'], q{>"}=>[12303,'RIGHT WHITE CORNER BRACKET','Pe','Common'], q{>'}=>[12301,'RIGHT CORNER BRACKET','Pe','Common'], @@ -319,10 +337,13 @@ q{>=}=>[8805,'GREATER-THAN OR EQUAL TO','Sm','Common'], q{>>}=>[187,'RIGHT-POINTING DOUBLE ANGLE QUOTATION MARK','Pf Xl','Common'], q{>H}=>[9758,'WHITE RIGHT POINTING INDEX','So','Common'], q{>V}=>[57381,'','Co','Common'], +q{?!}=>[8253,'INTERROBANG','Po Xz','Common'], q{?*}=>[57383,'','Co','Common'], q{?+}=>[1567,'ARABIC QUESTION MARK','Po','Common'], q{?,}=>[7941,'GREEK SMALL LETTER ALPHA WITH DASIA AND OXIA','Ll','Greek'], q{?-}=>[8771,'ASYMPTOTICALLY EQUAL TO','Sm','Common'], +q{?.}=>[660,'LATIN LETTER GLOTTAL STOP','Ll Xz','Latin'], +q{?/}=>[673,'LATIN LETTER GLOTTAL STOP WITH STROKE','Ll Xz','Latin'], q{?1}=>[8764,'TILDE OPERATOR','Sm','Common'], q{?2}=>[8776,'ALMOST EQUAL TO','Sm','Common'], q{?:}=>[7943,'GREEK SMALL LETTER ALPHA WITH DASIA AND PERISPOMENI','Ll','Greek'], @@ -334,15 +355,19 @@ q{A!}=>[192,'LATIN CAPITAL LETTER A WITH GRAVE','Lu Xl','Latin'], q{A%}=>[902,'GREEK CAPITAL LETTER ALPHA WITH TONOS','Lu','Greek'], q{A'}=>[193,'LATIN CAPITAL LETTER A WITH ACUTE','Lu Xl','Latin'], q{A(}=>[258,'LATIN CAPITAL LETTER A WITH BREVE','Lu','Latin'], +q{A)}=>[514,'LATIN CAPITAL LETTER A WITH INVERTED BREVE','Lu Xz','Latin'], q{A*}=>[913,'GREEK CAPITAL LETTER ALPHA','Lu','Greek'], q{A+}=>[1488,'HEBREW LETTER ALEF','Lo','Hebrew'], q{A-}=>[256,'LATIN CAPITAL LETTER A WITH MACRON','Lu','Latin'], +q{A.}=>[550,'LATIN CAPITAL LETTER A WITH DOT ABOVE','Lu Xz','Latin'], +q{A0}=>[506,'LATIN CAPITAL LETTER A WITH RING ABOVE AND ACUTE','Lu Xz','Latin'], q{A1}=>[478,'LATIN CAPITAL LETTER A WITH DIAERESIS AND MACRON','Lu','Latin'], q{A2}=>[7842,'LATIN CAPITAL LETTER A WITH HOOK ABOVE','Lu','Latin'], q{A3}=>[482,'LATIN CAPITAL LETTER AE WITH MACRON','Lu','Latin'], q{A5}=>[12353,'HIRAGANA LETTER SMALL A','Lo','Hiragana'], q{A6}=>[12450,'KATAKANA LETTER A','Lo','Katakana'], q{A7}=>[480,'LATIN CAPITAL LETTER A WITH DOT ABOVE AND MACRON','Lu','Latin'], +q{A8}=>[512,'LATIN CAPITAL LETTER A WITH DOUBLE GRAVE','Lu Xz','Latin'], q{A:}=>[196,'LATIN CAPITAL LETTER A WITH DIAERESIS','Lu Xl','Latin'], q{A;}=>[260,'LATIN CAPITAL LETTER A WITH OGONEK','Lu','Latin'], q{A<}=>[461,'LATIN CAPITAL LETTER A WITH CARON','Lu','Latin'], @@ -358,7 +383,10 @@ q{AO}=>[8491,'ANGSTROM SIGN','Lu','Latin'], q{At}=>[64,'COMMERCIAL AT','Po Xa','Common'], q{B*}=>[914,'GREEK CAPITAL LETTER BETA','Lu','Greek'], q{B+}=>[1489,'HEBREW LETTER BET','Lo','Hebrew'], +q{B-}=>[386,'LATIN CAPITAL LETTER B WITH TOPBAR','Lu Xz','Latin'], q{B.}=>[7682,'LATIN CAPITAL LETTER B WITH DOT ABOVE','Lu','Latin'], +q{B/}=>[579,'','Xn Xz',''], +q{B2}=>[385,'LATIN CAPITAL LETTER B WITH HOOK','Lu Xz','Latin'], q{B=}=>[1041,'CYRILLIC CAPITAL LETTER BE','Lu','Cyrillic'], q{BB}=>[166,'BROKEN BAR','So Xl','Common'], q{BD}=>[9586,'BOX DRAWINGS LIGHT DIAGONAL UPPER LEFT TO LOWER RIGHT','So','Common'], @@ -377,6 +405,7 @@ q{C'}=>[262,'LATIN CAPITAL LETTER C WITH ACUTE','Lu','Latin'], q{C*}=>[926,'GREEK CAPITAL LETTER XI','Lu','Greek'], q{C,}=>[199,'LATIN CAPITAL LETTER C WITH CEDILLA','Lu Xl','Latin'], q{C.}=>[266,'LATIN CAPITAL LETTER C WITH DOT ABOVE','Lu','Latin'], +q{C2}=>[391,'LATIN CAPITAL LETTER C WITH HOOK','Lu Xz','Latin'], q{C3}=>[1152,'CYRILLIC CAPITAL LETTER KOPPA','Lu','Cyrillic'], q{C<}=>[268,'LATIN CAPITAL LETTER C WITH CARON','Lu','Latin'], q{C=}=>[1062,'CYRILLIC CAPITAL LETTER TSE','Lu','Cyrillic'], @@ -402,6 +431,7 @@ q{D1}=>[17,'','Cc Xa','Common'], q{D2}=>[18,'','Cc Xa','Common'], q{D3}=>[19,'','Cc Xa','Common'], q{D4}=>[20,'','Cc Xa','Common'], +q{D;}=>[393,'LATIN CAPITAL LETTER AFRICAN D','Lu Xz','Latin'], q{D<}=>[270,'LATIN CAPITAL LETTER D WITH CARON','Lu','Latin'], q{D=}=>[1044,'CYRILLIC CAPITAL LETTER DE','Lu','Cyrillic'], q{DC}=>[144,'','Cc Xl','Common'], @@ -431,13 +461,17 @@ q{E!}=>[200,'LATIN CAPITAL LETTER E WITH GRAVE','Lu Xl','Latin'], q{E%}=>[904,'GREEK CAPITAL LETTER EPSILON WITH TONOS','Lu','Greek'], q{E'}=>[201,'LATIN CAPITAL LETTER E WITH ACUTE','Lu Xl','Latin'], q{E(}=>[276,'LATIN CAPITAL LETTER E WITH BREVE','Lu','Latin'], +q{E)}=>[518,'LATIN CAPITAL LETTER E WITH INVERTED BREVE','Lu Xz','Latin'], q{E*}=>[917,'GREEK CAPITAL LETTER EPSILON','Lu','Greek'], q{E+}=>[1506,'HEBREW LETTER AYIN','Lo','Hebrew'], +q{E,}=>[552,'LATIN CAPITAL LETTER E WITH CEDILLA','Lu Xz','Latin'], q{E-}=>[274,'LATIN CAPITAL LETTER E WITH MACRON','Lu','Latin'], q{E.}=>[278,'LATIN CAPITAL LETTER E WITH DOT ABOVE','Lu','Latin'], +q{E/}=>[582,'','Xn Xz',''], q{E2}=>[7866,'LATIN CAPITAL LETTER E WITH HOOK ABOVE','Lu','Latin'], q{E5}=>[12359,'HIRAGANA LETTER SMALL E','Lo','Hiragana'], q{E6}=>[12456,'KATAKANA LETTER E','Lo','Katakana'], +q{E8}=>[516,'LATIN CAPITAL LETTER E WITH DOUBLE GRAVE','Lu Xz','Latin'], q{E:}=>[203,'LATIN CAPITAL LETTER E WITH DIAERESIS','Lu Xl','Latin'], q{E;}=>[280,'LATIN CAPITAL LETTER E WITH OGONEK','Lu','Latin'], q{E<}=>[282,'LATIN CAPITAL LETTER E WITH CARON','Lu','Latin'], @@ -455,14 +489,17 @@ q{ET}=>[4,'','Cc Xa','Common'], q{EX}=>[3,'','Cc Xa','Common'], q{EZ}=>[494,'LATIN CAPITAL LETTER EZH WITH CARON','Lu','Latin'], q{Eh}=>[8962,'HOUSE','So','Common'], +q{Eu}=>[8364,'EURO SIGN','Sc Xz','Common'], q{F*}=>[934,'GREEK CAPITAL LETTER PHI','Lu','Greek'], q{F.}=>[7710,'LATIN CAPITAL LETTER F WITH DOT ABOVE','Lu','Latin'], +q{F2}=>[401,'LATIN CAPITAL LETTER F WITH HOOK','Lu Xz','Latin'], q{F3}=>[1138,'CYRILLIC CAPITAL LETTER FITA','Lu','Cyrillic'], q{F=}=>[1060,'CYRILLIC CAPITAL LETTER EF','Lu','Cyrillic'], q{FA}=>[8704,'FOR ALL','Sm','Common'], q{FB}=>[9608,'FULL BLOCK','So','Common'], q{FD}=>[9585,'BOX DRAWINGS LIGHT DIAGONAL UPPER RIGHT TO LOWER LEFT','So','Common'], q{FF}=>[12,'','Cc Xa','Common'], +q{FI}=>[8498,'TURNED CAPITAL F','So Xz','Common'], q{FS}=>[28,'','Cc Xa','Common'], q{Fd}=>[9698,'BLACK LOWER RIGHT TRIANGLE','So','Common'], q{Fl}=>[57379,'','Co','Common'], @@ -476,6 +513,7 @@ q{G,}=>[290,'LATIN CAPITAL LETTER G WITH CEDILLA','Lu','Latin'], q{G-}=>[7712,'LATIN CAPITAL LETTER G WITH MACRON','Lu','Latin'], q{G.}=>[288,'LATIN CAPITAL LETTER G WITH DOT ABOVE','Lu','Latin'], q{G/}=>[484,'LATIN CAPITAL LETTER G WITH STROKE','Lu','Latin'], +q{G2}=>[403,'LATIN CAPITAL LETTER G WITH HOOK','Lu Xz','Latin'], q{G3}=>[1168,'CYRILLIC CAPITAL LETTER GHE WITH UPTURN','Lu','Cyrillic'], q{G<}=>[486,'LATIN CAPITAL LETTER G WITH CARON','Lu','Latin'], q{G=}=>[1043,'CYRILLIC CAPITAL LETTER GHE','Lu','Cyrillic'], @@ -503,6 +541,7 @@ q{HJ}=>[137,'','Cc Xl','Common'], q{HO}=>[129,'','Cc Xl','Common'], q{HS}=>[136,'','Cc Xl','Common'], q{HT}=>[9,'','Cc Xa','Common'], +q{HW}=>[502,'LATIN CAPITAL LETTER HWAIR','Lu Xz','Latin'], q{Ha}=>[12495,'KATAKANA LETTER HA','Lo','Katakana'], q{He}=>[12504,'KATAKANA LETTER HE','Lo','Katakana'], q{Hi}=>[12498,'KATAKANA LETTER HI','Lo','Katakana'], @@ -512,12 +551,15 @@ q{I!}=>[204,'LATIN CAPITAL LETTER I WITH GRAVE','Lu Xl','Latin'], q{I%}=>[906,'GREEK CAPITAL LETTER IOTA WITH TONOS','Lu','Greek'], q{I'}=>[205,'LATIN CAPITAL LETTER I WITH ACUTE','Lu Xl','Latin'], q{I(}=>[300,'LATIN CAPITAL LETTER I WITH BREVE','Lu','Latin'], +q{I)}=>[522,'LATIN CAPITAL LETTER I WITH INVERTED BREVE','Lu Xz','Latin'], q{I*}=>[921,'GREEK CAPITAL LETTER IOTA','Lu','Greek'], q{I-}=>[298,'LATIN CAPITAL LETTER I WITH MACRON','Lu','Latin'], q{I.}=>[304,'LATIN CAPITAL LETTER I WITH DOT ABOVE','Lu','Latin'], +q{I/}=>[407,'LATIN CAPITAL LETTER I WITH STROKE','Lu Xz','Latin'], q{I2}=>[7880,'LATIN CAPITAL LETTER I WITH HOOK ABOVE','Lu','Latin'], q{I5}=>[12355,'HIRAGANA LETTER SMALL I','Lo','Hiragana'], q{I6}=>[12452,'KATAKANA LETTER I','Lo','Katakana'], +q{I8}=>[520,'LATIN CAPITAL LETTER I WITH DOUBLE GRAVE','Lu Xz','Latin'], q{I:}=>[207,'LATIN CAPITAL LETTER I WITH DIAERESIS','Lu Xl','Latin'], q{I;}=>[302,'LATIN CAPITAL LETTER I WITH OGONEK','Lu','Latin'], q{I<}=>[463,'LATIN CAPITAL LETTER I WITH CARON','Lu','Latin'], @@ -538,6 +580,7 @@ q{Iu}=>[8992,'TOP HALF INTEGRAL','Sm','Common'], q{J%}=>[1032,'CYRILLIC CAPITAL LETTER JE','Lu','Cyrillic'], q{J*}=>[938,'GREEK CAPITAL LETTER IOTA WITH DIALYTIKA','Lu','Greek'], q{J+}=>[1497,'HEBREW LETTER YOD','Lo','Hebrew'], +q{J/}=>[584,'','Xn Xz',''], q{J<}=>[57384,'','Co','Common'], q{J=}=>[1049,'CYRILLIC CAPITAL LETTER SHORT I','Lu','Cyrillic'], q{J>}=>[308,'LATIN CAPITAL LETTER J WITH CIRCUMFLEX','Lu','Latin'], @@ -549,6 +592,7 @@ q{K'}=>[7728,'LATIN CAPITAL LETTER K WITH ACUTE','Lu','Latin'], q{K*}=>[922,'GREEK CAPITAL LETTER KAPPA','Lu','Greek'], q{K+}=>[1499,'HEBREW LETTER KAF','Lo','Hebrew'], q{K,}=>[310,'LATIN CAPITAL LETTER K WITH CEDILLA','Lu','Latin'], +q{K2}=>[408,'LATIN CAPITAL LETTER K WITH HOOK','Lu Xz','Latin'], q{K3}=>[990,'GREEK LETTER KOPPA','Lu','Greek'], q{K<}=>[488,'LATIN CAPITAL LETTER K WITH CARON','Lu','Latin'], q{K=}=>[1050,'CYRILLIC CAPITAL LETTER KA','Lu','Cyrillic'], @@ -569,6 +613,7 @@ q{L.}=>[319,'LATIN CAPITAL LETTER L WITH MIDDLE DOT','Lu','Latin'], q{L/}=>[321,'LATIN CAPITAL LETTER L WITH STROKE','Lu','Latin'], q{L<}=>[317,'LATIN CAPITAL LETTER L WITH CARON','Lu','Latin'], q{L=}=>[1051,'CYRILLIC CAPITAL LETTER EL','Lu','Cyrillic'], +q{L?}=>[11362,'','Xn Xz',''], q{LB}=>[9604,'LOWER HALF BLOCK','So','Common'], q{LD}=>[9491,'BOX DRAWINGS HEAVY DOWN AND LEFT','So','Common'], q{LF}=>[10,'','Cc Xa','Common'], @@ -585,6 +630,7 @@ q{M2}=>[9835,'BEAMED EIGHTH NOTES','So','Common'], q{M3}=>[988,'GREEK LETTER DIGAMMA','Lu','Greek'], q{M8}=>[9834,'EIGHTH NOTE','So','Common'], q{M=}=>[1052,'CYRILLIC CAPITAL LETTER EM','Lu','Cyrillic'], +q{MI}=>[412,'LATIN CAPITAL LETTER TURNED M','Lu Xz','Latin'], q{MW}=>[149,'','Cc Xl','Common'], q{MX}=>[9839,'MUSIC SHARP SIGN','Sm','Common'], q{Ma}=>[12510,'KATAKANA LETTER MA','Lo','Katakana'], @@ -597,6 +643,7 @@ q{Mo}=>[12514,'KATAKANA LETTER MO','Lo','Katakana'], q{Mu}=>[12512,'KATAKANA LETTER MU','Lo','Katakana'], q{Mx}=>[9838,'MUSIC NATURAL SIGN','So','Common'], q{My}=>[181,'MICRO SIGN','Ll Xl','Common'], +q{N!}=>[504,'LATIN CAPITAL LETTER N WITH GRAVE','Lu Xz','Latin'], q{N%}=>[1503,'HEBREW LETTER FINAL NUN','Lo','Hebrew'], q{N'}=>[323,'LATIN CAPITAL LETTER N WITH ACUTE','Lu','Latin'], q{N*}=>[925,'GREEK CAPITAL LETTER NU','Lu','Greek'], @@ -604,6 +651,7 @@ q{N+}=>[1504,'HEBREW LETTER NUN','Lo','Hebrew'], q{N,}=>[325,'LATIN CAPITAL LETTER N WITH CEDILLA','Lu','Latin'], q{N.}=>[7748,'LATIN CAPITAL LETTER N WITH DOT ABOVE','Lu','Latin'], q{N0}=>[8470,'NUMERO SIGN','So','Common'], +q{N2}=>[413,'LATIN CAPITAL LETTER N WITH LEFT HOOK','Lu Xz','Latin'], q{N6}=>[12531,'KATAKANA LETTER N','Lo','Katakana'], q{N<}=>[327,'LATIN CAPITAL LETTER N WITH CARON','Lu','Latin'], q{N=}=>[1053,'CYRILLIC CAPITAL LETTER EN','Lu','Cyrillic'], @@ -630,14 +678,17 @@ q{O"}=>[336,'LATIN CAPITAL LETTER O WITH DOUBLE ACUTE','Lu','Latin'], q{O%}=>[908,'GREEK CAPITAL LETTER OMICRON WITH TONOS','Lu','Greek'], q{O'}=>[211,'LATIN CAPITAL LETTER O WITH ACUTE','Lu Xl','Latin'], q{O(}=>[334,'LATIN CAPITAL LETTER O WITH BREVE','Lu','Latin'], +q{O)}=>[526,'LATIN CAPITAL LETTER O WITH INVERTED BREVE','Lu Xz','Latin'], q{O*}=>[927,'GREEK CAPITAL LETTER OMICRON','Lu','Greek'], q{O-}=>[332,'LATIN CAPITAL LETTER O WITH MACRON','Lu','Latin'], +q{O.}=>[558,'LATIN CAPITAL LETTER O WITH DOT ABOVE','Lu Xz','Latin'], q{O/}=>[216,'LATIN CAPITAL LETTER O WITH STROKE','Lu Xl','Latin'], q{O1}=>[492,'LATIN CAPITAL LETTER O WITH OGONEK AND MACRON','Lu','Latin'], q{O2}=>[7886,'LATIN CAPITAL LETTER O WITH HOOK ABOVE','Lu','Latin'], q{O3}=>[1130,'CYRILLIC CAPITAL LETTER BIG YUS','Lu','Cyrillic'], q{O5}=>[12361,'HIRAGANA LETTER SMALL O','Lo','Hiragana'], q{O6}=>[12458,'KATAKANA LETTER O','Lo','Katakana'], +q{O8}=>[524,'LATIN CAPITAL LETTER O WITH DOUBLE GRAVE','Lu Xz','Latin'], q{O9}=>[416,'LATIN CAPITAL LETTER O WITH HORN','Lu','Latin'], q{O:}=>[214,'LATIN CAPITAL LETTER O WITH DIAERESIS','Lu Xl','Latin'], q{O;}=>[490,'LATIN CAPITAL LETTER O WITH OGONEK','Lu','Latin'], @@ -659,6 +710,7 @@ q{P'}=>[7764,'LATIN CAPITAL LETTER P WITH ACUTE','Lu','Latin'], q{P*}=>[928,'GREEK CAPITAL LETTER PI','Lu','Greek'], q{P+}=>[1508,'HEBREW LETTER PE','Lo','Hebrew'], q{P.}=>[7766,'LATIN CAPITAL LETTER P WITH DOT ABOVE','Lu','Latin'], +q{P/}=>[11363,'','Xn Xz',''], q{P1}=>[145,'','Cc Xl','Common'], q{P2}=>[146,'','Cc Xl','Common'], q{P3}=>[992,'GREEK LETTER SAMPI','Lu','Greek'], @@ -681,11 +733,16 @@ q{Pt}=>[8359,'PESETA SIGN','Sc','Common'], q{Pu}=>[12503,'KATAKANA LETTER PU','Lo','Katakana'], q{Q*}=>[936,'GREEK CAPITAL LETTER PSI','Lu','Greek'], q{Q+}=>[1511,'HEBREW LETTER QOF','Lo','Hebrew'], +q{Q;}=>[586,'','Xn Xz',''], q{R'}=>[340,'LATIN CAPITAL LETTER R WITH ACUTE','Lu','Latin'], +q{R)}=>[530,'LATIN CAPITAL LETTER R WITH INVERTED BREVE','Lu Xz','Latin'], q{R*}=>[929,'GREEK CAPITAL LETTER RHO','Lu','Greek'], q{R+}=>[1512,'HEBREW LETTER RESH','Lo','Hebrew'], q{R,}=>[342,'LATIN CAPITAL LETTER R WITH CEDILLA','Lu','Latin'], q{R.}=>[7768,'LATIN CAPITAL LETTER R WITH DOT ABOVE','Lu','Latin'], +q{R/}=>[588,'','Xn Xz',''], +q{R8}=>[528,'LATIN CAPITAL LETTER R WITH DOUBLE GRAVE','Lu Xz','Latin'], +q{R;}=>[11364,'','Xn Xz',''], q{R<}=>[344,'LATIN CAPITAL LETTER R WITH CARON','Lu','Latin'], q{R=}=>[1056,'CYRILLIC CAPITAL LETTER ER','Lu','Cyrillic'], q{RB}=>[9616,'RIGHT HALF BLOCK','So','Common'], @@ -748,7 +805,9 @@ q{T+}=>[1514,'HEBREW LETTER TAV','Lo','Hebrew'], q{T,}=>[354,'LATIN CAPITAL LETTER T WITH CEDILLA','Lu','Latin'], q{T.}=>[7786,'LATIN CAPITAL LETTER T WITH DOT ABOVE','Lu','Latin'], q{T/}=>[358,'LATIN CAPITAL LETTER T WITH STROKE','Lu','Latin'], +q{T2}=>[428,'LATIN CAPITAL LETTER T WITH HOOK','Lu Xz','Latin'], q{T3}=>[986,'GREEK LETTER STIGMA','Lu','Greek'], +q{T;}=>[430,'LATIN CAPITAL LETTER T WITH RETROFLEX HOOK','Lu Xz','Latin'], q{T<}=>[356,'LATIN CAPITAL LETTER T WITH CARON','Lu','Latin'], q{T=}=>[1058,'CYRILLIC CAPITAL LETTER TE','Lu','Cyrillic'], q{TB}=>[9600,'UPPER HALF BLOCK','So','Common'], @@ -773,12 +832,15 @@ q{U"}=>[368,'LATIN CAPITAL LETTER U WITH DOUBLE ACUTE','Lu','Latin'], q{U%}=>[910,'GREEK CAPITAL LETTER UPSILON WITH TONOS','Lu','Greek'], q{U'}=>[218,'LATIN CAPITAL LETTER U WITH ACUTE','Lu Xl','Latin'], q{U(}=>[364,'LATIN CAPITAL LETTER U WITH BREVE','Lu','Latin'], +q{U)}=>[534,'LATIN CAPITAL LETTER U WITH INVERTED BREVE','Lu Xz','Latin'], q{U*}=>[933,'GREEK CAPITAL LETTER UPSILON','Lu','Greek'], q{U-}=>[362,'LATIN CAPITAL LETTER U WITH MACRON','Lu','Latin'], +q{U/}=>[580,'','Xn Xz',''], q{U0}=>[366,'LATIN CAPITAL LETTER U WITH RING ABOVE','Lu','Latin'], q{U2}=>[7910,'LATIN CAPITAL LETTER U WITH HOOK ABOVE','Lu','Latin'], q{U5}=>[12357,'HIRAGANA LETTER SMALL U','Lo','Hiragana'], q{U6}=>[12454,'KATAKANA LETTER U','Lo','Katakana'], +q{U8}=>[532,'LATIN CAPITAL LETTER U WITH DOUBLE GRAVE','Lu Xz','Latin'], q{U9}=>[431,'LATIN CAPITAL LETTER U WITH HORN','Lu','Latin'], q{U:}=>[220,'LATIN CAPITAL LETTER U WITH DIAERESIS','Lu Xl','Latin'], q{U;}=>[370,'LATIN CAPITAL LETTER U WITH OGONEK','Lu','Latin'], @@ -799,10 +861,12 @@ q{Ul}=>[9498,'BOX DRAWINGS UP HEAVY AND LEFT LIGHT','So','Common'], q{Ur}=>[9494,'BOX DRAWINGS UP HEAVY AND RIGHT LIGHT','So','Common'], q{V%}=>[1038,'CYRILLIC CAPITAL LETTER SHORT U','Lu','Cyrillic'], q{V*}=>[939,'GREEK CAPITAL LETTER UPSILON WITH DIALYTIKA','Lu','Greek'], +q{V2}=>[434,'LATIN CAPITAL LETTER V WITH HOOK','Lu Xz','Latin'], q{V3}=>[1140,'CYRILLIC CAPITAL LETTER IZHITSA','Lu','Cyrillic'], q{V=}=>[1042,'CYRILLIC CAPITAL LETTER VE','Lu','Cyrillic'], q{V?}=>[7804,'LATIN CAPITAL LETTER V WITH TILDE','Lu','Latin'], q{VH}=>[9547,'BOX DRAWINGS HEAVY VERTICAL AND HORIZONTAL','So','Common'], +q{VI}=>[581,'','Xn Xz',''], q{VL}=>[9515,'BOX DRAWINGS HEAVY VERTICAL AND LEFT','So','Common'], q{VR}=>[9507,'BOX DRAWINGS HEAVY VERTICAL AND RIGHT','So','Common'], q{VS}=>[138,'','Cc Xl','Common'], @@ -827,6 +891,7 @@ q{W:}=>[7812,'LATIN CAPITAL LETTER W WITH DIAERESIS','Lu','Latin'], q{W=}=>[8361,'WON SIGN','Sc','Common'], q{W>}=>[372,'LATIN CAPITAL LETTER W WITH CIRCUMFLEX','Lu','Latin'], q{WA}=>[12526,'KATAKANA LETTER SMALL WA','Lo','Katakana'], +q{WW}=>[503,'LATIN CAPITAL LETTER WYNN','Lu Xz','Latin'], q{Wa}=>[12527,'KATAKANA LETTER WA','Lo','Katakana'], q{We}=>[12529,'KATAKANA LETTER WE','Lo','Katakana'], q{Wi}=>[12528,'KATAKANA LETTER WI','Lo','Katakana'], @@ -840,10 +905,13 @@ q{Y!}=>[7922,'LATIN CAPITAL LETTER Y WITH GRAVE','Lu','Latin'], q{Y%}=>[905,'GREEK CAPITAL LETTER ETA WITH TONOS','Lu','Greek'], q{Y'}=>[221,'LATIN CAPITAL LETTER Y WITH ACUTE','Lu Xl','Latin'], q{Y*}=>[919,'GREEK CAPITAL LETTER ETA','Lu','Greek'], +q{Y-}=>[562,'LATIN CAPITAL LETTER Y WITH MACRON','Lu Xz','Latin'], q{Y.}=>[7822,'LATIN CAPITAL LETTER Y WITH DOT ABOVE','Lu','Latin'], +q{Y/}=>[590,'','Xn Xz',''], q{Y2}=>[7926,'LATIN CAPITAL LETTER Y WITH HOOK ABOVE','Lu','Latin'], q{Y3}=>[1122,'CYRILLIC CAPITAL LETTER YAT','Lu','Cyrillic'], q{Y:}=>[376,'LATIN CAPITAL LETTER Y WITH DIAERESIS','Lu','Latin'], +q{Y;}=>[435,'LATIN CAPITAL LETTER Y WITH HOOK','Lu Xz','Latin'], q{Y=}=>[1067,'CYRILLIC CAPITAL LETTER YERU','Lu','Cyrillic'], q{Y>}=>[374,'LATIN CAPITAL LETTER Y WITH CIRCUMFLEX','Lu','Latin'], q{Y?}=>[7928,'LATIN CAPITAL LETTER Y WITH TILDE','Lu','Latin'], @@ -851,6 +919,7 @@ q{YA}=>[12515,'KATAKANA LETTER SMALL YA','Lo','Katakana'], q{YI}=>[1031,'CYRILLIC CAPITAL LETTER YI','Lu','Cyrillic'], q{YO}=>[12519,'KATAKANA LETTER SMALL YO','Lo','Katakana'], q{YU}=>[12517,'KATAKANA LETTER SMALL YU','Lo','Katakana'], +q{YY}=>[540,'LATIN CAPITAL LETTER YOGH','Lu Xz','Latin'], q{Ya}=>[12516,'KATAKANA LETTER YA','Lo','Katakana'], q{Ye}=>[165,'YEN SIGN','Sc Xl','Common'], q{Yo}=>[12520,'KATAKANA LETTER YO','Lo','Katakana'], @@ -861,6 +930,7 @@ q{Z*}=>[918,'GREEK CAPITAL LETTER ZETA','Lu','Greek'], q{Z+}=>[1494,'HEBREW LETTER ZAYIN','Lo','Hebrew'], q{Z.}=>[379,'LATIN CAPITAL LETTER Z WITH DOT ABOVE','Lu','Latin'], q{Z/}=>[437,'LATIN CAPITAL LETTER Z WITH STROKE','Lu','Latin'], +q{Z2}=>[548,'LATIN CAPITAL LETTER Z WITH HOOK','Lu Xz','Latin'], q{Z<}=>[381,'LATIN CAPITAL LETTER Z WITH CARON','Lu','Latin'], q{Z=}=>[1047,'CYRILLIC CAPITAL LETTER ZE','Lu','Cyrillic'], q{Z>}=>[7824,'LATIN CAPITAL LETTER Z WITH CIRCUMFLEX','Lu','Latin'], @@ -876,9 +946,12 @@ q{a!}=>[224,'LATIN SMALL LETTER A WITH GRAVE','Ll Xl','Latin'], q{a%}=>[940,'GREEK SMALL LETTER ALPHA WITH TONOS','Ll','Greek'], q{a'}=>[225,'LATIN SMALL LETTER A WITH ACUTE','Ll Xl','Latin'], q{a(}=>[259,'LATIN SMALL LETTER A WITH BREVE','Ll','Latin'], +q{a)}=>[515,'LATIN SMALL LETTER A WITH INVERTED BREVE','Ll Xz','Latin'], q{a*}=>[945,'GREEK SMALL LETTER ALPHA','Ll','Greek'], q{a+}=>[1575,'ARABIC LETTER ALEF','Lo','Arabic'], q{a-}=>[257,'LATIN SMALL LETTER A WITH MACRON','Ll','Latin'], +q{a.}=>[551,'LATIN SMALL LETTER A WITH DOT ABOVE','Ll Xz','Latin'], +q{a0}=>[507,'LATIN SMALL LETTER A WITH RING ABOVE AND ACUTE','Ll Xz','Latin'], q{a1}=>[479,'LATIN SMALL LETTER A WITH DIAERESIS AND MACRON','Ll','Latin'], q{a2}=>[7843,'LATIN SMALL LETTER A WITH HOOK ABOVE','Ll','Latin'], q{a3}=>[483,'LATIN SMALL LETTER AE WITH MACRON','Ll','Latin'], @@ -886,6 +959,7 @@ q{a4}=>[12570,'BOPOMOFO LETTER A','Lo','Bopomofo'], q{a5}=>[12354,'HIRAGANA LETTER A','Lo','Hiragana'], q{a6}=>[12449,'KATAKANA LETTER SMALL A','Lo','Katakana'], q{a7}=>[481,'LATIN SMALL LETTER A WITH DOT ABOVE AND MACRON','Ll','Latin'], +q{a8}=>[513,'LATIN SMALL LETTER A WITH DOUBLE GRAVE','Ll Xz','Latin'], q{a:}=>[228,'LATIN SMALL LETTER A WITH DIAERESIS','Ll Xl','Latin'], q{a;}=>[261,'LATIN SMALL LETTER A WITH OGONEK','Ll','Latin'], q{a<}=>[462,'LATIN SMALL LETTER A WITH CARON','Ll','Latin'], @@ -893,24 +967,31 @@ q{a=}=>[1072,'CYRILLIC SMALL LETTER A','Ll','Cyrillic'], q{a>}=>[226,'LATIN SMALL LETTER A WITH CIRCUMFLEX','Ll Xl','Latin'], q{a?}=>[227,'LATIN SMALL LETTER A WITH TILDE','Ll Xl','Latin'], q{aH}=>[1571,'ARABIC LETTER ALEF WITH HAMZA ABOVE','Lo','Arabic'], +q{aI}=>[592,'LATIN SMALL LETTER TURNED A','Ll Xz','Latin'], q{aM}=>[1570,'ARABIC LETTER ALEF WITH MADDA ABOVE','Lo','Arabic'], q{aN}=>[12580,'BOPOMOFO LETTER ANG','Lo','Bopomofo'], q{aR}=>[8553,'ROMAN NUMERAL TEN','Nl','Common'], q{aS}=>[1648,'ARABIC LETTER SUPERSCRIPT ALEF','Mn','Inherited'], q{aa}=>[229,'LATIN SMALL LETTER A WITH RING ABOVE','Ll Xl','Latin'], +q{ac}=>[8448,'ACCOUNT OF','So Xz','Common'], q{ae}=>[230,'LATIN SMALL LETTER AE','Ll Xl','Latin'], q{ah}=>[1573,'ARABIC LETTER ALEF WITH HAMZA BELOW','Lo','Arabic'], q{ai}=>[12574,'BOPOMOFO LETTER AI','Lo','Bopomofo'], q{am}=>[57375,'','Co','Common'], q{an}=>[12578,'BOPOMOFO LETTER AN','Lo','Bopomofo'], q{ar}=>[8569,'SMALL ROMAN NUMERAL TEN','Nl','Common'], +q{as}=>[8449,'ADDRESSED TO THE SUBJECT','So Xz','Common'], q{au}=>[12576,'BOPOMOFO LETTER AU','Lo','Bopomofo'], q{b*}=>[946,'GREEK SMALL LETTER BETA','Ll','Greek'], q{b+}=>[1576,'ARABIC LETTER BEH','Lo','Arabic'], +q{b-}=>[387,'LATIN SMALL LETTER B WITH TOPBAR','Ll Xz','Latin'], q{b.}=>[7683,'LATIN SMALL LETTER B WITH DOT ABOVE','Ll','Latin'], +q{b/}=>[384,'LATIN SMALL LETTER B WITH STROKE','Ll Xz','Latin'], +q{b2}=>[595,'LATIN SMALL LETTER B WITH HOOK','Ll Xz','Latin'], q{b3}=>[57371,'','Co','Common'], q{b4}=>[12549,'BOPOMOFO LETTER B','Lo','Bopomofo'], q{b=}=>[1073,'CYRILLIC SMALL LETTER BE','Ll','Cyrillic'], +q{b?}=>[7532,'LATIN SMALL LETTER B WITH MIDDLE TILDE','Ll Xz','Latin'], q{bR}=>[8554,'ROMAN NUMERAL ELEVEN','Nl','Common'], q{b_}=>[7687,'LATIN SMALL LETTER B WITH LINE BELOW','Ll','Latin'], q{ba}=>[12400,'HIRAGANA LETTER BA','Lo','Hiragana'], @@ -925,8 +1006,10 @@ q{c*}=>[958,'GREEK SMALL LETTER XI','Ll','Greek'], q{c+}=>[1589,'ARABIC LETTER SAD','Lo','Arabic'], q{c,}=>[231,'LATIN SMALL LETTER C WITH CEDILLA','Ll Xl','Latin'], q{c.}=>[267,'LATIN SMALL LETTER C WITH DOT ABOVE','Ll','Latin'], +q{c2}=>[392,'LATIN SMALL LETTER C WITH HOOK','Ll Xz','Latin'], q{c3}=>[1153,'CYRILLIC SMALL LETTER KOPPA','Ll','Cyrillic'], q{c4}=>[12568,'BOPOMOFO LETTER C','Lo','Bopomofo'], +q{c9}=>[597,'LATIN SMALL LETTER C WITH CURL','Ll Xz','Latin'], q{c<}=>[269,'LATIN SMALL LETTER C WITH CARON','Ll','Latin'], q{c=}=>[1094,'CYRILLIC SMALL LETTER TSE','Ll','Cyrillic'], q{c>}=>[265,'LATIN SMALL LETTER C WITH CIRCUMFLEX','Ll','Latin'], @@ -938,6 +1021,7 @@ q{cS}=>[9824,'BLACK SPADE SUIT','So','Common'], q{ch}=>[12564,'BOPOMOFO LETTER CH','Lo','Bopomofo'], q{co}=>[8453,'CARE OF','So','Common'], q{cr}=>[8571,'SMALL ROMAN NUMERAL TWELVE','Nl','Common'], +q{cu}=>[8454,'CADA UNA','So Xz','Common'], q{d%}=>[1106,'CYRILLIC SMALL LETTER DJE','Ll','Cyrillic'], q{d*}=>[948,'GREEK SMALL LETTER DELTA','Ll','Greek'], q{d+}=>[1583,'ARABIC LETTER DAL','Lo','Arabic'], @@ -945,9 +1029,13 @@ q{d,}=>[7697,'LATIN SMALL LETTER D WITH CEDILLA','Ll','Latin'], q{d-}=>[240,'LATIN SMALL LETTER ETH','Ll Xl','Latin'], q{d.}=>[7691,'LATIN SMALL LETTER D WITH DOT ABOVE','Ll','Latin'], q{d/}=>[273,'LATIN SMALL LETTER D WITH STROKE','Ll','Latin'], +q{d2}=>[599,'LATIN SMALL LETTER D WITH HOOK','Ll Xz','Latin'], q{d4}=>[12553,'BOPOMOFO LETTER D','Lo','Bopomofo'], +q{d9}=>[545,'LATIN SMALL LETTER D WITH CURL','Ll Xz','Latin'], +q{d;}=>[598,'LATIN SMALL LETTER D WITH TAIL','Ll Xz','Latin'], q{d<}=>[271,'LATIN SMALL LETTER D WITH CARON','Ll','Latin'], q{d=}=>[1076,'CYRILLIC SMALL LETTER DE','Ll','Cyrillic'], +q{d?}=>[7533,'LATIN SMALL LETTER D WITH MIDDLE TILDE','Ll Xz','Latin'], q{dH}=>[9519,'BOX DRAWINGS DOWN LIGHT AND HORIZONTAL HEAVY','So','Common'], q{dL}=>[9489,'BOX DRAWINGS DOWN LIGHT AND LEFT HEAVY','So','Common'], q{dP}=>[8706,'PARTIAL DIFFERENTIAL','Sm','Common'], @@ -955,6 +1043,7 @@ q{dR}=>[9485,'BOX DRAWINGS DOWN LIGHT AND RIGHT HEAVY','So','Common'], q{dT}=>[9661,'WHITE DOWN-POINTING TRIANGLE','So','Common'], q{d_}=>[7695,'LATIN SMALL LETTER D WITH LINE BELOW','Ll','Latin'], q{da}=>[12384,'HIRAGANA LETTER DA','Lo','Hiragana'], +q{db}=>[568,'LATIN SMALL LETTER DB DIGRAPH','Ll Xz','Latin'], q{dd}=>[1590,'ARABIC LETTER DAD','Lo','Arabic'], q{de}=>[12391,'HIRAGANA LETTER DE','Lo','Hiragana'], q{dh}=>[9516,'BOX DRAWINGS LIGHT DOWN AND HORIZONTAL','So','Common'], @@ -970,20 +1059,25 @@ q{e!}=>[232,'LATIN SMALL LETTER E WITH GRAVE','Ll Xl','Latin'], q{e%}=>[941,'GREEK SMALL LETTER EPSILON WITH TONOS','Ll','Greek'], q{e'}=>[233,'LATIN SMALL LETTER E WITH ACUTE','Ll Xl','Latin'], q{e(}=>[277,'LATIN SMALL LETTER E WITH BREVE','Ll','Latin'], +q{e)}=>[519,'LATIN SMALL LETTER E WITH INVERTED BREVE','Ll Xz','Latin'], q{e*}=>[949,'GREEK SMALL LETTER EPSILON','Ll','Greek'], q{e+}=>[1593,'ARABIC LETTER AIN','Lo','Arabic'], +q{e,}=>[553,'LATIN SMALL LETTER E WITH CEDILLA','Ll Xz','Latin'], q{e-}=>[275,'LATIN SMALL LETTER E WITH MACRON','Ll','Latin'], q{e.}=>[279,'LATIN SMALL LETTER E WITH DOT ABOVE','Ll','Latin'], +q{e/}=>[583,'','Xn Xz',''], q{e2}=>[7867,'LATIN SMALL LETTER E WITH HOOK ABOVE','Ll','Latin'], q{e4}=>[12572,'BOPOMOFO LETTER E','Lo','Bopomofo'], q{e5}=>[12360,'HIRAGANA LETTER E','Lo','Hiragana'], q{e6}=>[12455,'KATAKANA LETTER SMALL E','Lo','Katakana'], +q{e8}=>[517,'LATIN SMALL LETTER E WITH DOUBLE GRAVE','Ll Xz','Latin'], q{e:}=>[235,'LATIN SMALL LETTER E WITH DIAERESIS','Ll Xl','Latin'], q{e;}=>[281,'LATIN SMALL LETTER E WITH OGONEK','Ll','Latin'], q{e<}=>[283,'LATIN SMALL LETTER E WITH CARON','Ll','Latin'], q{e=}=>[1077,'CYRILLIC SMALL LETTER IE','Ll','Cyrillic'], q{e>}=>[234,'LATIN SMALL LETTER E WITH CIRCUMFLEX','Ll Xl','Latin'], q{e?}=>[7869,'LATIN SMALL LETTER E WITH TILDE','Ll','Latin'], +q{eI}=>[601,'LATIN SMALL LETTER SCHWA','Ll Xz','Latin'], q{eN}=>[12581,'BOPOMOFO LETTER ENG','Lo','Bopomofo'], q{ed}=>[57374,'','Co','Common'], q{ei}=>[12575,'BOPOMOFO LETTER EI','Lo','Bopomofo'], @@ -994,9 +1088,12 @@ q{f(}=>[57373,'','Co','Common'], q{f*}=>[966,'GREEK SMALL LETTER PHI','Ll','Greek'], q{f+}=>[1601,'ARABIC LETTER FEH','Lo','Arabic'], q{f.}=>[7711,'LATIN SMALL LETTER F WITH DOT ABOVE','Ll','Latin'], +q{f2}=>[402,'LATIN SMALL LETTER F WITH HOOK','Ll Xz','Latin'], q{f3}=>[1139,'CYRILLIC SMALL LETTER FITA','Ll','Cyrillic'], q{f4}=>[12552,'BOPOMOFO LETTER F','Lo','Bopomofo'], q{f=}=>[1092,'CYRILLIC SMALL LETTER EF','Ll','Cyrillic'], +q{f?}=>[7534,'LATIN SMALL LETTER F WITH MIDDLE TILDE','Ll Xz','Latin'], +q{fI}=>[8526,'','Xn Xz',''], q{fS}=>[9632,'BLACK SQUARE','So','Common'], q{ff}=>[64256,'LATIN SMALL LIGATURE FF','Ll','Latin'], q{fi}=>[64257,'LATIN SMALL LIGATURE FI','Ll','Latin'], @@ -1011,11 +1108,13 @@ q{g,}=>[291,'LATIN SMALL LETTER G WITH CEDILLA','Ll','Latin'], q{g-}=>[7713,'LATIN SMALL LETTER G WITH MACRON','Ll','Latin'], q{g.}=>[289,'LATIN SMALL LETTER G WITH DOT ABOVE','Ll','Latin'], q{g/}=>[485,'LATIN SMALL LETTER G WITH STROKE','Ll','Latin'], +q{g2}=>[608,'LATIN SMALL LETTER G WITH HOOK','Ll Xz','Latin'], q{g3}=>[1169,'CYRILLIC SMALL LETTER GHE WITH UPTURN','Ll','Cyrillic'], q{g4}=>[12557,'BOPOMOFO LETTER G','Lo','Bopomofo'], q{g<}=>[487,'LATIN SMALL LETTER G WITH CARON','Ll','Latin'], q{g=}=>[1075,'CYRILLIC SMALL LETTER GHE','Ll','Cyrillic'], q{g>}=>[285,'LATIN SMALL LETTER G WITH CIRCUMFLEX','Ll','Latin'], +q{gI}=>[7543,'LATIN SMALL LETTER TURNED G','Ll Xz','Latin'], q{ga}=>[12364,'HIRAGANA LETTER GA','Lo','Hiragana'], q{ge}=>[12370,'HIRAGANA LETTER GE','Lo','Hiragana'], q{gf}=>[1711,'ARABIC LETTER GAF','Lo','Arabic'], @@ -1028,10 +1127,12 @@ q{h+}=>[1607,'ARABIC LETTER HEH','Lo','Arabic'], q{h,}=>[7721,'LATIN SMALL LETTER H WITH CEDILLA','Ll','Latin'], q{h.}=>[7715,'LATIN SMALL LETTER H WITH DOT ABOVE','Ll','Latin'], q{h/}=>[295,'LATIN SMALL LETTER H WITH STROKE','Ll','Latin'], +q{h2}=>[614,'LATIN SMALL LETTER H WITH HOOK','Ll Xz','Latin'], q{h4}=>[12559,'BOPOMOFO LETTER H','Lo','Bopomofo'], q{h:}=>[7719,'LATIN SMALL LETTER H WITH DIAERESIS','Ll','Latin'], q{h=}=>[1093,'CYRILLIC SMALL LETTER HA','Ll','Cyrillic'], q{h>}=>[293,'LATIN SMALL LETTER H WITH CIRCUMFLEX','Ll','Latin'], +q{hI}=>[613,'LATIN SMALL LETTER TURNED H','Ll Xz','Latin'], q{h_}=>[7830,'LATIN SMALL LETTER H WITH LINE BELOW','Ll','Latin'], q{ha}=>[12399,'HIRAGANA LETTER HA','Lo','Hiragana'], q{he}=>[12408,'HIRAGANA LETTER HE','Lo','Hiragana'], @@ -1040,25 +1141,30 @@ q{hi}=>[12402,'HIRAGANA LETTER HI','Lo','Hiragana'], q{hk}=>[1581,'ARABIC LETTER HAH','Lo','Arabic'], q{ho}=>[12411,'HIRAGANA LETTER HO','Lo','Hiragana'], q{hu}=>[12405,'HIRAGANA LETTER HU','Lo','Hiragana'], +q{hw}=>[405,'LATIN SMALL LETTER HV','Ll Xz','Latin'], q{i!}=>[236,'LATIN SMALL LETTER I WITH GRAVE','Ll Xl','Latin'], q{i%}=>[943,'GREEK SMALL LETTER IOTA WITH TONOS','Ll','Greek'], q{i'}=>[237,'LATIN SMALL LETTER I WITH ACUTE','Ll Xl','Latin'], q{i(}=>[301,'LATIN SMALL LETTER I WITH BREVE','Ll','Latin'], +q{i)}=>[523,'LATIN SMALL LETTER I WITH INVERTED BREVE','Ll Xz','Latin'], q{i*}=>[953,'GREEK SMALL LETTER IOTA','Ll','Greek'], q{i+}=>[1594,'ARABIC LETTER GHAIN','Lo','Arabic'], q{i-}=>[299,'LATIN SMALL LETTER I WITH MACRON','Ll','Latin'], q{i.}=>[305,'LATIN SMALL LETTER DOTLESS I','Ll','Latin'], +q{i/}=>[616,'LATIN SMALL LETTER I WITH STROKE','Ll Xz','Latin'], q{i2}=>[7881,'LATIN SMALL LETTER I WITH HOOK ABOVE','Ll','Latin'], q{i3}=>[912,'GREEK SMALL LETTER IOTA WITH DIALYTIKA AND TONOS','Ll','Greek'], q{i4}=>[12583,'BOPOMOFO LETTER I','Lo','Bopomofo'], q{i5}=>[12356,'HIRAGANA LETTER I','Lo','Hiragana'], q{i6}=>[12451,'KATAKANA LETTER SMALL I','Lo','Katakana'], +q{i8}=>[521,'LATIN SMALL LETTER I WITH DOUBLE GRAVE','Ll Xz','Latin'], q{i:}=>[239,'LATIN SMALL LETTER I WITH DIAERESIS','Ll Xl','Latin'], q{i;}=>[303,'LATIN SMALL LETTER I WITH OGONEK','Ll','Latin'], q{i<}=>[464,'LATIN SMALL LETTER I WITH CARON','Ll','Latin'], q{i=}=>[1080,'CYRILLIC SMALL LETTER I','Ll','Cyrillic'], q{i>}=>[238,'LATIN SMALL LETTER I WITH CIRCUMFLEX','Ll Xl','Latin'], q{i?}=>[297,'LATIN SMALL LETTER I WITH TILDE','Ll','Latin'], +q{iI}=>[7433,'LATIN SMALL LETTER TURNED I','Ll Xz','Latin'], q{ie}=>[1108,'CYRILLIC SMALL LETTER UKRAINIAN IE','Ll','Cyrillic'], q{ii}=>[1110,'CYRILLIC SMALL LETTER BYELORUSSIAN-UKRAINIAN I','Ll','Cyrillic'], q{ij}=>[307,'LATIN SMALL LIGATURE IJ','Ll','Latin'], @@ -1067,6 +1173,8 @@ q{iu}=>[12585,'BOPOMOFO LETTER IU','Lo','Bopomofo'], q{j%}=>[1112,'CYRILLIC SMALL LETTER JE','Ll','Cyrillic'], q{j*}=>[970,'GREEK SMALL LETTER IOTA WITH DIALYTIKA','Ll','Greek'], q{j+}=>[1609,'ARABIC LETTER ALEF MAKSURA','Lo','Arabic'], +q{j.}=>[567,'LATIN SMALL LETTER DOTLESS J','Ll Xz','Latin'], +q{j/}=>[585,'','Xn Xz',''], q{j3}=>[1013,'GREEK LUNATE EPSILON SYMBOL','Ll','Greek'], q{j4}=>[12560,'BOPOMOFO LETTER J','Lo','Bopomofo'], q{j<}=>[496,'LATIN SMALL LETTER J WITH CARON','Ll','Latin'], @@ -1079,10 +1187,12 @@ q{k'}=>[7729,'LATIN SMALL LETTER K WITH ACUTE','Ll','Latin'], q{k*}=>[954,'GREEK SMALL LETTER KAPPA','Ll','Greek'], q{k+}=>[1603,'ARABIC LETTER KAF','Lo','Arabic'], q{k,}=>[311,'LATIN SMALL LETTER K WITH CEDILLA','Ll','Latin'], +q{k2}=>[409,'LATIN SMALL LETTER K WITH HOOK','Ll Xz','Latin'], q{k3}=>[991,'GREEK SMALL LETTER KOPPA','Ll','Greek'], q{k4}=>[12558,'BOPOMOFO LETTER K','Lo','Bopomofo'], q{k<}=>[489,'LATIN SMALL LETTER K WITH CARON','Ll','Latin'], q{k=}=>[1082,'CYRILLIC SMALL LETTER KA','Ll','Cyrillic'], +q{kI}=>[670,'LATIN SMALL LETTER TURNED K','Ll Xz','Latin'], q{k_}=>[7733,'LATIN SMALL LETTER K WITH LINE BELOW','Ll','Latin'], q{ka}=>[12363,'HIRAGANA LETTER KA','Lo','Hiragana'], q{ke}=>[12369,'HIRAGANA LETTER KE','Lo','Hiragana'], @@ -1095,11 +1205,15 @@ q{l'}=>[314,'LATIN SMALL LETTER L WITH ACUTE','Ll','Latin'], q{l*}=>[955,'GREEK SMALL LETTER LAMDA','Ll','Greek'], q{l+}=>[1604,'ARABIC LETTER LAM','Lo','Arabic'], q{l,}=>[316,'LATIN SMALL LETTER L WITH CEDILLA','Ll','Latin'], +q{l-}=>[410,'LATIN SMALL LETTER L WITH BAR','Ll Xz','Latin'], q{l.}=>[320,'LATIN SMALL LETTER L WITH MIDDLE DOT','Ll','Latin'], q{l/}=>[322,'LATIN SMALL LETTER L WITH STROKE','Ll','Latin'], q{l4}=>[12556,'BOPOMOFO LETTER L','Lo','Bopomofo'], +q{l9}=>[564,'LATIN SMALL LETTER L WITH CURL','Ll Xz','Latin'], +q{l;}=>[621,'LATIN SMALL LETTER L WITH RETROFLEX HOOK','Ll Xz','Latin'], q{l<}=>[318,'LATIN SMALL LETTER L WITH CARON','Ll','Latin'], q{l=}=>[1083,'CYRILLIC SMALL LETTER EL','Ll','Cyrillic'], +q{l?}=>[619,'LATIN SMALL LETTER L WITH MIDDLE TILDE','Ll Xz','Latin'], q{lB}=>[9612,'LEFT HALF BLOCK','So','Common'], q{l_}=>[7739,'LATIN SMALL LETTER L WITH LINE BELOW','Ll','Latin'], q{lj}=>[1113,'CYRILLIC SMALL LETTER LJE','Ll','Cyrillic'], @@ -1109,19 +1223,26 @@ q{m+}=>[1605,'ARABIC LETTER MEEM','Lo','Arabic'], q{m.}=>[7745,'LATIN SMALL LETTER M WITH DOT ABOVE','Ll','Latin'], q{m3}=>[989,'GREEK SMALL LETTER DIGAMMA','Ll','Greek'], q{m4}=>[12551,'BOPOMOFO LETTER M','Lo','Bopomofo'], +q{m;}=>[625,'LATIN SMALL LETTER M WITH HOOK','Ll Xz','Latin'], q{m=}=>[1084,'CYRILLIC SMALL LETTER EM','Ll','Cyrillic'], +q{m?}=>[7535,'LATIN SMALL LETTER M WITH MIDDLE TILDE','Ll Xz','Latin'], +q{mI}=>[623,'LATIN SMALL LETTER TURNED M','Ll Xz','Latin'], q{ma}=>[12414,'HIRAGANA LETTER MA','Lo','Hiragana'], q{me}=>[12417,'HIRAGANA LETTER ME','Lo','Hiragana'], q{mi}=>[12415,'HIRAGANA LETTER MI','Lo','Hiragana'], q{mo}=>[12418,'HIRAGANA LETTER MO','Lo','Hiragana'], q{mu}=>[12416,'HIRAGANA LETTER MU','Lo','Hiragana'], +q{n!}=>[505,'LATIN SMALL LETTER N WITH GRAVE','Ll Xz','Latin'], q{n'}=>[324,'LATIN SMALL LETTER N WITH ACUTE','Ll','Latin'], q{n*}=>[957,'GREEK SMALL LETTER NU','Ll','Greek'], q{n+}=>[1606,'ARABIC LETTER NOON','Lo','Arabic'], q{n,}=>[326,'LATIN SMALL LETTER N WITH CEDILLA','Ll','Latin'], q{n.}=>[7749,'LATIN SMALL LETTER N WITH DOT ABOVE','Ll','Latin'], +q{n2}=>[626,'LATIN SMALL LETTER N WITH LEFT HOOK','Ll Xz','Latin'], q{n4}=>[12555,'BOPOMOFO LETTER N','Lo','Bopomofo'], q{n5}=>[12435,'HIRAGANA LETTER N','Lo','Hiragana'], +q{n9}=>[565,'LATIN SMALL LETTER N WITH CURL','Ll Xz','Latin'], +q{n;}=>[627,'LATIN SMALL LETTER N WITH RETROFLEX HOOK','Ll Xz','Latin'], q{n<}=>[328,'LATIN SMALL LETTER N WITH CARON','Ll','Latin'], q{n=}=>[1085,'CYRILLIC SMALL LETTER EN','Ll','Cyrillic'], q{n?}=>[241,'LATIN SMALL LETTER N WITH TILDE','Ll Xl','Latin'], @@ -1140,8 +1261,10 @@ q{o"}=>[337,'LATIN SMALL LETTER O WITH DOUBLE ACUTE','Ll','Latin'], q{o%}=>[972,'GREEK SMALL LETTER OMICRON WITH TONOS','Ll','Greek'], q{o'}=>[243,'LATIN SMALL LETTER O WITH ACUTE','Ll Xl','Latin'], q{o(}=>[335,'LATIN SMALL LETTER O WITH BREVE','Ll','Latin'], +q{o)}=>[527,'LATIN SMALL LETTER O WITH INVERTED BREVE','Ll Xz','Latin'], q{o*}=>[959,'GREEK SMALL LETTER OMICRON','Ll','Greek'], q{o-}=>[333,'LATIN SMALL LETTER O WITH MACRON','Ll','Latin'], +q{o.}=>[559,'LATIN SMALL LETTER O WITH DOT ABOVE','Ll Xz','Latin'], q{o/}=>[248,'LATIN SMALL LETTER O WITH STROKE','Ll Xl','Latin'], q{o1}=>[493,'LATIN SMALL LETTER O WITH OGONEK AND MACRON','Ll','Latin'], q{o2}=>[7887,'LATIN SMALL LETTER O WITH HOOK ABOVE','Ll','Latin'], @@ -1149,6 +1272,7 @@ q{o3}=>[1131,'CYRILLIC SMALL LETTER BIG YUS','Ll','Cyrillic'], q{o4}=>[12571,'BOPOMOFO LETTER O','Lo','Bopomofo'], q{o5}=>[12362,'HIRAGANA LETTER O','Lo','Hiragana'], q{o6}=>[12457,'KATAKANA LETTER SMALL O','Lo','Katakana'], +q{o8}=>[525,'LATIN SMALL LETTER O WITH DOUBLE GRAVE','Ll Xz','Latin'], q{o9}=>[417,'LATIN SMALL LETTER O WITH HORN','Ll','Latin'], q{o:}=>[246,'LATIN SMALL LETTER O WITH DIAERESIS','Ll Xl','Latin'], q{o;}=>[491,'LATIN SMALL LETTER O WITH OGONEK','Ll','Latin'], @@ -1158,6 +1282,7 @@ q{o>}=>[244,'LATIN SMALL LETTER O WITH CIRCUMFLEX','Ll Xl','Latin'], q{o?}=>[245,'LATIN SMALL LETTER O WITH TILDE','Ll Xl','Latin'], q{oC}=>[8451,'DEGREE CELSIUS','So','Common'], q{oF}=>[8457,'DEGREE FAHRENHEIT','So','Common'], +q{oI}=>[596,'LATIN SMALL LETTER OPEN O','Ll Xz','Latin'], q{oe}=>[339,'LATIN SMALL LIGATURE OE','Ll','Latin'], q{oi}=>[419,'LATIN SMALL LETTER OI','Ll','Latin'], q{ou}=>[12577,'BOPOMOFO LETTER OU','Lo','Bopomofo'], @@ -1165,9 +1290,12 @@ q{p'}=>[7765,'LATIN SMALL LETTER P WITH ACUTE','Ll','Latin'], q{p*}=>[960,'GREEK SMALL LETTER PI','Ll','Greek'], q{p+}=>[1662,'ARABIC LETTER PEH','Lo','Arabic'], q{p.}=>[7767,'LATIN SMALL LETTER P WITH DOT ABOVE','Ll','Latin'], +q{p/}=>[7549,'LATIN SMALL LETTER P WITH STROKE','Ll Xz','Latin'], +q{p2}=>[421,'LATIN SMALL LETTER P WITH HOOK','Ll Xz','Latin'], q{p3}=>[993,'GREEK SMALL LETTER SAMPI','Ll','Greek'], q{p4}=>[12550,'BOPOMOFO LETTER P','Lo','Bopomofo'], q{p=}=>[1087,'CYRILLIC SMALL LETTER PE','Ll','Cyrillic'], +q{p?}=>[7537,'LATIN SMALL LETTER P WITH MIDDLE TILDE','Ll Xz','Latin'], q{pa}=>[12401,'HIRAGANA LETTER PA','Lo','Hiragana'], q{pe}=>[12410,'HIRAGANA LETTER PE','Lo','Hiragana'], q{pi}=>[12404,'HIRAGANA LETTER PI','Lo','Hiragana'], @@ -1176,15 +1304,24 @@ q{po}=>[12413,'HIRAGANA LETTER PO','Lo','Hiragana'], q{pu}=>[12407,'HIRAGANA LETTER PU','Lo','Hiragana'], q{q*}=>[968,'GREEK SMALL LETTER PSI','Ll','Greek'], q{q+}=>[1602,'ARABIC LETTER QAF','Lo','Arabic'], +q{q2}=>[672,'LATIN SMALL LETTER Q WITH HOOK','Ll Xz','Latin'], q{q4}=>[12561,'BOPOMOFO LETTER Q','Lo','Bopomofo'], +q{q;}=>[587,'','Xn Xz',''], +q{qp}=>[569,'LATIN SMALL LETTER QP DIGRAPH','Ll Xz','Latin'], q{r'}=>[341,'LATIN SMALL LETTER R WITH ACUTE','Ll','Latin'], +q{r)}=>[531,'LATIN SMALL LETTER R WITH INVERTED BREVE','Ll Xz','Latin'], q{r*}=>[961,'GREEK SMALL LETTER RHO','Ll','Greek'], q{r+}=>[1585,'ARABIC LETTER REH','Lo','Arabic'], q{r,}=>[343,'LATIN SMALL LETTER R WITH CEDILLA','Ll','Latin'], q{r.}=>[7769,'LATIN SMALL LETTER R WITH DOT ABOVE','Ll','Latin'], +q{r/}=>[589,'','Xn Xz',''], q{r4}=>[12566,'BOPOMOFO LETTER R','Lo','Bopomofo'], +q{r8}=>[529,'LATIN SMALL LETTER R WITH DOUBLE GRAVE','Ll Xz','Latin'], +q{r;}=>[637,'LATIN SMALL LETTER R WITH TAIL','Ll Xz','Latin'], q{r<}=>[345,'LATIN SMALL LETTER R WITH CARON','Ll','Latin'], q{r=}=>[1088,'CYRILLIC SMALL LETTER ER','Ll','Cyrillic'], +q{r?}=>[7538,'LATIN SMALL LETTER R WITH MIDDLE TILDE','Ll Xz','Latin'], +q{rI}=>[633,'LATIN SMALL LETTER TURNED R','Ll Xz','Latin'], q{r_}=>[7775,'LATIN SMALL LETTER R WITH LINE BELOW','Ll','Latin'], q{ra}=>[12425,'HIRAGANA LETTER RA','Lo','Hiragana'], q{re}=>[12428,'HIRAGANA LETTER RE','Lo','Hiragana'], @@ -1198,9 +1335,11 @@ q{s+}=>[1587,'ARABIC LETTER SEEN','Lo','Arabic'], q{s,}=>[351,'LATIN SMALL LETTER S WITH CEDILLA','Ll','Latin'], q{s.}=>[7777,'LATIN SMALL LETTER S WITH DOT ABOVE','Ll','Latin'], q{s4}=>[12569,'BOPOMOFO LETTER S','Lo','Bopomofo'], +q{s;}=>[642,'LATIN SMALL LETTER S WITH HOOK','Ll Xz','Latin'], q{s<}=>[353,'LATIN SMALL LETTER S WITH CARON','Ll','Latin'], q{s=}=>[1089,'CYRILLIC SMALL LETTER ES','Ll','Cyrillic'], q{s>}=>[349,'LATIN SMALL LETTER S WITH CIRCUMFLEX','Ll','Latin'], +q{s?}=>[7540,'LATIN SMALL LETTER S WITH MIDDLE TILDE','Ll Xz','Latin'], q{sB}=>[9642,'BLACK SMALL SQUARE','So','Common'], q{sa}=>[12373,'HIRAGANA LETTER SA','Lo','Hiragana'], q{sc}=>[1097,'CYRILLIC SMALL LETTER SHCHA','Ll','Cyrillic'], @@ -1217,11 +1356,16 @@ q{t+}=>[1578,'ARABIC LETTER TEH','Lo','Arabic'], q{t,}=>[355,'LATIN SMALL LETTER T WITH CEDILLA','Ll','Latin'], q{t.}=>[7787,'LATIN SMALL LETTER T WITH DOT ABOVE','Ll','Latin'], q{t/}=>[359,'LATIN SMALL LETTER T WITH STROKE','Ll','Latin'], +q{t2}=>[429,'LATIN SMALL LETTER T WITH HOOK','Ll Xz','Latin'], q{t3}=>[987,'GREEK SMALL LETTER STIGMA','Ll','Greek'], q{t4}=>[12554,'BOPOMOFO LETTER T','Lo','Bopomofo'], +q{t9}=>[566,'LATIN SMALL LETTER T WITH CURL','Ll Xz','Latin'], q{t:}=>[7831,'LATIN SMALL LETTER T WITH DIAERESIS','Ll','Latin'], +q{t;}=>[648,'LATIN SMALL LETTER T WITH RETROFLEX HOOK','Ll Xz','Latin'], q{t<}=>[357,'LATIN SMALL LETTER T WITH CARON','Ll','Latin'], q{t=}=>[1090,'CYRILLIC SMALL LETTER TE','Ll','Cyrillic'], +q{t?}=>[7541,'LATIN SMALL LETTER T WITH MIDDLE TILDE','Ll Xz','Latin'], +q{tI}=>[647,'LATIN SMALL LETTER TURNED T','Ll Xz','Latin'], q{tU}=>[12387,'HIRAGANA LETTER SMALL TU','Lo','Hiragana'], q{t_}=>[7791,'LATIN SMALL LETTER T WITH LINE BELOW','Ll','Latin'], q{ta}=>[12383,'HIRAGANA LETTER TA','Lo','Hiragana'], @@ -1239,14 +1383,17 @@ q{u"}=>[369,'LATIN SMALL LETTER U WITH DOUBLE ACUTE','Ll','Latin'], q{u%}=>[973,'GREEK SMALL LETTER UPSILON WITH TONOS','Ll','Greek'], q{u'}=>[250,'LATIN SMALL LETTER U WITH ACUTE','Ll Xl','Latin'], q{u(}=>[365,'LATIN SMALL LETTER U WITH BREVE','Ll','Latin'], +q{u)}=>[535,'LATIN SMALL LETTER U WITH INVERTED BREVE','Ll Xz','Latin'], q{u*}=>[965,'GREEK SMALL LETTER UPSILON','Ll','Greek'], q{u-}=>[363,'LATIN SMALL LETTER U WITH MACRON','Ll','Latin'], +q{u/}=>[649,'LATIN SMALL LETTER U BAR','Ll Xz','Latin'], q{u0}=>[367,'LATIN SMALL LETTER U WITH RING ABOVE','Ll','Latin'], q{u2}=>[7911,'LATIN SMALL LETTER U WITH HOOK ABOVE','Ll','Latin'], q{u3}=>[944,'GREEK SMALL LETTER UPSILON WITH DIALYTIKA AND TONOS','Ll','Greek'], q{u4}=>[12584,'BOPOMOFO LETTER U','Lo','Bopomofo'], q{u5}=>[12358,'HIRAGANA LETTER U','Lo','Hiragana'], q{u6}=>[12453,'KATAKANA LETTER SMALL U','Lo','Katakana'], +q{u8}=>[533,'LATIN SMALL LETTER U WITH DOUBLE GRAVE','Ll Xz','Latin'], q{u9}=>[432,'LATIN SMALL LETTER U WITH HORN','Ll','Latin'], q{u:}=>[252,'LATIN SMALL LETTER U WITH DIAERESIS','Ll Xl','Latin'], q{u;}=>[371,'LATIN SMALL LETTER U WITH OGONEK','Ll','Latin'], @@ -1264,11 +1411,14 @@ q{ur}=>[9492,'BOX DRAWINGS LIGHT UP AND RIGHT','So','Common'], q{v%}=>[1118,'CYRILLIC SMALL LETTER SHORT U','Ll','Cyrillic'], q{v*}=>[971,'GREEK SMALL LETTER UPSILON WITH DIALYTIKA','Ll','Greek'], q{v+}=>[1700,'ARABIC LETTER VEH','Lo','Arabic'], +q{v2}=>[651,'LATIN SMALL LETTER V WITH HOOK','Ll Xz','Latin'], q{v3}=>[1141,'CYRILLIC SMALL LETTER IZHITSA','Ll','Cyrillic'], q{v4}=>[12586,'BOPOMOFO LETTER V','Lo','Bopomofo'], +q{v9}=>[11380,'','Xn Xz',''], q{v=}=>[1074,'CYRILLIC SMALL LETTER VE','Ll','Cyrillic'], q{v?}=>[7805,'LATIN SMALL LETTER V WITH TILDE','Ll','Latin'], q{vH}=>[9535,'BOX DRAWINGS VERTICAL LIGHT AND HORIZONTAL HEAVY','So','Common'], +q{vI}=>[652,'LATIN SMALL LETTER TURNED V','Ll Xz','Latin'], q{vL}=>[9509,'BOX DRAWINGS VERTICAL LIGHT AND LEFT HEAVY','So','Common'], q{vR}=>[9501,'BOX DRAWINGS VERTICAL LIGHT AND RIGHT HEAVY','So','Common'], q{vh}=>[9532,'BOX DRAWINGS LIGHT VERTICAL AND HORIZONTAL','So','Common'], @@ -1287,10 +1437,12 @@ q{w:}=>[7813,'LATIN SMALL LETTER W WITH DIAERESIS','Ll','Latin'], q{w>}=>[373,'LATIN SMALL LETTER W WITH CIRCUMFLEX','Ll','Latin'], q{wA}=>[12430,'HIRAGANA LETTER SMALL WA','Lo','Hiragana'], q{wH}=>[1572,'ARABIC LETTER WAW WITH HAMZA ABOVE','Lo','Arabic'], +q{wI}=>[653,'LATIN SMALL LETTER TURNED W','Ll Xz','Latin'], q{wa}=>[12431,'HIRAGANA LETTER WA','Lo','Hiragana'], q{we}=>[12433,'HIRAGANA LETTER WE','Lo','Hiragana'], q{wi}=>[12432,'HIRAGANA LETTER WI','Lo','Hiragana'], q{wo}=>[12434,'HIRAGANA LETTER WO','Lo','Hiragana'], +q{ww}=>[447,'LATIN LETTER WYNN','Ll Xz','Latin'], q{x*}=>[967,'GREEK SMALL LETTER CHI','Ll','Greek'], q{x+}=>[1582,'ARABIC LETTER KHAH','Lo','Arabic'], q{x.}=>[7819,'LATIN SMALL LETTER X WITH DOT ABOVE','Ll','Latin'], @@ -1301,16 +1453,20 @@ q{y%}=>[942,'GREEK SMALL LETTER ETA WITH TONOS','Ll','Greek'], q{y'}=>[253,'LATIN SMALL LETTER Y WITH ACUTE','Ll Xl','Latin'], q{y*}=>[951,'GREEK SMALL LETTER ETA','Ll','Greek'], q{y+}=>[1610,'ARABIC LETTER YEH','Lo','Arabic'], +q{y-}=>[563,'LATIN SMALL LETTER Y WITH MACRON','Ll Xz','Latin'], q{y.}=>[7823,'LATIN SMALL LETTER Y WITH DOT ABOVE','Ll','Latin'], +q{y/}=>[591,'','Xn Xz',''], q{y0}=>[7833,'LATIN SMALL LETTER Y WITH RING ABOVE','Ll','Latin'], q{y2}=>[7927,'LATIN SMALL LETTER Y WITH HOOK ABOVE','Ll','Latin'], q{y3}=>[1123,'CYRILLIC SMALL LETTER YAT','Ll','Cyrillic'], q{y:}=>[255,'LATIN SMALL LETTER Y WITH DIAERESIS','Ll Xl','Latin'], +q{y;}=>[436,'LATIN SMALL LETTER Y WITH HOOK','Ll Xz','Latin'], q{y=}=>[1099,'CYRILLIC SMALL LETTER YERU','Ll','Cyrillic'], q{y>}=>[375,'LATIN SMALL LETTER Y WITH CIRCUMFLEX','Ll','Latin'], q{y?}=>[7929,'LATIN SMALL LETTER Y WITH TILDE','Ll','Latin'], q{yA}=>[12419,'HIRAGANA LETTER SMALL YA','Lo','Hiragana'], q{yH}=>[1574,'ARABIC LETTER YEH WITH HAMZA ABOVE','Lo','Arabic'], +q{yI}=>[654,'LATIN SMALL LETTER TURNED Y','Ll Xz','Latin'], q{yO}=>[12423,'HIRAGANA LETTER SMALL YO','Lo','Hiragana'], q{yU}=>[12421,'HIRAGANA LETTER SMALL YU','Lo','Hiragana'], q{ya}=>[12420,'HIRAGANA LETTER YA','Lo','Hiragana'], @@ -1318,16 +1474,21 @@ q{yi}=>[1111,'CYRILLIC SMALL LETTER YI','Ll','Cyrillic'], q{yo}=>[12424,'HIRAGANA LETTER YO','Lo','Hiragana'], q{yr}=>[422,'LATIN LETTER YR','Lu','Latin'], q{yu}=>[12422,'HIRAGANA LETTER YU','Lo','Hiragana'], +q{yy}=>[541,'LATIN SMALL LETTER YOGH','Ll Xz','Latin'], q{z%}=>[1078,'CYRILLIC SMALL LETTER ZHE','Ll','Cyrillic'], q{z'}=>[378,'LATIN SMALL LETTER Z WITH ACUTE','Ll','Latin'], q{z*}=>[950,'GREEK SMALL LETTER ZETA','Ll','Greek'], q{z+}=>[1586,'ARABIC LETTER ZAIN','Lo','Arabic'], q{z.}=>[380,'LATIN SMALL LETTER Z WITH DOT ABOVE','Ll','Latin'], q{z/}=>[438,'LATIN SMALL LETTER Z WITH STROKE','Ll','Latin'], +q{z2}=>[549,'LATIN SMALL LETTER Z WITH HOOK','Ll Xz','Latin'], q{z4}=>[12567,'BOPOMOFO LETTER Z','Lo','Bopomofo'], +q{z9}=>[657,'LATIN SMALL LETTER Z WITH CURL','Ll Xz','Latin'], +q{z;}=>[656,'LATIN SMALL LETTER Z WITH RETROFLEX HOOK','Ll Xz','Latin'], q{z<}=>[382,'LATIN SMALL LETTER Z WITH CARON','Ll','Latin'], q{z=}=>[1079,'CYRILLIC SMALL LETTER ZE','Ll','Cyrillic'], q{z>}=>[7825,'LATIN SMALL LETTER Z WITH CIRCUMFLEX','Ll','Latin'], +q{z?}=>[7542,'LATIN SMALL LETTER Z WITH MIDDLE TILDE','Ll Xz','Latin'], q{zH}=>[1592,'ARABIC LETTER ZAH','Lo','Arabic'], q{z_}=>[7829,'LATIN SMALL LETTER Z WITH LINE BELOW','Ll','Latin'], q{za}=>[12374,'HIRAGANA LETTER ZA','Lo','Hiragana'], diff --git a/rfc1345convert b/rfc1345convert index 6edfa74..412bac1 100644 --- a/rfc1345convert +++ b/rfc1345convert @@ -46,10 +46,26 @@ for (@t) { $di{$mnem} = hex $char; } +# personal addendums +my @extra; +if (-r 'shiar.inc.txt') { + open my $include, '<:utf8', 'shiar.inc.txt'; + for (readline $include) { + m{^([!"%'-Z_a-z]{2}) (.)} or next; + warn("$1 already defined"), next if defined $di{$1}; + $di{$1} = ord $2; + push @extra, $1; + } +} +warn $@ if $@; + # optionally get unicode character information my %info = eval { require Unicode::UCD; - map { $_ => Unicode::UCD::charinfo($di{$_}) } keys %di; + map { + $_ => Unicode::UCD::charinfo($di{$_}) + || { block => '?', category => 'Xn', name => '', script => '' } + } keys %di; }; # add custom categories for certain blocks @@ -58,6 +74,9 @@ for (values %info) { $_->{category} .= ' Xl' if $_->{block} eq 'Latin-1 Supplement'; } +# mark unofficial extras as such +$info{$_}->{category} .= ' Xz' for @extra; + # output perl code of hash # (assume no backslashes or curlies, so we can just q{} w/o escaping) print "{\n"; diff --git a/shiar.inc.txt b/shiar.inc.txt new file mode 100644 index 0000000..661dc67 --- /dev/null +++ b/shiar.inc.txt @@ -0,0 +1,228 @@ +# vim +=e € + +# zsh +Eu € + +# useful characters +?! ‽ +<3 ♥ # easy alias to trigraph cH- +:) ☺ # easy alias to 0u +:( ☹ +** ⁑ #XXX: useful? +3* ⁂ #XXX: useful? + +# additional letters +HW Ƕ # HV conflicts with vh line drawing +hw ƕ +db ȸ +qp ȹ +ww ƿ +WW Ƿ +YY Ȝ #XXX +yy ȝ +?. ʔ +?/ ʡ +!c ǀ # corresponding zulu letter +!q ǃ # idem; !. would be much more intuitive +!x ǁ # idem; or !/ (previously ʖ) +!- ǂ +!b ʘ # bilabial +# ES ʃ/Ʃ #XXX + +# expected but missing +A. Ȧ +a. ȧ +A0 Ǻ # normal A-ring already provided by AA +a0 ǻ +j. ȷ +O. Ȯ +o. ȯ +N! Ǹ +n! ǹ +Y- Ȳ +y- ȳ +ac ℀ +as ℁ +cu ℆ # co ís present though + +# bars and strokes +B/ Ƀ +B- Ƃ +b- ƃ +b/ ƀ +E/ Ɇ +e/ ɇ +I/ Ɨ +i/ ɨ +J/ Ɉ +j/ ɉ +l- ƚ # not really a macron, but wouldn't really make sense anyway otherwise +l? ɫ # idem +L? Ɫ +P/ Ᵽ +p/ ᵽ +R/ Ɍ +r/ ɍ +U/ Ʉ +u/ ʉ +Y/ Ɏ +y/ ɏ + +# inverted breves +A) Ȃ +a) ȃ +E) Ȇ +e) ȇ +I) Ȋ # )I exists, but should not confuse +i) ȋ +O) Ȏ +o) ȏ +R) Ȓ +r) ȓ +U) Ȗ # )U exists +u) ȗ + +# double grave +A8 Ȁ +a8 ȁ +E8 Ȅ +e8 ȅ +I8 Ȉ +i8 ȉ +O8 Ȍ +o8 ȍ +R8 Ȑ +r8 ȑ +U8 Ȕ +u8 ȕ + +# hooks +B2 Ɓ +b2 ɓ +C2 Ƈ +c2 ƈ +# D2 Ɗ # in use by control char +d2 ɗ # hook +d; ɖ # R (tail) +D; Ɖ +E, Ȩ +e, ȩ +F2 Ƒ +f2 ƒ # looks like a cedilla +G2 Ɠ +g2 ɠ +h2 ɦ +K2 Ƙ +k2 ƙ +l; ɭ # R +m; ɱ +N2 Ɲ # left hook +n2 ɲ +n; ɳ # R +# P2 Ƥ # in use by control char +p2 ƥ +Q; Ɋ # hook tail +q; ɋ # hook tail +q2 ʠ # hook +R; Ɽ # R (tail) +r; ɽ +s; ʂ # R +T2 Ƭ # hook +t2 ƭ +T; Ʈ # R +t; ʈ +V2 Ʋ +v2 ʋ +Y; Ƴ # not a hook below, but Y2 hook above is already present +y; ƴ +Z2 Ȥ # looks like a cedilla +z2 ȥ +z; ʐ # R + +# curls +c9 ɕ +d9 ȡ +l9 ȴ +n9 ȵ +t9 ȶ +v9 ⱴ +z9 ʑ +# S9 ʆ +# Z9 ʓ + +# middle tilde #XXX: not tilde above +b? ᵬ +d? ᵭ +f? ᵮ +m? ᵯ +# n? ᵰ # already a tilde above +p? ᵱ +r? ᵲ +s? ᵴ +t? ᵵ +z? ᵶ + +# tone letters +2/ ƻ +%2 Ƨ +2% ƨ +%6 Ƅ +6% ƅ +%5 Ƽ +5% ƽ + +# turned/inverted (trailing I is uncommon for lowercase, and already used thusly for !I, ?I and NI) +aI ɐ +# EI Ǝ # could be confusing, as it's not uppercase schwa eI +eI ə # schwa, not turned E (latter is very uncommon) +FI Ⅎ # not a letter +fI ⅎ # idem +gI ᵷ +hI ɥ +iI ᴉ +kI ʞ +MI Ɯ +mI ɯ +# nI ᴎ # reversed capital N, but NI already in use +oI ɔ # can't invert O +rI ɹ +# RI ᴚ # conflicts with RI control char +tI ʇ +VI Ʌ +vI ʌ +wI ʍ +yI ʎ + +# note: common meaning + ! Grave + " Double acute accent + ' Acute accent + ( Breve + + ) Inverted Breve + , Cedilla + - Macron + . Dot Above + / Stroke + 0 Ring above + 2 Hook above + + 8 Double Grave + 9 Horn + + Curl + : Diaeresis + ; Ogonek + + Hook below right + < Caron + > Circumflex accent + ? tilde + _ Underline + + = Cyrillic + * Greek + % Greek/Cyrillic special + + smalls: Arabic, capitals: Hebrew + 3 some Latin/Greek/Cyrillic letters + 4 Bopomofo + 5 Hiragana + 6 Katakana + -- 2.30.0