Cover HTML4 entities.
eK ㅕ
EK ㅖ
+# common formatting control
+ZS # ZWSP; capitals like other Cc
+ZN # ZWNJ; less obvious alt: 'Z
+ZW # ZWJ; ZJ somewhy used for tsadi; less obvious alt: "Z
+LR # LRM
+RL # RLM; keep rl for ɼ
+
###
# under development or temporary
$yy ײ
$g1 ׳
$g2 ״
-$lr
-$rl
-$zw
# rfc (incorrectly?) maps double to heavy
$vL ╡
our $VERSION = '1.00';
my %info = (
+ # prepare presentational string for some control(lish) entries
"\xAD" => {string => '-'},
"\x{200E}" => {string => '→'},
"\x{200F}" => {string => '←'},
+ "\x{200B}" => {string => '␣'},
+ "\x{200C}" => {string => '|'}, # ISO-9995-7-081 lookalike (alt: ∣ ⊺ ⟙)
+ "\x{200D}" => {string => '⁀'}, # join (alt: ∤ |ͯ ⨝)
);
$info{chr $_} //= {} for 32 .. 126;
}
# presentational string for some control(lish) entries
$info{$_}->{string} = '-' for grep { $di{$_} == 0x00AD } keys %di;
+$info{$_}->{string} = '␣' for grep { $di{$_} == 0x200B } keys %di;
+$info{$_}->{string} = '|' for grep { $di{$_} == 0x200C } keys %di;
+$info{$_}->{string} = '⁀' for grep { $di{$_} == 0x200D } keys %di;
$info{$_}->{string} = '→' for grep { $di{$_} == 0x200E } keys %di;
$info{$_}->{string} = '←' for grep { $di{$_} == 0x200F } keys %di;