Notable characters missing for latin1 coverage:
superscript 1-3 (2 already present) and quarter fractions.
punctuation => {
quoting => [qw{. « » . ‹ › . ‘ ’ . “ ” . „ ‚ . ‟ ‛}],
- common => [qw{. † ‡ • . § ¶ # . © ® ™ . ° ′ ″ . − × ÷ . ± ² √ . 年 月 日}],
+ common => [qw{
+ . † ‡ • . § ¶ # . © ® ™
+ . ° ′ ″ . − × ÷ . ± ² √
+ . ¹ ⁿ ³ . ¼ ½ ¾ . 年 月 日
+ }],
marks => [qw{. ¿ … 〃 ‐ – . ‽ · ※ ‒ — }],
spacing => [split / /, join ' ',
". \x{2003} \x{2009} \x{2007} \x{A0} \x{200B}",
my @config = qw(
Popular
punctuation/quoting
- common=-5
+ common=-5?common
symbols/binary?symbols/binary=-5
latin/sample=-1
?sample=2-