From fa15370b8f30686099ea3cbb1c91ed140c9e70bc Mon Sep 17 00:00:00 2001 From: Mischa POSLAWSKY Date: Sat, 7 Feb 2015 07:53:43 +0100 Subject: [PATCH] writing: declare utf8 source of perl includes Apparently not noticeable in some environments, but normally encoding needs to be specified to avoid being interpreted as Latin1. --- tools/mkdigraphlist | 1 + writing-brah.inc.pl | 3 +++ writing-digits.inc.pl | 3 +++ writing-latn.inc.pl | 3 +++ writing-phnx.inc.pl | 3 +++ writing-script.inc.pl | 3 ++- 6 files changed, 15 insertions(+), 1 deletion(-) diff --git a/tools/mkdigraphlist b/tools/mkdigraphlist index fa67418..a1bfbcd 100755 --- a/tools/mkdigraphlist +++ b/tools/mkdigraphlist @@ -153,6 +153,7 @@ for my $row (values %info) { # output perl code of hash # (assume no backslashes or curlies, so we can just q{} w/o escaping) +print "use utf8;\n"; print "+{\n"; printf '(map {$_=>0} qw{%s}),'."\n", join(' ', map { substr($_, 1, 1).substr($_, 0, 1) } sort keys %di diff --git a/writing-brah.inc.pl b/writing-brah.inc.pl index 9025e13..ae28d2b 100644 --- a/writing-brah.inc.pl +++ b/writing-brah.inc.pl @@ -1,3 +1,5 @@ +use utf8; +( iso => [qw{ k kh g gh ṅ c ch j jh > ñ ṭ ṭh ḍ ḍh ṇ t th d dh n ṉ p ph b bh m y r ṟ l ḷ ḻ v ś ṣ s h }], ipa => [qw{ k kʰ ɡ ɡʱ ŋ c cʰ ɟ ɟʱ > ɲ ʈ ʈʰ ɖ ɖʱ ɳ t̪ t̪ʰ d̪ d̪ʱ n̪ n p pʰ b bʱ m j r ɾ l ɭ ɻ ʋ ʃ ʂ s ɦ }], orya => [qw{ କ ଖ ଗ ଘ ଙ ଚ ଛ ଜ ଝ > ଞ ଟ ଠ ଡ ଢ ଣ ତ ଥ ଦ ଧ > ନ ପ ଫ ବ ଭ ମ ଯ > ର ଲ > ଳ ଵ ଶ ଷ ସ ହ }], @@ -17,3 +19,4 @@ khmr => [qw{ ក ខ គ ឃ ង ច ឆ ជ ឈ > ញ ដ ឋ thai => [qw{ ก ข ค ฆ ง จ ฉ ช ฌ > ญ ฏ ฐ ฑ ฒ ณ ต ถ ท ธ > น ป ผ พ ภ ม ย > ร ล > - ว ศ ษ ส ห }], laoo => [qw{ ກ ຂ - ຄ ງ ຈ ສ ຊ - > ຍ - - - - - ຕ ຖ ທ - > ນ ປ ຜ ຟ ພ ມ ຢ > ຣ ລ > - ວ - - - ຫ }], tglg => [qw{ ᜃ - ᜄ - ᜅ - - - - > - - - - - - ᜆ - ᜇ - > ᜈ ᜉ - ᜊ - ᜋ ᜌ > ᜇ ᜎ > - - - - ᜐ ᜑ }], +); diff --git a/writing-digits.inc.pl b/writing-digits.inc.pl index e45bf5f..a7176c0 100644 --- a/writing-digits.inc.pl +++ b/writing-digits.inc.pl @@ -1,3 +1,5 @@ +use utf8; +( hant => [qw{ 壹 貳 參 肆 伍 陸 柒 捌 玖 零 }], hans => [qw{ 一 二 三 四 五 六 七 八 九 〇 }], suzhou => [qw{ 〡 〢 〣 〤 〥 〦 〧 〨 〩 }], @@ -37,3 +39,4 @@ teng => [qw{           }], tlh => [qw{           }], osma => [qw{ 𐒡 𐒢 𐒣 𐒤 𐒥 𐒦 𐒧 𐒨 𐒩 𐒠 }], brai => [qw{ ⠁ ⠃ ⠉ ⠙ ⠑ ⠋ ⠛ ⠓ ⠊ ⠚ }], +); diff --git a/writing-latn.inc.pl b/writing-latn.inc.pl index d20c5e4..d808e0d 100644 --- a/writing-latn.inc.pl +++ b/writing-latn.inc.pl @@ -1,6 +1,9 @@ +use utf8; +( latn => [qw{ a b c d e f g h i j k l m n o p q r s t u v w x y z }], latfsuet => [qw{ a b c d e f g h i j k l m n o p q r ſ s t u v w x y z }], ase => [qw{ a b c d e f g h i j k l m n o p q r s t u v w x y z }], brai => [qw{ ⠁ ⠃ ⠉ ⠙ ⠑ ⠋ ⠛ ⠓ ⠊ ⠚ ⠅ ⠇ ⠍ ⠝ ⠕ ⠏ ⠟ ⠗ ⠎ ⠞ ⠥ ⠧ ⠺ ⠭ ⠽ ⠵ }], morse => [qw{ ‧‑ ‑‧‧‧ ‑‧‑‧ ‑‧‧ ‧ ‧‧‐‧ ‐‐‧ ‧‧‧‧ ‧‧ ‧‐‐‐ ‐‧‐ ‧‐‧‧ ‐‐ ‐‧ ‐‐‐ ‧‐‐‧ ‐‐‧‐ ‧‐‧ ‧‧‧ ‐ ‧‧‐ ‧‧‧‐ ‧‐‐ ‐‧‧‐ ‐‧‐‐ ‐‐‧‧ }], +); diff --git a/writing-phnx.inc.pl b/writing-phnx.inc.pl index 5e0fc04..174b9aa 100644 --- a/writing-phnx.inc.pl +++ b/writing-phnx.inc.pl @@ -1,3 +1,5 @@ +use utf8; +( latn => [qw{ A > B C G D > E F Y U V W Z H > - I J K L M N > X O P > - Q R > S T }], #runr_ys => [qw{ ᚭ - ᛓ ᚴ ᛆ - > - ᚠ > > > - ᛧ ᚽ ᚦ - > ᛁ - ᛚ ᛙ ᚿ > - - - > - - ᚱ > ᛌ ᛐ }], # short-twig fuþark #runr_m => [qw{ ᚮ - ᛒ ᚲ ᛆ - > - ᚠ > > > - ᛧ ᚼ ᚦ - ᛁ ᛂ - ᛚ ᛘ ᚿ > - - - > - - ᚱ > ᛋ ᛐ }], # fuþork (medieval) @@ -17,3 +19,4 @@ syrc => [qw{ ܐ > ܒ > ܓ ܕ > ܗ > > > > ܘ ܙ ܚ > ܛ ܝ ҩ ܟ ܠ ܡ ܢ > ܣ ܥ ܦ > ܨ ܩ ܪ > ܫ ܬ }], arab => [qw{ ا > ب > ج د ه ـ > > > > و ز ح > ط > ي ك ل م ن > س ع ف > ص ق ر > ش ت }], #arab => [qw{ ^ ^ ^ ^ ^ ذ ^ ^ ^ ^ ^ > ^ ^ خ ^ ظ ^ ^ ^ ^ ^ ^ ^ س غ ^ ^ ض ^ ﺭ ^ ^ ث }], +); diff --git a/writing-script.inc.pl b/writing-script.inc.pl index 3fb6ca5..8850268 100644 --- a/writing-script.inc.pl +++ b/writing-script.inc.pl @@ -1,4 +1,5 @@ -{ +use utf8; ++{ arab => 'Arabic', armi => 'Aramaic', bali => 'Balinese', -- 2.30.0