From: Don Armstrong Date: Fri, 24 Jun 2011 17:55:44 +0000 (+0000) Subject: * add word_sanitize functoin X-Git-Url: https://git.donarmstrong.com/?a=commitdiff_plain;h=9b57d1ea29c26fcc70f4b399eb1caee78adae7aa;p=bin.git * add word_sanitize functoin --- diff --git a/anamang b/anamang index a2bedd7..e14f213 100755 --- a/anamang +++ b/anamang @@ -123,6 +123,9 @@ if (not @words) { my @l_o = ('a'..'z'); my %l_o; @l_o{@l_o} = (0 .. 25); +sub word_sanitize{ + return map {tr/A-Z/a-z/; tr/éüöáí/euoai/; $_ } @_ +} my $database = update_and_load_database($options{database_dir},$options{wordlist}); @@ -270,7 +273,7 @@ sub update_and_load_database { while (<$wordlist_fh>) { chomp; next unless length $_; - my $word = lc($_); + my $word = word_sanitize($_); $word =~ s/[^a-z]//; next unless length $_; next if exists $seen_words{$word};