From b8712cdc5c0013c4468d672460301a9a9f3ac5a3 Mon Sep 17 00:00:00 2001 From: Tapio Lehtonen Date: Sat, 5 Sep 2009 14:34:13 +0000 Subject: I'm working on finnish spellchecking using Voikko. This is still work in progress, but to not lose what I have already done I'm storing the scripts I have made. --- po/fi/make-fi-all.sh | 24 ++++++++++++++++++++++++ 1 file changed, 24 insertions(+) create mode 100755 po/fi/make-fi-all.sh diff --git a/po/fi/make-fi-all.sh b/po/fi/make-fi-all.sh new file mode 100755 index 000000000..fea25f2f2 --- /dev/null +++ b/po/fi/make-fi-all.sh @@ -0,0 +1,24 @@ +#! /bin/bash +BASEDIR=~/Work/Debian/ +EXTRACT=${BASEDIR}d-i/trunk/scripts/l10n/l10n-spellcheck/extract_msg.pl +SPELLCHECKER=/usr/bin/enchant +WORDLIST=${BASEDIR}d-i/trunk/scripts/l10n/l10n-spellcheck/cfg/wls/di_common_wl.txt + +if [ -f fi_all.po ] ; then + rm fi_all.po +fi + +# no fi_all.po at *.po time +for f in *.po ; do + ${EXTRACT} -msgstr ${f} > $$.temp1 + tail --lines=+3 $$.temp1 > $$.temp2 + cut --delimiter=\" --fields=2 < $$.temp2 >> fi_all.po +done + +rm $$.temp1 $$.temp2 + +# Make list of words tmispell-voikko does not accept +${SPELLCHECKER} -l -d suomi < fi_all.po > $$.temp3 +sort $$.temp3 | uniq > finnish_unkn_wl.txt +rm $$.temp3 +echo "Tuntemattomia sanoja " `wc -l finnish_unkn_wl.txt` -- cgit v1.2.3