summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorTapio Lehtonen <tale@debian.org>2009-09-05 14:34:13 +0000
committerTapio Lehtonen <tale@debian.org>2009-09-05 14:34:13 +0000
commitb8712cdc5c0013c4468d672460301a9a9f3ac5a3 (patch)
treefc4e9b09ca03f5eb907868db4c0ee643caf06b21
parent53be289ba6da97defc15f2e0669402ea7d00ded8 (diff)
downloadinstallation-guide-b8712cdc5c0013c4468d672460301a9a9f3ac5a3.zip
I'm working on finnish spellchecking using Voikko. This is still
work in progress, but to not lose what I have already done I'm storing the scripts I have made.
-rwxr-xr-xpo/fi/make-fi-all.sh24
1 files changed, 24 insertions, 0 deletions
diff --git a/po/fi/make-fi-all.sh b/po/fi/make-fi-all.sh
new file mode 100755
index 000000000..fea25f2f2
--- /dev/null
+++ b/po/fi/make-fi-all.sh
@@ -0,0 +1,24 @@
+#! /bin/bash
+BASEDIR=~/Work/Debian/
+EXTRACT=${BASEDIR}d-i/trunk/scripts/l10n/l10n-spellcheck/extract_msg.pl
+SPELLCHECKER=/usr/bin/enchant
+WORDLIST=${BASEDIR}d-i/trunk/scripts/l10n/l10n-spellcheck/cfg/wls/di_common_wl.txt
+
+if [ -f fi_all.po ] ; then
+ rm fi_all.po
+fi
+
+# no fi_all.po at *.po time
+for f in *.po ; do
+ ${EXTRACT} -msgstr ${f} > $$.temp1
+ tail --lines=+3 $$.temp1 > $$.temp2
+ cut --delimiter=\" --fields=2 < $$.temp2 >> fi_all.po
+done
+
+rm $$.temp1 $$.temp2
+
+# Make list of words tmispell-voikko does not accept
+${SPELLCHECKER} -l -d suomi < fi_all.po > $$.temp3
+sort $$.temp3 | uniq > finnish_unkn_wl.txt
+rm $$.temp3
+echo "Tuntemattomia sanoja " `wc -l finnish_unkn_wl.txt`