From f73bc969da1b56b315b7de9660a1f5e0ee5fddcc Mon Sep 17 00:00:00 2001 From: =?utf8?q?Reimar=20D=C3=B6ffinger?= Date: Wed, 26 Aug 2015 22:34:44 +0200 Subject: [PATCH] Script adds/improvements dictionary generation. --- WiktionarySplitter.sh | 3 +++ data/downloadInputs.sh | 2 +- 2 files changed, 4 insertions(+), 1 deletion(-) create mode 100755 WiktionarySplitter.sh diff --git a/WiktionarySplitter.sh b/WiktionarySplitter.sh new file mode 100755 index 0000000..5c4a752 --- /dev/null +++ b/WiktionarySplitter.sh @@ -0,0 +1,3 @@ +# Run after downloading (data/downloadInputs.sh) to generate +# per-language data files from enwiktionary. +/usr/lib/jvm/java-8-openjdk-amd64/jre/bin/java -classpath src:../Util/src/:../Dictionary/src/:/usr/share/java/com.ibm.icu.jar:/usr/share/java/xercesImpl.jar com.hughes.android.dictionary.engine.WiktionarySplitter "$@" diff --git a/data/downloadInputs.sh b/data/downloadInputs.sh index 8d58801..3135eb0 100755 --- a/data/downloadInputs.sh +++ b/data/downloadInputs.sh @@ -47,6 +47,6 @@ curl --remote-name http://dumps.wikimedia.org/${L}wiktionary/latest/${WIKI}.bz2 bunzip2 ${WIKI}.bz2 mv ${WIKI} inputs/${L}wiktionary-pages-articles.xml -echo "Done. Now run WiktionarySplitter to spit apart enwiktionary." +echo "Done. Now run WiktionarySplitter to split apart enwiktionary." cd $OLD_DIR -- 2.43.0