X-Git-Url: http://gitweb.fperrin.net/?a=blobdiff_plain;f=src%2Fcom%2Fhughes%2Fandroid%2Fdictionary%2Fparser%2Fwiktionary%2FWiktionaryLangs.java;h=c4935341d999e13b687b9c0878f4ff9bcdfaa743;hb=5a1b9f8a37d03dc675e1d895817422e9743a5b5b;hp=804925796377bb3dc78a08c3b410e56d3ef87c87;hpb=761f748ec034b093581535f7a4befa8e6e3c6873;p=DictionaryPC.git diff --git a/src/com/hughes/android/dictionary/parser/wiktionary/WiktionaryLangs.java b/src/com/hughes/android/dictionary/parser/wiktionary/WiktionaryLangs.java index 8049257..c493534 100644 --- a/src/com/hughes/android/dictionary/parser/wiktionary/WiktionaryLangs.java +++ b/src/com/hughes/android/dictionary/parser/wiktionary/WiktionaryLangs.java @@ -14,12 +14,8 @@ package com.hughes.android.dictionary.parser.wiktionary; -import com.hughes.android.dictionary.engine.Language; - import java.util.LinkedHashMap; -import java.util.LinkedHashSet; import java.util.Map; -import java.util.Set; import java.util.regex.Pattern; public class WiktionaryLangs { @@ -46,6 +42,10 @@ public class WiktionaryLangs { isoCodeToEnWikiName.put("ET", "Estonian"); isoCodeToEnWikiName.put("FI", "Finnish"); isoCodeToEnWikiName.put("FR", "French"); + // Note: must be before German since matcher + // simply takes first match instead of best. + isoCodeToEnWikiName.put("nds", "Low German"); + isoCodeToEnWikiName.put("pdc", "Pennsylvania German"); isoCodeToEnWikiName.put("DE", "German"); isoCodeToEnWikiName.put("grc", "Ancient Greek"); isoCodeToEnWikiName.put("EL", "Greek"); @@ -108,6 +108,9 @@ public class WiktionaryLangs { isoCodeToEnWikiName.put("LB", "Luxembourgish"); isoCodeToEnWikiName.put("MK", "Macedonian"); isoCodeToEnWikiName.put("GV", "Manx"); + isoCodeToEnWikiName.put("scn", "Sicilian"); + isoCodeToEnWikiName.put("cu", "Old Church Slavonic"); + isoCodeToEnWikiName.put("rom", "Romani"); // No longer exists in EN: // isoCodeToEnWikiName.put("BS", "Bosnian"); @@ -128,14 +131,15 @@ public class WiktionaryLangs { public static final Map> wikiCodeToIsoCodeToWikiName = new LinkedHashMap>(); static { + Map isoCodeToWikiName; + // en wikiCodeToIsoCodeToWikiName.put("en", isoCodeToEnWikiName); - Map isoCodeToWikiName; - // egrep -o '\{\{Wortart[^}]+\}\}' dewiktionary-pages-articles.xml | cut -d \| -f3 | sort | uniq -c | sort -nr isoCodeToWikiName = new LinkedHashMap(); wikiCodeToIsoCodeToWikiName.put("de", isoCodeToWikiName); + isoCodeToWikiName.put("nds", "Niederdeutsch"); isoCodeToWikiName.put("DE", "Deutsch"); isoCodeToWikiName.put("EN", "Englisch"); isoCodeToWikiName.put("IT", "Italienisch"); @@ -148,6 +152,7 @@ public class WiktionaryLangs { isoCodeToWikiName.put("HU", "Ungarisch"); isoCodeToWikiName.put("SV", "Schwedisch"); isoCodeToWikiName.put("ES", "Spanisch"); + isoCodeToWikiName.put("RO", "Rumänisch"); // egrep -o '== *\{\{langue\|[a-zA-Z]+\}\} *==' frwiktionary-pages-articles.xml | sort | uniq -c | sort -nr isoCodeToWikiName = new LinkedHashMap(); @@ -156,6 +161,7 @@ public class WiktionaryLangs { isoCodeToWikiName.put("RU", Pattern.quote("{{langue|ru}}")); isoCodeToWikiName.put("AR", Pattern.quote("{{langue|ar}}")); // Arabic isoCodeToWikiName.put("BG", Pattern.quote("{{langue|bg}}")); // Bulgarian + isoCodeToWikiName.put("EL", Pattern.quote("{{langue|el}}")); isoCodeToWikiName.put("EN", Pattern.quote("{{langue|en}}")); //isoCodeToWikiName.put("", Pattern.quote("{{langue|sl}}")); isoCodeToWikiName.put("LA", Pattern.quote("{{langue|la}}")); @@ -196,6 +202,7 @@ public class WiktionaryLangs { // egrep -o '== *\{\{lengua\|[a-zA-Z]+\}\} *==' frwiktionary-pages-articles.xml | sort | uniq -c | sort -nr isoCodeToWikiName = new LinkedHashMap(); wikiCodeToIsoCodeToWikiName.put("es", isoCodeToWikiName); + isoCodeToWikiName.put("AR", Pattern.quote("{{lengua|ar}}")); isoCodeToWikiName.put("ES", Pattern.quote("{{lengua|es}}")); isoCodeToWikiName.put("EN", Pattern.quote("{{lengua|en}}")); isoCodeToWikiName.put("FR", Pattern.quote("{{lengua|fr}}"));