X-Git-Url: http://gitweb.fperrin.net/?a=blobdiff_plain;f=src%2Fcom%2Fhughes%2Fandroid%2Fdictionary%2Fparser%2Fwiktionary%2FWiktionaryLangs.java;h=86206a060bbbc68f09c4314c16ba1eeae6f245e9;hb=cb48e386855b695b54c6e9682ef7bffaf1d2ba38;hp=30472fb434643ea956c03737ebfe38d8f73ee9ec;hpb=7262a5fd59deba0fed05958b0eee06f806fac09a;p=DictionaryPC.git diff --git a/src/com/hughes/android/dictionary/parser/wiktionary/WiktionaryLangs.java b/src/com/hughes/android/dictionary/parser/wiktionary/WiktionaryLangs.java index 30472fb..86206a0 100644 --- a/src/com/hughes/android/dictionary/parser/wiktionary/WiktionaryLangs.java +++ b/src/com/hughes/android/dictionary/parser/wiktionary/WiktionaryLangs.java @@ -46,6 +46,10 @@ public class WiktionaryLangs { isoCodeToEnWikiName.put("ET", "Estonian"); isoCodeToEnWikiName.put("FI", "Finnish"); isoCodeToEnWikiName.put("FR", "French"); + // Note: must be before German since matcher + // simply takes first match instead of best. + isoCodeToEnWikiName.put("nds", "Low German"); + isoCodeToEnWikiName.put("pdc", "Pennsylvania German"); isoCodeToEnWikiName.put("DE", "German"); isoCodeToEnWikiName.put("grc", "Ancient Greek"); isoCodeToEnWikiName.put("EL", "Greek"); @@ -109,6 +113,8 @@ public class WiktionaryLangs { isoCodeToEnWikiName.put("MK", "Macedonian"); isoCodeToEnWikiName.put("GV", "Manx"); isoCodeToEnWikiName.put("scn", "Sicilian"); + isoCodeToEnWikiName.put("cu", "Old Church Slavonic"); + isoCodeToEnWikiName.put("rom", "Romani"); // No longer exists in EN: // isoCodeToEnWikiName.put("BS", "Bosnian"); @@ -129,14 +135,15 @@ public class WiktionaryLangs { public static final Map> wikiCodeToIsoCodeToWikiName = new LinkedHashMap>(); static { + Map isoCodeToWikiName; + // en wikiCodeToIsoCodeToWikiName.put("en", isoCodeToEnWikiName); - Map isoCodeToWikiName; - // egrep -o '\{\{Wortart[^}]+\}\}' dewiktionary-pages-articles.xml | cut -d \| -f3 | sort | uniq -c | sort -nr isoCodeToWikiName = new LinkedHashMap(); wikiCodeToIsoCodeToWikiName.put("de", isoCodeToWikiName); + isoCodeToWikiName.put("nds", "Niederdeutsch"); isoCodeToWikiName.put("DE", "Deutsch"); isoCodeToWikiName.put("EN", "Englisch"); isoCodeToWikiName.put("IT", "Italienisch"); @@ -149,6 +156,7 @@ public class WiktionaryLangs { isoCodeToWikiName.put("HU", "Ungarisch"); isoCodeToWikiName.put("SV", "Schwedisch"); isoCodeToWikiName.put("ES", "Spanisch"); + isoCodeToWikiName.put("RO", "Rumänisch"); // egrep -o '== *\{\{langue\|[a-zA-Z]+\}\} *==' frwiktionary-pages-articles.xml | sort | uniq -c | sort -nr isoCodeToWikiName = new LinkedHashMap(); @@ -157,6 +165,7 @@ public class WiktionaryLangs { isoCodeToWikiName.put("RU", Pattern.quote("{{langue|ru}}")); isoCodeToWikiName.put("AR", Pattern.quote("{{langue|ar}}")); // Arabic isoCodeToWikiName.put("BG", Pattern.quote("{{langue|bg}}")); // Bulgarian + isoCodeToWikiName.put("EL", Pattern.quote("{{langue|el}}")); isoCodeToWikiName.put("EN", Pattern.quote("{{langue|en}}")); //isoCodeToWikiName.put("", Pattern.quote("{{langue|sl}}")); isoCodeToWikiName.put("LA", Pattern.quote("{{langue|la}}")); @@ -175,6 +184,7 @@ public class WiktionaryLangs { isoCodeToWikiName.put("ES", Pattern.quote("{{langue|es}}")); isoCodeToWikiName.put("UK", Pattern.quote("{{langue|uk}}")); isoCodeToWikiName.put("PT", Pattern.quote("{{langue|pt}}")); + isoCodeToWikiName.put("SV", Pattern.quote("{{langue|sv}}")); // egrep -o '= *\{\{-[a-z]+-\}\} *=' itwiktionary-pages-articles.xml | sort | uniq -c | sort -n isoCodeToWikiName = new LinkedHashMap(); @@ -197,6 +207,7 @@ public class WiktionaryLangs { // egrep -o '== *\{\{lengua\|[a-zA-Z]+\}\} *==' frwiktionary-pages-articles.xml | sort | uniq -c | sort -nr isoCodeToWikiName = new LinkedHashMap(); wikiCodeToIsoCodeToWikiName.put("es", isoCodeToWikiName); + isoCodeToWikiName.put("AR", Pattern.quote("{{lengua|ar}}")); isoCodeToWikiName.put("ES", Pattern.quote("{{lengua|es}}")); isoCodeToWikiName.put("EN", Pattern.quote("{{lengua|en}}")); isoCodeToWikiName.put("FR", Pattern.quote("{{lengua|fr}}"));