]> gitweb.fperrin.net Git - DictionaryPC.git/commitdiff
Support pt and es wiktionary in splitter.
authorReimar Döffinger <Reimar.Doeffinger@gmx.de>
Sat, 11 Feb 2017 16:32:56 +0000 (17:32 +0100)
committerReimar Döffinger <Reimar.Doeffinger@gmx.de>
Sat, 11 Feb 2017 16:32:56 +0000 (17:32 +0100)
The ES format seems to have changed so we can
now actually use it.

src/com/hughes/android/dictionary/parser/wiktionary/WiktionaryLangs.java

index 3efc67695c6f841a1e998fd0d35155a6066074df..804925796377bb3dc78a08c3b410e56d3ef87c87 100644 (file)
@@ -193,10 +193,20 @@ public class WiktionaryLangs {
         isoCodeToWikiName.put("SV", Pattern.quote("{{-sv-}}"));
         isoCodeToWikiName.put("RU", Pattern.quote("{{-ru-}}"));
 
-        // There seems to be no consistent pattern and few foreign language entries anyway
+        // egrep -o '== *\{\{lengua\|[a-zA-Z]+\}\} *==' frwiktionary-pages-articles.xml | sort | uniq -c | sort -nr
         isoCodeToWikiName = new LinkedHashMap<String, String>();
         wikiCodeToIsoCodeToWikiName.put("es", isoCodeToWikiName);
-        isoCodeToWikiName.put("ES", Pattern.quote("{{ES"));
+        isoCodeToWikiName.put("ES", Pattern.quote("{{lengua|es}}"));
+        isoCodeToWikiName.put("EN", Pattern.quote("{{lengua|en}}"));
+        isoCodeToWikiName.put("FR", Pattern.quote("{{lengua|fr}}"));
+        isoCodeToWikiName.put("IT", Pattern.quote("{{lengua|it}}"));
+
+        // Pattern seems to match Italian one
+        isoCodeToWikiName = new LinkedHashMap<String, String>();
+        wikiCodeToIsoCodeToWikiName.put("pt", isoCodeToWikiName);
+        isoCodeToWikiName.put("PT", Pattern.quote("{{-pt-}}"));
+        isoCodeToWikiName.put("EN", Pattern.quote("{{-en-}}"));
+        isoCodeToWikiName.put("ES", Pattern.quote("{{-es-}}"));
     }
     public static String getEnglishName(String langCode) {
         String name = isoCodeToEnWikiName.get(langCode);