static {
isoCodeToEnWikiName.put("AF", "Afrikaans");
isoCodeToEnWikiName.put("SQ", "Albanian");
static {
isoCodeToEnWikiName.put("AF", "Afrikaans");
isoCodeToEnWikiName.put("SQ", "Albanian");
isoCodeToEnWikiName.put("ET", "Estonian");
isoCodeToEnWikiName.put("FI", "Finnish");
isoCodeToEnWikiName.put("FR", "French");
isoCodeToEnWikiName.put("ET", "Estonian");
isoCodeToEnWikiName.put("FI", "Finnish");
isoCodeToEnWikiName.put("FR", "French");
+ // Note: must be before German since matcher
+ // simply takes first match instead of best.
+ isoCodeToEnWikiName.put("nds", "Low German");
+ isoCodeToEnWikiName.put("pdc", "Pennsylvania German");
isoCodeToEnWikiName.put("DE", "German");
isoCodeToEnWikiName.put("grc", "Ancient Greek");
isoCodeToEnWikiName.put("EL", "Greek");
isoCodeToEnWikiName.put("DE", "German");
isoCodeToEnWikiName.put("grc", "Ancient Greek");
isoCodeToEnWikiName.put("EL", "Greek");
isoCodeToEnWikiName.put("HT", "Haitian Creole");
isoCodeToEnWikiName.put("LB", "Luxembourgish");
isoCodeToEnWikiName.put("MK", "Macedonian");
isoCodeToEnWikiName.put("HT", "Haitian Creole");
isoCodeToEnWikiName.put("LB", "Luxembourgish");
isoCodeToEnWikiName.put("MK", "Macedonian");
- isoCodeToEnWikiName.put("GV", "Manx");
+ isoCodeToEnWikiName.put("scn", "Sicilian");
+ isoCodeToEnWikiName.put("cu", "Old Church Slavonic");
+ isoCodeToEnWikiName.put("rom", "Romani");
// No longer exists in EN:
// isoCodeToEnWikiName.put("BS", "Bosnian");
// No longer exists in EN:
// isoCodeToEnWikiName.put("BS", "Bosnian");
- public static final Map<String,Map<String,String>> wikiCodeToIsoCodeToWikiName = new LinkedHashMap<String, Map<String,String>>();
+ public static final Map<String,Map<String,String>> wikiCodeToIsoCodeToWikiName = new LinkedHashMap<>();
isoCodeToWikiName.put("DE", "Deutsch");
isoCodeToWikiName.put("EN", "Englisch");
isoCodeToWikiName.put("IT", "Italienisch");
isoCodeToWikiName.put("DE", "Deutsch");
isoCodeToWikiName.put("EN", "Englisch");
isoCodeToWikiName.put("IT", "Italienisch");
isoCodeToWikiName.put("HU", "Ungarisch");
isoCodeToWikiName.put("SV", "Schwedisch");
isoCodeToWikiName.put("ES", "Spanisch");
isoCodeToWikiName.put("HU", "Ungarisch");
isoCodeToWikiName.put("SV", "Schwedisch");
isoCodeToWikiName.put("ES", "Spanisch");
wikiCodeToIsoCodeToWikiName.put("fr", isoCodeToWikiName);
isoCodeToWikiName.put("FR", Pattern.quote("{{langue|fr}}"));
isoCodeToWikiName.put("RU", Pattern.quote("{{langue|ru}}"));
isoCodeToWikiName.put("AR", Pattern.quote("{{langue|ar}}")); // Arabic
isoCodeToWikiName.put("BG", Pattern.quote("{{langue|bg}}")); // Bulgarian
wikiCodeToIsoCodeToWikiName.put("fr", isoCodeToWikiName);
isoCodeToWikiName.put("FR", Pattern.quote("{{langue|fr}}"));
isoCodeToWikiName.put("RU", Pattern.quote("{{langue|ru}}"));
isoCodeToWikiName.put("AR", Pattern.quote("{{langue|ar}}")); // Arabic
isoCodeToWikiName.put("BG", Pattern.quote("{{langue|bg}}")); // Bulgarian
isoCodeToWikiName.put("EN", Pattern.quote("{{langue|en}}"));
//isoCodeToWikiName.put("", Pattern.quote("{{langue|sl}}"));
isoCodeToWikiName.put("LA", Pattern.quote("{{langue|la}}"));
isoCodeToWikiName.put("EN", Pattern.quote("{{langue|en}}"));
//isoCodeToWikiName.put("", Pattern.quote("{{langue|sl}}"));
isoCodeToWikiName.put("LA", Pattern.quote("{{langue|la}}"));
isoCodeToWikiName.put("PT", Pattern.quote("{{langue|pt}}"));
// egrep -o '= *\{\{-[a-z]+-\}\} *=' itwiktionary-pages-articles.xml | sort | uniq -c | sort -n
isoCodeToWikiName.put("PT", Pattern.quote("{{langue|pt}}"));
// egrep -o '= *\{\{-[a-z]+-\}\} *=' itwiktionary-pages-articles.xml | sort | uniq -c | sort -n
wikiCodeToIsoCodeToWikiName.put("it", isoCodeToWikiName);
isoCodeToWikiName.put("IT", "\\{\\{-(it|scn|nap|cal|lmo)-\\}\\}"); // scn, nap, cal, lmo
isoCodeToWikiName.put("EN", Pattern.quote("{{-en-}}"));
wikiCodeToIsoCodeToWikiName.put("it", isoCodeToWikiName);
isoCodeToWikiName.put("IT", "\\{\\{-(it|scn|nap|cal|lmo)-\\}\\}"); // scn, nap, cal, lmo
isoCodeToWikiName.put("EN", Pattern.quote("{{-en-}}"));
isoCodeToWikiName.put("RU", Pattern.quote("{{-ru-}}"));
// egrep -o '== *\{\{lengua\|[a-zA-Z]+\}\} *==' frwiktionary-pages-articles.xml | sort | uniq -c | sort -nr
isoCodeToWikiName.put("RU", Pattern.quote("{{-ru-}}"));
// egrep -o '== *\{\{lengua\|[a-zA-Z]+\}\} *==' frwiktionary-pages-articles.xml | sort | uniq -c | sort -nr
isoCodeToWikiName.put("ES", Pattern.quote("{{lengua|es}}"));
isoCodeToWikiName.put("EN", Pattern.quote("{{lengua|en}}"));
isoCodeToWikiName.put("FR", Pattern.quote("{{lengua|fr}}"));
isoCodeToWikiName.put("IT", Pattern.quote("{{lengua|it}}"));
// Pattern seems to match Italian one
isoCodeToWikiName.put("ES", Pattern.quote("{{lengua|es}}"));
isoCodeToWikiName.put("EN", Pattern.quote("{{lengua|en}}"));
isoCodeToWikiName.put("FR", Pattern.quote("{{lengua|fr}}"));
isoCodeToWikiName.put("IT", Pattern.quote("{{lengua|it}}"));
// Pattern seems to match Italian one
wikiCodeToIsoCodeToWikiName.put("pt", isoCodeToWikiName);
isoCodeToWikiName.put("PT", Pattern.quote("{{-pt-}}"));
isoCodeToWikiName.put("EN", Pattern.quote("{{-en-}}"));
wikiCodeToIsoCodeToWikiName.put("pt", isoCodeToWikiName);
isoCodeToWikiName.put("PT", Pattern.quote("{{-pt-}}"));
isoCodeToWikiName.put("EN", Pattern.quote("{{-en-}}"));