import com.hughes.android.dictionary.parser.wiktionary.AbstractWiktionaryParser.NameAndArgs;
import com.hughes.util.ListUtil;
import com.hughes.util.MapUtil;
+import com.hughes.util.StringUtil;
+import java.util.ArrayList;
import java.util.Arrays;
import java.util.LinkedHashMap;
import java.util.LinkedHashSet;
callbacks.put("p", callback);
callbacks.put("g", callback);
+ callbacks.put("etyl", new etyl<T>());
+ callbacks.put("term", new term<T>());
+
callback = new EncodingCallback<T>();
Set<String> encodings = new LinkedHashSet<String>(Arrays.asList(
"IPA", "IPAchar", // Not really encodings, but it works.
callbacks.put("rfquote", callback);
callbacks.put("attention", callback);
callbacks.put("zh-attention", callback);
+ callbacks.put("top2", callback);
+ callbacks.put("mid2", callback);
+ callbacks.put("top3", callback);
+ callbacks.put("mid3", callback);
+ callbacks.put("bottom", callback);
+ callbacks.put("rel-mid", callback);
+ callbacks.put("rel-mid3", callback);
+ callbacks.put("rel-mid4", callback);
+ callbacks.put("rel-bottom", callback);
+ callbacks.put("der-top", callback);
+ callbacks.put("der-mid", callback);
+ callbacks.put("der-mid3", callback);
+ callbacks.put("der-bottom", callback);
callback = new AppendName<T>();
callbacks.put("...", callback);
final Map<String, String> namedArgs,
final T parser,
final AppendAndIndexWikiCallback<T> appendAndIndexWikiCallback) {
- if (args.size() != 1 || !namedArgs.isEmpty()) {
- EnParser.LOG.warning("weird qualifier: ");
+ namedArgs.remove("lang");
+ if (!namedArgs.isEmpty()) {
+ EnParser.LOG.warning("weird qualifier: " + wikiTokenizer.token());
return false;
}
- String qualifier = args.get(0);
appendAndIndexWikiCallback.builder.append("(");
- appendAndIndexWikiCallback.dispatch(qualifier, null);
+ for (int i = 0; i < args.size(); ++i) {
+ appendAndIndexWikiCallback.dispatch(args.get(i), null);
+ if (i > 0) {
+ appendAndIndexWikiCallback.builder.append(", ");
+ }
+ }
appendAndIndexWikiCallback.builder.append(")");
return true;
}
final Map<String, String> namedArgs,
final T parser,
final AppendAndIndexWikiCallback<T> appendAndIndexWikiCallback) {
+ namedArgs.remove("lang");
if (!namedArgs.isEmpty()) {
EnParser.LOG.warning("weird encoding: " + wikiTokenizer.token());
return false;
}
}
+ static final class etyl<T extends AbstractWiktionaryParser> implements FunctionCallback<T> {
+ @Override
+ public boolean onWikiFunction(final WikiTokenizer wikiTokenizer, final String name, final List<String> args,
+ final Map<String, String> namedArgs,
+ final T parser,
+ final AppendAndIndexWikiCallback<T> appendAndIndexWikiCallback) {
+ final String langCode = ListUtil.get(args, 0);
+ if (langCode == null) {
+ return false;
+ }
+ String langName = WiktionaryLangs.getEnglishName(langCode);
+ if (langName != null) {
+ appendAndIndexWikiCallback.dispatch(langName, null);
+ } else {
+ appendAndIndexWikiCallback.dispatch("lang:" + langCode, null);
+ }
+ return true;
+ }
+ }
+
+ static final class term<T extends AbstractWiktionaryParser> implements FunctionCallback<T> {
+ @Override
+ public boolean onWikiFunction(final WikiTokenizer wikiTokenizer, final String name, final List<String> args,
+ final Map<String, String> namedArgs,
+ final T parser,
+ final AppendAndIndexWikiCallback<T> appendAndIndexWikiCallback) {
+ namedArgs.remove("sc");
+
+ // Main text.
+ final String lang = namedArgs.remove("lang");
+ String head = ListUtil.get(args, 0);
+ String display = ListUtil.get(args, 1);
+ if (StringUtil.isNullOrEmpty(head) && StringUtil.isNullOrEmpty(display)) {
+ head = display = parser.title;
+ }
+ if (StringUtil.isNullOrEmpty(head)) {
+ // Dispatches formatted wiki text.
+ appendAndIndexWikiCallback.dispatch(display, null);
+ } else {
+ if (StringUtil.isNullOrEmpty(display)) {
+ display = head;
+ }
+ appendAndIndexWikiCallback.dispatch(String.format("[[%s|%s]]", display, head), null);
+ }
+
+ // Stuff in ()s.
+ final String tr = namedArgs.remove("tr");
+ final String pos = namedArgs.remove("pos");
+ String gloss = ListUtil.get(args, 2);
+ String literally = namedArgs.remove("lit");
+ if (!StringUtil.isNullOrEmpty(gloss)) {
+ gloss = String.format("\"%s\"", gloss);
+ }
+ if (!StringUtil.isNullOrEmpty(literally)) {
+ literally = String.format("literally %s", literally);
+ }
+ final List<String> inParens = new ArrayList<String>(Arrays.asList(tr, pos, gloss, literally));
+ cleanList(inParens);
+ appendCommaSeparatedList(appendAndIndexWikiCallback, inParens);
+
+ if (tr != null) {
+ parser.addLinkToCurrentEntry(tr, lang, EntryTypeName.WIKTIONARY_MENTIONED);
+ }
+ return namedArgs.isEmpty();
+ }
+
+ private void appendCommaSeparatedList(
+ final AppendAndIndexWikiCallback<T> appendAndIndexWikiCallback,
+ final List<String> inParens) {
+ if (!inParens.isEmpty()) {
+ appendAndIndexWikiCallback.dispatch(" (", null);
+ for (int i = 0; i < inParens.size(); ++i) {
+ if (i > 0) {
+ appendAndIndexWikiCallback.dispatch(", ", null);
+ }
+ appendAndIndexWikiCallback.dispatch(inParens.get(i), null);
+ }
+ appendAndIndexWikiCallback.dispatch(")", null);
+ }
+ }
+
+ }
+
+ private static void cleanList(List<String> asList) {
+ int pos;
+ while ((pos = asList.indexOf("")) != -1) {
+ asList.remove(pos);
+ }
+ while ((pos = asList.indexOf(null)) != -1) {
+ asList.remove(pos);
+ }
+ }
+
static {
DEFAULT.put("it-noun", new it_noun());
final EnParser parser,
final AppendAndIndexWikiCallback<EnParser> appendAndIndexWikiCallback) {
parser.titleAppended = true;
- final String base = ListUtil.get(args, 0);
- final String gender = ListUtil.get(args, 1);
- final String singular = base + ListUtil.get(args, 2, null);
- final String plural = base + ListUtil.get(args, 3, null);
+ final String gender = ListUtil.get(args, 0);
+ final String singular = parser.title;
+ final String plural = ListUtil.get(args, 1, null);
appendAndIndexWikiCallback.builder.append(" ");
appendAndIndexWikiCallback.dispatch(singular, null, null);
appendAndIndexWikiCallback.builder.append(" {").append(gender).append("}, ");
- appendAndIndexWikiCallback.dispatch(plural, null, null);
- appendAndIndexWikiCallback.builder.append(" {pl}");
+ if (plural != null) {
+ appendAndIndexWikiCallback.dispatch(plural, null, null);
+ appendAndIndexWikiCallback.builder.append(" {pl}");
+ parser.wordForms.add(plural);
+ }
+ final String f = namedArgs.remove("f");
+ if (f != null) {
+ appendAndIndexWikiCallback.builder.append(", ");
+ appendAndIndexWikiCallback.dispatch(f, null, null);
+ appendAndIndexWikiCallback.builder.append(" {f}");
+ }
+ final String m = namedArgs.remove("m");
+ if (m != null) {
+ appendAndIndexWikiCallback.builder.append(", ");
+ appendAndIndexWikiCallback.dispatch(m, null, null);
+ appendAndIndexWikiCallback.builder.append(" {m}");
+ }
parser.wordForms.add(singular);
- parser.wordForms.add(plural);
if (!namedArgs.isEmpty() || args.size() > 4) {
EnParser.LOG.warning("Invalid it-noun: " + wikiTokenizer.token());
}
// Italian stuff
// -----------------------------------------------------------------------
- static void passThroughOrFillIn(final Map<String,String> namedArgs, final String key, final String fillIn, final boolean quoteToEmpty) {
- final String value = namedArgs.get(key);
- if (quoteToEmpty && "''".equals(value)) {
- namedArgs.put(key, "");
- return;
- }
- if (value == null || value.equals("")) {
- namedArgs.put(key, fillIn);
- }
- }
-
- static final List<String> it_number_s_p = Arrays.asList("s", "p");
- static final List<String> it_person_1_2_3 = Arrays.asList("1", "2", "3");
- static final List<String> it_reflexive_pronouns = Arrays.asList("mi ", "ti ", "si ", "ci ", "vi ", "si ");
- static final List<String> it_empty = Arrays.asList("", "", "", "", "", "");
- static void it_conj_passMood(final Map<String,String> namedArgs, final String moodName, final boolean quoteToEmpty, final String root, final List<String> suffixes) {
- assert suffixes.size() == 6;
- int i = 0;
- for (final String number : it_number_s_p) {
- for (final String person : it_person_1_2_3) {
- passThroughOrFillIn(namedArgs, String.format("%s%s%s", moodName, person, number), root + suffixes.get(i), quoteToEmpty);
- ++i;
- }
- }
- }
-
- private static <T extends AbstractWiktionaryParser> void outputKeyVariations(AppendAndIndexWikiCallback<T> appendAndIndexWikiCallback,
- final StringBuilder builder, final String keyBase, Map<String, String> namedArgs) {
- for (int suffix = 0; suffix <= 4; ++suffix) {
- final String key = suffix == 0 ? keyBase : keyBase + suffix;
- final String val = namedArgs.remove(key);
- if (val != null) {
- if (suffix > 0) {
- builder.append(", ");
- }
- appendAndIndexWikiCallback.dispatch(val, null);
- appendAndIndexWikiCallback.parser.addLinkToCurrentEntry(val, EntryTypeName.WIKTIONARY_IS_FORM_OF_SOMETHING_ELSE);
- }
- }
- }
-
static final class it_conj_are<T extends AbstractWiktionaryParser> implements FunctionCallback<T> {
final it_conj<T> dest;
it_conj_are(it_conj<T> dest) {
builder.append("</td>");
builder.append("<th colspan=\"1\" style=\"background:#e2e4c0\">gerundio</th>");
builder.append("<td colspan=\"1\">");
- outputKeyVariations(appendAndIndexWikiCallback, builder, "ger", namedArgs);
+ outputKeyVariations(appendAndIndexWikiCallback, builder, "ger", namedArgs, true);
builder.append("</td>");
builder.append("</tr>\n");
builder.append("<tr>");
builder.append("<th colspan=\"1\" style=\"background:#e2e4c0\">participio presente</th>");
builder.append("<td colspan=\"1\">");
- outputKeyVariations(appendAndIndexWikiCallback, builder, "presp", namedArgs);
+ outputKeyVariations(appendAndIndexWikiCallback, builder, "presp", namedArgs, true);
builder.append("</td>");
builder.append("<th colspan=\"1\" style=\"background:#e2e4c0\">participio passato</th>");
builder.append("<td colspan=\"1\">");
- outputKeyVariations(appendAndIndexWikiCallback, builder, "pastp", namedArgs);
+ outputKeyVariations(appendAndIndexWikiCallback, builder, "pastp", namedArgs, true);
builder.append("</td>");
builder.append("</tr>\n");
final List<String> prefixes = (inf != null && inf.endsWith("si")) ? it_reflexive_pronouns : it_empty;
String style = " style=\"background:#c0cfe4\"";
- outputDataRow(appendAndIndexWikiCallback, style, "indicativo", style, "th", "", new LinkedHashMap<String, String>(it_indicativePronouns), it_empty);
- outputDataRow(appendAndIndexWikiCallback, style, "presente", "", "td", "pres", namedArgs, prefixes);
- outputDataRow(appendAndIndexWikiCallback, style, "imperfetto", "", "td", "imperf", namedArgs, prefixes);
- outputDataRow(appendAndIndexWikiCallback, style, "passato remoto", "", "td", "prem", namedArgs, prefixes);
- outputDataRow(appendAndIndexWikiCallback, style, "futuro", "", "td", "fut", namedArgs, prefixes);
+ outputDataRow(appendAndIndexWikiCallback, style, "indicativo", style, "th", "", new LinkedHashMap<String, String>(it_indicativePronouns), it_empty, false);
+ outputDataRow(appendAndIndexWikiCallback, style, "presente", "", "td", "pres", namedArgs, prefixes, true);
+ outputDataRow(appendAndIndexWikiCallback, style, "imperfetto", "", "td", "imperf", namedArgs, prefixes, true);
+ outputDataRow(appendAndIndexWikiCallback, style, "passato remoto", "", "td", "prem", namedArgs, prefixes, true);
+ outputDataRow(appendAndIndexWikiCallback, style, "futuro", "", "td", "fut", namedArgs, prefixes, true);
style = " style=\"background:#c0d8e4\"";
- outputDataRow(appendAndIndexWikiCallback, style, "condizionale", style, "th", "", new LinkedHashMap<String, String>(it_indicativePronouns), it_empty);
- outputDataRow(appendAndIndexWikiCallback, style, "presente", "", "td", "cond", namedArgs, prefixes);
+ outputDataRow(appendAndIndexWikiCallback, style, "condizionale", style, "th", "", new LinkedHashMap<String, String>(it_indicativePronouns), it_empty, false);
+ outputDataRow(appendAndIndexWikiCallback, style, "presente", "", "td", "cond", namedArgs, prefixes, true);
style = " style=\"background:#c0e4c0\"";
- outputDataRow(appendAndIndexWikiCallback, style, "congiuntivo", style, "th", "", new LinkedHashMap<String, String>(it_subjunctivePronouns), it_empty);
+ outputDataRow(appendAndIndexWikiCallback, style, "congiuntivo", style, "th", "", new LinkedHashMap<String, String>(it_subjunctivePronouns), it_empty, false);
namedArgs.put("sub3s2", namedArgs.remove("sub3s"));
namedArgs.put("sub1s", namedArgs.get("sub123s"));
namedArgs.put("sub2s", namedArgs.get("sub123s"));
namedArgs.put("sub1s2", namedArgs.get("sub123s2"));
namedArgs.put("sub2s2", namedArgs.get("sub123s2"));
namedArgs.put("sub3s2", namedArgs.remove("sub123s2"));
- outputDataRow(appendAndIndexWikiCallback, style, "presente", "", "td", "sub", namedArgs, prefixes);
+ outputDataRow(appendAndIndexWikiCallback, style, "presente", "", "td", "sub", namedArgs, prefixes, true);
namedArgs.put("impsub1s", namedArgs.get("impsub12s"));
namedArgs.put("impsub2s", namedArgs.remove("impsub12s"));
namedArgs.put("impsub1s2", namedArgs.get("impsub12s2"));
namedArgs.put("impsub2s2", namedArgs.remove("impsub12s2"));
- outputDataRow(appendAndIndexWikiCallback, style, "imperfetto", "", "td", "impsub", namedArgs, prefixes);
+ outputDataRow(appendAndIndexWikiCallback, style, "imperfetto", "", "td", "impsub", namedArgs, prefixes, true);
style = " style=\"background:#e4d4c0\"";
- outputDataRow(appendAndIndexWikiCallback, style, "imperativo", style, "th", "", new LinkedHashMap<String, String>(it_imperativePronouns), it_empty);
- outputDataRow(appendAndIndexWikiCallback, style, "", "", "td", "imp", namedArgs, it_empty); // these are attached to the stem.
+ outputDataRow(appendAndIndexWikiCallback, style, "imperativo", style, "th", "", new LinkedHashMap<String, String>(it_imperativePronouns), it_empty, false);
+ outputDataRow(appendAndIndexWikiCallback, style, "", "", "td", "imp", namedArgs, it_empty, false); // these are attached to the stem.
builder.append("</table>\n");
if (!namedArgs.isEmpty()) {
System.err.println("NON-EMPTY namedArgs: " + namedArgs);
- assert false;
+ if ("muovesse".equals(namedArgs.get("impsib3s2"))) {
+ return false;
+ }
+ if ("percuotesse".equals(namedArgs.get("impsib3s2"))) {
+ return false;
+ }
+ // Too many to deal with:
+ //assert false;
return false;
}
private void outputDataRow(AppendAndIndexWikiCallback<T> appendAndIndexWikiCallback,
String col1Style, String headerName,
String col2Style, final String type2,
- String moodName, Map<String, String> namedArgs, final List<String> prefixes) {
+ String moodName, Map<String, String> namedArgs, final List<String> prefixes, final boolean isForm) {
final StringBuilder builder = appendAndIndexWikiCallback.builder;
builder.append("<tr>");
builder.append("<th colspan=\"1\"").append(col1Style).append(">").append(headerName).append("</th>");
builder.append("<").append(type2).append("").append(col2Style).append(">");
final String keyBase = String.format("%s%s%s", moodName, person, number);
appendAndIndexWikiCallback.dispatch(prefixes.get(i++), null);
- outputKeyVariations(appendAndIndexWikiCallback, builder, keyBase, namedArgs);
+ outputKeyVariations(appendAndIndexWikiCallback, builder, keyBase, namedArgs, isForm);
// Output <td> or <th>
builder.append("</").append(type2).append(">");
}
builder.append("</tr>\n");
}
}
-}
\ No newline at end of file
+
+ static void passThroughOrFillIn(final Map<String,String> namedArgs, final String key, final String fillIn, final boolean quoteToEmpty) {
+ final String value = namedArgs.get(key);
+ if (quoteToEmpty && "''".equals(value)) {
+ namedArgs.put(key, "");
+ return;
+ }
+ if (value == null || value.equals("")) {
+ namedArgs.put(key, fillIn);
+ }
+ }
+
+ static final List<String> it_number_s_p = Arrays.asList("s", "p");
+ static final List<String> it_person_1_2_3 = Arrays.asList("1", "2", "3");
+ static final List<String> it_reflexive_pronouns = Arrays.asList("mi ", "ti ", "si ", "ci ", "vi ", "si ");
+ static final List<String> it_empty = Arrays.asList("", "", "", "", "", "");
+ static void it_conj_passMood(final Map<String,String> namedArgs, final String moodName, final boolean quoteToEmpty, final String root, final List<String> suffixes) {
+ assert suffixes.size() == 6;
+ int i = 0;
+ for (final String number : it_number_s_p) {
+ for (final String person : it_person_1_2_3) {
+ passThroughOrFillIn(namedArgs, String.format("%s%s%s", moodName, person, number), root + suffixes.get(i), quoteToEmpty);
+ ++i;
+ }
+ }
+ }
+
+ private static <T extends AbstractWiktionaryParser> void outputKeyVariations(AppendAndIndexWikiCallback<T> appendAndIndexWikiCallback,
+ final StringBuilder builder, final String keyBase, Map<String, String> namedArgs, boolean isForm) {
+ for (int suffix = 0; suffix <= 4; ++suffix) {
+ final String key = suffix == 0 ? keyBase : keyBase + suffix;
+ final String val = namedArgs.remove(key);
+ if (val != null && !val.trim().equals("")) {
+ if (suffix > 0) {
+ builder.append(", ");
+ }
+ appendAndIndexWikiCallback.dispatch(val, null);
+ if (isForm) {
+ appendAndIndexWikiCallback.parser.addLinkToCurrentEntry(val, null, EntryTypeName.WIKTIONARY_INFLECTED_FORM_MULTI);
+ }
+ }
+ }
+ }
+
+
+}