import java.util.logging.Logger;
import java.util.regex.Pattern;
+import com.hughes.android.dictionary.engine.EntrySource;
import com.hughes.android.dictionary.engine.EntryTypeName;
import com.hughes.android.dictionary.engine.IndexBuilder;
import com.hughes.android.dictionary.engine.IndexedEntry;
"Particle|Interjection|Pronominal adverb" +
"Han character|Hanzi|Hanja|Kanji|Katakana character|Syllable");
+ EntrySource entrySource;
final IndexBuilder enIndexBuilder;
final IndexBuilder foreignIndexBuilder;
final Pattern langPattern;
}
- public void parse(final File file, final int pageLimit) throws IOException {
+ public void parse(final File file, final EntrySource entrySource, final int pageLimit) throws IOException {
+ this.entrySource = entrySource;
int pageCount = 0;
final DataInputStream dis = new DataInputStream(new BufferedInputStream(new FileInputStream(file)));
+ try {
while (true) {
if (pageLimit >= 0 && pageCount >= pageLimit) {
return;
LOG.info("pageCount=" + pageCount);
}
}
+ } finally {
+ System.out.println("lang Counts: " + appendAndIndexWikiCallback.langCodeToTCount);
+ appendAndIndexWikiCallback.langCodeToTCount.keySet().removeAll(EnWiktionaryLangs.isoCodeToWikiName.keySet());
+ System.out.println("unused Counts: " + appendAndIndexWikiCallback.langCodeToTCount);
+ }
}
private void parseSection(String heading, final String text) {
private void doTranslationLine(final String line, final String lang, final String pos, final String sense, final String rest) {
state = State.TRANSLATION_LINE;
// Good chance we'll actually file this one...
- final PairEntry pairEntry = new PairEntry();
+ final PairEntry pairEntry = new PairEntry(entrySource);
final IndexedEntry indexedEntry = new IndexedEntry(pairEntry);
final StringBuilder foreignText = new StringBuilder();
return;
}
- final PairEntry pairEntry = new PairEntry();
+ final PairEntry pairEntry = new PairEntry(entrySource);
final IndexedEntry indexedEntry = new IndexedEntry(pairEntry);
entryIsFormOfSomething = false;