if (isIgnorableTitle(title)) {
return;
}
- final String lang = heading.replaceAll("=", "").trim();
+ final String lang = heading.replace("=", "").trim();
if (!langPattern.matcher(lang).find()){
return;
}
} else if (wikiTokenizer.isPlainText()) {
// Unindexed!
foreignBuilder.append(wikiTokenizer.token());
-
- } else if (wikiTokenizer.isMarkup() || wikiTokenizer.isNewline() || wikiTokenizer.isComment()) {
+ } else if (wikiTokenizer.isHtml()) {
+ if (!wikiTokenizer.token().startsWith("<ref>")) {
+ foreignBuilder.append(wikiTokenizer.token());
+ }
+ } else if (wikiTokenizer.isMarkup() ||
+ wikiTokenizer.isNewline() ||
+ wikiTokenizer.isComment()) {
// Do nothing.
} else {
LOG.warning("Unexpected token: " + wikiTokenizer.token());
}
- } // ForeignParser
\ No newline at end of file
+ } // ForeignParser