]> gitweb.fperrin.net Git - DictionaryPC.git/commitdiff
Escape only unicode chars
authorFrédéric Perrin <fred@fperrin.net>
Sun, 7 Feb 2021 00:35:19 +0000 (00:35 +0000)
committerFrédéric Perrin <fred@fperrin.net>
Sun, 7 Feb 2021 00:35:19 +0000 (00:35 +0000)
src/com/hughes/android/dictionary/parser/DictFileParser.java

index 1f08428761d42911a99a29c3c07a71f6c7f271cc..ef71a689c88dbd6c881d48bedbb434845cb27f24 100644 (file)
@@ -157,8 +157,8 @@ public class DictFileParser implements Parser {
 
         if (singleLang) {
             HtmlEntry htmlEntry = new HtmlEntry(entrySource, fields[0]);
-            htmlEntry.html = StringUtil.escapeUnicodeToPureHtml(fields[1]);
-            
+            htmlEntry.html = StringUtil.escapeUnicodeToPureHtml(fields[1], false);
+
             final IndexBuilder titleIndexBuilder = dictBuilder.indexBuilders.get(0);
             htmlEntry.addToDictionary(titleIndexBuilder.index.dict);
 
@@ -170,6 +170,9 @@ public class DictFileParser implements Parser {
             if (tokens.length > 1) {
                 for (final String token : tokens) {
                     assert token.length() >= 1;
+                   if (token.length() <= 2) {
+                       continue;
+                   }
                     assert token.indexOf("-") == -1;
                     if (/*!alreadyDone.contains(token) && */!token.isEmpty()) {
                         tokenData = titleIndexBuilder.getOrCreateTokenData(token);