X-Git-Url: http://gitweb.fperrin.net/?a=blobdiff_plain;f=src%2Fcom%2Fhughes%2Fandroid%2Fdictionary%2Fengine%2FHtmlEntry.java;h=8dcf905175f5f5e01b983a7fd288f2a80a998ae1;hb=a6dcf86c19971cea1e7585a43bc65f12f189636c;hp=ae1f9f8755864a693e9c52b0652e8aa6ba039c26;hpb=4dfbd0851b5f462644cd200c627e4ab377f297d2;p=Dictionary.git diff --git a/src/com/hughes/android/dictionary/engine/HtmlEntry.java b/src/com/hughes/android/dictionary/engine/HtmlEntry.java index ae1f9f8..8dcf905 100644 --- a/src/com/hughes/android/dictionary/engine/HtmlEntry.java +++ b/src/com/hughes/android/dictionary/engine/HtmlEntry.java @@ -3,22 +3,25 @@ package com.hughes.android.dictionary.engine; import com.hughes.util.StringUtil; import com.hughes.util.raf.RAFListSerializer; -import com.hughes.util.raf.RAFSerializable; +import com.hughes.util.raf.RAFListSerializerSkippable; import com.ibm.icu.text.Transliterator; +import java.io.DataInput; +import java.io.DataOutput; import java.io.IOException; import java.io.PrintStream; -import java.io.RandomAccessFile; +import java.io.UnsupportedEncodingException; import java.lang.ref.SoftReference; +import java.nio.channels.FileChannel; import java.util.List; import java.util.regex.Pattern; -public class HtmlEntry extends AbstractEntry implements RAFSerializable, - Comparable { +public class HtmlEntry extends AbstractEntry implements Comparable { // Title is not HTML escaped. public final String title; - public final LazyHtmlLoader lazyHtmlLoader; + private final LazyHtmlLoader lazyHtmlLoader; + @SuppressWarnings("WeakerAccess") public String html; public HtmlEntry(final EntrySource entrySource, String title) { @@ -27,24 +30,30 @@ public class HtmlEntry extends AbstractEntry implements RAFSerializable { + static final class Serializer implements RAFListSerializerSkippable { final Dictionary dictionary; + final FileChannel ch; - Serializer(Dictionary dictionary) { + Serializer(Dictionary dictionary, FileChannel ch) { this.dictionary = dictionary; + this.ch = ch; } @Override - public HtmlEntry read(RandomAccessFile raf, final int index) throws IOException { - return new HtmlEntry(dictionary, raf, index); + public HtmlEntry read(DataInput raf, final int index) throws IOException { + return new HtmlEntry(dictionary, ch, raf, index); + } + + @Override + public void skip(DataInput raf, final int index) throws IOException { + if (dictionary.dictFileVersion >= 7) + { + StringUtil.readVarInt(raf); + } + else + { + raf.skipBytes(2); + } + int l = raf.readUnsignedShort(); + raf.skipBytes(l); + } + + @Override + public void write(DataOutput raf, HtmlEntry t) throws IOException { + t.writeBase(raf); + } + } + + static final class DataSerializer implements RAFListSerializer { + @Override + public HtmlEntry read(DataInput raf, final int index) { + assert false; + return null; } @Override - public void write(RandomAccessFile raf, HtmlEntry t) throws IOException { - t.write(raf); + public void write(DataOutput raf, HtmlEntry t) throws IOException { + t.writeData(raf); } } - public String getRawText(final boolean compact) { + static final class DataDeserializer implements RAFListSerializer { + @Override + public byte[] read(DataInput raf, final int index) throws IOException { + return HtmlEntry.readData(raf); + } + + @Override + public void write(DataOutput raf, byte[] t) { + assert false; + } + } + + private String getRawText(final boolean compact) { return title + ":\n" + getHtml(); } @Override - public int compareTo(HtmlEntry another) { + public int compareTo(/*@NonNull*/ HtmlEntry another) { if (title.compareTo(another.title) != 0) { return title.compareTo(another.title); } @@ -103,15 +153,13 @@ public class HtmlEntry extends AbstractEntry implements RAFSerializable searchTokens, - final Pattern orderedMatchPattern, final Transliterator normalizer, - final boolean swapPairEntries) { + final Pattern orderedMatchPattern, final Transliterator normalizer, + final boolean swapPairEntries) { final String text = normalizer.transform(getRawText(false)); if (orderedMatchPattern.matcher(text).find()) { return RowMatchType.ORDERED_MATCH; @@ -159,12 +207,13 @@ public class HtmlEntry extends AbstractEntry implements RAFSerializable%s\n

%s\n", - formatQuickdicUrl(indexShortName, htmlEntry.title), titleEscaped, - htmlEntry.getHtml())); + formatQuickdicUrl(indexShortName, htmlEntry.title), titleEscaped, + htmlEntry.getHtml())); } return result.toString(); } + @SuppressWarnings("WeakerAccess") public static String formatQuickdicUrl(final String indexShortName, final String text) { assert !indexShortName.contains(":"); assert text.length() > 0; @@ -177,47 +226,70 @@ public class HtmlEntry extends AbstractEntry implements RAFSerializable data; + final int index; // Not sure this volatile is right, but oh well. - volatile SoftReference htmlRef = new SoftReference(null); - - private LazyHtmlLoader(final RandomAccessFile raf) throws IOException { - this.raf = raf; - numBytes = raf.readInt(); - numZipBytes = raf.readInt(); - offset = raf.getFilePointer(); + volatile SoftReference htmlRef = new SoftReference<>(null); + + private LazyHtmlLoader(FileChannel ch, final DataInput inp, List data, int index) throws IOException { + this.data = data; + this.index = index; + if (data != null) { + this.raf = null; + this.ch = null; + this.offset = 0; + this.numBytes = -1; + this.numZipBytes = -1; + return; + } + raf = inp; + this.ch = ch; + numBytes = Math.min(raf.readInt(), 20 * 1024 * 1024); + numZipBytes = Math.min(raf.readInt(), 20 * 1024 * 1024); + offset = ch.position(); raf.skipBytes(numZipBytes); } - public String getHtml() { + String getHtml() { String html = htmlRef.get(); if (html != null) { return html; } + if (data != null) { + try { + html = new String(data.get(index), "UTF-8"); + } catch (UnsupportedEncodingException e) { + throw new RuntimeException("Dictionary HTML data corrupted", e); + } + htmlRef = new SoftReference<>(html); + return html; + } System.out.println("Loading Html: numBytes=" + numBytes + ", numZipBytes=" - + numZipBytes); - final byte[] bytes = new byte[numBytes]; + + numZipBytes); final byte[] zipBytes = new byte[numZipBytes]; - synchronized (raf) { + synchronized (ch) { try { - raf.seek(offset); - raf.read(zipBytes); + ch.position(offset); + raf.readFully(zipBytes); } catch (IOException e) { - throw new RuntimeException(e); + throw new RuntimeException("Failed to read HTML data from dictionary", e); } } try { - StringUtil.unzipFully(zipBytes, bytes); + final byte[] bytes = StringUtil.unzipFully(zipBytes, numBytes); html = new String(bytes, "UTF-8"); } catch (IOException e) { - throw new RuntimeException(e); + throw new RuntimeException("Dictionary HTML data corrupted", e); } - htmlRef = new SoftReference(html); + htmlRef = new SoftReference<>(html); return html; } }