1 package com.hughes.android.dictionary;
\r
3 import java.io.IOException;
\r
4 import java.io.RandomAccessFile;
\r
5 import java.util.ArrayList;
\r
6 import java.util.List;
\r
7 import java.util.concurrent.atomic.AtomicBoolean;
\r
9 import com.hughes.util.CachingList;
\r
10 import com.hughes.util.raf.FileList;
\r
11 import com.hughes.util.raf.RAFFactory;
\r
12 import com.hughes.util.raf.RAFSerializable;
\r
13 import com.hughes.util.raf.RAFSerializableSerializer;
\r
14 import com.hughes.util.raf.RAFSerializer;
\r
15 import com.hughes.util.raf.UniformFileList;
\r
17 public final class Dictionary implements RAFSerializable<Dictionary> {
\r
19 static final RAFSerializer<Entry> ENTRY_SERIALIZER = new RAFSerializableSerializer<Entry>(
\r
21 static final RAFSerializer<Row> ROW_SERIALIZER = new RAFSerializableSerializer<Row>(
\r
23 static final RAFSerializer<IndexEntry> INDEX_ENTRY_SERIALIZER = new RAFSerializableSerializer<IndexEntry>(
\r
24 IndexEntry.RAF_FACTORY);
\r
26 final List<Entry> entries;
\r
27 final LanguageData[] languageDatas = new LanguageData[2];
\r
29 public Dictionary(final Language language0, final Language language1) {
\r
30 languageDatas[0] = new LanguageData(language0, Entry.LANG1);
\r
31 languageDatas[1] = new LanguageData(language1, Entry.LANG2);
\r
32 entries = new ArrayList<Entry>();
\r
35 public Dictionary(final RandomAccessFile raf) throws IOException {
\r
36 entries = CachingList.create(FileList.create(raf, ENTRY_SERIALIZER, raf
\r
37 .getFilePointer()), 10000);
\r
38 languageDatas[0] = new LanguageData(raf, Entry.LANG1);
\r
39 languageDatas[1] = new LanguageData(raf, Entry.LANG2);
\r
42 public void write(RandomAccessFile raf) throws IOException {
\r
43 FileList.write(raf, entries, ENTRY_SERIALIZER);
\r
44 languageDatas[0].write(raf);
\r
45 languageDatas[1].write(raf);
\r
48 final class LanguageData implements RAFSerializable<LanguageData> {
\r
49 final Language language;
\r
51 final List<Row> rows;
\r
52 final List<IndexEntry> sortedIndex;
\r
54 LanguageData(final Language language, final byte lang) {
\r
55 this.language = language;
\r
57 rows = new ArrayList<Row>();
\r
58 sortedIndex = new ArrayList<IndexEntry>();
\r
61 LanguageData(final RandomAccessFile raf, final byte lang) throws IOException {
\r
62 language = Language.lookup(raf.readUTF());
\r
63 if (language == null) {
\r
64 throw new RuntimeException("Unknown language.");
\r
67 rows = CachingList.create(UniformFileList.create(raf, ROW_SERIALIZER, raf
\r
68 .getFilePointer()), 10000);
\r
69 sortedIndex = CachingList.create(FileList.create(raf,
\r
70 INDEX_ENTRY_SERIALIZER, raf.getFilePointer()), 10000);
\r
73 public void write(final RandomAccessFile raf) throws IOException {
\r
74 raf.writeUTF(language.symbol);
\r
75 UniformFileList.write(raf, rows, ROW_SERIALIZER, 4);
\r
76 FileList.write(raf, sortedIndex, INDEX_ENTRY_SERIALIZER);
\r
79 String rowToString(final Row row) {
\r
80 return row.isToken() ? sortedIndex.get(row.getIndex()).word : entries
\r
81 .get(row.getIndex()).toString();
\r
84 int lookup(String word, final AtomicBoolean interrupted) {
\r
85 word = word.toLowerCase();
\r
88 int end = sortedIndex.size();
\r
89 while (start < end) {
\r
90 final int mid = (start + end) / 2;
\r
91 if (interrupted.get()) {
\r
94 final IndexEntry midEntry = sortedIndex.get(mid);
\r
96 final int comp = language.tokenComparator.compare(word, midEntry.word.toLowerCase());
\r
99 while (result > 0 && language.tokenComparator.compare(word, sortedIndex.get(result - 1).word.toLowerCase()) == 0) {
\r
101 if (interrupted.get()) {
\r
106 } else if (comp < 0) {
\r
112 return Math.min(sortedIndex.size() - 1, start);
\r
115 public int getTokenRow(final int rowIndex) {
\r
119 row = rows.get(r);
\r
120 if (row.isToken() || row.tokenRow != -1) {
\r
125 final int result = row.isToken() ? r : row.tokenRow;
\r
126 for (; r <= rowIndex; ++r) {
\r
127 rows.get(r).tokenRow = result;
\r
129 assert rows.get(result).isToken();
\r
134 public static final class Row implements RAFSerializable<Row> {
\r
139 public Row(final int index) {
\r
140 this.index = index;
\r
143 static final RAFFactory<Row> RAF_FACTORY = new RAFFactory<Row>() {
\r
144 public Row create(RandomAccessFile raf) throws IOException {
\r
145 return new Row(raf.readInt());
\r
149 public void write(RandomAccessFile raf) throws IOException {
\r
150 raf.writeInt(index);
\r
153 boolean isToken() {
\r
157 public int getIndex() {
\r
165 public static final class IndexEntry implements RAFSerializable<IndexEntry> {
\r
167 final int startRow;
\r
169 public IndexEntry(final String word, final int startRow) {
\r
171 this.startRow = startRow;
\r
174 static final RAFFactory<IndexEntry> RAF_FACTORY = new RAFFactory<IndexEntry>() {
\r
175 public IndexEntry create(RandomAccessFile raf) throws IOException {
\r
176 final String word = raf.readUTF();
\r
177 final int startRow = raf.readInt();
\r
178 return new IndexEntry(word, startRow);
\r
182 public void write(final RandomAccessFile raf) throws IOException {
\r
183 raf.writeUTF(word);
\r
184 raf.writeInt(startRow);
\r
188 public String toString() {
\r
189 return word + "@" + startRow;
\r