1 /*
2  * Copyright (C) 2013 The Android Open Source Project
3  *
4  * Licensed under the Apache License, Version 2.0 (the "License");
5  * you may not use this file except in compliance with the License.
6  * You may obtain a copy of the License at
7  *
8  *      http://www.apache.org/licenses/LICENSE-2.0
9  *
10  * Unless required by applicable law or agreed to in writing, software
11  * distributed under the License is distributed on an "AS IS" BASIS,
12  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13  * See the License for the specific language governing permissions and
14  * limitations under the License.
15  */
16 
17 package com.android.inputmethod.latin.makedict;
18 
19 import com.android.inputmethod.annotations.UsedForTesting;
20 import com.android.inputmethod.latin.BinaryDictionary;
21 import com.android.inputmethod.latin.common.FileUtils;
22 
23 import java.io.File;
24 import java.io.FileNotFoundException;
25 import java.io.IOException;
26 import java.util.ArrayList;
27 
28 /**
29  * An implementation of binary dictionary decoder for version 4 binary dictionary.
30  */
31 @UsedForTesting
32 public class Ver4DictDecoder extends AbstractDictDecoder {
33     final File mDictDirectory;
34 
35     @UsedForTesting
Ver4DictDecoder(final File dictDirectory)36     /* package */ Ver4DictDecoder(final File dictDirectory) {
37         mDictDirectory = dictDirectory;
38 
39     }
40 
41     @Override
readHeader()42     public DictionaryHeader readHeader() throws IOException, UnsupportedFormatException {
43         // dictType is not being used in dicttool. Passing an empty string.
44         final BinaryDictionary binaryDictionary= new BinaryDictionary(
45               mDictDirectory.getAbsolutePath(), 0 /* offset */, 0 /* length */,
46               true /* useFullEditDistance */, null /* locale */,
47               "" /* dictType */, true /* isUpdatable */);
48         final DictionaryHeader header = binaryDictionary.getHeader();
49         binaryDictionary.close();
50         if (header == null) {
51             throw new IOException("Cannot read the dictionary header.");
52         }
53         return header;
54     }
55 
56     @Override
readDictionaryBinary(final boolean deleteDictIfBroken)57     public FusionDictionary readDictionaryBinary(final boolean deleteDictIfBroken)
58             throws FileNotFoundException, IOException, UnsupportedFormatException {
59         // dictType is not being used in dicttool. Passing an empty string.
60         final BinaryDictionary binaryDictionary = new BinaryDictionary(
61               mDictDirectory.getAbsolutePath(), 0 /* offset */, 0 /* length */,
62               true /* useFullEditDistance */, null /* locale */,
63               "" /* dictType */, true /* isUpdatable */);
64         final DictionaryHeader header = readHeader();
65         final FusionDictionary fusionDict =
66                 new FusionDictionary(new FusionDictionary.PtNodeArray(), header.mDictionaryOptions);
67         int token = 0;
68         final ArrayList<WordProperty> wordProperties = new ArrayList<>();
69         do {
70             final BinaryDictionary.GetNextWordPropertyResult result =
71                     binaryDictionary.getNextWordProperty(token);
72             final WordProperty wordProperty = result.mWordProperty;
73             if (wordProperty == null) {
74                 binaryDictionary.close();
75                 if (deleteDictIfBroken) {
76                     FileUtils.deleteRecursively(mDictDirectory);
77                 }
78                 return null;
79             }
80             wordProperties.add(wordProperty);
81             token = result.mNextToken;
82         } while (token != 0);
83 
84         // Insert unigrams into the fusion dictionary.
85         for (final WordProperty wordProperty : wordProperties) {
86             fusionDict.add(wordProperty.mWord, wordProperty.mProbabilityInfo,
87                     wordProperty.mIsNotAWord,
88                     wordProperty.mIsPossiblyOffensive);
89         }
90         // Insert bigrams into the fusion dictionary.
91         // TODO: Support ngrams.
92         for (final WordProperty wordProperty : wordProperties) {
93             if (!wordProperty.mHasNgrams) {
94                 continue;
95             }
96             final String word0 = wordProperty.mWord;
97             for (final WeightedString bigram : wordProperty.getBigrams()) {
98                 fusionDict.setBigram(word0, bigram.mWord, bigram.mProbabilityInfo);
99             }
100         }
101         binaryDictionary.close();
102         return fusionDict;
103     }
104 }
105