1 /* 2 * Copyright (C) 2011 The Android Open Source Project 3 * 4 * Licensed under the Apache License, Version 2.0 (the "License"); 5 * you may not use this file except in compliance with the License. 6 * You may obtain a copy of the License at 7 * 8 * http://www.apache.org/licenses/LICENSE-2.0 9 * 10 * Unless required by applicable law or agreed to in writing, software 11 * distributed under the License is distributed on an "AS IS" BASIS, 12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. 13 * See the License for the specific language governing permissions and 14 * limitations under the License. 15 */ 16 17 package com.android.inputmethod.latin; 18 19 import android.content.Context; 20 import android.content.SharedPreferences; 21 import android.content.res.AssetFileDescriptor; 22 import android.util.Log; 23 24 import com.android.inputmethod.latin.common.LocaleUtils; 25 import com.android.inputmethod.latin.define.DecoderSpecificConstants; 26 import com.android.inputmethod.latin.makedict.DictionaryHeader; 27 import com.android.inputmethod.latin.makedict.UnsupportedFormatException; 28 import com.android.inputmethod.latin.utils.BinaryDictionaryUtils; 29 import com.android.inputmethod.latin.utils.DictionaryInfoUtils; 30 31 import java.io.File; 32 import java.io.IOException; 33 import java.nio.BufferUnderflowException; 34 import java.util.ArrayList; 35 import java.util.HashMap; 36 import java.util.Locale; 37 38 /** 39 * Helper class to get the address of a mmap'able dictionary file. 40 */ 41 final public class BinaryDictionaryGetter { 42 43 /** 44 * Used for Log actions from this class 45 */ 46 private static final String TAG = BinaryDictionaryGetter.class.getSimpleName(); 47 48 /** 49 * Used to return empty lists 50 */ 51 private static final File[] EMPTY_FILE_ARRAY = new File[0]; 52 53 /** 54 * Name of the common preferences name to know which word list are on and which are off. 55 */ 56 private static final String COMMON_PREFERENCES_NAME = "LatinImeDictPrefs"; 57 58 private static final boolean SHOULD_USE_DICT_VERSION = 59 DecoderSpecificConstants.SHOULD_USE_DICT_VERSION; 60 61 // Name of the category for the main dictionary 62 public static final String MAIN_DICTIONARY_CATEGORY = "main"; 63 public static final String ID_CATEGORY_SEPARATOR = ":"; 64 65 // The key considered to read the version attribute in a dictionary file. 66 private static String VERSION_KEY = "version"; 67 68 // Prevents this from being instantiated BinaryDictionaryGetter()69 private BinaryDictionaryGetter() {} 70 71 /** 72 * Generates a unique temporary file name in the app cache directory. 73 */ getTempFileName(final String id, final Context context)74 public static String getTempFileName(final String id, final Context context) 75 throws IOException { 76 final String safeId = DictionaryInfoUtils.replaceFileNameDangerousCharacters(id); 77 final File directory = new File(DictionaryInfoUtils.getWordListTempDirectory(context)); 78 if (!directory.exists()) { 79 if (!directory.mkdirs()) { 80 Log.e(TAG, "Could not create the temporary directory"); 81 } 82 } 83 // If the first argument is less than three chars, createTempFile throws a 84 // RuntimeException. We don't really care about what name we get, so just 85 // put a three-chars prefix makes us safe. 86 return File.createTempFile("xxx" + safeId, null, directory).getAbsolutePath(); 87 } 88 89 /** 90 * Returns a file address from a resource, or null if it cannot be opened. 91 */ loadFallbackResource(final Context context, final int fallbackResId)92 public static AssetFileAddress loadFallbackResource(final Context context, 93 final int fallbackResId) { 94 AssetFileDescriptor afd = null; 95 try { 96 afd = context.getResources().openRawResourceFd(fallbackResId); 97 } catch (RuntimeException e) { 98 Log.e(TAG, "Resource not found: " + fallbackResId); 99 return null; 100 } 101 if (afd == null) { 102 Log.e(TAG, "Resource cannot be opened: " + fallbackResId); 103 return null; 104 } 105 try { 106 return AssetFileAddress.makeFromFileNameAndOffset( 107 context.getApplicationInfo().sourceDir, afd.getStartOffset(), afd.getLength()); 108 } finally { 109 try { 110 afd.close(); 111 } catch (IOException ignored) { 112 } 113 } 114 } 115 116 private static final class DictPackSettings { 117 final SharedPreferences mDictPreferences; DictPackSettings(final Context context)118 public DictPackSettings(final Context context) { 119 mDictPreferences = null == context ? null 120 : context.getSharedPreferences(COMMON_PREFERENCES_NAME, 121 Context.MODE_MULTI_PROCESS); 122 } isWordListActive(final String dictId)123 public boolean isWordListActive(final String dictId) { 124 if (null == mDictPreferences) { 125 // If we don't have preferences it basically means we can't find the dictionary 126 // pack - either it's not installed, or it's disabled, or there is some strange 127 // bug. Either way, a word list with no settings should be on by default: default 128 // dictionaries in LatinIME are on if there is no settings at all, and if for some 129 // reason some dictionaries have been installed BUT the dictionary pack can't be 130 // found anymore it's safer to actually supply installed dictionaries. 131 return true; 132 } 133 // The default is true here for the same reasons as above. We got the dictionary 134 // pack but if we don't have any settings for it it means the user has never been 135 // to the settings yet. So by default, the main dictionaries should be on. 136 return mDictPreferences.getBoolean(dictId, true); 137 } 138 } 139 140 /** 141 * Utility class for the {@link #getCachedWordLists} method 142 */ 143 private static final class FileAndMatchLevel { 144 final File mFile; 145 final int mMatchLevel; FileAndMatchLevel(final File file, final int matchLevel)146 public FileAndMatchLevel(final File file, final int matchLevel) { 147 mFile = file; 148 mMatchLevel = matchLevel; 149 } 150 } 151 152 /** 153 * Returns the list of cached files for a specific locale, one for each category. 154 * 155 * This will return exactly one file for each word list category that matches 156 * the passed locale. If several files match the locale for any given category, 157 * this returns the file with the closest match to the locale. For example, if 158 * the passed word list is en_US, and for a category we have an en and an en_US 159 * word list available, we'll return only the en_US one. 160 * Thus, the list will contain as many files as there are categories. 161 * 162 * @param locale the locale to find the dictionary files for, as a string. 163 * @param context the context on which to open the files upon. 164 * @return an array of binary dictionary files, which may be empty but may not be null. 165 */ getCachedWordLists(final String locale, final Context context)166 public static File[] getCachedWordLists(final String locale, final Context context) { 167 final File[] directoryList = DictionaryInfoUtils.getCachedDirectoryList(context); 168 if (null == directoryList) return EMPTY_FILE_ARRAY; 169 final HashMap<String, FileAndMatchLevel> cacheFiles = new HashMap<>(); 170 for (File directory : directoryList) { 171 if (!directory.isDirectory()) continue; 172 final String dirLocale = 173 DictionaryInfoUtils.getWordListIdFromFileName(directory.getName()); 174 final int matchLevel = LocaleUtils.getMatchLevel(dirLocale, locale); 175 if (LocaleUtils.isMatch(matchLevel)) { 176 final File[] wordLists = directory.listFiles(); 177 if (null != wordLists) { 178 for (File wordList : wordLists) { 179 final String category = 180 DictionaryInfoUtils.getCategoryFromFileName(wordList.getName()); 181 final FileAndMatchLevel currentBestMatch = cacheFiles.get(category); 182 if (null == currentBestMatch || currentBestMatch.mMatchLevel < matchLevel) { 183 cacheFiles.put(category, new FileAndMatchLevel(wordList, matchLevel)); 184 } 185 } 186 } 187 } 188 } 189 if (cacheFiles.isEmpty()) return EMPTY_FILE_ARRAY; 190 final File[] result = new File[cacheFiles.size()]; 191 int index = 0; 192 for (final FileAndMatchLevel entry : cacheFiles.values()) { 193 result[index++] = entry.mFile; 194 } 195 return result; 196 } 197 198 // ## HACK ## we prevent usage of a dictionary before version 18. The reason for this is, since 199 // those do not include allowlist entries, the new code with an old version of the dictionary 200 // would lose allowlist functionality. hackCanUseDictionaryFile(final File file)201 private static boolean hackCanUseDictionaryFile(final File file) { 202 if (!SHOULD_USE_DICT_VERSION) { 203 return true; 204 } 205 206 try { 207 // Read the version of the file 208 final DictionaryHeader header = BinaryDictionaryUtils.getHeader(file); 209 final String version = header.mDictionaryOptions.mAttributes.get(VERSION_KEY); 210 if (null == version) { 211 // No version in the options : the format is unexpected 212 return false; 213 } 214 // Version 18 is the first one to include the allowlist. 215 // Obviously this is a big ## HACK ## 216 return Integer.parseInt(version) >= 18; 217 } catch (java.io.FileNotFoundException e) { 218 return false; 219 } catch (java.io.IOException e) { 220 return false; 221 } catch (NumberFormatException e) { 222 return false; 223 } catch (BufferUnderflowException e) { 224 return false; 225 } catch (UnsupportedFormatException e) { 226 return false; 227 } 228 } 229 230 /** 231 * Returns a list of file addresses for a given locale, trying relevant methods in order. 232 * 233 * Tries to get binary dictionaries from various sources, in order: 234 * - Uses a content provider to get a public dictionary set, as per the protocol described 235 * in BinaryDictionaryFileDumper. 236 * If that fails: 237 * - Gets a file name from the built-in dictionary for this locale, if any. 238 * If that fails: 239 * - Returns null. 240 * @return The list of addresses of valid dictionary files, or null. 241 */ getDictionaryFiles(final Locale locale, final Context context, boolean notifyDictionaryPackForUpdates)242 public static ArrayList<AssetFileAddress> getDictionaryFiles(final Locale locale, 243 final Context context, boolean notifyDictionaryPackForUpdates) { 244 if (notifyDictionaryPackForUpdates) { 245 final boolean hasDefaultWordList = DictionaryInfoUtils.isDictionaryAvailable( 246 context, locale); 247 // It makes sure that the first time keyboard comes up and the dictionaries are reset, 248 // the DB is populated with the appropriate values for each locale. Helps in downloading 249 // the dictionaries when the user enables and switches new languages before the 250 // DictionaryService runs. 251 BinaryDictionaryFileDumper.downloadDictIfNeverRequested( 252 locale, context, hasDefaultWordList); 253 254 // Move a staging files to the cache ddirectories if any. 255 DictionaryInfoUtils.moveStagingFilesIfExists(context); 256 } 257 final File[] cachedWordLists = getCachedWordLists(locale.toString(), context); 258 final String mainDictId = DictionaryInfoUtils.getMainDictId(locale); 259 final DictPackSettings dictPackSettings = new DictPackSettings(context); 260 261 boolean foundMainDict = false; 262 final ArrayList<AssetFileAddress> fileList = new ArrayList<>(); 263 // cachedWordLists may not be null, see doc for getCachedDictionaryList 264 for (final File f : cachedWordLists) { 265 final String wordListId = DictionaryInfoUtils.getWordListIdFromFileName(f.getName()); 266 final boolean canUse = f.canRead() && hackCanUseDictionaryFile(f); 267 if (canUse && DictionaryInfoUtils.isMainWordListId(wordListId)) { 268 foundMainDict = true; 269 } 270 if (!dictPackSettings.isWordListActive(wordListId)) continue; 271 if (canUse) { 272 final AssetFileAddress afa = AssetFileAddress.makeFromFileName(f.getPath()); 273 if (null != afa) fileList.add(afa); 274 } else { 275 Log.e(TAG, "Found a cached dictionary file for " + locale.toString() 276 + " but cannot read or use it"); 277 } 278 } 279 280 if (!foundMainDict && dictPackSettings.isWordListActive(mainDictId)) { 281 final int fallbackResId = 282 DictionaryInfoUtils.getMainDictionaryResourceId(context.getResources(), locale); 283 final AssetFileAddress fallbackAsset = loadFallbackResource(context, fallbackResId); 284 if (null != fallbackAsset) { 285 fileList.add(fallbackAsset); 286 } 287 } 288 289 return fileList; 290 } 291 } 292