1 /* 2 * Copyright (C) 2012 The Android Open Source Project 3 * 4 * Licensed under the Apache License, Version 2.0 (the "License"); 5 * you may not use this file except in compliance with the License. 6 * You may obtain a copy of the License at 7 * 8 * http://www.apache.org/licenses/LICENSE-2.0 9 * 10 * Unless required by applicable law or agreed to in writing, software 11 * distributed under the License is distributed on an "AS IS" BASIS, 12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. 13 * See the License for the specific language governing permissions and 14 * limitations under the License. 15 */ 16 17 package com.android.inputmethod.latin; 18 19 import android.content.ContentResolver; 20 import android.content.Context; 21 import android.database.ContentObserver; 22 import android.database.Cursor; 23 import android.database.sqlite.SQLiteException; 24 import android.net.Uri; 25 import android.provider.UserDictionary.Words; 26 import android.text.TextUtils; 27 import android.util.Log; 28 29 import com.android.inputmethod.annotations.ExternallyReferenced; 30 import com.android.inputmethod.latin.utils.SubtypeLocaleUtils; 31 32 import java.io.File; 33 import java.util.Arrays; 34 import java.util.Locale; 35 36 import javax.annotation.Nullable; 37 38 /** 39 * An expandable dictionary that stores the words in the user dictionary provider into a binary 40 * dictionary file to use it from native code. 41 */ 42 public class UserBinaryDictionary extends ExpandableBinaryDictionary { 43 private static final String TAG = ExpandableBinaryDictionary.class.getSimpleName(); 44 45 // The user dictionary provider uses an empty string to mean "all languages". 46 private static final String USER_DICTIONARY_ALL_LANGUAGES = ""; 47 private static final int HISTORICAL_DEFAULT_USER_DICTIONARY_FREQUENCY = 250; 48 private static final int LATINIME_DEFAULT_USER_DICTIONARY_FREQUENCY = 160; 49 50 private static final String[] PROJECTION_QUERY = new String[] {Words.WORD, Words.FREQUENCY}; 51 52 private static final String NAME = "userunigram"; 53 54 private ContentObserver mObserver; 55 final private String mLocaleString; 56 final private boolean mAlsoUseMoreRestrictiveLocales; 57 58 protected UserBinaryDictionary(final Context context, final Locale locale, 59 final boolean alsoUseMoreRestrictiveLocales, 60 final File dictFile, final String name) { 61 super(context, getDictName(name, locale, dictFile), locale, Dictionary.TYPE_USER, dictFile); 62 if (null == locale) throw new NullPointerException(); // Catch the error earlier 63 final String localeStr = locale.toString(); 64 if (SubtypeLocaleUtils.NO_LANGUAGE.equals(localeStr)) { 65 // If we don't have a locale, insert into the "all locales" user dictionary. 66 mLocaleString = USER_DICTIONARY_ALL_LANGUAGES; 67 } else { 68 mLocaleString = localeStr; 69 } 70 mAlsoUseMoreRestrictiveLocales = alsoUseMoreRestrictiveLocales; 71 ContentResolver cres = context.getContentResolver(); 72 73 mObserver = new ContentObserver(null) { 74 @Override 75 public void onChange(final boolean self) { 76 // This hook is deprecated as of API level 16 (Build.VERSION_CODES.JELLY_BEAN), 77 // but should still be supported for cases where the IME is running on an older 78 // version of the platform. 79 onChange(self, null); 80 } 81 // The following hook is only available as of API level 16 82 // (Build.VERSION_CODES.JELLY_BEAN), and as such it will only work on JellyBean+ 83 // devices. On older versions of the platform, the hook above will be called instead. 84 @Override 85 public void onChange(final boolean self, final Uri uri) { 86 setNeedsToRecreate(); 87 } 88 }; 89 cres.registerContentObserver(Words.CONTENT_URI, true, mObserver); 90 reloadDictionaryIfRequired(); 91 } 92 93 // Note: This method is called by {@link DictionaryFacilitator} using Java reflection. 94 @ExternallyReferenced 95 public static UserBinaryDictionary getDictionary( 96 final Context context, final Locale locale, final File dictFile, 97 final String dictNamePrefix, @Nullable final String account) { 98 return new UserBinaryDictionary( 99 context, locale, false /* alsoUseMoreRestrictiveLocales */, 100 dictFile, dictNamePrefix + NAME); 101 } 102 103 @Override 104 public synchronized void close() { 105 if (mObserver != null) { 106 mContext.getContentResolver().unregisterContentObserver(mObserver); 107 mObserver = null; 108 } 109 super.close(); 110 } 111 112 @Override 113 public void loadInitialContentsLocked() { 114 // Split the locale. For example "en" => ["en"], "de_DE" => ["de", "DE"], 115 // "en_US_foo_bar_qux" => ["en", "US", "foo_bar_qux"] because of the limit of 3. 116 // This is correct for locale processing. 117 // For this example, we'll look at the "en_US_POSIX" case. 118 final String[] localeElements = 119 TextUtils.isEmpty(mLocaleString) ? new String[] {} : mLocaleString.split("_", 3); 120 final int length = localeElements.length; 121 122 final StringBuilder request = new StringBuilder("(locale is NULL)"); 123 String localeSoFar = ""; 124 // At start, localeElements = ["en", "US", "POSIX"] ; localeSoFar = "" ; 125 // and request = "(locale is NULL)" 126 for (int i = 0; i < length; ++i) { 127 // i | localeSoFar | localeElements 128 // 0 | "" | ["en", "US", "POSIX"] 129 // 1 | "en_" | ["en", "US", "POSIX"] 130 // 2 | "en_US_" | ["en", "en_US", "POSIX"] 131 localeElements[i] = localeSoFar + localeElements[i]; 132 localeSoFar = localeElements[i] + "_"; 133 // i | request 134 // 0 | "(locale is NULL)" 135 // 1 | "(locale is NULL) or (locale=?)" 136 // 2 | "(locale is NULL) or (locale=?) or (locale=?)" 137 request.append(" or (locale=?)"); 138 } 139 // At the end, localeElements = ["en", "en_US", "en_US_POSIX"]; localeSoFar = en_US_POSIX_" 140 // and request = "(locale is NULL) or (locale=?) or (locale=?) or (locale=?)" 141 142 final String[] requestArguments; 143 // If length == 3, we already have all the arguments we need (common prefix is meaningless 144 // inside variants 145 if (mAlsoUseMoreRestrictiveLocales && length < 3) { 146 request.append(" or (locale like ?)"); 147 // The following creates an array with one more (null) position 148 final String[] localeElementsWithMoreRestrictiveLocalesIncluded = 149 Arrays.copyOf(localeElements, length + 1); 150 localeElementsWithMoreRestrictiveLocalesIncluded[length] = 151 localeElements[length - 1] + "_%"; 152 requestArguments = localeElementsWithMoreRestrictiveLocalesIncluded; 153 // If for example localeElements = ["en"] 154 // then requestArguments = ["en", "en_%"] 155 // and request = (locale is NULL) or (locale=?) or (locale like ?) 156 // If localeElements = ["en", "en_US"] 157 // then requestArguments = ["en", "en_US", "en_US_%"] 158 } else { 159 requestArguments = localeElements; 160 } 161 final String requestString = request.toString(); 162 addWordsFromProjectionLocked(PROJECTION_QUERY, requestString, requestArguments); 163 } 164 165 private void addWordsFromProjectionLocked(final String[] query, String request, 166 final String[] requestArguments) 167 throws IllegalArgumentException { 168 Cursor cursor = null; 169 try { 170 cursor = mContext.getContentResolver().query( 171 Words.CONTENT_URI, query, request, requestArguments, null); 172 addWordsLocked(cursor); 173 } catch (final SQLiteException e) { 174 Log.e(TAG, "SQLiteException in the remote User dictionary process.", e); 175 } finally { 176 try { 177 if (null != cursor) cursor.close(); 178 } catch (final SQLiteException e) { 179 Log.e(TAG, "SQLiteException in the remote User dictionary process.", e); 180 } 181 } 182 } 183 184 private static int scaleFrequencyFromDefaultToLatinIme(final int defaultFrequency) { 185 // The default frequency for the user dictionary is 250 for historical reasons. 186 // Latin IME considers a good value for the default user dictionary frequency 187 // is about 160 considering the scale we use. So we are scaling down the values. 188 if (defaultFrequency > Integer.MAX_VALUE / LATINIME_DEFAULT_USER_DICTIONARY_FREQUENCY) { 189 return (defaultFrequency / HISTORICAL_DEFAULT_USER_DICTIONARY_FREQUENCY) 190 * LATINIME_DEFAULT_USER_DICTIONARY_FREQUENCY; 191 } 192 return (defaultFrequency * LATINIME_DEFAULT_USER_DICTIONARY_FREQUENCY) 193 / HISTORICAL_DEFAULT_USER_DICTIONARY_FREQUENCY; 194 } 195 196 private void addWordsLocked(final Cursor cursor) { 197 if (cursor == null) return; 198 if (cursor.moveToFirst()) { 199 final int indexWord = cursor.getColumnIndex(Words.WORD); 200 final int indexFrequency = cursor.getColumnIndex(Words.FREQUENCY); 201 while (!cursor.isAfterLast()) { 202 final String word = cursor.getString(indexWord); 203 final int frequency = cursor.getInt(indexFrequency); 204 final int adjustedFrequency = scaleFrequencyFromDefaultToLatinIme(frequency); 205 // Safeguard against adding really long words. 206 if (word.length() <= MAX_WORD_LENGTH) { 207 runGCIfRequiredLocked(true /* mindsBlockByGC */); 208 addUnigramLocked(word, adjustedFrequency, false /* isNotAWord */, 209 false /* isPossiblyOffensive */, 210 BinaryDictionary.NOT_A_VALID_TIMESTAMP); 211 } 212 cursor.moveToNext(); 213 } 214 } 215 } 216 } 217