Home | History | Annotate | Download | only in latin
      1 /*
      2  * Copyright (C) 2011 The Android Open Source Project
      3  *
      4  * Licensed under the Apache License, Version 2.0 (the "License");
      5  * you may not use this file except in compliance with the License.
      6  * You may obtain a copy of the License at
      7  *
      8  *      http://www.apache.org/licenses/LICENSE-2.0
      9  *
     10  * Unless required by applicable law or agreed to in writing, software
     11  * distributed under the License is distributed on an "AS IS" BASIS,
     12  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
     13  * See the License for the specific language governing permissions and
     14  * limitations under the License.
     15  */
     16 
     17 package com.android.inputmethod.latin;
     18 
     19 import android.content.ContentProviderClient;
     20 import android.content.ContentResolver;
     21 import android.content.ContentValues;
     22 import android.content.Context;
     23 import android.content.res.AssetFileDescriptor;
     24 import android.database.Cursor;
     25 import android.net.Uri;
     26 import android.os.RemoteException;
     27 import android.text.TextUtils;
     28 import android.util.Log;
     29 
     30 import com.android.inputmethod.dictionarypack.DictionaryPackConstants;
     31 import com.android.inputmethod.latin.utils.CollectionUtils;
     32 import com.android.inputmethod.latin.utils.DictionaryInfoUtils;
     33 import com.android.inputmethod.latin.utils.DictionaryInfoUtils.DictionaryInfo;
     34 import com.android.inputmethod.latin.utils.FileTransforms;
     35 import com.android.inputmethod.latin.utils.MetadataFileUriGetter;
     36 
     37 import java.io.BufferedInputStream;
     38 import java.io.BufferedOutputStream;
     39 import java.io.Closeable;
     40 import java.io.File;
     41 import java.io.FileNotFoundException;
     42 import java.io.FileOutputStream;
     43 import java.io.IOException;
     44 import java.io.InputStream;
     45 import java.util.Arrays;
     46 import java.util.ArrayList;
     47 import java.util.Collections;
     48 import java.util.List;
     49 import java.util.Locale;
     50 
     51 /**
     52  * Group class for static methods to help with creation and getting of the binary dictionary
     53  * file from the dictionary provider
     54  */
     55 public final class BinaryDictionaryFileDumper {
     56     private static final String TAG = BinaryDictionaryFileDumper.class.getSimpleName();
     57     private static final boolean DEBUG = false;
     58 
     59     /**
     60      * The size of the temporary buffer to copy files.
     61      */
     62     private static final int FILE_READ_BUFFER_SIZE = 8192;
     63     // TODO: make the following data common with the native code
     64     private static final byte[] MAGIC_NUMBER_VERSION_1 =
     65             new byte[] { (byte)0x78, (byte)0xB1, (byte)0x00, (byte)0x00 };
     66     private static final byte[] MAGIC_NUMBER_VERSION_2 =
     67             new byte[] { (byte)0x9B, (byte)0xC1, (byte)0x3A, (byte)0xFE };
     68 
     69     private static final String DICTIONARY_PROJECTION[] = { "id" };
     70 
     71     private static final String QUERY_PARAMETER_MAY_PROMPT_USER = "mayPrompt";
     72     private static final String QUERY_PARAMETER_TRUE = "true";
     73     private static final String QUERY_PARAMETER_DELETE_RESULT = "result";
     74     private static final String QUERY_PARAMETER_SUCCESS = "success";
     75     private static final String QUERY_PARAMETER_FAILURE = "failure";
     76 
     77     // Using protocol version 2 to communicate with the dictionary pack
     78     private static final String QUERY_PARAMETER_PROTOCOL = "protocol";
     79     private static final String QUERY_PARAMETER_PROTOCOL_VALUE = "2";
     80 
     81     // The path fragment to append after the client ID for dictionary info requests.
     82     private static final String QUERY_PATH_DICT_INFO = "dict";
     83     // The path fragment to append after the client ID for dictionary datafile requests.
     84     private static final String QUERY_PATH_DATAFILE = "datafile";
     85     // The path fragment to append after the client ID for updating the metadata URI.
     86     private static final String QUERY_PATH_METADATA = "metadata";
     87     private static final String INSERT_METADATA_CLIENT_ID_COLUMN = "clientid";
     88     private static final String INSERT_METADATA_METADATA_URI_COLUMN = "uri";
     89     private static final String INSERT_METADATA_METADATA_ADDITIONAL_ID_COLUMN = "additionalid";
     90 
     91     // Prevents this class to be accidentally instantiated.
     92     private BinaryDictionaryFileDumper() {
     93     }
     94 
     95     /**
     96      * Returns a URI builder pointing to the dictionary pack.
     97      *
     98      * This creates a URI builder able to build a URI pointing to the dictionary
     99      * pack content provider for a specific dictionary id.
    100      */
    101     private static Uri.Builder getProviderUriBuilder(final String path) {
    102         return new Uri.Builder().scheme(ContentResolver.SCHEME_CONTENT)
    103                 .authority(DictionaryPackConstants.AUTHORITY).appendPath(path);
    104     }
    105 
    106     /**
    107      * Gets the content URI builder for a specified type.
    108      *
    109      * Supported types include QUERY_PATH_DICT_INFO, which takes the locale as
    110      * the extraPath argument, and QUERY_PATH_DATAFILE, which needs a wordlist ID
    111      * as the extraPath argument.
    112      *
    113      * @param clientId the clientId to use
    114      * @param contentProviderClient the instance of content provider client
    115      * @param queryPathType the path element encoding the type
    116      * @param extraPath optional extra argument for this type (typically word list id)
    117      * @return a builder that can build the URI for the best supported protocol version
    118      * @throws RemoteException if the client can't be contacted
    119      */
    120     private static Uri.Builder getContentUriBuilderForType(final String clientId,
    121             final ContentProviderClient contentProviderClient, final String queryPathType,
    122             final String extraPath) throws RemoteException {
    123         // Check whether protocol v2 is supported by building a v2 URI and calling getType()
    124         // on it. If this returns null, v2 is not supported.
    125         final Uri.Builder uriV2Builder = getProviderUriBuilder(clientId);
    126         uriV2Builder.appendPath(queryPathType);
    127         uriV2Builder.appendPath(extraPath);
    128         uriV2Builder.appendQueryParameter(QUERY_PARAMETER_PROTOCOL,
    129                 QUERY_PARAMETER_PROTOCOL_VALUE);
    130         if (null != contentProviderClient.getType(uriV2Builder.build())) return uriV2Builder;
    131         // Protocol v2 is not supported, so create and return the protocol v1 uri.
    132         return getProviderUriBuilder(extraPath);
    133     }
    134 
    135     /**
    136      * Queries a content provider for the list of word lists for a specific locale
    137      * available to copy into Latin IME.
    138      */
    139     private static List<WordListInfo> getWordListWordListInfos(final Locale locale,
    140             final Context context, final boolean hasDefaultWordList) {
    141         final String clientId = context.getString(R.string.dictionary_pack_client_id);
    142         final ContentProviderClient client = context.getContentResolver().
    143                 acquireContentProviderClient(getProviderUriBuilder("").build());
    144         if (null == client) return Collections.<WordListInfo>emptyList();
    145 
    146         try {
    147             final Uri.Builder builder = getContentUriBuilderForType(clientId, client,
    148                     QUERY_PATH_DICT_INFO, locale.toString());
    149             if (!hasDefaultWordList) {
    150                 builder.appendQueryParameter(QUERY_PARAMETER_MAY_PROMPT_USER,
    151                         QUERY_PARAMETER_TRUE);
    152             }
    153             final Uri queryUri = builder.build();
    154             final boolean isProtocolV2 = (QUERY_PARAMETER_PROTOCOL_VALUE.equals(
    155                     queryUri.getQueryParameter(QUERY_PARAMETER_PROTOCOL)));
    156 
    157             Cursor c = client.query(queryUri, DICTIONARY_PROJECTION, null, null, null);
    158             if (isProtocolV2 && null == c) {
    159                 reinitializeClientRecordInDictionaryContentProvider(context, client, clientId);
    160                 c = client.query(queryUri, DICTIONARY_PROJECTION, null, null, null);
    161             }
    162             if (null == c) return Collections.<WordListInfo>emptyList();
    163             if (c.getCount() <= 0 || !c.moveToFirst()) {
    164                 c.close();
    165                 return Collections.<WordListInfo>emptyList();
    166             }
    167             final ArrayList<WordListInfo> list = CollectionUtils.newArrayList();
    168             do {
    169                 final String wordListId = c.getString(0);
    170                 final String wordListLocale = c.getString(1);
    171                 if (TextUtils.isEmpty(wordListId)) continue;
    172                 list.add(new WordListInfo(wordListId, wordListLocale));
    173             } while (c.moveToNext());
    174             c.close();
    175             return list;
    176         } catch (RemoteException e) {
    177             // The documentation is unclear as to in which cases this may happen, but it probably
    178             // happens when the content provider got suddenly killed because it crashed or because
    179             // the user disabled it through Settings.
    180             Log.e(TAG, "RemoteException: communication with the dictionary pack cut", e);
    181             return Collections.<WordListInfo>emptyList();
    182         } catch (Exception e) {
    183             // A crash here is dangerous because crashing here would brick any encrypted device -
    184             // we need the keyboard to be up and working to enter the password, so we don't want
    185             // to die no matter what. So let's be as safe as possible.
    186             Log.e(TAG, "Unexpected exception communicating with the dictionary pack", e);
    187             return Collections.<WordListInfo>emptyList();
    188         } finally {
    189             client.release();
    190         }
    191     }
    192 
    193 
    194     /**
    195      * Helper method to encapsulate exception handling.
    196      */
    197     private static AssetFileDescriptor openAssetFileDescriptor(
    198             final ContentProviderClient providerClient, final Uri uri) {
    199         try {
    200             return providerClient.openAssetFile(uri, "r");
    201         } catch (FileNotFoundException e) {
    202             // I don't want to log the word list URI here for security concerns. The exception
    203             // contains the name of the file, so let's not pass it to Log.e here.
    204             Log.e(TAG, "Could not find a word list from the dictionary provider."
    205                     /* intentionally don't pass the exception (see comment above) */);
    206             return null;
    207         } catch (RemoteException e) {
    208             Log.e(TAG, "Can't communicate with the dictionary pack", e);
    209             return null;
    210         }
    211     }
    212 
    213     /**
    214      * Caches a word list the id of which is passed as an argument. This will write the file
    215      * to the cache file name designated by its id and locale, overwriting it if already present
    216      * and creating it (and its containing directory) if necessary.
    217      */
    218     private static void cacheWordList(final String wordlistId, final String locale,
    219             final ContentProviderClient providerClient, final Context context) {
    220         final int COMPRESSED_CRYPTED_COMPRESSED = 0;
    221         final int CRYPTED_COMPRESSED = 1;
    222         final int COMPRESSED_CRYPTED = 2;
    223         final int COMPRESSED_ONLY = 3;
    224         final int CRYPTED_ONLY = 4;
    225         final int NONE = 5;
    226         final int MODE_MIN = COMPRESSED_CRYPTED_COMPRESSED;
    227         final int MODE_MAX = NONE;
    228 
    229         final String clientId = context.getString(R.string.dictionary_pack_client_id);
    230         final Uri.Builder wordListUriBuilder;
    231         try {
    232             wordListUriBuilder = getContentUriBuilderForType(clientId,
    233                     providerClient, QUERY_PATH_DATAFILE, wordlistId /* extraPath */);
    234         } catch (RemoteException e) {
    235             Log.e(TAG, "Can't communicate with the dictionary pack", e);
    236             return;
    237         }
    238         final String finalFileName =
    239                 DictionaryInfoUtils.getCacheFileName(wordlistId, locale, context);
    240         String tempFileName;
    241         try {
    242             tempFileName = BinaryDictionaryGetter.getTempFileName(wordlistId, context);
    243         } catch (IOException e) {
    244             Log.e(TAG, "Can't open the temporary file", e);
    245             return;
    246         }
    247 
    248         for (int mode = MODE_MIN; mode <= MODE_MAX; ++mode) {
    249             final InputStream originalSourceStream;
    250             InputStream inputStream = null;
    251             InputStream uncompressedStream = null;
    252             InputStream decryptedStream = null;
    253             BufferedInputStream bufferedInputStream = null;
    254             File outputFile = null;
    255             BufferedOutputStream bufferedOutputStream = null;
    256             AssetFileDescriptor afd = null;
    257             final Uri wordListUri = wordListUriBuilder.build();
    258             try {
    259                 // Open input.
    260                 afd = openAssetFileDescriptor(providerClient, wordListUri);
    261                 // If we can't open it at all, don't even try a number of times.
    262                 if (null == afd) return;
    263                 originalSourceStream = afd.createInputStream();
    264                 // Open output.
    265                 outputFile = new File(tempFileName);
    266                 // Just to be sure, delete the file. This may fail silently, and return false: this
    267                 // is the right thing to do, as we just want to continue anyway.
    268                 outputFile.delete();
    269                 // Get the appropriate decryption method for this try
    270                 switch (mode) {
    271                     case COMPRESSED_CRYPTED_COMPRESSED:
    272                         uncompressedStream =
    273                                 FileTransforms.getUncompressedStream(originalSourceStream);
    274                         decryptedStream = FileTransforms.getDecryptedStream(uncompressedStream);
    275                         inputStream = FileTransforms.getUncompressedStream(decryptedStream);
    276                         break;
    277                     case CRYPTED_COMPRESSED:
    278                         decryptedStream = FileTransforms.getDecryptedStream(originalSourceStream);
    279                         inputStream = FileTransforms.getUncompressedStream(decryptedStream);
    280                         break;
    281                     case COMPRESSED_CRYPTED:
    282                         uncompressedStream =
    283                                 FileTransforms.getUncompressedStream(originalSourceStream);
    284                         inputStream = FileTransforms.getDecryptedStream(uncompressedStream);
    285                         break;
    286                     case COMPRESSED_ONLY:
    287                         inputStream = FileTransforms.getUncompressedStream(originalSourceStream);
    288                         break;
    289                     case CRYPTED_ONLY:
    290                         inputStream = FileTransforms.getDecryptedStream(originalSourceStream);
    291                         break;
    292                     case NONE:
    293                         inputStream = originalSourceStream;
    294                         break;
    295                 }
    296                 bufferedInputStream = new BufferedInputStream(inputStream);
    297                 bufferedOutputStream = new BufferedOutputStream(new FileOutputStream(outputFile));
    298                 checkMagicAndCopyFileTo(bufferedInputStream, bufferedOutputStream);
    299                 bufferedOutputStream.flush();
    300                 bufferedOutputStream.close();
    301                 final File finalFile = new File(finalFileName);
    302                 finalFile.delete();
    303                 if (!outputFile.renameTo(finalFile)) {
    304                     throw new IOException("Can't move the file to its final name");
    305                 }
    306                 wordListUriBuilder.appendQueryParameter(QUERY_PARAMETER_DELETE_RESULT,
    307                         QUERY_PARAMETER_SUCCESS);
    308                 if (0 >= providerClient.delete(wordListUriBuilder.build(), null, null)) {
    309                     Log.e(TAG, "Could not have the dictionary pack delete a word list");
    310                 }
    311                 BinaryDictionaryGetter.removeFilesWithIdExcept(context, wordlistId, finalFile);
    312                 Log.e(TAG, "Successfully copied file for wordlist ID " + wordlistId);
    313                 // Success! Close files (through the finally{} clause) and return.
    314                 return;
    315             } catch (Exception e) {
    316                 if (DEBUG) {
    317                     Log.i(TAG, "Can't open word list in mode " + mode, e);
    318                 }
    319                 if (null != outputFile) {
    320                     // This may or may not fail. The file may not have been created if the
    321                     // exception was thrown before it could be. Hence, both failure and
    322                     // success are expected outcomes, so we don't check the return value.
    323                     outputFile.delete();
    324                 }
    325                 // Try the next method.
    326             } finally {
    327                 // Ignore exceptions while closing files.
    328                 closeAssetFileDescriptorAndReportAnyException(afd);
    329                 closeCloseableAndReportAnyException(inputStream);
    330                 closeCloseableAndReportAnyException(uncompressedStream);
    331                 closeCloseableAndReportAnyException(decryptedStream);
    332                 closeCloseableAndReportAnyException(bufferedInputStream);
    333                 closeCloseableAndReportAnyException(bufferedOutputStream);
    334             }
    335         }
    336 
    337         // We could not copy the file at all. This is very unexpected.
    338         // I'd rather not print the word list ID to the log out of security concerns
    339         Log.e(TAG, "Could not copy a word list. Will not be able to use it.");
    340         // If we can't copy it we should warn the dictionary provider so that it can mark it
    341         // as invalid.
    342         wordListUriBuilder.appendQueryParameter(QUERY_PARAMETER_DELETE_RESULT,
    343                 QUERY_PARAMETER_FAILURE);
    344         try {
    345             if (0 >= providerClient.delete(wordListUriBuilder.build(), null, null)) {
    346                 Log.e(TAG, "In addition, we were unable to delete it.");
    347             }
    348         } catch (RemoteException e) {
    349             Log.e(TAG, "In addition, communication with the dictionary provider was cut", e);
    350         }
    351     }
    352 
    353     // Ideally the two following methods should be merged, but AssetFileDescriptor does not
    354     // implement Closeable although it does implement #close(), and Java does not have
    355     // structural typing.
    356     private static void closeAssetFileDescriptorAndReportAnyException(
    357             final AssetFileDescriptor file) {
    358         try {
    359             if (null != file) file.close();
    360         } catch (Exception e) {
    361             Log.e(TAG, "Exception while closing a file", e);
    362         }
    363     }
    364 
    365     private static void closeCloseableAndReportAnyException(final Closeable file) {
    366         try {
    367             if (null != file) file.close();
    368         } catch (Exception e) {
    369             Log.e(TAG, "Exception while closing a file", e);
    370         }
    371     }
    372 
    373     /**
    374      * Queries a content provider for word list data for some locale and cache the returned files
    375      *
    376      * This will query a content provider for word list data for a given locale, and copy the
    377      * files locally so that they can be mmap'ed. This may overwrite previously cached word lists
    378      * with newer versions if a newer version is made available by the content provider.
    379      * @throw FileNotFoundException if the provider returns non-existent data.
    380      * @throw IOException if the provider-returned data could not be read.
    381      */
    382     public static void cacheWordListsFromContentProvider(final Locale locale,
    383             final Context context, final boolean hasDefaultWordList) {
    384         final ContentProviderClient providerClient;
    385         try {
    386             providerClient = context.getContentResolver().
    387                 acquireContentProviderClient(getProviderUriBuilder("").build());
    388         } catch (final SecurityException e) {
    389             Log.e(TAG, "No permission to communicate with the dictionary provider", e);
    390             return;
    391         }
    392         if (null == providerClient) {
    393             Log.e(TAG, "Can't establish communication with the dictionary provider");
    394             return;
    395         }
    396         try {
    397             final List<WordListInfo> idList = getWordListWordListInfos(locale, context,
    398                     hasDefaultWordList);
    399             for (WordListInfo id : idList) {
    400                 cacheWordList(id.mId, id.mLocale, providerClient, context);
    401             }
    402         } finally {
    403             providerClient.release();
    404         }
    405     }
    406 
    407     /**
    408      * Copies the data in an input stream to a target file if the magic number matches.
    409      *
    410      * If the magic number does not match the expected value, this method throws an
    411      * IOException. Other usual conditions for IOException or FileNotFoundException
    412      * also apply.
    413      *
    414      * @param input the stream to be copied.
    415      * @param output an output stream to copy the data to.
    416      */
    417     public static void checkMagicAndCopyFileTo(final BufferedInputStream input,
    418             final BufferedOutputStream output) throws FileNotFoundException, IOException {
    419         // Check the magic number
    420         final int length = MAGIC_NUMBER_VERSION_2.length;
    421         final byte[] magicNumberBuffer = new byte[length];
    422         final int readMagicNumberSize = input.read(magicNumberBuffer, 0, length);
    423         if (readMagicNumberSize < length) {
    424             throw new IOException("Less bytes to read than the magic number length");
    425         }
    426         if (!Arrays.equals(MAGIC_NUMBER_VERSION_2, magicNumberBuffer)) {
    427             if (!Arrays.equals(MAGIC_NUMBER_VERSION_1, magicNumberBuffer)) {
    428                 throw new IOException("Wrong magic number for downloaded file");
    429             }
    430         }
    431         output.write(magicNumberBuffer);
    432 
    433         // Actually copy the file
    434         final byte[] buffer = new byte[FILE_READ_BUFFER_SIZE];
    435         for (int readBytes = input.read(buffer); readBytes >= 0; readBytes = input.read(buffer))
    436             output.write(buffer, 0, readBytes);
    437         input.close();
    438     }
    439 
    440     private static void reinitializeClientRecordInDictionaryContentProvider(final Context context,
    441             final ContentProviderClient client, final String clientId) throws RemoteException {
    442         final String metadataFileUri = MetadataFileUriGetter.getMetadataUri(context);
    443         final String metadataAdditionalId = MetadataFileUriGetter.getMetadataAdditionalId(context);
    444         // Tell the content provider to reset all information about this client id
    445         final Uri metadataContentUri = getProviderUriBuilder(clientId)
    446                 .appendPath(QUERY_PATH_METADATA)
    447                 .appendQueryParameter(QUERY_PARAMETER_PROTOCOL, QUERY_PARAMETER_PROTOCOL_VALUE)
    448                 .build();
    449         client.delete(metadataContentUri, null, null);
    450         // Update the metadata URI
    451         final ContentValues metadataValues = new ContentValues();
    452         metadataValues.put(INSERT_METADATA_CLIENT_ID_COLUMN, clientId);
    453         metadataValues.put(INSERT_METADATA_METADATA_URI_COLUMN, metadataFileUri);
    454         metadataValues.put(INSERT_METADATA_METADATA_ADDITIONAL_ID_COLUMN, metadataAdditionalId);
    455         client.insert(metadataContentUri, metadataValues);
    456 
    457         // Update the dictionary list.
    458         final Uri dictionaryContentUriBase = getProviderUriBuilder(clientId)
    459                 .appendPath(QUERY_PATH_DICT_INFO)
    460                 .appendQueryParameter(QUERY_PARAMETER_PROTOCOL, QUERY_PARAMETER_PROTOCOL_VALUE)
    461                 .build();
    462         final ArrayList<DictionaryInfo> dictionaryList =
    463                 DictionaryInfoUtils.getCurrentDictionaryFileNameAndVersionInfo(context);
    464         final int length = dictionaryList.size();
    465         for (int i = 0; i < length; ++i) {
    466             final DictionaryInfo info = dictionaryList.get(i);
    467             client.insert(Uri.withAppendedPath(dictionaryContentUriBase, info.mId),
    468                     info.toContentValues());
    469         }
    470     }
    471 
    472     /**
    473      * Initialize a client record with the dictionary content provider.
    474      *
    475      * This merely acquires the content provider and calls
    476      * #reinitializeClientRecordInDictionaryContentProvider.
    477      *
    478      * @param context the context for resources and providers.
    479      * @param clientId the client ID to use.
    480      */
    481     public static void initializeClientRecordHelper(final Context context,
    482             final String clientId) {
    483         try {
    484             final ContentProviderClient client = context.getContentResolver().
    485                     acquireContentProviderClient(getProviderUriBuilder("").build());
    486             if (null == client) return;
    487             reinitializeClientRecordInDictionaryContentProvider(context, client, clientId);
    488         } catch (RemoteException e) {
    489             Log.e(TAG, "Cannot contact the dictionary content provider", e);
    490         }
    491     }
    492 }
    493