2012-03-26 13:31:20 +00:00
|
|
|
/*
|
|
|
|
* Copyright (C) 2012 The Android Open Source Project
|
|
|
|
*
|
2013-01-21 12:52:57 +00:00
|
|
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
* you may not use this file except in compliance with the License.
|
|
|
|
* You may obtain a copy of the License at
|
2012-03-26 13:31:20 +00:00
|
|
|
*
|
2013-01-21 12:52:57 +00:00
|
|
|
* http://www.apache.org/licenses/LICENSE-2.0
|
2012-03-26 13:31:20 +00:00
|
|
|
*
|
2013-01-21 12:52:57 +00:00
|
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
|
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
* See the License for the specific language governing permissions and
|
|
|
|
* limitations under the License.
|
2012-03-26 13:31:20 +00:00
|
|
|
*/
|
|
|
|
|
|
|
|
package com.android.inputmethod.latin;
|
|
|
|
|
|
|
|
import android.content.ContentResolver;
|
|
|
|
import android.content.Context;
|
|
|
|
import android.database.ContentObserver;
|
|
|
|
import android.database.Cursor;
|
2013-09-20 10:31:39 +00:00
|
|
|
import android.database.sqlite.SQLiteException;
|
2013-05-08 04:00:37 +00:00
|
|
|
import android.net.Uri;
|
2012-04-27 06:50:21 +00:00
|
|
|
import android.os.SystemClock;
|
2012-03-26 13:31:20 +00:00
|
|
|
import android.provider.BaseColumns;
|
2013-05-08 04:00:37 +00:00
|
|
|
import android.provider.ContactsContract;
|
2012-03-26 13:31:20 +00:00
|
|
|
import android.provider.ContactsContract.Contacts;
|
|
|
|
import android.util.Log;
|
|
|
|
|
2014-05-01 09:44:57 +00:00
|
|
|
import com.android.inputmethod.annotations.UsedForTesting;
|
2013-12-26 09:26:28 +00:00
|
|
|
import com.android.inputmethod.latin.personalization.AccountUtils;
|
2014-05-08 03:25:32 +00:00
|
|
|
import com.android.inputmethod.latin.utils.ExecutorUtils;
|
2013-06-23 16:11:32 +00:00
|
|
|
import com.android.inputmethod.latin.utils.StringUtils;
|
|
|
|
|
2013-12-13 05:48:43 +00:00
|
|
|
import java.io.File;
|
2014-05-08 03:25:32 +00:00
|
|
|
import java.util.ArrayList;
|
2013-05-08 07:08:56 +00:00
|
|
|
import java.util.List;
|
2012-03-26 13:31:20 +00:00
|
|
|
import java.util.Locale;
|
|
|
|
|
|
|
|
public class ContactsBinaryDictionary extends ExpandableBinaryDictionary {
|
|
|
|
|
2013-05-08 04:00:37 +00:00
|
|
|
private static final String[] PROJECTION = {BaseColumns._ID, Contacts.DISPLAY_NAME};
|
2012-04-27 06:50:21 +00:00
|
|
|
private static final String[] PROJECTION_ID_ONLY = {BaseColumns._ID};
|
2012-03-26 13:31:20 +00:00
|
|
|
|
|
|
|
private static final String TAG = ContactsBinaryDictionary.class.getSimpleName();
|
|
|
|
private static final String NAME = "contacts";
|
|
|
|
|
2013-11-20 05:07:44 +00:00
|
|
|
private static final boolean DEBUG = false;
|
|
|
|
private static final boolean DEBUG_DUMP = false;
|
2012-04-27 06:50:21 +00:00
|
|
|
|
2012-03-26 13:31:20 +00:00
|
|
|
/**
|
|
|
|
* Frequency for contacts information into the dictionary
|
|
|
|
*/
|
|
|
|
private static final int FREQUENCY_FOR_CONTACTS = 40;
|
|
|
|
private static final int FREQUENCY_FOR_CONTACTS_BIGRAM = 90;
|
|
|
|
|
2012-04-27 06:50:21 +00:00
|
|
|
/** The maximum number of contacts that this dictionary supports. */
|
|
|
|
private static final int MAX_CONTACT_COUNT = 10000;
|
|
|
|
|
2012-03-26 13:31:20 +00:00
|
|
|
private static final int INDEX_NAME = 1;
|
|
|
|
|
2012-04-27 06:50:21 +00:00
|
|
|
/** The number of contacts in the most recent dictionary rebuild. */
|
2014-05-08 03:25:32 +00:00
|
|
|
private int mContactCountAtLastRebuild = 0;
|
|
|
|
|
|
|
|
/** The hash code of ArrayList of contacts names in the most recent dictionary rebuild. */
|
|
|
|
private int mHashCodeAtLastRebuild = 0;
|
2012-04-27 06:50:21 +00:00
|
|
|
|
2012-03-26 13:31:20 +00:00
|
|
|
private ContentObserver mObserver;
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Whether to use "firstname lastname" in bigram predictions.
|
|
|
|
*/
|
|
|
|
private final boolean mUseFirstLastBigrams;
|
|
|
|
|
2014-04-28 03:29:48 +00:00
|
|
|
protected ContactsBinaryDictionary(final Context context, final Locale locale,
|
|
|
|
final File dictFile, final String name) {
|
|
|
|
super(context, getDictName(name, locale, dictFile), locale, Dictionary.TYPE_CONTACTS,
|
2014-02-27 14:21:09 +00:00
|
|
|
dictFile);
|
2012-03-26 13:31:20 +00:00
|
|
|
mUseFirstLastBigrams = useFirstLastBigramsForLocale(locale);
|
|
|
|
registerObserver(context);
|
2014-04-28 07:58:27 +00:00
|
|
|
reloadDictionaryIfRequired();
|
2012-03-26 13:31:20 +00:00
|
|
|
}
|
|
|
|
|
2014-05-01 09:44:57 +00:00
|
|
|
@UsedForTesting
|
2014-05-01 08:22:23 +00:00
|
|
|
public static ContactsBinaryDictionary getDictionary(final Context context, final Locale locale,
|
2014-06-10 09:05:10 +00:00
|
|
|
final File dictFile, final String dictNamePrefix) {
|
|
|
|
return new ContactsBinaryDictionary(context, locale, dictFile, dictNamePrefix + NAME);
|
2014-05-01 08:22:23 +00:00
|
|
|
}
|
|
|
|
|
2012-03-26 13:31:20 +00:00
|
|
|
private synchronized void registerObserver(final Context context) {
|
|
|
|
if (mObserver != null) return;
|
|
|
|
ContentResolver cres = context.getContentResolver();
|
|
|
|
cres.registerContentObserver(Contacts.CONTENT_URI, true, mObserver =
|
|
|
|
new ContentObserver(null) {
|
|
|
|
@Override
|
|
|
|
public void onChange(boolean self) {
|
2014-05-08 03:25:32 +00:00
|
|
|
ExecutorUtils.getExecutor("Check Contacts").execute(new Runnable() {
|
|
|
|
@Override
|
|
|
|
public void run() {
|
|
|
|
if (haveContentsChanged()) {
|
|
|
|
setNeedsToRecreate();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
});
|
2012-03-26 13:31:20 +00:00
|
|
|
}
|
|
|
|
});
|
|
|
|
}
|
|
|
|
|
|
|
|
@Override
|
|
|
|
public synchronized void close() {
|
|
|
|
if (mObserver != null) {
|
|
|
|
mContext.getContentResolver().unregisterContentObserver(mObserver);
|
|
|
|
mObserver = null;
|
|
|
|
}
|
|
|
|
super.close();
|
|
|
|
}
|
|
|
|
|
|
|
|
@Override
|
2014-02-27 14:21:09 +00:00
|
|
|
public void loadInitialContentsLocked() {
|
|
|
|
loadDeviceAccountsEmailAddressesLocked();
|
|
|
|
loadDictionaryForUriLocked(ContactsContract.Profile.CONTENT_URI);
|
2013-05-08 04:00:37 +00:00
|
|
|
// TODO: Switch this URL to the newer ContactsContract too
|
2014-02-27 14:21:09 +00:00
|
|
|
loadDictionaryForUriLocked(Contacts.CONTENT_URI);
|
2013-05-08 04:00:37 +00:00
|
|
|
}
|
|
|
|
|
2014-02-27 14:21:09 +00:00
|
|
|
private void loadDeviceAccountsEmailAddressesLocked() {
|
2013-05-08 07:08:56 +00:00
|
|
|
final List<String> accountVocabulary =
|
|
|
|
AccountUtils.getDeviceAccountsEmailAddresses(mContext);
|
|
|
|
if (accountVocabulary == null || accountVocabulary.isEmpty()) {
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
for (String word : accountVocabulary) {
|
|
|
|
if (DEBUG) {
|
|
|
|
Log.d(TAG, "loadAccountVocabulary: " + word);
|
|
|
|
}
|
2014-02-27 14:21:09 +00:00
|
|
|
runGCIfRequiredLocked(true /* mindsBlockByGC */);
|
2014-05-21 02:15:38 +00:00
|
|
|
addUnigramLocked(word, FREQUENCY_FOR_CONTACTS, null /* shortcut */,
|
2014-10-14 03:13:11 +00:00
|
|
|
0 /* shortcutFreq */, false /* isNotAWord */, false /* isPossiblyOffensive */,
|
2014-02-27 14:21:09 +00:00
|
|
|
BinaryDictionary.NOT_A_VALID_TIMESTAMP);
|
2013-05-08 07:08:56 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2014-02-27 14:21:09 +00:00
|
|
|
private void loadDictionaryForUriLocked(final Uri uri) {
|
2014-02-18 07:02:51 +00:00
|
|
|
Cursor cursor = null;
|
2012-03-26 13:31:20 +00:00
|
|
|
try {
|
2014-02-18 07:02:51 +00:00
|
|
|
cursor = mContext.getContentResolver().query(uri, PROJECTION, null, null, null);
|
|
|
|
if (null == cursor) {
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
if (cursor.moveToFirst()) {
|
2014-05-08 03:25:32 +00:00
|
|
|
mContactCountAtLastRebuild = getContactCount();
|
2014-02-27 14:21:09 +00:00
|
|
|
addWordsLocked(cursor);
|
2012-03-26 13:31:20 +00:00
|
|
|
}
|
2013-09-20 10:31:39 +00:00
|
|
|
} catch (final SQLiteException e) {
|
|
|
|
Log.e(TAG, "SQLiteException in the remote Contacts process.", e);
|
|
|
|
} catch (final IllegalStateException e) {
|
|
|
|
Log.e(TAG, "Contacts DB is having problems", e);
|
2014-02-18 07:02:51 +00:00
|
|
|
} finally {
|
|
|
|
if (null != cursor) {
|
|
|
|
cursor.close();
|
|
|
|
}
|
2012-03-26 13:31:20 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2014-10-20 05:48:56 +00:00
|
|
|
private static boolean useFirstLastBigramsForLocale(final Locale locale) {
|
2012-03-26 13:31:20 +00:00
|
|
|
// TODO: Add firstname/lastname bigram rules for other languages.
|
|
|
|
if (locale != null && locale.getLanguage().equals(Locale.ENGLISH.getLanguage())) {
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
2014-02-27 14:21:09 +00:00
|
|
|
private void addWordsLocked(final Cursor cursor) {
|
2012-04-27 06:50:21 +00:00
|
|
|
int count = 0;
|
2014-05-23 11:18:17 +00:00
|
|
|
final ArrayList<String> names = new ArrayList<>();
|
2012-04-27 06:50:21 +00:00
|
|
|
while (!cursor.isAfterLast() && count < MAX_CONTACT_COUNT) {
|
2012-03-26 13:31:20 +00:00
|
|
|
String name = cursor.getString(INDEX_NAME);
|
2012-04-27 06:50:21 +00:00
|
|
|
if (isValidName(name)) {
|
2014-05-08 03:25:32 +00:00
|
|
|
names.add(name);
|
2014-02-27 14:21:09 +00:00
|
|
|
addNameLocked(name);
|
2012-04-27 06:50:21 +00:00
|
|
|
++count;
|
2013-11-20 05:07:44 +00:00
|
|
|
} else {
|
|
|
|
if (DEBUG_DUMP) {
|
|
|
|
Log.d(TAG, "Invalid name: " + name);
|
|
|
|
}
|
2012-03-26 13:31:20 +00:00
|
|
|
}
|
|
|
|
cursor.moveToNext();
|
|
|
|
}
|
2014-05-08 03:25:32 +00:00
|
|
|
mHashCodeAtLastRebuild = names.hashCode();
|
2012-03-26 13:31:20 +00:00
|
|
|
}
|
|
|
|
|
2012-04-27 06:50:21 +00:00
|
|
|
private int getContactCount() {
|
|
|
|
// TODO: consider switching to a rawQuery("select count(*)...") on the database if
|
|
|
|
// performance is a bottleneck.
|
2014-02-18 07:02:51 +00:00
|
|
|
Cursor cursor = null;
|
2013-09-20 10:31:39 +00:00
|
|
|
try {
|
2014-02-18 07:02:51 +00:00
|
|
|
cursor = mContext.getContentResolver().query(Contacts.CONTENT_URI, PROJECTION_ID_ONLY,
|
|
|
|
null, null, null);
|
|
|
|
if (null == cursor) {
|
|
|
|
return 0;
|
2012-05-21 23:50:26 +00:00
|
|
|
}
|
2014-02-18 07:02:51 +00:00
|
|
|
return cursor.getCount();
|
2013-09-20 10:31:39 +00:00
|
|
|
} catch (final SQLiteException e) {
|
|
|
|
Log.e(TAG, "SQLiteException in the remote Contacts process.", e);
|
2014-02-18 07:02:51 +00:00
|
|
|
} finally {
|
|
|
|
if (null != cursor) {
|
|
|
|
cursor.close();
|
|
|
|
}
|
2012-04-27 06:50:21 +00:00
|
|
|
}
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2012-03-26 13:31:20 +00:00
|
|
|
/**
|
|
|
|
* Adds the words in a name (e.g., firstname/lastname) to the binary dictionary along with their
|
|
|
|
* bigrams depending on locale.
|
|
|
|
*/
|
2014-02-27 14:21:09 +00:00
|
|
|
private void addNameLocked(final String name) {
|
2012-06-27 05:35:24 +00:00
|
|
|
int len = StringUtils.codePointCount(name);
|
2014-09-29 01:52:18 +00:00
|
|
|
NgramContext ngramContext = NgramContext.EMPTY_PREV_WORDS_INFO;
|
2012-03-26 13:31:20 +00:00
|
|
|
// TODO: Better tokenization for non-Latin writing systems
|
|
|
|
for (int i = 0; i < len; i++) {
|
|
|
|
if (Character.isLetter(name.codePointAt(i))) {
|
2012-04-27 06:50:21 +00:00
|
|
|
int end = getWordEndPosition(name, len, i);
|
|
|
|
String word = name.substring(i, end);
|
2013-11-20 05:07:44 +00:00
|
|
|
if (DEBUG_DUMP) {
|
|
|
|
Log.d(TAG, "addName word = " + word);
|
|
|
|
}
|
2012-04-27 06:50:21 +00:00
|
|
|
i = end - 1;
|
2012-03-26 13:31:20 +00:00
|
|
|
// Don't add single letter words, possibly confuses
|
|
|
|
// capitalization of i.
|
2012-06-27 05:35:24 +00:00
|
|
|
final int wordLen = StringUtils.codePointCount(word);
|
2014-07-28 10:18:04 +00:00
|
|
|
if (wordLen <= MAX_WORD_LENGTH && wordLen > 1) {
|
2013-05-08 04:00:37 +00:00
|
|
|
if (DEBUG) {
|
2014-09-29 01:52:18 +00:00
|
|
|
Log.d(TAG, "addName " + name + ", " + word + ", " + ngramContext);
|
2013-05-08 04:00:37 +00:00
|
|
|
}
|
2014-02-27 14:21:09 +00:00
|
|
|
runGCIfRequiredLocked(true /* mindsBlockByGC */);
|
2014-05-21 02:15:38 +00:00
|
|
|
addUnigramLocked(word, FREQUENCY_FOR_CONTACTS,
|
2014-02-27 14:21:09 +00:00
|
|
|
null /* shortcut */, 0 /* shortcutFreq */, false /* isNotAWord */,
|
2014-10-14 03:13:11 +00:00
|
|
|
false /* isPossiblyOffensive */,
|
|
|
|
BinaryDictionary.NOT_A_VALID_TIMESTAMP);
|
2014-09-29 01:52:18 +00:00
|
|
|
if (!ngramContext.isValid() && mUseFirstLastBigrams) {
|
2014-02-27 14:21:09 +00:00
|
|
|
runGCIfRequiredLocked(true /* mindsBlockByGC */);
|
2014-09-29 01:52:18 +00:00
|
|
|
addNgramEntryLocked(ngramContext, word, FREQUENCY_FOR_CONTACTS_BIGRAM,
|
2014-02-27 14:21:09 +00:00
|
|
|
BinaryDictionary.NOT_A_VALID_TIMESTAMP);
|
2012-03-26 13:31:20 +00:00
|
|
|
}
|
2014-09-29 01:52:18 +00:00
|
|
|
ngramContext = ngramContext.getNextNgramContext(
|
|
|
|
new NgramContext.WordInfo(word));
|
2012-03-26 13:31:20 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
2012-04-27 06:50:21 +00:00
|
|
|
|
|
|
|
/**
|
|
|
|
* Returns the index of the last letter in the word, starting from position startIndex.
|
|
|
|
*/
|
2012-10-03 06:19:43 +00:00
|
|
|
private static int getWordEndPosition(final String string, final int len,
|
|
|
|
final int startIndex) {
|
2012-04-27 06:50:21 +00:00
|
|
|
int end;
|
|
|
|
int cp = 0;
|
|
|
|
for (end = startIndex + 1; end < len; end += Character.charCount(cp)) {
|
|
|
|
cp = string.codePointAt(end);
|
2012-10-29 05:46:34 +00:00
|
|
|
if (!(cp == Constants.CODE_DASH || cp == Constants.CODE_SINGLE_QUOTE
|
2012-04-27 06:50:21 +00:00
|
|
|
|| Character.isLetter(cp))) {
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return end;
|
|
|
|
}
|
|
|
|
|
2014-10-20 05:48:56 +00:00
|
|
|
boolean haveContentsChanged() {
|
2012-04-27 06:50:21 +00:00
|
|
|
final long startTime = SystemClock.uptimeMillis();
|
|
|
|
final int contactCount = getContactCount();
|
|
|
|
if (contactCount > MAX_CONTACT_COUNT) {
|
|
|
|
// If there are too many contacts then return false. In this rare case it is impossible
|
|
|
|
// to include all of them anyways and the cost of rebuilding the dictionary is too high.
|
|
|
|
// TODO: Sort and check only the MAX_CONTACT_COUNT most recent contacts?
|
|
|
|
return false;
|
|
|
|
}
|
2014-05-08 03:25:32 +00:00
|
|
|
if (contactCount != mContactCountAtLastRebuild) {
|
2012-05-25 18:16:30 +00:00
|
|
|
if (DEBUG) {
|
2014-05-08 03:25:32 +00:00
|
|
|
Log.d(TAG, "Contact count changed: " + mContactCountAtLastRebuild + " to "
|
2012-05-25 18:16:30 +00:00
|
|
|
+ contactCount);
|
|
|
|
}
|
2012-04-27 06:50:21 +00:00
|
|
|
return true;
|
|
|
|
}
|
|
|
|
// Check all contacts since it's not possible to find out which names have changed.
|
|
|
|
// This is needed because it's possible to receive extraneous onChange events even when no
|
|
|
|
// name has changed.
|
2014-02-18 07:02:51 +00:00
|
|
|
final Cursor cursor = mContext.getContentResolver().query(Contacts.CONTENT_URI, PROJECTION,
|
|
|
|
null, null, null);
|
|
|
|
if (null == cursor) {
|
|
|
|
return false;
|
|
|
|
}
|
2014-05-23 11:18:17 +00:00
|
|
|
final ArrayList<String> names = new ArrayList<>();
|
2014-02-18 07:02:51 +00:00
|
|
|
try {
|
|
|
|
if (cursor.moveToFirst()) {
|
|
|
|
while (!cursor.isAfterLast()) {
|
|
|
|
String name = cursor.getString(INDEX_NAME);
|
2014-05-08 03:25:32 +00:00
|
|
|
if (isValidName(name)) {
|
|
|
|
names.add(name);
|
2012-04-27 06:50:21 +00:00
|
|
|
}
|
2014-02-18 07:02:51 +00:00
|
|
|
cursor.moveToNext();
|
2012-04-27 06:50:21 +00:00
|
|
|
}
|
|
|
|
}
|
2014-05-08 03:25:32 +00:00
|
|
|
if (names.hashCode() != mHashCodeAtLastRebuild) {
|
|
|
|
return true;
|
|
|
|
}
|
2014-02-18 07:02:51 +00:00
|
|
|
} finally {
|
|
|
|
cursor.close();
|
2012-04-27 06:50:21 +00:00
|
|
|
}
|
|
|
|
if (DEBUG) {
|
|
|
|
Log.d(TAG, "No contacts changed. (runtime = " + (SystemClock.uptimeMillis() - startTime)
|
|
|
|
+ " ms)");
|
|
|
|
}
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
2012-10-03 06:19:43 +00:00
|
|
|
private static boolean isValidName(final String name) {
|
2013-04-15 08:33:48 +00:00
|
|
|
if (name != null && -1 == name.indexOf(Constants.CODE_COMMERCIAL_AT)) {
|
2012-04-27 06:50:21 +00:00
|
|
|
return true;
|
|
|
|
}
|
|
|
|
return false;
|
|
|
|
}
|
2012-03-26 13:31:20 +00:00
|
|
|
}
|