2009-03-13 22:11:42 +00:00
|
|
|
/*
|
2010-03-26 22:07:10 +00:00
|
|
|
* Copyright (C) 2008 The Android Open Source Project
|
2009-03-13 22:11:42 +00:00
|
|
|
*
|
|
|
|
* Licensed under the Apache License, Version 2.0 (the "License"); you may not
|
|
|
|
* use this file except in compliance with the License. You may obtain a copy of
|
|
|
|
* the License at
|
|
|
|
*
|
|
|
|
* http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
*
|
|
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
|
|
* distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
|
|
|
|
* WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
|
|
|
|
* License for the specific language governing permissions and limitations under
|
|
|
|
* the License.
|
|
|
|
*/
|
|
|
|
|
|
|
|
package com.android.inputmethod.latin;
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Abstract base class for a dictionary that can do a fuzzy search for words based on a set of key
|
|
|
|
* strokes.
|
|
|
|
*/
|
|
|
|
abstract public class Dictionary {
|
2010-07-01 03:28:04 +00:00
|
|
|
|
|
|
|
protected static final int MAX_WORD_LENGTH = 48;
|
|
|
|
|
2009-03-13 22:11:42 +00:00
|
|
|
/**
|
|
|
|
* Whether or not to replicate the typed word in the suggested list, even if it's valid.
|
|
|
|
*/
|
|
|
|
protected static final boolean INCLUDE_TYPED_WORD_IF_VALID = false;
|
|
|
|
|
|
|
|
/**
|
|
|
|
* The weight to give to a word if it's length is the same as the number of typed characters.
|
|
|
|
*/
|
|
|
|
protected static final int FULL_WORD_FREQ_MULTIPLIER = 2;
|
2010-07-01 03:28:04 +00:00
|
|
|
|
|
|
|
public static enum DataType {
|
|
|
|
UNIGRAM, BIGRAM
|
|
|
|
}
|
|
|
|
|
2009-03-13 22:11:42 +00:00
|
|
|
/**
|
|
|
|
* Interface to be implemented by classes requesting words to be fetched from the dictionary.
|
|
|
|
* @see #getWords(WordComposer, WordCallback)
|
|
|
|
*/
|
|
|
|
public interface WordCallback {
|
|
|
|
/**
|
|
|
|
* Adds a word to a list of suggestions. The word is expected to be ordered based on
|
|
|
|
* the provided frequency.
|
|
|
|
* @param word the character array containing the word
|
|
|
|
* @param wordOffset starting offset of the word in the character array
|
|
|
|
* @param wordLength length of valid characters in the character array
|
|
|
|
* @param frequency the frequency of occurence. This is normalized between 1 and 255, but
|
|
|
|
* can exceed those limits
|
2010-06-02 09:30:27 +00:00
|
|
|
* @param dicTypeId of the dictionary where word was from
|
2010-07-01 03:28:04 +00:00
|
|
|
* @param dataType tells type of this data
|
2009-03-13 22:11:42 +00:00
|
|
|
* @return true if the word was added, false if no more words are required
|
|
|
|
*/
|
2010-07-16 04:02:45 +00:00
|
|
|
boolean addWord(char[] word, int wordOffset, int wordLength, int frequency, int dicTypeId,
|
2010-07-01 03:28:04 +00:00
|
|
|
DataType dataType);
|
2009-03-13 22:11:42 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Searches for words in the dictionary that match the characters in the composer. Matched
|
|
|
|
* words are added through the callback object.
|
|
|
|
* @param composer the key sequence to match
|
|
|
|
* @param callback the callback object to send matched words to as possible candidates
|
2010-02-05 22:07:04 +00:00
|
|
|
* @param nextLettersFrequencies array of frequencies of next letters that could follow the
|
|
|
|
* word so far. For instance, "bracke" can be followed by "t", so array['t'] will have
|
|
|
|
* a non-zero value on returning from this method.
|
|
|
|
* Pass in null if you don't want the dictionary to look up next letters.
|
2009-03-13 22:11:42 +00:00
|
|
|
* @see WordCallback#addWord(char[], int, int)
|
|
|
|
*/
|
2010-02-05 22:07:04 +00:00
|
|
|
abstract public void getWords(final WordComposer composer, final WordCallback callback,
|
|
|
|
int[] nextLettersFrequencies);
|
2009-03-13 22:11:42 +00:00
|
|
|
|
2010-07-01 03:28:04 +00:00
|
|
|
/**
|
|
|
|
* Searches for pairs in the bigram dictionary that matches the previous word and all the
|
|
|
|
* possible words following are added through the callback object.
|
|
|
|
* @param composer the key sequence to match
|
|
|
|
* @param callback the callback object to send possible word following previous word
|
|
|
|
* @param nextLettersFrequencies array of frequencies of next letters that could follow the
|
|
|
|
* word so far. For instance, "bracke" can be followed by "t", so array['t'] will have
|
|
|
|
* a non-zero value on returning from this method.
|
|
|
|
* Pass in null if you don't want the dictionary to look up next letters.
|
|
|
|
*/
|
|
|
|
public void getBigrams(final WordComposer composer, final CharSequence previousWord,
|
|
|
|
final WordCallback callback, int[] nextLettersFrequencies) {
|
|
|
|
// empty base implementation
|
|
|
|
}
|
|
|
|
|
2009-03-13 22:11:42 +00:00
|
|
|
/**
|
|
|
|
* Checks if the given word occurs in the dictionary
|
|
|
|
* @param word the word to search for. The search should be case-insensitive.
|
|
|
|
* @return true if the word exists, false otherwise
|
|
|
|
*/
|
|
|
|
abstract public boolean isValidWord(CharSequence word);
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Compares the contents of the character array with the typed word and returns true if they
|
|
|
|
* are the same.
|
|
|
|
* @param word the array of characters that make up the word
|
|
|
|
* @param length the number of valid characters in the character array
|
|
|
|
* @param typedWord the word to compare with
|
|
|
|
* @return true if they are the same, false otherwise.
|
|
|
|
*/
|
|
|
|
protected boolean same(final char[] word, final int length, final CharSequence typedWord) {
|
|
|
|
if (typedWord.length() != length) {
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
for (int i = 0; i < length; i++) {
|
|
|
|
if (word[i] != typedWord.charAt(i)) {
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
2009-10-12 20:48:35 +00:00
|
|
|
/**
|
|
|
|
* Override to clean up any resources.
|
|
|
|
*/
|
|
|
|
public void close() {
|
|
|
|
}
|
2009-03-13 22:11:42 +00:00
|
|
|
}
|