Merge "Limit the suggestions with an excessive character by filtering proximity characters"
commit
3f7eac0d2c
|
@ -58,10 +58,12 @@ int UnigramDictionary::getSuggestions(int *codes, int codesSize, unsigned short
|
||||||
// Suggestion with excessive character
|
// Suggestion with excessive character
|
||||||
if (SUGGEST_WORDS_WITH_EXCESSIVE_CHARACTER) {
|
if (SUGGEST_WORDS_WITH_EXCESSIVE_CHARACTER) {
|
||||||
for (int i = 0; i < codesSize; ++i) {
|
for (int i = 0; i < codesSize; ++i) {
|
||||||
|
if (existsAdjacentProximityChars(i, codesSize)) {
|
||||||
if (DEBUG_DICT) LOGI("--- Suggest excessive characters %d", i);
|
if (DEBUG_DICT) LOGI("--- Suggest excessive characters %d", i);
|
||||||
getSuggestionCandidates(codesSize, -1, i, NULL, 0);
|
getSuggestionCandidates(codesSize, -1, i, NULL, 0);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
}
|
||||||
|
|
||||||
// Suggestions with missing space
|
// Suggestions with missing space
|
||||||
if (SUGGEST_WORDS_WITH_MISSING_SPACE_CHARACTER && mInputLength > MIN_SUGGEST_DEPTH) {
|
if (SUGGEST_WORDS_WITH_MISSING_SPACE_CHARACTER && mInputLength > MIN_SUGGEST_DEPTH) {
|
||||||
|
@ -331,11 +333,34 @@ inline bool UnigramDictionary::needsToSkipCurrentNode(const unsigned short c,
|
||||||
return (c == QUOTE && userTypedChar != QUOTE) || skipPos == depth;
|
return (c == QUOTE && userTypedChar != QUOTE) || skipPos == depth;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
inline bool UnigramDictionary::existsAdjacentProximityChars(const int inputIndex,
|
||||||
|
const int inputLength) {
|
||||||
|
if (inputIndex < 0 || inputIndex >= inputLength) return false;
|
||||||
|
const int currentChar = *getInputCharsAt(inputIndex);
|
||||||
|
const int leftIndex = inputIndex - 1;
|
||||||
|
if (leftIndex >= 0) {
|
||||||
|
int *leftChars = getInputCharsAt(leftIndex);
|
||||||
|
int i = 0;
|
||||||
|
while (leftChars[i] > 0 && i < MAX_PROXIMITY_CHARS) {
|
||||||
|
if (leftChars[i++] == currentChar) return true;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
const int rightIndex = inputIndex + 1;
|
||||||
|
if (rightIndex < inputLength) {
|
||||||
|
int *rightChars = getInputCharsAt(rightIndex);
|
||||||
|
int i = 0;
|
||||||
|
while (rightChars[i] > 0 && i < MAX_PROXIMITY_CHARS) {
|
||||||
|
if (rightChars[i++] == currentChar) return true;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
|
||||||
inline int UnigramDictionary::getMatchedProximityId(const int *currentChars,
|
inline int UnigramDictionary::getMatchedProximityId(const int *currentChars,
|
||||||
const unsigned short c, const int skipPos) {
|
const unsigned short c, const int skipPos) {
|
||||||
const unsigned short lowerC = toLowerCase(c);
|
const unsigned short lowerC = toLowerCase(c);
|
||||||
int j = 0;
|
int j = 0;
|
||||||
while (currentChars[j] > 0) {
|
while (currentChars[j] > 0 && j < MAX_PROXIMITY_CHARS) {
|
||||||
const bool matched = (currentChars[j] == lowerC || currentChars[j] == c);
|
const bool matched = (currentChars[j] == lowerC || currentChars[j] == c);
|
||||||
// If skipPos is defined, not to search proximity collections.
|
// If skipPos is defined, not to search proximity collections.
|
||||||
// First char is what user typed.
|
// First char is what user typed.
|
||||||
|
|
|
@ -69,7 +69,8 @@ private:
|
||||||
bool processCurrentNodeForExactMatch(const int firstChildPos,
|
bool processCurrentNodeForExactMatch(const int firstChildPos,
|
||||||
const int startInputIndex, const int depth, unsigned short *word,
|
const int startInputIndex, const int depth, unsigned short *word,
|
||||||
int *newChildPosition, int *newCount, bool *newTerminal, int *newFreq, int *siblingPos);
|
int *newChildPosition, int *newCount, bool *newTerminal, int *newFreq, int *siblingPos);
|
||||||
|
bool existsAdjacentProximityChars(const int inputIndex, const int inputLength);
|
||||||
|
int* getInputCharsAt(const int index) {return mInputCodes + (index * MAX_PROXIMITY_CHARS);}
|
||||||
const unsigned char *DICT;
|
const unsigned char *DICT;
|
||||||
const int MAX_WORDS;
|
const int MAX_WORDS;
|
||||||
const int MAX_WORD_LENGTH;
|
const int MAX_WORD_LENGTH;
|
||||||
|
|
Loading…
Reference in New Issue