2009-03-13 22:11:42 +00:00
|
|
|
/*
|
2012-07-25 08:51:43 +00:00
|
|
|
* Copyright (C) 2009, The Android Open Source Project
|
|
|
|
*
|
|
|
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
* you may not use this file except in compliance with the License.
|
|
|
|
* You may obtain a copy of the License at
|
|
|
|
*
|
|
|
|
* http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
*
|
|
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
|
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
* See the License for the specific language governing permissions and
|
|
|
|
* limitations under the License.
|
|
|
|
*/
|
2009-03-13 22:11:42 +00:00
|
|
|
|
2010-12-02 05:53:24 +00:00
|
|
|
#define LOG_TAG "LatinIME: dictionary.cpp"
|
|
|
|
|
2012-08-02 10:48:08 +00:00
|
|
|
#include <stdint.h>
|
|
|
|
|
|
|
|
#include "bigram_dictionary.h"
|
2012-02-27 10:48:47 +00:00
|
|
|
#include "binary_format.h"
|
2012-05-16 14:05:32 +00:00
|
|
|
#include "defines.h"
|
2009-03-13 22:11:42 +00:00
|
|
|
#include "dictionary.h"
|
2012-08-09 14:23:08 +00:00
|
|
|
#include "dic_traverse_wrapper.h"
|
2012-07-03 08:45:50 +00:00
|
|
|
#include "gesture_decoder_wrapper.h"
|
2012-08-02 10:48:08 +00:00
|
|
|
#include "unigram_dictionary.h"
|
2010-12-01 10:09:29 +00:00
|
|
|
|
2009-03-13 22:11:42 +00:00
|
|
|
namespace latinime {
|
|
|
|
|
2011-02-22 08:28:55 +00:00
|
|
|
// TODO: Change the type of all keyCodes to uint32_t
|
2011-01-07 06:01:51 +00:00
|
|
|
Dictionary::Dictionary(void *dict, int dictSize, int mmapFd, int dictBufAdjust,
|
|
|
|
int typedLetterMultiplier, int fullWordMultiplier,
|
2012-07-11 02:31:48 +00:00
|
|
|
int maxWordLength, int maxWords, int maxPredictions)
|
2012-08-09 14:23:08 +00:00
|
|
|
: mDict((unsigned char*) dict),
|
|
|
|
mOffsetDict(((unsigned char*) dict) + BinaryFormat::getHeaderSize(mDict)),
|
|
|
|
mDictSize(dictSize), mMmapFd(mmapFd), mDictBufAdjust(dictBufAdjust) {
|
2010-12-08 08:05:39 +00:00
|
|
|
if (DEBUG_DICT) {
|
|
|
|
if (MAX_WORD_LENGTH_INTERNAL < maxWordLength) {
|
2012-01-13 09:01:22 +00:00
|
|
|
AKLOGI("Max word length (%d) is greater than %d",
|
2010-12-08 08:05:39 +00:00
|
|
|
maxWordLength, MAX_WORD_LENGTH_INTERNAL);
|
2012-01-13 09:01:22 +00:00
|
|
|
AKLOGI("IN NATIVE SUGGEST Version: %d", (mDict[0] & 0xFF));
|
2010-12-08 08:05:39 +00:00
|
|
|
}
|
2010-12-02 11:19:59 +00:00
|
|
|
}
|
2012-04-06 09:26:00 +00:00
|
|
|
const unsigned int options = BinaryFormat::getFlags(mDict);
|
2012-08-09 14:23:08 +00:00
|
|
|
mUnigramDictionary = new UnigramDictionary(mOffsetDict, typedLetterMultiplier,
|
2012-04-06 09:26:00 +00:00
|
|
|
fullWordMultiplier, maxWordLength, maxWords, options);
|
2012-08-09 14:23:08 +00:00
|
|
|
mBigramDictionary = new BigramDictionary(mOffsetDict, maxWordLength, maxPredictions);
|
2012-07-03 08:45:50 +00:00
|
|
|
mGestureDecoder = new GestureDecoderWrapper(maxWordLength, maxWords);
|
2012-06-27 05:52:40 +00:00
|
|
|
mGestureDecoder->setDict(mUnigramDictionary, mBigramDictionary,
|
2012-08-09 14:23:08 +00:00
|
|
|
mOffsetDict /* dict root */, 0 /* root pos */);
|
2009-03-13 22:11:42 +00:00
|
|
|
}
|
|
|
|
|
2010-12-08 08:05:39 +00:00
|
|
|
Dictionary::~Dictionary() {
|
2010-12-01 12:22:15 +00:00
|
|
|
delete mUnigramDictionary;
|
|
|
|
delete mBigramDictionary;
|
2012-06-29 23:53:33 +00:00
|
|
|
delete mGestureDecoder;
|
2009-03-13 22:11:42 +00:00
|
|
|
}
|
2010-12-02 05:53:24 +00:00
|
|
|
|
2012-08-08 12:23:25 +00:00
|
|
|
int Dictionary::getSuggestions(ProximityInfo *proximityInfo, void *traverseSession,
|
|
|
|
int *xcoordinates, int *ycoordinates, int *times, int *pointerIds,
|
|
|
|
int *codes, int codesSize, int *prevWordChars,
|
2012-08-02 10:48:08 +00:00
|
|
|
int prevWordLength, int commitPoint, bool isGesture,
|
|
|
|
bool useFullEditDistance, unsigned short *outWords,
|
|
|
|
int *frequencies, int *spaceIndices, int *outputTypes) {
|
|
|
|
int result = 0;
|
|
|
|
if (isGesture) {
|
2012-08-09 14:23:08 +00:00
|
|
|
DicTraverseWrapper::initDicTraverseSession(
|
|
|
|
traverseSession, this, prevWordChars, prevWordLength);
|
2012-08-08 12:23:25 +00:00
|
|
|
result = mGestureDecoder->getSuggestions(proximityInfo, traverseSession,
|
|
|
|
xcoordinates, ycoordinates, times, pointerIds, codes, codesSize, commitPoint,
|
2012-08-02 10:48:08 +00:00
|
|
|
outWords, frequencies, spaceIndices, outputTypes);
|
2012-08-06 02:20:54 +00:00
|
|
|
if (DEBUG_DICT) {
|
|
|
|
DUMP_RESULT(outWords, frequencies, 18 /* MAX_WORDS */, MAX_WORD_LENGTH_INTERNAL);
|
|
|
|
}
|
2012-08-02 10:48:08 +00:00
|
|
|
return result;
|
|
|
|
} else {
|
|
|
|
std::map<int, int> bigramMap;
|
|
|
|
uint8_t bigramFilter[BIGRAM_FILTER_BYTE_SIZE];
|
|
|
|
mBigramDictionary->fillBigramAddressToFrequencyMapAndFilter(prevWordChars,
|
|
|
|
prevWordLength, &bigramMap, bigramFilter);
|
|
|
|
result = mUnigramDictionary->getSuggestions(proximityInfo, xcoordinates,
|
|
|
|
ycoordinates, codes, codesSize, &bigramMap, bigramFilter,
|
|
|
|
useFullEditDistance, outWords, frequencies, outputTypes);
|
|
|
|
return result;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
int Dictionary::getBigrams(const int32_t *word, int length, int *codes, int codesSize,
|
|
|
|
unsigned short *outWords, int *frequencies, int *outputTypes) const {
|
|
|
|
if (length <= 0) return 0;
|
|
|
|
return mBigramDictionary->getBigrams(word, length, codes, codesSize, outWords, frequencies,
|
|
|
|
outputTypes);
|
|
|
|
}
|
|
|
|
|
2012-06-14 23:35:23 +00:00
|
|
|
int Dictionary::getFrequency(const int32_t *word, int length) const {
|
2012-05-29 06:58:13 +00:00
|
|
|
return mUnigramDictionary->getFrequency(word, length);
|
2010-12-02 05:53:24 +00:00
|
|
|
}
|
|
|
|
|
2012-04-27 06:50:21 +00:00
|
|
|
bool Dictionary::isValidBigram(const int32_t *word1, int length1, const int32_t *word2,
|
2012-06-14 23:35:23 +00:00
|
|
|
int length2) const {
|
2012-04-27 06:50:21 +00:00
|
|
|
return mBigramDictionary->isValidBigram(word1, length1, word2, length2);
|
|
|
|
}
|
2009-03-13 22:11:42 +00:00
|
|
|
} // namespace latinime
|