2009-03-13 22:11:42 +00:00
|
|
|
/*
|
|
|
|
**
|
|
|
|
** Copyright 2009, The Android Open Source Project
|
|
|
|
**
|
|
|
|
** Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
** you may not use this file except in compliance with the License.
|
|
|
|
** You may obtain a copy of the License at
|
|
|
|
**
|
|
|
|
** http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
**
|
|
|
|
** Unless required by applicable law or agreed to in writing, software
|
|
|
|
** distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
** WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
** See the License for the specific language governing permissions and
|
|
|
|
** limitations under the License.
|
|
|
|
*/
|
|
|
|
|
2011-02-22 08:28:55 +00:00
|
|
|
#define LOG_TAG "LatinIME: jni: BinaryDictionary"
|
2011-01-07 06:01:51 +00:00
|
|
|
|
2011-07-20 09:42:32 +00:00
|
|
|
#include "binary_format.h"
|
2012-01-12 09:44:40 +00:00
|
|
|
#include "correction.h"
|
2011-02-22 08:28:55 +00:00
|
|
|
#include "com_android_inputmethod_latin_BinaryDictionary.h"
|
2009-03-13 22:11:42 +00:00
|
|
|
#include "dictionary.h"
|
2010-12-03 07:51:14 +00:00
|
|
|
#include "jni.h"
|
2011-06-18 04:09:55 +00:00
|
|
|
#include "jni_common.h"
|
2011-02-22 08:28:55 +00:00
|
|
|
#include "proximity_info.h"
|
2010-12-03 07:51:14 +00:00
|
|
|
|
|
|
|
#include <assert.h>
|
2011-01-07 06:01:51 +00:00
|
|
|
#include <errno.h>
|
2010-12-03 07:51:14 +00:00
|
|
|
#include <stdio.h>
|
2009-03-13 22:11:42 +00:00
|
|
|
|
2011-01-07 06:01:51 +00:00
|
|
|
#ifdef USE_MMAP_FOR_DICTIONARY
|
|
|
|
#include <sys/mman.h>
|
|
|
|
#include <sys/types.h>
|
|
|
|
#include <sys/stat.h>
|
|
|
|
#include <fcntl.h>
|
2011-10-28 07:24:31 +00:00
|
|
|
#include <unistd.h>
|
2011-01-07 06:01:51 +00:00
|
|
|
#else // USE_MMAP_FOR_DICTIONARY
|
|
|
|
#include <stdlib.h>
|
|
|
|
#endif // USE_MMAP_FOR_DICTIONARY
|
|
|
|
|
2011-02-22 08:28:55 +00:00
|
|
|
namespace latinime {
|
2009-03-13 22:11:42 +00:00
|
|
|
|
2011-07-20 09:42:32 +00:00
|
|
|
void releaseDictBuf(void* dictBuf, const size_t length, int fd);
|
|
|
|
|
2011-10-31 11:44:01 +00:00
|
|
|
static jlong latinime_BinaryDictionary_open(JNIEnv *env, jobject object,
|
2011-01-09 07:32:58 +00:00
|
|
|
jstring sourceDir, jlong dictOffset, jlong dictSize,
|
2012-03-28 09:21:04 +00:00
|
|
|
jint typedLetterMultiplier, jint fullWordMultiplier, jint maxWordLength, jint maxWords) {
|
2011-01-07 06:01:51 +00:00
|
|
|
PROF_OPEN;
|
|
|
|
PROF_START(66);
|
2011-10-28 08:06:58 +00:00
|
|
|
const char *sourceDirChars = env->GetStringUTFChars(sourceDir, 0);
|
|
|
|
if (sourceDirChars == 0) {
|
2012-01-13 09:01:22 +00:00
|
|
|
AKLOGE("DICT: Can't get sourceDir string");
|
2011-01-07 06:01:51 +00:00
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
int fd = 0;
|
2011-10-28 08:06:58 +00:00
|
|
|
void *dictBuf = 0;
|
2011-01-07 06:01:51 +00:00
|
|
|
int adjust = 0;
|
|
|
|
#ifdef USE_MMAP_FOR_DICTIONARY
|
|
|
|
/* mmap version */
|
2011-01-09 07:32:58 +00:00
|
|
|
fd = open(sourceDirChars, O_RDONLY);
|
2011-01-07 06:01:51 +00:00
|
|
|
if (fd < 0) {
|
2012-01-13 09:01:22 +00:00
|
|
|
AKLOGE("DICT: Can't open sourceDir. sourceDirChars=%s errno=%d", sourceDirChars, errno);
|
2011-01-07 06:01:51 +00:00
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
int pagesize = getpagesize();
|
|
|
|
adjust = dictOffset % pagesize;
|
|
|
|
int adjDictOffset = dictOffset - adjust;
|
|
|
|
int adjDictSize = dictSize + adjust;
|
2011-10-28 08:06:58 +00:00
|
|
|
dictBuf = mmap(0, sizeof(char) * adjDictSize, PROT_READ, MAP_PRIVATE, fd, adjDictOffset);
|
2011-01-07 06:01:51 +00:00
|
|
|
if (dictBuf == MAP_FAILED) {
|
2012-01-13 09:01:22 +00:00
|
|
|
AKLOGE("DICT: Can't mmap dictionary. errno=%d", errno);
|
2011-01-07 06:01:51 +00:00
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
dictBuf = (void *)((char *)dictBuf + adjust);
|
|
|
|
#else // USE_MMAP_FOR_DICTIONARY
|
|
|
|
/* malloc version */
|
2011-10-28 08:06:58 +00:00
|
|
|
FILE *file = 0;
|
2011-01-09 07:32:58 +00:00
|
|
|
file = fopen(sourceDirChars, "rb");
|
2011-10-28 08:06:58 +00:00
|
|
|
if (file == 0) {
|
2012-01-13 09:01:22 +00:00
|
|
|
AKLOGE("DICT: Can't fopen sourceDir. sourceDirChars=%s errno=%d", sourceDirChars, errno);
|
2011-01-07 06:01:51 +00:00
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
dictBuf = malloc(sizeof(char) * dictSize);
|
2011-01-17 06:13:45 +00:00
|
|
|
if (!dictBuf) {
|
2012-01-13 09:01:22 +00:00
|
|
|
AKLOGE("DICT: Can't allocate memory region for dictionary. errno=%d", errno);
|
2011-01-07 06:01:51 +00:00
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
int ret = fseek(file, (long)dictOffset, SEEK_SET);
|
|
|
|
if (ret != 0) {
|
2012-01-13 09:01:22 +00:00
|
|
|
AKLOGE("DICT: Failure in fseek. ret=%d errno=%d", ret, errno);
|
2011-01-07 06:01:51 +00:00
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
ret = fread(dictBuf, sizeof(char) * dictSize, 1, file);
|
|
|
|
if (ret != 1) {
|
2012-01-13 09:01:22 +00:00
|
|
|
AKLOGE("DICT: Failure in fread. ret=%d errno=%d", ret, errno);
|
2009-03-13 22:11:42 +00:00
|
|
|
return 0;
|
|
|
|
}
|
2011-01-07 06:01:51 +00:00
|
|
|
ret = fclose(file);
|
|
|
|
if (ret != 0) {
|
2012-01-13 09:01:22 +00:00
|
|
|
AKLOGE("DICT: Failure in fclose. ret=%d errno=%d", ret, errno);
|
2011-01-07 06:01:51 +00:00
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
#endif // USE_MMAP_FOR_DICTIONARY
|
2011-01-09 07:32:58 +00:00
|
|
|
env->ReleaseStringUTFChars(sourceDir, sourceDirChars);
|
2011-01-07 06:01:51 +00:00
|
|
|
|
|
|
|
if (!dictBuf) {
|
2012-01-13 09:01:22 +00:00
|
|
|
AKLOGE("DICT: dictBuf is null");
|
2011-01-07 06:01:51 +00:00
|
|
|
return 0;
|
|
|
|
}
|
2011-10-28 08:06:58 +00:00
|
|
|
Dictionary *dictionary = 0;
|
2011-07-20 09:42:32 +00:00
|
|
|
if (BinaryFormat::UNKNOWN_FORMAT == BinaryFormat::detectFormat((uint8_t*)dictBuf)) {
|
2012-01-13 09:01:22 +00:00
|
|
|
AKLOGE("DICT: dictionary format is unknown, bad magic number");
|
2011-07-20 09:42:32 +00:00
|
|
|
#ifdef USE_MMAP_FOR_DICTIONARY
|
|
|
|
releaseDictBuf(((char*)dictBuf) - adjust, adjDictSize, fd);
|
|
|
|
#else // USE_MMAP_FOR_DICTIONARY
|
|
|
|
releaseDictBuf(dictBuf, 0, 0);
|
|
|
|
#endif // USE_MMAP_FOR_DICTIONARY
|
|
|
|
} else {
|
|
|
|
dictionary = new Dictionary(dictBuf, dictSize, fd, adjust, typedLetterMultiplier,
|
2012-03-28 09:21:04 +00:00
|
|
|
fullWordMultiplier, maxWordLength, maxWords);
|
2011-07-20 09:42:32 +00:00
|
|
|
}
|
2011-01-07 06:01:51 +00:00
|
|
|
PROF_END(66);
|
|
|
|
PROF_CLOSE;
|
2011-10-31 11:44:01 +00:00
|
|
|
return (jlong)dictionary;
|
2009-03-13 22:11:42 +00:00
|
|
|
}
|
|
|
|
|
2011-10-31 11:44:01 +00:00
|
|
|
static int latinime_BinaryDictionary_getSuggestions(JNIEnv *env, jobject object, jlong dict,
|
|
|
|
jlong proximityInfo, jintArray xCoordinatesArray, jintArray yCoordinatesArray,
|
2011-02-25 08:56:53 +00:00
|
|
|
jintArray inputArray, jint arraySize, jint flags,
|
|
|
|
jcharArray outputArray, jintArray frequencyArray) {
|
2011-01-07 06:01:51 +00:00
|
|
|
Dictionary *dictionary = (Dictionary*)dict;
|
|
|
|
if (!dictionary) return 0;
|
2011-02-22 08:28:55 +00:00
|
|
|
ProximityInfo *pInfo = (ProximityInfo*)proximityInfo;
|
|
|
|
|
2011-10-28 08:06:58 +00:00
|
|
|
int *xCoordinates = env->GetIntArrayElements(xCoordinatesArray, 0);
|
|
|
|
int *yCoordinates = env->GetIntArrayElements(yCoordinatesArray, 0);
|
2009-03-13 22:11:42 +00:00
|
|
|
|
2011-10-28 08:06:58 +00:00
|
|
|
int *frequencies = env->GetIntArrayElements(frequencyArray, 0);
|
|
|
|
int *inputCodes = env->GetIntArrayElements(inputArray, 0);
|
|
|
|
jchar *outputChars = env->GetCharArrayElements(outputArray, 0);
|
2009-06-04 19:20:45 +00:00
|
|
|
|
2011-02-22 08:28:55 +00:00
|
|
|
int count = dictionary->getSuggestions(pInfo, xCoordinates, yCoordinates, inputCodes,
|
2011-02-25 08:56:53 +00:00
|
|
|
arraySize, flags, (unsigned short*) outputChars, frequencies);
|
2010-02-09 18:58:26 +00:00
|
|
|
|
2009-08-03 19:56:35 +00:00
|
|
|
env->ReleaseIntArrayElements(frequencyArray, frequencies, 0);
|
2009-03-13 22:11:42 +00:00
|
|
|
env->ReleaseIntArrayElements(inputArray, inputCodes, JNI_ABORT);
|
2011-02-22 08:28:55 +00:00
|
|
|
env->ReleaseIntArrayElements(xCoordinatesArray, xCoordinates, 0);
|
|
|
|
env->ReleaseIntArrayElements(yCoordinatesArray, yCoordinates, 0);
|
2009-08-03 19:56:35 +00:00
|
|
|
env->ReleaseCharArrayElements(outputArray, outputChars, 0);
|
2010-02-09 18:58:26 +00:00
|
|
|
|
2009-03-13 22:11:42 +00:00
|
|
|
return count;
|
|
|
|
}
|
|
|
|
|
2011-10-31 11:44:01 +00:00
|
|
|
static int latinime_BinaryDictionary_getBigrams(JNIEnv *env, jobject object, jlong dict,
|
2010-12-03 07:51:14 +00:00
|
|
|
jcharArray prevWordArray, jint prevWordLength, jintArray inputArray, jint inputArraySize,
|
2012-03-28 09:21:04 +00:00
|
|
|
jcharArray outputArray, jintArray frequencyArray, jint maxWordLength, jint maxBigrams) {
|
2011-01-07 06:01:51 +00:00
|
|
|
Dictionary *dictionary = (Dictionary*)dict;
|
|
|
|
if (!dictionary) return 0;
|
2010-07-01 03:28:04 +00:00
|
|
|
|
2011-10-28 08:06:58 +00:00
|
|
|
jchar *prevWord = env->GetCharArrayElements(prevWordArray, 0);
|
|
|
|
int *inputCodes = env->GetIntArrayElements(inputArray, 0);
|
|
|
|
jchar *outputChars = env->GetCharArrayElements(outputArray, 0);
|
|
|
|
int *frequencies = env->GetIntArrayElements(frequencyArray, 0);
|
2010-07-01 03:28:04 +00:00
|
|
|
|
2010-07-26 18:43:29 +00:00
|
|
|
int count = dictionary->getBigrams((unsigned short*) prevWord, prevWordLength, inputCodes,
|
2012-03-28 09:21:04 +00:00
|
|
|
inputArraySize, (unsigned short*) outputChars, frequencies, maxWordLength, maxBigrams);
|
2010-07-01 03:28:04 +00:00
|
|
|
|
2010-07-26 18:43:29 +00:00
|
|
|
env->ReleaseCharArrayElements(prevWordArray, prevWord, JNI_ABORT);
|
|
|
|
env->ReleaseIntArrayElements(inputArray, inputCodes, JNI_ABORT);
|
2010-07-01 03:28:04 +00:00
|
|
|
env->ReleaseCharArrayElements(outputArray, outputChars, 0);
|
|
|
|
env->ReleaseIntArrayElements(frequencyArray, frequencies, 0);
|
|
|
|
|
|
|
|
return count;
|
|
|
|
}
|
|
|
|
|
2011-10-31 11:44:01 +00:00
|
|
|
static jboolean latinime_BinaryDictionary_isValidWord(JNIEnv *env, jobject object, jlong dict,
|
2010-12-03 07:51:14 +00:00
|
|
|
jcharArray wordArray, jint wordLength) {
|
2011-01-07 06:01:51 +00:00
|
|
|
Dictionary *dictionary = (Dictionary*)dict;
|
|
|
|
if (!dictionary) return (jboolean) false;
|
2009-06-04 19:20:45 +00:00
|
|
|
|
2011-10-28 08:06:58 +00:00
|
|
|
jchar *word = env->GetCharArrayElements(wordArray, 0);
|
2009-03-13 22:11:42 +00:00
|
|
|
jboolean result = dictionary->isValidWord((unsigned short*) word, wordLength);
|
|
|
|
env->ReleaseCharArrayElements(wordArray, word, JNI_ABORT);
|
2009-06-04 19:20:45 +00:00
|
|
|
|
2009-03-13 22:11:42 +00:00
|
|
|
return result;
|
|
|
|
}
|
|
|
|
|
2012-01-12 09:44:40 +00:00
|
|
|
static jdouble latinime_BinaryDictionary_calcNormalizedScore(JNIEnv *env, jobject object,
|
|
|
|
jcharArray before, jint beforeLength, jcharArray after, jint afterLength, jint score) {
|
|
|
|
jchar *beforeChars = env->GetCharArrayElements(before, 0);
|
|
|
|
jchar *afterChars = env->GetCharArrayElements(after, 0);
|
|
|
|
jdouble result = Correction::RankingAlgorithm::calcNormalizedScore(
|
|
|
|
(unsigned short*)beforeChars, beforeLength, (unsigned short*)afterChars, afterLength,
|
|
|
|
score);
|
|
|
|
env->ReleaseCharArrayElements(before, beforeChars, JNI_ABORT);
|
|
|
|
env->ReleaseCharArrayElements(after, afterChars, JNI_ABORT);
|
|
|
|
return result;
|
|
|
|
}
|
|
|
|
|
|
|
|
static jint latinime_BinaryDictionary_editDistance(JNIEnv *env, jobject object,
|
|
|
|
jcharArray before, jint beforeLength, jcharArray after, jint afterLength) {
|
|
|
|
jchar *beforeChars = env->GetCharArrayElements(before, 0);
|
|
|
|
jchar *afterChars = env->GetCharArrayElements(after, 0);
|
|
|
|
jint result = Correction::RankingAlgorithm::editDistance(
|
|
|
|
(unsigned short*)beforeChars, beforeLength, (unsigned short*)afterChars, afterLength);
|
|
|
|
env->ReleaseCharArrayElements(before, beforeChars, JNI_ABORT);
|
|
|
|
env->ReleaseCharArrayElements(after, afterChars, JNI_ABORT);
|
|
|
|
return result;
|
|
|
|
}
|
|
|
|
|
2011-10-31 11:44:01 +00:00
|
|
|
static void latinime_BinaryDictionary_close(JNIEnv *env, jobject object, jlong dict) {
|
2011-01-07 06:01:51 +00:00
|
|
|
Dictionary *dictionary = (Dictionary*)dict;
|
|
|
|
if (!dictionary) return;
|
|
|
|
void *dictBuf = dictionary->getDict();
|
|
|
|
if (!dictBuf) return;
|
|
|
|
#ifdef USE_MMAP_FOR_DICTIONARY
|
2011-07-20 09:42:32 +00:00
|
|
|
releaseDictBuf((void *)((char *)dictBuf - dictionary->getDictBufAdjust()),
|
|
|
|
dictionary->getDictSize() + dictionary->getDictBufAdjust(), dictionary->getMmapFd());
|
|
|
|
#else // USE_MMAP_FOR_DICTIONARY
|
|
|
|
releaseDictBuf(dictBuf, 0, 0);
|
|
|
|
#endif // USE_MMAP_FOR_DICTIONARY
|
|
|
|
delete dictionary;
|
|
|
|
}
|
|
|
|
|
|
|
|
void releaseDictBuf(void* dictBuf, const size_t length, int fd) {
|
|
|
|
#ifdef USE_MMAP_FOR_DICTIONARY
|
|
|
|
int ret = munmap(dictBuf, length);
|
2011-01-07 06:01:51 +00:00
|
|
|
if (ret != 0) {
|
2012-01-13 09:01:22 +00:00
|
|
|
AKLOGE("DICT: Failure in munmap. ret=%d errno=%d", ret, errno);
|
2011-01-07 06:01:51 +00:00
|
|
|
}
|
2011-07-20 09:42:32 +00:00
|
|
|
ret = close(fd);
|
2011-01-07 06:01:51 +00:00
|
|
|
if (ret != 0) {
|
2012-01-13 09:01:22 +00:00
|
|
|
AKLOGE("DICT: Failure in close. ret=%d errno=%d", ret, errno);
|
2011-01-07 06:01:51 +00:00
|
|
|
}
|
|
|
|
#else // USE_MMAP_FOR_DICTIONARY
|
|
|
|
free(dictBuf);
|
|
|
|
#endif // USE_MMAP_FOR_DICTIONARY
|
2009-03-13 22:11:42 +00:00
|
|
|
}
|
|
|
|
|
2011-02-22 08:28:55 +00:00
|
|
|
static JNINativeMethod sMethods[] = {
|
2012-03-28 09:21:04 +00:00
|
|
|
{"openNative", "(Ljava/lang/String;JJIIII)J", (void*)latinime_BinaryDictionary_open},
|
2011-10-31 11:44:01 +00:00
|
|
|
{"closeNative", "(J)V", (void*)latinime_BinaryDictionary_close},
|
|
|
|
{"getSuggestionsNative", "(JJ[I[I[III[C[I)I", (void*)latinime_BinaryDictionary_getSuggestions},
|
|
|
|
{"isValidWordNative", "(J[CI)Z", (void*)latinime_BinaryDictionary_isValidWord},
|
2012-03-28 09:21:04 +00:00
|
|
|
{"getBigramsNative", "(J[CI[II[C[III)I", (void*)latinime_BinaryDictionary_getBigrams},
|
2012-01-12 09:44:40 +00:00
|
|
|
{"calcNormalizedScoreNative", "([CI[CII)D",
|
|
|
|
(void*)latinime_BinaryDictionary_calcNormalizedScore},
|
|
|
|
{"editDistanceNative", "([CI[CI)I", (void*)latinime_BinaryDictionary_editDistance}
|
2009-03-13 22:11:42 +00:00
|
|
|
};
|
|
|
|
|
2011-02-22 08:28:55 +00:00
|
|
|
int register_BinaryDictionary(JNIEnv *env) {
|
2009-03-13 22:11:42 +00:00
|
|
|
const char* const kClassPathName = "com/android/inputmethod/latin/BinaryDictionary";
|
2011-02-22 08:28:55 +00:00
|
|
|
return registerNativeMethods(env, kClassPathName, sMethods,
|
|
|
|
sizeof(sMethods) / sizeof(sMethods[0]));
|
2009-03-13 22:11:42 +00:00
|
|
|
}
|
|
|
|
|
2011-06-18 04:09:55 +00:00
|
|
|
} // namespace latinime
|