2014-02-06 07:09:25 +00:00
|
|
|
/*
|
|
|
|
* Copyright (C) 2014 The Android Open Source Project
|
|
|
|
*
|
|
|
|
* Licensed under the Apache License, Version 2.0 (the "License"); you may not
|
|
|
|
* use this file except in compliance with the License. You may obtain a copy of
|
|
|
|
* the License at
|
|
|
|
*
|
|
|
|
* http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
*
|
|
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
|
|
* distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
|
|
|
|
* WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
|
|
|
|
* License for the specific language governing permissions and limitations under
|
|
|
|
* the License.
|
|
|
|
*/
|
|
|
|
|
|
|
|
package com.android.inputmethod.latin.utils;
|
|
|
|
|
|
|
|
import com.android.inputmethod.latin.makedict.DictionaryHeader;
|
2014-10-22 09:15:53 +00:00
|
|
|
import com.android.inputmethod.latin.makedict.NgramProperty;
|
2014-02-06 07:09:25 +00:00
|
|
|
import com.android.inputmethod.latin.makedict.ProbabilityInfo;
|
|
|
|
import com.android.inputmethod.latin.makedict.WordProperty;
|
|
|
|
|
|
|
|
import java.util.HashMap;
|
|
|
|
|
|
|
|
public class CombinedFormatUtils {
|
|
|
|
public static final String DICTIONARY_TAG = "dictionary";
|
|
|
|
public static final String BIGRAM_TAG = "bigram";
|
2014-10-22 09:15:53 +00:00
|
|
|
public static final String NGRAM_TAG = "ngram";
|
|
|
|
public static final String NGRAM_PREV_WORD_TAG = "prev_word";
|
2014-02-06 07:09:25 +00:00
|
|
|
public static final String PROBABILITY_TAG = "f";
|
|
|
|
public static final String HISTORICAL_INFO_TAG = "historicalInfo";
|
|
|
|
public static final String HISTORICAL_INFO_SEPARATOR = ":";
|
|
|
|
public static final String WORD_TAG = "word";
|
2014-06-24 03:37:07 +00:00
|
|
|
public static final String BEGINNING_OF_SENTENCE_TAG = "beginning_of_sentence";
|
2014-02-06 07:09:25 +00:00
|
|
|
public static final String NOT_A_WORD_TAG = "not_a_word";
|
2014-10-14 03:13:11 +00:00
|
|
|
public static final String POSSIBLY_OFFENSIVE_TAG = "possibly_offensive";
|
|
|
|
public static final String TRUE_VALUE = "true";
|
2014-02-06 07:09:25 +00:00
|
|
|
|
|
|
|
public static String formatAttributeMap(final HashMap<String, String> attributeMap) {
|
|
|
|
final StringBuilder builder = new StringBuilder();
|
|
|
|
builder.append(DICTIONARY_TAG + "=");
|
2014-02-06 08:55:45 +00:00
|
|
|
if (attributeMap.containsKey(DictionaryHeader.DICTIONARY_ID_KEY)) {
|
|
|
|
builder.append(attributeMap.get(DictionaryHeader.DICTIONARY_ID_KEY));
|
2014-02-06 07:09:25 +00:00
|
|
|
}
|
|
|
|
for (final String key : attributeMap.keySet()) {
|
2014-02-06 08:55:45 +00:00
|
|
|
if (key.equals(DictionaryHeader.DICTIONARY_ID_KEY)) {
|
2014-02-06 07:09:25 +00:00
|
|
|
continue;
|
|
|
|
}
|
|
|
|
final String value = attributeMap.get(key);
|
|
|
|
builder.append("," + key + "=" + value);
|
|
|
|
}
|
|
|
|
builder.append("\n");
|
|
|
|
return builder.toString();
|
|
|
|
}
|
|
|
|
|
|
|
|
public static String formatWordProperty(final WordProperty wordProperty) {
|
|
|
|
final StringBuilder builder = new StringBuilder();
|
|
|
|
builder.append(" " + WORD_TAG + "=" + wordProperty.mWord);
|
|
|
|
builder.append(",");
|
|
|
|
builder.append(formatProbabilityInfo(wordProperty.mProbabilityInfo));
|
2014-06-24 03:37:07 +00:00
|
|
|
if (wordProperty.mIsBeginningOfSentence) {
|
2014-10-14 03:13:11 +00:00
|
|
|
builder.append("," + BEGINNING_OF_SENTENCE_TAG + "=" + TRUE_VALUE);
|
2014-06-24 03:37:07 +00:00
|
|
|
}
|
2014-02-06 07:09:25 +00:00
|
|
|
if (wordProperty.mIsNotAWord) {
|
2014-10-14 03:13:11 +00:00
|
|
|
builder.append("," + NOT_A_WORD_TAG + "=" + TRUE_VALUE);
|
2014-02-06 07:09:25 +00:00
|
|
|
}
|
2014-10-14 03:13:11 +00:00
|
|
|
if (wordProperty.mIsPossiblyOffensive) {
|
2014-10-14 03:13:11 +00:00
|
|
|
builder.append("," + POSSIBLY_OFFENSIVE_TAG + "=" + TRUE_VALUE);
|
2014-02-06 07:09:25 +00:00
|
|
|
}
|
|
|
|
builder.append("\n");
|
2014-10-01 02:21:08 +00:00
|
|
|
if (wordProperty.mHasNgrams) {
|
2014-10-22 09:15:53 +00:00
|
|
|
for (final NgramProperty ngramProperty : wordProperty.mNgrams) {
|
|
|
|
builder.append(" " + NGRAM_TAG + "=" + ngramProperty.mTargetWord.mWord);
|
2014-02-06 07:09:25 +00:00
|
|
|
builder.append(",");
|
2014-10-22 09:15:53 +00:00
|
|
|
builder.append(formatProbabilityInfo(ngramProperty.mTargetWord.mProbabilityInfo));
|
2014-02-06 07:09:25 +00:00
|
|
|
builder.append("\n");
|
2014-10-22 09:15:53 +00:00
|
|
|
for (int i = 0; i < ngramProperty.mNgramContext.getPrevWordCount(); i++) {
|
|
|
|
builder.append(" " + NGRAM_PREV_WORD_TAG + "[" + i + "]="
|
|
|
|
+ ngramProperty.mNgramContext.getNthPrevWord(i + 1));
|
2014-12-02 03:53:56 +00:00
|
|
|
if (ngramProperty.mNgramContext.isNthPrevWordBeginningOfSentence(i + 1)) {
|
2014-10-22 09:15:53 +00:00
|
|
|
builder.append("," + BEGINNING_OF_SENTENCE_TAG + "=true");
|
|
|
|
}
|
|
|
|
builder.append("\n");
|
|
|
|
}
|
2014-02-06 07:09:25 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
return builder.toString();
|
|
|
|
}
|
|
|
|
|
|
|
|
public static String formatProbabilityInfo(final ProbabilityInfo probabilityInfo) {
|
|
|
|
final StringBuilder builder = new StringBuilder();
|
|
|
|
builder.append(PROBABILITY_TAG + "=" + probabilityInfo.mProbability);
|
|
|
|
if (probabilityInfo.hasHistoricalInfo()) {
|
|
|
|
builder.append(",");
|
|
|
|
builder.append(HISTORICAL_INFO_TAG + "=");
|
|
|
|
builder.append(probabilityInfo.mTimestamp);
|
|
|
|
builder.append(HISTORICAL_INFO_SEPARATOR);
|
|
|
|
builder.append(probabilityInfo.mLevel);
|
|
|
|
builder.append(HISTORICAL_INFO_SEPARATOR);
|
|
|
|
builder.append(probabilityInfo.mCount);
|
|
|
|
}
|
|
|
|
return builder.toString();
|
|
|
|
}
|
2014-10-14 03:13:11 +00:00
|
|
|
|
|
|
|
public static boolean isLiteralTrue(final String value) {
|
|
|
|
return TRUE_VALUE.equalsIgnoreCase(value);
|
|
|
|
}
|
2014-02-06 07:09:25 +00:00
|
|
|
}
|