9a933a742d
This has no impact on performance. Before: (0) 9.61 (0.01%) (1) 57514.58 (56.70%) (2) 10.55 (0.01%) (3) 10.79 (0.01%) (4) 133.20 (0.13%) (5) 43553.87 (42.94%) (6) 10.03 (0.01%) (20) 47.20 (0.05%) Total 101431.47 (sum of others 101289.84) After: (0) 10.52 (0.01%) (1) 56311.16 (56.66%) (2) 13.40 (0.01%) (3) 10.98 (0.01%) (4) 136.72 (0.14%) (5) 42707.92 (42.97%) (6) 9.79 (0.01%) (20) 51.35 (0.05%) Total 99390.76 (sum of others 99251.84) The difference is not significant with regard to measure imprecision Change-Id: I2e4f1ef7a5e99082e67dd27f56cf4fc432bb48fa
82 lines
3 KiB
C++
82 lines
3 KiB
C++
/*
|
|
* Copyright (C) 2012 The Android Open Source Project
|
|
*
|
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
|
* you may not use this file except in compliance with the License.
|
|
* You may obtain a copy of the License at
|
|
*
|
|
* http://www.apache.org/licenses/LICENSE-2.0
|
|
*
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
* See the License for the specific language governing permissions and
|
|
* limitations under the License.
|
|
*/
|
|
|
|
#ifndef LATINIME_TERMINAL_ATTRIBUTES_H
|
|
#define LATINIME_TERMINAL_ATTRIBUTES_H
|
|
|
|
#include "unigram_dictionary.h"
|
|
|
|
namespace latinime {
|
|
|
|
/**
|
|
* This class encapsulates information about a terminal that allows to
|
|
* retrieve local node attributes like the list of shortcuts without
|
|
* exposing the format structure to the client.
|
|
*/
|
|
class TerminalAttributes {
|
|
public:
|
|
class ShortcutIterator {
|
|
const uint8_t* const mDict;
|
|
bool mHasNextShortcutTarget;
|
|
int mPos;
|
|
|
|
public:
|
|
ShortcutIterator(const uint8_t* dict, const int pos, const uint8_t flags) : mDict(dict),
|
|
mPos(pos) {
|
|
mHasNextShortcutTarget = (0 != (flags & UnigramDictionary::FLAG_HAS_SHORTCUT_TARGETS));
|
|
}
|
|
|
|
inline bool hasNextShortcutTarget() const {
|
|
return mHasNextShortcutTarget;
|
|
}
|
|
|
|
// Gets the shortcut target itself as a uint16_t string. For parameters and return value
|
|
// see BinaryFormat::getWordAtAddress.
|
|
// TODO: make the output an uint32_t* to handle the whole unicode range.
|
|
inline int getNextShortcutTarget(const int maxDepth, uint16_t* outWord) {
|
|
const int shortcutFlags = BinaryFormat::getFlagsAndForwardPointer(mDict, &mPos);
|
|
mHasNextShortcutTarget =
|
|
0 != (shortcutFlags & UnigramDictionary::FLAG_ATTRIBUTE_HAS_NEXT);
|
|
unsigned int i;
|
|
for (i = 0; i < MAX_WORD_LENGTH_INTERNAL; ++i) {
|
|
const int charCode = BinaryFormat::getCharCodeAndForwardPointer(mDict, &mPos);
|
|
if (NOT_A_CHARACTER == charCode) break;
|
|
outWord[i] = (uint16_t)charCode;
|
|
}
|
|
mPos += BinaryFormat::CHARACTER_ARRAY_TERMINATOR_SIZE;
|
|
return i;
|
|
}
|
|
};
|
|
|
|
private:
|
|
const uint8_t* const mDict;
|
|
const uint8_t mFlags;
|
|
const int mStartPos;
|
|
|
|
public:
|
|
TerminalAttributes(const uint8_t* const dict, const uint8_t flags, const int pos) :
|
|
mDict(dict), mFlags(flags), mStartPos(pos) {
|
|
}
|
|
|
|
inline ShortcutIterator getShortcutIterator() const {
|
|
// The size of the shortcuts is stored here so that the whole shortcut chunk can be
|
|
// skipped quickly, so we ignore it.
|
|
return ShortcutIterator(mDict, mStartPos + BinaryFormat::SHORTCUT_LIST_SIZE_SIZE, mFlags);
|
|
}
|
|
};
|
|
} // namespace latinime
|
|
|
|
#endif // LATINIME_TERMINAL_ATTRIBUTES_H
|