Merge "Fix bugs of GC."
commit
2520e14ced
|
@ -127,8 +127,7 @@ bool DynamicPatriciaTrieGcEventListeners::TraversePolicyToPlaceAndWriteValidPtNo
|
||||||
ptNodeParams->getHeadPos(), writingPos));
|
ptNodeParams->getHeadPos(), writingPos));
|
||||||
mValidPtNodeCount++;
|
mValidPtNodeCount++;
|
||||||
// Writes current PtNode.
|
// Writes current PtNode.
|
||||||
return mPtNodeWriter->writeNewTerminalPtNodeAndAdvancePosition(ptNodeParams,
|
return mPtNodeWriter->writePtNodeAndAdvancePosition(ptNodeParams, &writingPos);
|
||||||
0 /* timestamp */, &writingPos);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
bool DynamicPatriciaTrieGcEventListeners::TraversePolicyToUpdateAllPositionFields
|
bool DynamicPatriciaTrieGcEventListeners::TraversePolicyToUpdateAllPositionFields
|
||||||
|
|
|
@ -174,8 +174,7 @@ bool DynamicPatriciaTrieNodeWriter::addNewBigramEntry(
|
||||||
// Then, Mark as the PtNode having bigram list in the flags.
|
// Then, Mark as the PtNode having bigram list in the flags.
|
||||||
const PatriciaTrieReadingUtils::NodeFlags updatedFlags =
|
const PatriciaTrieReadingUtils::NodeFlags updatedFlags =
|
||||||
PatriciaTrieReadingUtils::createAndGetFlags(newPtNodeParams.isBlacklisted(),
|
PatriciaTrieReadingUtils::createAndGetFlags(newPtNodeParams.isBlacklisted(),
|
||||||
newPtNodeParams.isNotAWord(),
|
newPtNodeParams.isNotAWord(), newPtNodeParams.isTerminal(),
|
||||||
newPtNodeParams.getProbability() != NOT_A_PROBABILITY,
|
|
||||||
newPtNodeParams.getShortcutPos() != NOT_A_DICT_POS, true /* hasBigrams */,
|
newPtNodeParams.getShortcutPos() != NOT_A_DICT_POS, true /* hasBigrams */,
|
||||||
newPtNodeParams.getCodePointCount() > 1, CHILDREN_POSITION_FIELD_SIZE);
|
newPtNodeParams.getCodePointCount() > 1, CHILDREN_POSITION_FIELD_SIZE);
|
||||||
writingPos = newNodePos;
|
writingPos = newNodePos;
|
||||||
|
|
|
@ -26,9 +26,8 @@ namespace latinime {
|
||||||
void ProbabilityDictContent::getProbabilityEntry(const int terminalId,
|
void ProbabilityDictContent::getProbabilityEntry(const int terminalId,
|
||||||
ProbabilityEntry *const outProbabilityEntry) const {
|
ProbabilityEntry *const outProbabilityEntry) const {
|
||||||
if (terminalId < 0 || terminalId >= mSize) {
|
if (terminalId < 0 || terminalId >= mSize) {
|
||||||
|
// This method can be called with invalid terminal id during GC.
|
||||||
outProbabilityEntry->setProbability(0 /* flags */, NOT_A_PROBABILITY);
|
outProbabilityEntry->setProbability(0 /* flags */, NOT_A_PROBABILITY);
|
||||||
AKLOGE("Terminal id (%d) is not in the probability dict content. mSize: %d", terminalId,
|
|
||||||
mSize);
|
|
||||||
return;
|
return;
|
||||||
}
|
}
|
||||||
const BufferWithExtendableBuffer *const buffer = getBuffer();
|
const BufferWithExtendableBuffer *const buffer = getBuffer();
|
||||||
|
|
|
@ -44,9 +44,6 @@ bool TerminalPositionLookupTable::setTerminalPtNodePosition(
|
||||||
}
|
}
|
||||||
mSize++;
|
mSize++;
|
||||||
}
|
}
|
||||||
if (terminalPtNodePos == NOT_A_DICT_POS) {
|
|
||||||
return true;
|
|
||||||
}
|
|
||||||
const int terminalPos = (terminalPtNodePos != NOT_A_DICT_POS) ?
|
const int terminalPos = (terminalPtNodePos != NOT_A_DICT_POS) ?
|
||||||
terminalPtNodePos + mHeaderRegionSize : Ver4DictConstants::NOT_A_TERMINAL_ADDRESS;
|
terminalPtNodePos + mHeaderRegionSize : Ver4DictConstants::NOT_A_TERMINAL_ADDRESS;
|
||||||
return getWritableBuffer()->writeUint(terminalPos,
|
return getWritableBuffer()->writeUint(terminalPos,
|
||||||
|
|
|
@ -51,7 +51,7 @@ bool Ver4PatriciaTrieNodeWriter::markPtNodeAsDeleted(
|
||||||
&writingPos)) {
|
&writingPos)) {
|
||||||
return false;
|
return false;
|
||||||
}
|
}
|
||||||
if (toBeUpdatedPtNodeParams->getTerminalId() != NOT_A_DICT_POS) {
|
if (toBeUpdatedPtNodeParams->isTerminal()) {
|
||||||
// The PtNode is a terminal. Delete entry from the terminal position lookup table.
|
// The PtNode is a terminal. Delete entry from the terminal position lookup table.
|
||||||
return mBuffers->getUpdatableTerminalPositionLookupTable()->setTerminalPtNodePosition(
|
return mBuffers->getUpdatableTerminalPositionLookupTable()->setTerminalPtNodePosition(
|
||||||
toBeUpdatedPtNodeParams->getTerminalId(), NOT_A_DICT_POS /* ptNodePos */);
|
toBeUpdatedPtNodeParams->getTerminalId(), NOT_A_DICT_POS /* ptNodePos */);
|
||||||
|
|
|
@ -143,29 +143,12 @@ bool Ver4PatriciaTrieWritingHelper::runGC(const int rootPtNodeArrayPos,
|
||||||
Ver4PatriciaTrieNodeWriter newPtNodeWriter(buffersToWrite->getWritableTrieBuffer(),
|
Ver4PatriciaTrieNodeWriter newPtNodeWriter(buffersToWrite->getWritableTrieBuffer(),
|
||||||
buffersToWrite, &newPtNodeReader, &newBigramPolicy, &newShortcutPolicy,
|
buffersToWrite, &newPtNodeReader, &newBigramPolicy, &newShortcutPolicy,
|
||||||
false /* needsToDecayWhenUpdating */);
|
false /* needsToDecayWhenUpdating */);
|
||||||
|
|
||||||
DynamicPatriciaTrieReadingHelper newDictReadingHelper(buffersToWrite->getTrieBuffer(),
|
|
||||||
&newPtNodeReader);
|
|
||||||
newDictReadingHelper.initWithPtNodeArrayPos(rootPtNodeArrayPos);
|
|
||||||
DynamicPatriciaTrieGcEventListeners::TraversePolicyToUpdateAllPositionFields
|
|
||||||
traversePolicyToUpdateAllPositionFields(&newPtNodeWriter, &dictPositionRelocationMap);
|
|
||||||
if (!newDictReadingHelper.traverseAllPtNodesInPtNodeArrayLevelPreorderDepthFirstManner(
|
|
||||||
&traversePolicyToUpdateAllPositionFields)) {
|
|
||||||
return false;
|
|
||||||
}
|
|
||||||
|
|
||||||
// Re-assign terminal IDs for valid terminal PtNodes.
|
// Re-assign terminal IDs for valid terminal PtNodes.
|
||||||
TerminalPositionLookupTable::TerminalIdMap terminalIdMap;
|
TerminalPositionLookupTable::TerminalIdMap terminalIdMap;
|
||||||
if(!buffersToWrite->getUpdatableTerminalPositionLookupTable()->runGCTerminalIds(
|
if(!buffersToWrite->getUpdatableTerminalPositionLookupTable()->runGCTerminalIds(
|
||||||
&terminalIdMap)) {
|
&terminalIdMap)) {
|
||||||
return false;
|
return false;
|
||||||
}
|
}
|
||||||
TraversePolicyToUpdateAllTerminalIds traversePolicyToUpdateAllTerminalIds(&newPtNodeWriter,
|
|
||||||
&terminalIdMap);
|
|
||||||
if (!newDictReadingHelper.traverseAllPtNodesInPostorderDepthFirstManner(
|
|
||||||
&traversePolicyToUpdateAllTerminalIds)) {
|
|
||||||
return false;
|
|
||||||
}
|
|
||||||
// Run GC for probability dict content.
|
// Run GC for probability dict content.
|
||||||
if (!buffersToWrite->getUpdatableProbabilityDictContent()->runGC(&terminalIdMap,
|
if (!buffersToWrite->getUpdatableProbabilityDictContent()->runGC(&terminalIdMap,
|
||||||
mBuffers->getProbabilityDictContent())) {
|
mBuffers->getProbabilityDictContent())) {
|
||||||
|
@ -181,6 +164,22 @@ bool Ver4PatriciaTrieWritingHelper::runGC(const int rootPtNodeArrayPos,
|
||||||
mBuffers->getShortcutDictContent())) {
|
mBuffers->getShortcutDictContent())) {
|
||||||
return false;
|
return false;
|
||||||
}
|
}
|
||||||
|
DynamicPatriciaTrieReadingHelper newDictReadingHelper(buffersToWrite->getTrieBuffer(),
|
||||||
|
&newPtNodeReader);
|
||||||
|
newDictReadingHelper.initWithPtNodeArrayPos(rootPtNodeArrayPos);
|
||||||
|
DynamicPatriciaTrieGcEventListeners::TraversePolicyToUpdateAllPositionFields
|
||||||
|
traversePolicyToUpdateAllPositionFields(&newPtNodeWriter, &dictPositionRelocationMap);
|
||||||
|
if (!newDictReadingHelper.traverseAllPtNodesInPtNodeArrayLevelPreorderDepthFirstManner(
|
||||||
|
&traversePolicyToUpdateAllPositionFields)) {
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
newDictReadingHelper.initWithPtNodeArrayPos(rootPtNodeArrayPos);
|
||||||
|
TraversePolicyToUpdateAllTerminalIds traversePolicyToUpdateAllTerminalIds(&newPtNodeWriter,
|
||||||
|
&terminalIdMap);
|
||||||
|
if (!newDictReadingHelper.traverseAllPtNodesInPostorderDepthFirstManner(
|
||||||
|
&traversePolicyToUpdateAllTerminalIds)) {
|
||||||
|
return false;
|
||||||
|
}
|
||||||
*outUnigramCount = traversePolicyToUpdateAllPositionFields.getUnigramCount();
|
*outUnigramCount = traversePolicyToUpdateAllPositionFields.getUnigramCount();
|
||||||
return true;
|
return true;
|
||||||
}
|
}
|
||||||
|
|
Loading…
Reference in New Issue