* commit 'eb501f26c1615b4e0572767f85faa3ec0636a21b': Fix a bug with surrogate characters
This commit is contained in:
commit
23af2a47bd
1 changed files with 4 additions and 3 deletions
|
@ -556,6 +556,7 @@ public class FusionDictionary implements Iterable<Word> {
|
|||
final StringBuilder checker = DBG ? new StringBuilder() : null;
|
||||
|
||||
CharGroup currentGroup;
|
||||
final int codePointCountInS = s.codePointCount(0, s.length());
|
||||
do {
|
||||
int indexOfGroup = findIndexOfChar(node, s.codePointAt(index));
|
||||
if (CHARACTER_NOT_FOUND == indexOfGroup) return null;
|
||||
|
@ -570,12 +571,12 @@ public class FusionDictionary implements Iterable<Word> {
|
|||
index = newIndex;
|
||||
|
||||
if (DBG) checker.append(new String(currentGroup.mChars, 0, currentGroup.mChars.length));
|
||||
if (index < s.length()) {
|
||||
if (index < codePointCountInS) {
|
||||
node = currentGroup.mChildren;
|
||||
}
|
||||
} while (null != node && index < s.length());
|
||||
} while (null != node && index < codePointCountInS);
|
||||
|
||||
if (index < s.length()) return null;
|
||||
if (index < codePointCountInS) return null;
|
||||
if (!currentGroup.isTerminal()) return null;
|
||||
if (DBG && !s.equals(checker.toString())) return null;
|
||||
return currentGroup;
|
||||
|
|
Loading…
Reference in a new issue