ICU-4157 Word Break, fix problem with CR <combining> sequences

X-SVN-Rev: 17427
This commit is contained in:
Andy Heninger 2005-03-31 01:45:27 +00:00
parent 3fdcb27040
commit 2b714f2bce
2 changed files with 5 additions and 2 deletions

View File

@ -52,7 +52,7 @@ $ExtendNumLetEx = $ExtendNumLet $Extend*;
# see character breaks.
$CR $LF;
[^$Control] $Extend+;
[^$Control $CR $LF] $Extend+;
$NumericEx $Extend* {100};
$ALetterEx $Extend* {200};
@ -114,7 +114,7 @@ $LF $CR;
# see character breaks
$Extend* [^$Control];
$Extend* [^$Control $CR $LF];
# rule 5

View File

@ -2139,6 +2139,8 @@ RBBIWordMonkey::RBBIWordMonkey() : fGCFMatcher(0),
fOtherSet->removeAll(*fMidNumSet);
fOtherSet->removeAll(*fNumericSet);
fOtherSet->removeAll(*fExtendNumLetSet);
fOtherSet->removeAll(*fFormatSet);
fOtherSet->removeAll(*fExtendSet);
fSets->addElement(fALetterSet, status);
fSets->addElement(fKatakanaSet, status);
@ -2146,6 +2148,7 @@ RBBIWordMonkey::RBBIWordMonkey() : fGCFMatcher(0),
fSets->addElement(fMidNumSet, status);
fSets->addElement(fNumericSet, status);
fSets->addElement(fFormatSet, status);
fSets->addElement(fExtendSet, status);
fSets->addElement(fOtherSet, status);
fSets->addElement(fExtendNumLetSet, status);