mirror of
https://github.com/unicode-org/icu.git
synced 2025-04-05 05:25:34 +00:00
ICU-22580 Address infinity loop in RBBI
ICU-22580 Fix tests
This commit is contained in:
parent
73f972f7ff
commit
4da7ffaa36
5 changed files with 69 additions and 1 deletions
|
@ -934,6 +934,9 @@ void RBBIRuleScanner::nextChar(RBBIRuleChar &c) {
|
|||
}
|
||||
}
|
||||
|
||||
if (c.fChar == (UChar32)-1) {
|
||||
return;
|
||||
}
|
||||
if (fQuoteMode) {
|
||||
c.fEscaped = true;
|
||||
}
|
||||
|
|
|
@ -881,6 +881,35 @@ void RBBIAPITest::TestBug2190() {
|
|||
delete bi;
|
||||
}
|
||||
|
||||
void RBBIAPITest::TestBug22580() {
|
||||
UParseError parseError;
|
||||
// Test single ' will not cause infinity loop
|
||||
{
|
||||
UnicodeString rulesString = u"'";
|
||||
UErrorCode status=U_ZERO_ERROR;
|
||||
RuleBasedBreakIterator(rulesString, parseError, status);
|
||||
}
|
||||
if (quick) {
|
||||
return;
|
||||
}
|
||||
// Test any 1 or 2 ASCII chars as rule will not cause infinity loop.
|
||||
// only in exhaust mode
|
||||
for (char16_t u1 = u' '; u1 <= u'~'; u1++) {
|
||||
{
|
||||
UnicodeString rule = u1;
|
||||
UErrorCode status=U_ZERO_ERROR;
|
||||
RuleBasedBreakIterator bi (rule, parseError, status);
|
||||
}
|
||||
for (char16_t u2 = u' '; u2 <= u'~'; u2++) {
|
||||
{
|
||||
UnicodeString rule;
|
||||
rule.append(u1).append(u2);
|
||||
UErrorCode status=U_ZERO_ERROR;
|
||||
RuleBasedBreakIterator bi (rule, parseError, status);
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
void RBBIAPITest::TestRegistration() {
|
||||
#if !UCONFIG_NO_SERVICE
|
||||
|
@ -1428,6 +1457,7 @@ void RBBIAPITest::runIndexedTest( int32_t index, UBool exec, const char* &name,
|
|||
TESTCASE_AUTO(TestQuoteGrouping);
|
||||
TESTCASE_AUTO(TestRuleStatusVec);
|
||||
TESTCASE_AUTO(TestBug2190);
|
||||
TESTCASE_AUTO(TestBug22580);
|
||||
#if !UCONFIG_NO_FILE_IO
|
||||
TESTCASE_AUTO(TestRegistration);
|
||||
TESTCASE_AUTO(TestBoilerPlate);
|
||||
|
|
|
@ -83,6 +83,7 @@ public:
|
|||
void TestRuleStatusVec();
|
||||
|
||||
void TestBug2190();
|
||||
void TestBug22580();
|
||||
|
||||
void TestBoilerPlate();
|
||||
|
||||
|
|
|
@ -770,7 +770,7 @@ class RBBIRuleScanner {
|
|||
// These are recognized in all contexts, whether in quoted text or not.
|
||||
//
|
||||
if (c.fChar == '\'') {
|
||||
if (UTF16.charAt(fRB.fRules, fNextIndex) == '\'') {
|
||||
if (fNextIndex < fRB.fRules.length() && UTF16.charAt(fRB.fRules, fNextIndex) == '\'') {
|
||||
c.fChar = nextCharLL(); // get nextChar officially so character counts
|
||||
c.fEscaped = true; // stay correct.
|
||||
} else {
|
||||
|
@ -787,6 +787,9 @@ class RBBIRuleScanner {
|
|||
return;
|
||||
}
|
||||
}
|
||||
if (c.fChar == -1) {
|
||||
return;
|
||||
}
|
||||
|
||||
if (fQuoteMode) {
|
||||
c.fEscaped = true;
|
||||
|
|
|
@ -485,4 +485,35 @@ public class RBBIAPITest extends CoreTestFmwk {
|
|||
bi.setText("Here is some Text");
|
||||
TestFmwk.assertEquals("Title instance break iterator not correctly instantiated", bi.first(), 0);
|
||||
}
|
||||
|
||||
@Test
|
||||
public void TestBug22580() {
|
||||
try {
|
||||
RuleBasedBreakIterator bi = new RuleBasedBreakIterator("'");
|
||||
} catch(IllegalArgumentException e) {
|
||||
// nothing.
|
||||
}
|
||||
boolean quick = TestFmwk.getExhaustiveness() <= 5;
|
||||
if (quick) {
|
||||
return;
|
||||
}
|
||||
// Test any 1 or 2 ASCII chars as rule will not cause infinity loop.
|
||||
// only in exhaust mode
|
||||
for (char u1 = ' '; u1 < '~'; u1++) {
|
||||
try {
|
||||
char array[] = {u1};
|
||||
RuleBasedBreakIterator bi = new RuleBasedBreakIterator(new String(array));
|
||||
} catch(IllegalArgumentException e) {
|
||||
// nothing.
|
||||
}
|
||||
for (char u2 = ' '; u2 < '~'; u2++) {
|
||||
try {
|
||||
char array[] = {u1, u2};
|
||||
RuleBasedBreakIterator bi = new RuleBasedBreakIterator(new String(array));
|
||||
} catch(IllegalArgumentException e) {
|
||||
// nothing.
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
|
|
Loading…
Add table
Reference in a new issue