ICU-22580 Address infinity loop in RBBI

ICU-22580 Fix tests
This commit is contained in:
Frank Tang 2023-12-08 12:41:52 -08:00 committed by Frank Yung-Fong Tang
parent 73f972f7ff
commit 4da7ffaa36
5 changed files with 69 additions and 1 deletions

View file

@ -934,6 +934,9 @@ void RBBIRuleScanner::nextChar(RBBIRuleChar &c) {
}
}
if (c.fChar == (UChar32)-1) {
return;
}
if (fQuoteMode) {
c.fEscaped = true;
}

View file

@ -881,6 +881,35 @@ void RBBIAPITest::TestBug2190() {
delete bi;
}
void RBBIAPITest::TestBug22580() {
UParseError parseError;
// Test single ' will not cause infinity loop
{
UnicodeString rulesString = u"'";
UErrorCode status=U_ZERO_ERROR;
RuleBasedBreakIterator(rulesString, parseError, status);
}
if (quick) {
return;
}
// Test any 1 or 2 ASCII chars as rule will not cause infinity loop.
// only in exhaust mode
for (char16_t u1 = u' '; u1 <= u'~'; u1++) {
{
UnicodeString rule = u1;
UErrorCode status=U_ZERO_ERROR;
RuleBasedBreakIterator bi (rule, parseError, status);
}
for (char16_t u2 = u' '; u2 <= u'~'; u2++) {
{
UnicodeString rule;
rule.append(u1).append(u2);
UErrorCode status=U_ZERO_ERROR;
RuleBasedBreakIterator bi (rule, parseError, status);
}
}
}
}
void RBBIAPITest::TestRegistration() {
#if !UCONFIG_NO_SERVICE
@ -1428,6 +1457,7 @@ void RBBIAPITest::runIndexedTest( int32_t index, UBool exec, const char* &name,
TESTCASE_AUTO(TestQuoteGrouping);
TESTCASE_AUTO(TestRuleStatusVec);
TESTCASE_AUTO(TestBug2190);
TESTCASE_AUTO(TestBug22580);
#if !UCONFIG_NO_FILE_IO
TESTCASE_AUTO(TestRegistration);
TESTCASE_AUTO(TestBoilerPlate);

View file

@ -83,6 +83,7 @@ public:
void TestRuleStatusVec();
void TestBug2190();
void TestBug22580();
void TestBoilerPlate();

View file

@ -770,7 +770,7 @@ class RBBIRuleScanner {
// These are recognized in all contexts, whether in quoted text or not.
//
if (c.fChar == '\'') {
if (UTF16.charAt(fRB.fRules, fNextIndex) == '\'') {
if (fNextIndex < fRB.fRules.length() && UTF16.charAt(fRB.fRules, fNextIndex) == '\'') {
c.fChar = nextCharLL(); // get nextChar officially so character counts
c.fEscaped = true; // stay correct.
} else {
@ -787,6 +787,9 @@ class RBBIRuleScanner {
return;
}
}
if (c.fChar == -1) {
return;
}
if (fQuoteMode) {
c.fEscaped = true;

View file

@ -485,4 +485,35 @@ public class RBBIAPITest extends CoreTestFmwk {
bi.setText("Here is some Text");
TestFmwk.assertEquals("Title instance break iterator not correctly instantiated", bi.first(), 0);
}
@Test
public void TestBug22580() {
try {
RuleBasedBreakIterator bi = new RuleBasedBreakIterator("'");
} catch(IllegalArgumentException e) {
// nothing.
}
boolean quick = TestFmwk.getExhaustiveness() <= 5;
if (quick) {
return;
}
// Test any 1 or 2 ASCII chars as rule will not cause infinity loop.
// only in exhaust mode
for (char u1 = ' '; u1 < '~'; u1++) {
try {
char array[] = {u1};
RuleBasedBreakIterator bi = new RuleBasedBreakIterator(new String(array));
} catch(IllegalArgumentException e) {
// nothing.
}
for (char u2 = ' '; u2 < '~'; u2++) {
try {
char array[] = {u1, u2};
RuleBasedBreakIterator bi = new RuleBasedBreakIterator(new String(array));
} catch(IllegalArgumentException e) {
// nothing.
}
}
}
}
}