Home | History | Annotate | Download | only in intltest
      1 /********************************************************************
      2  * Copyright (c) 1999-2012, International Business Machines
      3  * Corporation and others. All Rights Reserved.
      4  ********************************************************************
      5  *   Date        Name        Description
      6  *   12/14/99    Madhu        Creation.
      7  *   01/12/2000  Madhu        updated for changed API
      8  ********************************************************************/
      9 
     10 #include "unicode/utypes.h"
     11 
     12 #if !UCONFIG_NO_BREAK_ITERATION
     13 
     14 #include "unicode/uchar.h"
     15 #include "intltest.h"
     16 #include "unicode/rbbi.h"
     17 #include "unicode/schriter.h"
     18 #include "rbbiapts.h"
     19 #include "rbbidata.h"
     20 #include "cstring.h"
     21 #include "ubrkimpl.h"
     22 #include "unicode/locid.h"
     23 #include "unicode/ustring.h"
     24 #include "unicode/utext.h"
     25 #include "cmemory.h"
     26 
     27 /**
     28  * API Test the RuleBasedBreakIterator class
     29  */
     30 
     31 
     32 #define TEST_ASSERT_SUCCESS(status) {if (U_FAILURE(status)) {\
     33 dataerrln("Failure at file %s, line %d, error = %s", __FILE__, __LINE__, u_errorName(status));}}
     34 
     35 #define TEST_ASSERT(expr) {if ((expr) == FALSE) { \
     36     errln("Test Failure at file %s, line %d: \"%s\" is false.\n", __FILE__, __LINE__, #expr);};}
     37 
     38 void RBBIAPITest::TestCloneEquals()
     39 {
     40 
     41     UErrorCode status=U_ZERO_ERROR;
     42     RuleBasedBreakIterator* bi1     = (RuleBasedBreakIterator*)RuleBasedBreakIterator::createCharacterInstance(Locale::getDefault(), status);
     43     RuleBasedBreakIterator* biequal = (RuleBasedBreakIterator*)RuleBasedBreakIterator::createCharacterInstance(Locale::getDefault(), status);
     44     RuleBasedBreakIterator* bi3     = (RuleBasedBreakIterator*)RuleBasedBreakIterator::createCharacterInstance(Locale::getDefault(), status);
     45     RuleBasedBreakIterator* bi2     = (RuleBasedBreakIterator*)RuleBasedBreakIterator::createWordInstance(Locale::getDefault(), status);
     46     if(U_FAILURE(status)){
     47         errcheckln(status, "Fail : in construction - %s", u_errorName(status));
     48         return;
     49     }
     50 
     51 
     52     UnicodeString testString="Testing word break iterators's clone() and equals()";
     53     bi1->setText(testString);
     54     bi2->setText(testString);
     55     biequal->setText(testString);
     56 
     57     bi3->setText("hello");
     58 
     59     logln((UnicodeString)"Testing equals()");
     60 
     61     logln((UnicodeString)"Testing == and !=");
     62     UBool b = (*bi1 != *biequal);
     63     b |= *bi1 == *bi2;
     64     b |= *bi1 == *bi3;
     65     if (b) {
     66         errln((UnicodeString)"ERROR:1 RBBI's == and != operator failed.");
     67     }
     68 
     69     if(*bi2 == *biequal || *bi2 == *bi1  || *biequal == *bi3)
     70         errln((UnicodeString)"ERROR:2 RBBI's == and != operator  failed.");
     71 
     72 
     73     // Quick test of RulesBasedBreakIterator assignment -
     74     // Check that
     75     //    two different iterators are !=
     76     //    they are == after assignment
     77     //    source and dest iterator produce the same next() after assignment.
     78     //    deleting one doesn't disable the other.
     79     logln("Testing assignment");
     80     RuleBasedBreakIterator *bix = (RuleBasedBreakIterator *)BreakIterator::createLineInstance(Locale::getDefault(), status);
     81     if(U_FAILURE(status)){
     82         errcheckln(status, "Fail : in construction - %s", u_errorName(status));
     83         return;
     84     }
     85 
     86     RuleBasedBreakIterator biDefault, biDefault2;
     87     if(U_FAILURE(status)){
     88         errln((UnicodeString)"FAIL : in construction of default iterator");
     89         return;
     90     }
     91     if (biDefault == *bix) {
     92         errln((UnicodeString)"ERROR: iterators should not compare ==");
     93         return;
     94     }
     95     if (biDefault != biDefault2) {
     96         errln((UnicodeString)"ERROR: iterators should compare ==");
     97         return;
     98     }
     99 
    100 
    101     UnicodeString   HelloString("Hello Kitty");
    102     bix->setText(HelloString);
    103     if (*bix == *bi2) {
    104         errln(UnicodeString("ERROR: strings should not be equal before assignment."));
    105     }
    106     *bix = *bi2;
    107     if (*bix != *bi2) {
    108         errln(UnicodeString("ERROR: strings should be equal before assignment."));
    109     }
    110 
    111     int bixnext = bix->next();
    112     int bi2next = bi2->next();
    113     if (! (bixnext == bi2next && bixnext == 7)) {
    114         errln(UnicodeString("ERROR: iterators behaved differently after assignment."));
    115     }
    116     delete bix;
    117     if (bi2->next() != 8) {
    118         errln(UnicodeString("ERROR: iterator.next() failed after deleting copy."));
    119     }
    120 
    121 
    122 
    123     logln((UnicodeString)"Testing clone()");
    124     RuleBasedBreakIterator* bi1clone=(RuleBasedBreakIterator*)bi1->clone();
    125     RuleBasedBreakIterator* bi2clone=(RuleBasedBreakIterator*)bi2->clone();
    126 
    127     if(*bi1clone != *bi1 || *bi1clone  != *biequal  ||
    128       *bi1clone == *bi3 || *bi1clone == *bi2)
    129         errln((UnicodeString)"ERROR:1 RBBI's clone() method failed");
    130 
    131     if(*bi2clone == *bi1 || *bi2clone == *biequal ||
    132        *bi2clone == *bi3 || *bi2clone != *bi2)
    133         errln((UnicodeString)"ERROR:2 RBBI's clone() method failed");
    134 
    135     if(bi1->getText() != bi1clone->getText()   ||
    136        bi2clone->getText() != bi2->getText()   ||
    137        *bi2clone == *bi1clone )
    138         errln((UnicodeString)"ERROR: RBBI's clone() method failed");
    139 
    140     delete bi1clone;
    141     delete bi2clone;
    142     delete bi1;
    143     delete bi3;
    144     delete bi2;
    145     delete biequal;
    146 }
    147 
    148 void RBBIAPITest::TestBoilerPlate()
    149 {
    150     UErrorCode status = U_ZERO_ERROR;
    151     BreakIterator* a = BreakIterator::createWordInstance(Locale("hi"), status);
    152     BreakIterator* b = BreakIterator::createWordInstance(Locale("hi_IN"),status);
    153     if (U_FAILURE(status)) {
    154         errcheckln(status, "Creation of break iterator failed %s", u_errorName(status));
    155         return;
    156     }
    157     if(*a!=*b){
    158         errln("Failed: boilerplate method operator!= does not return correct results");
    159     }
    160     // Japanese word break iterators are identical to root with
    161     // a dictionary-based break iterator
    162     BreakIterator* c = BreakIterator::createCharacterInstance(Locale("ja"),status);
    163     BreakIterator* d = BreakIterator::createCharacterInstance(Locale("root"),status);
    164     if(c && d){
    165         if(*c!=*d){
    166             errln("Failed: boilerplate method operator== does not return correct results");
    167         }
    168     }else{
    169         errln("creation of break iterator failed");
    170     }
    171     delete a;
    172     delete b;
    173     delete c;
    174     delete d;
    175 }
    176 
    177 void RBBIAPITest::TestgetRules()
    178 {
    179     UErrorCode status=U_ZERO_ERROR;
    180 
    181     RuleBasedBreakIterator* bi1=(RuleBasedBreakIterator*)RuleBasedBreakIterator::createCharacterInstance(Locale::getDefault(), status);
    182     RuleBasedBreakIterator* bi2=(RuleBasedBreakIterator*)RuleBasedBreakIterator::createWordInstance(Locale::getDefault(), status);
    183     if(U_FAILURE(status)){
    184         errcheckln(status, "FAIL: in construction - %s", u_errorName(status));
    185         delete bi1;
    186         delete bi2;
    187         return;
    188     }
    189 
    190 
    191 
    192     logln((UnicodeString)"Testing toString()");
    193 
    194     bi1->setText((UnicodeString)"Hello there");
    195 
    196     RuleBasedBreakIterator* bi3 =(RuleBasedBreakIterator*)bi1->clone();
    197 
    198     UnicodeString temp=bi1->getRules();
    199     UnicodeString temp2=bi2->getRules();
    200     UnicodeString temp3=bi3->getRules();
    201     if( temp2.compare(temp3) ==0 || temp.compare(temp2) == 0 || temp.compare(temp3) != 0)
    202         errln((UnicodeString)"ERROR: error in getRules() method");
    203 
    204     delete bi1;
    205     delete bi2;
    206     delete bi3;
    207 }
    208 void RBBIAPITest::TestHashCode()
    209 {
    210     UErrorCode status=U_ZERO_ERROR;
    211     RuleBasedBreakIterator* bi1     = (RuleBasedBreakIterator*)RuleBasedBreakIterator::createCharacterInstance(Locale::getDefault(), status);
    212     RuleBasedBreakIterator* bi3     = (RuleBasedBreakIterator*)RuleBasedBreakIterator::createCharacterInstance(Locale::getDefault(), status);
    213     RuleBasedBreakIterator* bi2     = (RuleBasedBreakIterator*)RuleBasedBreakIterator::createWordInstance(Locale::getDefault(), status);
    214     if(U_FAILURE(status)){
    215         errcheckln(status, "Fail : in construction - %s", u_errorName(status));
    216         delete bi1;
    217         delete bi2;
    218         delete bi3;
    219         return;
    220     }
    221 
    222 
    223     logln((UnicodeString)"Testing hashCode()");
    224 
    225     bi1->setText((UnicodeString)"Hash code");
    226     bi2->setText((UnicodeString)"Hash code");
    227     bi3->setText((UnicodeString)"Hash code");
    228 
    229     RuleBasedBreakIterator* bi1clone= (RuleBasedBreakIterator*)bi1->clone();
    230     RuleBasedBreakIterator* bi2clone= (RuleBasedBreakIterator*)bi2->clone();
    231 
    232     if(bi1->hashCode() != bi1clone->hashCode() ||  bi1->hashCode() != bi3->hashCode() ||
    233         bi1clone->hashCode() != bi3->hashCode() || bi2->hashCode() != bi2clone->hashCode())
    234         errln((UnicodeString)"ERROR: identical objects have different hashcodes");
    235 
    236     if(bi1->hashCode() == bi2->hashCode() ||  bi2->hashCode() == bi3->hashCode() ||
    237         bi1clone->hashCode() == bi2clone->hashCode() || bi1clone->hashCode() == bi2->hashCode())
    238         errln((UnicodeString)"ERROR: different objects have same hashcodes");
    239 
    240     delete bi1clone;
    241     delete bi2clone;
    242     delete bi1;
    243     delete bi2;
    244     delete bi3;
    245 
    246 }
    247 void RBBIAPITest::TestGetSetAdoptText()
    248 {
    249     logln((UnicodeString)"Testing getText setText ");
    250     IcuTestErrorCode status(*this, "TestGetSetAdoptText");
    251     UnicodeString str1="first string.";
    252     UnicodeString str2="Second string.";
    253     LocalPointer<RuleBasedBreakIterator> charIter1((RuleBasedBreakIterator*)RuleBasedBreakIterator::createCharacterInstance(Locale::getDefault(), status));
    254     LocalPointer<RuleBasedBreakIterator> wordIter1((RuleBasedBreakIterator*)RuleBasedBreakIterator::createWordInstance(Locale::getDefault(), status));
    255     if(status.isFailure()){
    256         errcheckln(status, "Fail : in construction - %s", status.errorName());
    257             return;
    258     }
    259 
    260 
    261     CharacterIterator* text1= new StringCharacterIterator(str1);
    262     CharacterIterator* text1Clone = text1->clone();
    263     CharacterIterator* text2= new StringCharacterIterator(str2);
    264     CharacterIterator* text3= new StringCharacterIterator(str2, 3, 10, 3); //  "ond str"
    265 
    266     wordIter1->setText(str1);
    267     CharacterIterator *tci = &wordIter1->getText();
    268     UnicodeString      tstr;
    269     tci->getText(tstr);
    270     TEST_ASSERT(tstr == str1);
    271     if(wordIter1->current() != 0)
    272         errln((UnicodeString)"ERROR:1 setText did not set the iteration position to the beginning of the text, it is" + wordIter1->current() + (UnicodeString)"\n");
    273 
    274     wordIter1->next(2);
    275 
    276     wordIter1->setText(str2);
    277     if(wordIter1->current() != 0)
    278         errln((UnicodeString)"ERROR:2 setText did not reset the iteration position to the beginning of the text, it is" + wordIter1->current() + (UnicodeString)"\n");
    279 
    280 
    281     charIter1->adoptText(text1Clone);
    282     TEST_ASSERT(wordIter1->getText() != charIter1->getText());
    283     tci = &wordIter1->getText();
    284     tci->getText(tstr);
    285     TEST_ASSERT(tstr == str2);
    286     tci = &charIter1->getText();
    287     tci->getText(tstr);
    288     TEST_ASSERT(tstr == str1);
    289 
    290 
    291     LocalPointer<RuleBasedBreakIterator> rb((RuleBasedBreakIterator*)wordIter1->clone());
    292     rb->adoptText(text1);
    293     if(rb->getText() != *text1)
    294         errln((UnicodeString)"ERROR:1 error in adoptText ");
    295     rb->adoptText(text2);
    296     if(rb->getText() != *text2)
    297         errln((UnicodeString)"ERROR:2 error in adoptText ");
    298 
    299     // Adopt where iterator range is less than the entire orignal source string.
    300     //   (With the change of the break engine to working with UText internally,
    301     //    CharacterIterators starting at positions other than zero are not supported)
    302     rb->adoptText(text3);
    303     TEST_ASSERT(rb->preceding(2) == 0);
    304     TEST_ASSERT(rb->following(11) == BreakIterator::DONE);
    305     //if(rb->preceding(2) != 3) {
    306     //    errln((UnicodeString)"ERROR:3 error in adoptText ");
    307     //}
    308     //if(rb->following(11) != BreakIterator::DONE) {
    309     //    errln((UnicodeString)"ERROR:4 error in adoptText ");
    310     //}
    311 
    312     // UText API
    313     //
    314     //   Quick test to see if UText is working at all.
    315     //
    316     const char *s1 = "\x68\x65\x6C\x6C\x6F\x20\x77\x6F\x72\x6C\x64"; /* "hello world" in UTF-8 */
    317     const char *s2 = "\x73\x65\x65\x20\x79\x61"; /* "see ya" in UTF-8 */
    318     //                012345678901
    319 
    320     status.reset();
    321     LocalUTextPointer ut(utext_openUTF8(NULL, s1, -1, status));
    322     wordIter1->setText(ut.getAlias(), status);
    323     TEST_ASSERT_SUCCESS(status);
    324 
    325     int32_t pos;
    326     pos = wordIter1->first();
    327     TEST_ASSERT(pos==0);
    328     pos = wordIter1->next();
    329     TEST_ASSERT(pos==5);
    330     pos = wordIter1->next();
    331     TEST_ASSERT(pos==6);
    332     pos = wordIter1->next();
    333     TEST_ASSERT(pos==11);
    334     pos = wordIter1->next();
    335     TEST_ASSERT(pos==UBRK_DONE);
    336 
    337     status.reset();
    338     LocalUTextPointer ut2(utext_openUTF8(NULL, s2, -1, status));
    339     TEST_ASSERT_SUCCESS(status);
    340     wordIter1->setText(ut2.getAlias(), status);
    341     TEST_ASSERT_SUCCESS(status);
    342 
    343     pos = wordIter1->first();
    344     TEST_ASSERT(pos==0);
    345     pos = wordIter1->next();
    346     TEST_ASSERT(pos==3);
    347     pos = wordIter1->next();
    348     TEST_ASSERT(pos==4);
    349 
    350     pos = wordIter1->last();
    351     TEST_ASSERT(pos==6);
    352     pos = wordIter1->previous();
    353     TEST_ASSERT(pos==4);
    354     pos = wordIter1->previous();
    355     TEST_ASSERT(pos==3);
    356     pos = wordIter1->previous();
    357     TEST_ASSERT(pos==0);
    358     pos = wordIter1->previous();
    359     TEST_ASSERT(pos==UBRK_DONE);
    360 
    361     status.reset();
    362     UnicodeString sEmpty;
    363     LocalUTextPointer gut2(utext_openUnicodeString(NULL, &sEmpty, status));
    364     wordIter1->getUText(gut2.getAlias(), status);
    365     TEST_ASSERT_SUCCESS(status);
    366     status.reset();
    367 }
    368 
    369 
    370 void RBBIAPITest::TestIteration()
    371 {
    372     // This test just verifies that the API is present.
    373     // Testing for correct operation of the break rules happens elsewhere.
    374 
    375     UErrorCode status=U_ZERO_ERROR;
    376     RuleBasedBreakIterator* bi  = (RuleBasedBreakIterator*)RuleBasedBreakIterator::createCharacterInstance(Locale::getDefault(), status);
    377     if (U_FAILURE(status) || bi == NULL)  {
    378         errcheckln(status, "Failure creating character break iterator.  Status = %s", u_errorName(status));
    379     }
    380     delete bi;
    381 
    382     status=U_ZERO_ERROR;
    383     bi  = (RuleBasedBreakIterator*)RuleBasedBreakIterator::createWordInstance(Locale::getDefault(), status);
    384     if (U_FAILURE(status) || bi == NULL)  {
    385         errcheckln(status, "Failure creating Word break iterator.  Status = %s", u_errorName(status));
    386     }
    387     delete bi;
    388 
    389     status=U_ZERO_ERROR;
    390     bi  = (RuleBasedBreakIterator*)RuleBasedBreakIterator::createLineInstance(Locale::getDefault(), status);
    391     if (U_FAILURE(status) || bi == NULL)  {
    392         errcheckln(status, "Failure creating Line break iterator.  Status = %s", u_errorName(status));
    393     }
    394     delete bi;
    395 
    396     status=U_ZERO_ERROR;
    397     bi  = (RuleBasedBreakIterator*)RuleBasedBreakIterator::createSentenceInstance(Locale::getDefault(), status);
    398     if (U_FAILURE(status) || bi == NULL)  {
    399         errcheckln(status, "Failure creating Sentence break iterator.  Status = %s", u_errorName(status));
    400     }
    401     delete bi;
    402 
    403     status=U_ZERO_ERROR;
    404     bi  = (RuleBasedBreakIterator*)RuleBasedBreakIterator::createTitleInstance(Locale::getDefault(), status);
    405     if (U_FAILURE(status) || bi == NULL)  {
    406         errcheckln(status, "Failure creating Title break iterator.  Status = %s", u_errorName(status));
    407     }
    408     delete bi;
    409 
    410     status=U_ZERO_ERROR;
    411     bi  = (RuleBasedBreakIterator*)RuleBasedBreakIterator::createCharacterInstance(Locale::getDefault(), status);
    412     if (U_FAILURE(status) || bi == NULL)  {
    413         errcheckln(status, "Failure creating character break iterator.  Status = %s", u_errorName(status));
    414         return;   // Skip the rest of these tests.
    415     }
    416 
    417 
    418     UnicodeString testString="0123456789";
    419     bi->setText(testString);
    420 
    421     int32_t i;
    422     i = bi->first();
    423     if (i != 0) {
    424         errln("Incorrect value from bi->first().  Expected 0, got %d.", i);
    425     }
    426 
    427     i = bi->last();
    428     if (i != 10) {
    429         errln("Incorrect value from bi->last().  Expected 10, got %d", i);
    430     }
    431 
    432     //
    433     // Previous
    434     //
    435     bi->last();
    436     i = bi->previous();
    437     if (i != 9) {
    438         errln("Incorrect value from bi->last() at line %d.  Expected 9, got %d", __LINE__, i);
    439     }
    440 
    441 
    442     bi->first();
    443     i = bi->previous();
    444     if (i != BreakIterator::DONE) {
    445         errln("Incorrect value from bi->previous() at line %d.  Expected DONE, got %d", __LINE__, i);
    446     }
    447 
    448     //
    449     // next()
    450     //
    451     bi->first();
    452     i = bi->next();
    453     if (i != 1) {
    454         errln("Incorrect value from bi->next() at line %d.  Expected 1, got %d", __LINE__, i);
    455     }
    456 
    457     bi->last();
    458     i = bi->next();
    459     if (i != BreakIterator::DONE) {
    460         errln("Incorrect value from bi->next() at line %d.  Expected DONE, got %d", __LINE__, i);
    461     }
    462 
    463 
    464     //
    465     //  current()
    466     //
    467     bi->first();
    468     i = bi->current();
    469     if (i != 0) {
    470         errln("Incorrect value from bi->previous() at line %d.  Expected 0, got %d", __LINE__, i);
    471     }
    472 
    473     bi->next();
    474     i = bi->current();
    475     if (i != 1) {
    476         errln("Incorrect value from bi->previous() at line %d.  Expected 1, got %d", __LINE__, i);
    477     }
    478 
    479     bi->last();
    480     bi->next();
    481     i = bi->current();
    482     if (i != 10) {
    483         errln("Incorrect value from bi->previous() at line %d.  Expected 10, got %d", __LINE__, i);
    484     }
    485 
    486     bi->first();
    487     bi->previous();
    488     i = bi->current();
    489     if (i != 0) {
    490         errln("Incorrect value from bi->previous() at line %d.  Expected 0, got %d", __LINE__, i);
    491     }
    492 
    493 
    494     //
    495     // Following()
    496     //
    497     i = bi->following(4);
    498     if (i != 5) {
    499         errln("Incorrect value from bi->following() at line %d.  Expected 5, got %d", __LINE__, i);
    500     }
    501 
    502     i = bi->following(9);
    503     if (i != 10) {
    504         errln("Incorrect value from bi->following() at line %d.  Expected 10, got %d", __LINE__, i);
    505     }
    506 
    507     i = bi->following(10);
    508     if (i != BreakIterator::DONE) {
    509         errln("Incorrect value from bi->following() at line %d.  Expected DONE, got %d", __LINE__, i);
    510     }
    511 
    512 
    513     //
    514     // Preceding
    515     //
    516     i = bi->preceding(4);
    517     if (i != 3) {
    518         errln("Incorrect value from bi->preceding() at line %d.  Expected 3, got %d", __LINE__, i);
    519     }
    520 
    521     i = bi->preceding(10);
    522     if (i != 9) {
    523         errln("Incorrect value from bi->preceding() at line %d.  Expected 9, got %d", __LINE__, i);
    524     }
    525 
    526     i = bi->preceding(1);
    527     if (i != 0) {
    528         errln("Incorrect value from bi->preceding() at line %d.  Expected 0, got %d", __LINE__, i);
    529     }
    530 
    531     i = bi->preceding(0);
    532     if (i != BreakIterator::DONE) {
    533         errln("Incorrect value from bi->preceding() at line %d.  Expected DONE, got %d", __LINE__, i);
    534     }
    535 
    536 
    537     //
    538     // isBoundary()
    539     //
    540     bi->first();
    541     if (bi->isBoundary(3) != TRUE) {
    542         errln("Incorrect value from bi->isBoudary() at line %d.  Expected TRUE, got FALSE", __LINE__, i);
    543     }
    544     i = bi->current();
    545     if (i != 3) {
    546         errln("Incorrect value from bi->current() at line %d.  Expected 3, got %d", __LINE__, i);
    547     }
    548 
    549 
    550     if (bi->isBoundary(11) != FALSE) {
    551         errln("Incorrect value from bi->isBoudary() at line %d.  Expected FALSE, got TRUE", __LINE__, i);
    552     }
    553     i = bi->current();
    554     if (i != 10) {
    555         errln("Incorrect value from bi->current() at line %d.  Expected 10, got %d", __LINE__, i);
    556     }
    557 
    558     //
    559     // next(n)
    560     //
    561     bi->first();
    562     i = bi->next(4);
    563     if (i != 4) {
    564         errln("Incorrect value from bi->next() at line %d.  Expected 4, got %d", __LINE__, i);
    565     }
    566 
    567     i = bi->next(6);
    568     if (i != 10) {
    569         errln("Incorrect value from bi->next() at line %d.  Expected 10, got %d", __LINE__, i);
    570     }
    571 
    572     bi->first();
    573     i = bi->next(11);
    574     if (i != BreakIterator::DONE) {
    575         errln("Incorrect value from bi->next() at line %d.  Expected BreakIterator::DONE, got %d", __LINE__, i);
    576     }
    577 
    578     delete bi;
    579 
    580 }
    581 
    582 
    583 
    584 
    585 
    586 
    587 void RBBIAPITest::TestBuilder() {
    588      UnicodeString rulesString1 = "$Letters = [:L:];\n"
    589                                   "$Numbers = [:N:];\n"
    590                                   "$Letters+;\n"
    591                                   "$Numbers+;\n"
    592                                   "[^$Letters $Numbers];\n"
    593                                   "!.*;\n";
    594      UnicodeString testString1  = "abc123..abc";
    595                                 // 01234567890
    596      int32_t bounds1[] = {0, 3, 6, 7, 8, 11};
    597      UErrorCode status=U_ZERO_ERROR;
    598      UParseError    parseError;
    599 
    600      RuleBasedBreakIterator *bi = new RuleBasedBreakIterator(rulesString1, parseError, status);
    601      if(U_FAILURE(status)) {
    602          dataerrln("Fail : in construction - %s", u_errorName(status));
    603      } else {
    604          bi->setText(testString1);
    605          doBoundaryTest(*bi, testString1, bounds1);
    606      }
    607      delete bi;
    608 }
    609 
    610 
    611 //
    612 //  TestQuoteGrouping
    613 //       Single quotes within rules imply a grouping, so that a modifier
    614 //       following the quoted text (* or +) applies to all of the quoted chars.
    615 //
    616 void RBBIAPITest::TestQuoteGrouping() {
    617      UnicodeString rulesString1 = "#Here comes the rule...\n"
    618                                   "'$@!'*;\n"   //  (\$\@\!)*
    619                                   ".;\n";
    620 
    621      UnicodeString testString1  = "$@!$@!X$@!!X";
    622                                 // 0123456789012
    623      int32_t bounds1[] = {0, 6, 7, 10, 11, 12};
    624      UErrorCode status=U_ZERO_ERROR;
    625      UParseError    parseError;
    626 
    627      RuleBasedBreakIterator *bi = new RuleBasedBreakIterator(rulesString1, parseError, status);
    628      if(U_FAILURE(status)) {
    629          dataerrln("Fail : in construction - %s", u_errorName(status));
    630      } else {
    631          bi->setText(testString1);
    632          doBoundaryTest(*bi, testString1, bounds1);
    633      }
    634      delete bi;
    635 }
    636 
    637 //
    638 //  TestRuleStatus
    639 //      Test word break rule status constants.
    640 //
    641 void RBBIAPITest::TestRuleStatus() {
    642      UChar str[30];
    643      //no longer test Han or hiragana breaking here: ruleStatusVec would return nothing
    644      // changed UBRK_WORD_KANA to UBRK_WORD_IDEO
    645      u_unescape("plain word 123.45 \\u30a1\\u30a2 ",
    646               // 012345678901234567  8      9    0
    647               //                     Katakana
    648                 str, 30);
    649      UnicodeString testString1(str);
    650      int32_t bounds1[] = {0, 5, 6, 10, 11, 17, 18, 20, 21};
    651      int32_t tag_lo[]  = {UBRK_WORD_NONE,     UBRK_WORD_LETTER, UBRK_WORD_NONE,    UBRK_WORD_LETTER,
    652                           UBRK_WORD_NONE,     UBRK_WORD_NUMBER, UBRK_WORD_NONE,
    653                           UBRK_WORD_IDEO,     UBRK_WORD_NONE};
    654 
    655      int32_t tag_hi[]  = {UBRK_WORD_NONE_LIMIT, UBRK_WORD_LETTER_LIMIT, UBRK_WORD_NONE_LIMIT, UBRK_WORD_LETTER_LIMIT,
    656                           UBRK_WORD_NONE_LIMIT, UBRK_WORD_NUMBER_LIMIT, UBRK_WORD_NONE_LIMIT,
    657                           UBRK_WORD_IDEO_LIMIT, UBRK_WORD_NONE_LIMIT};
    658 
    659      UErrorCode status=U_ZERO_ERROR;
    660 
    661      RuleBasedBreakIterator *bi = (RuleBasedBreakIterator *)BreakIterator::createWordInstance(Locale::getEnglish(), status);
    662      if(U_FAILURE(status)) {
    663          errcheckln(status, "Fail : in construction - %s", u_errorName(status));
    664      } else {
    665          bi->setText(testString1);
    666          // First test that the breaks are in the right spots.
    667          doBoundaryTest(*bi, testString1, bounds1);
    668 
    669          // Then go back and check tag values
    670          int32_t i = 0;
    671          int32_t pos, tag;
    672          for (pos = bi->first(); pos != BreakIterator::DONE; pos = bi->next(), i++) {
    673              if (pos != bounds1[i]) {
    674                  errln("FAIL: unexpected word break at postion %d", pos);
    675                  break;
    676              }
    677              tag = bi->getRuleStatus();
    678              if (tag < tag_lo[i] || tag >= tag_hi[i]) {
    679                  errln("FAIL: incorrect tag value %d at position %d", tag, pos);
    680                  break;
    681              }
    682 
    683              // Check that we get the same tag values from getRuleStatusVec()
    684              int32_t vec[10];
    685              int t = bi->getRuleStatusVec(vec, 10, status);
    686              TEST_ASSERT_SUCCESS(status);
    687              TEST_ASSERT(t==1);
    688              TEST_ASSERT(vec[0] == tag);
    689          }
    690      }
    691      delete bi;
    692 
    693      // Now test line break status.  This test mostly is to confirm that the status constants
    694      //                              are correctly declared in the header.
    695      testString1 =   "test line. \n";
    696      // break type    s    s     h
    697 
    698      bi = (RuleBasedBreakIterator *)
    699          BreakIterator::createLineInstance(Locale::getEnglish(), status);
    700      if(U_FAILURE(status)) {
    701          errcheckln(status, "failed to create word break iterator. - %s", u_errorName(status));
    702      } else {
    703          int32_t i = 0;
    704          int32_t pos, tag;
    705          UBool   success;
    706 
    707          bi->setText(testString1);
    708          pos = bi->current();
    709          tag = bi->getRuleStatus();
    710          for (i=0; i<3; i++) {
    711              switch (i) {
    712              case 0:
    713                  success = pos==0  && tag==UBRK_LINE_SOFT; break;
    714              case 1:
    715                  success = pos==5  && tag==UBRK_LINE_SOFT; break;
    716              case 2:
    717                  success = pos==12 && tag==UBRK_LINE_HARD; break;
    718              default:
    719                  success = FALSE; break;
    720              }
    721              if (success == FALSE) {
    722                  errln("Fail: incorrect word break status or position.  i=%d, pos=%d, tag=%d",
    723                      i, pos, tag);
    724                  break;
    725              }
    726              pos = bi->next();
    727              tag = bi->getRuleStatus();
    728          }
    729          if (UBRK_LINE_SOFT >= UBRK_LINE_SOFT_LIMIT ||
    730              UBRK_LINE_HARD >= UBRK_LINE_HARD_LIMIT ||
    731              (UBRK_LINE_HARD > UBRK_LINE_SOFT && UBRK_LINE_HARD < UBRK_LINE_SOFT_LIMIT)) {
    732              errln("UBRK_LINE_* constants from header are inconsistent.");
    733          }
    734      }
    735      delete bi;
    736 
    737 }
    738 
    739 
    740 //
    741 //  TestRuleStatusVec
    742 //      Test the vector form of  break rule status.
    743 //
    744 void RBBIAPITest::TestRuleStatusVec() {
    745     UnicodeString rulesString(   "[A-N]{100}; \n"
    746                                  "[a-w]{200}; \n"
    747                                  "[\\p{L}]{300}; \n"
    748                                  "[\\p{N}]{400}; \n"
    749                                  "[0-5]{500}; \n"
    750                                   "!.*;\n", -1, US_INV);
    751      UnicodeString testString1  = "Aapz5?";
    752      int32_t  statusVals[10];
    753      int32_t  numStatuses;
    754      int32_t  pos;
    755 
    756      UErrorCode status=U_ZERO_ERROR;
    757      UParseError    parseError;
    758 
    759      RuleBasedBreakIterator *bi = new RuleBasedBreakIterator(rulesString, parseError, status);
    760      if (U_FAILURE(status)) {
    761          dataerrln("Failure at file %s, line %d, error = %s", __FILE__, __LINE__, u_errorName(status));
    762      } else {
    763          bi->setText(testString1);
    764 
    765          // A
    766          pos = bi->next();
    767          TEST_ASSERT(pos==1);
    768          numStatuses = bi->getRuleStatusVec(statusVals, 10, status);
    769          TEST_ASSERT_SUCCESS(status);
    770          TEST_ASSERT(numStatuses == 2);
    771          TEST_ASSERT(statusVals[0] == 100);
    772          TEST_ASSERT(statusVals[1] == 300);
    773 
    774          // a
    775          pos = bi->next();
    776          TEST_ASSERT(pos==2);
    777          numStatuses = bi->getRuleStatusVec(statusVals, 10, status);
    778          TEST_ASSERT_SUCCESS(status);
    779          TEST_ASSERT(numStatuses == 2);
    780          TEST_ASSERT(statusVals[0] == 200);
    781          TEST_ASSERT(statusVals[1] == 300);
    782 
    783          // p
    784          pos = bi->next();
    785          TEST_ASSERT(pos==3);
    786          numStatuses = bi->getRuleStatusVec(statusVals, 10, status);
    787          TEST_ASSERT_SUCCESS(status);
    788          TEST_ASSERT(numStatuses == 2);
    789          TEST_ASSERT(statusVals[0] == 200);
    790          TEST_ASSERT(statusVals[1] == 300);
    791 
    792          // z
    793          pos = bi->next();
    794          TEST_ASSERT(pos==4);
    795          numStatuses = bi->getRuleStatusVec(statusVals, 10, status);
    796          TEST_ASSERT_SUCCESS(status);
    797          TEST_ASSERT(numStatuses == 1);
    798          TEST_ASSERT(statusVals[0] == 300);
    799 
    800          // 5
    801          pos = bi->next();
    802          TEST_ASSERT(pos==5);
    803          numStatuses = bi->getRuleStatusVec(statusVals, 10, status);
    804          TEST_ASSERT_SUCCESS(status);
    805          TEST_ASSERT(numStatuses == 2);
    806          TEST_ASSERT(statusVals[0] == 400);
    807          TEST_ASSERT(statusVals[1] == 500);
    808 
    809          // ?
    810          pos = bi->next();
    811          TEST_ASSERT(pos==6);
    812          numStatuses = bi->getRuleStatusVec(statusVals, 10, status);
    813          TEST_ASSERT_SUCCESS(status);
    814          TEST_ASSERT(numStatuses == 1);
    815          TEST_ASSERT(statusVals[0] == 0);
    816 
    817          //
    818          //  Check buffer overflow error handling.   Char == A
    819          //
    820          bi->first();
    821          pos = bi->next();
    822          TEST_ASSERT(pos==1);
    823          memset(statusVals, -1, sizeof(statusVals));
    824          numStatuses = bi->getRuleStatusVec(statusVals, 0, status);
    825          TEST_ASSERT(status == U_BUFFER_OVERFLOW_ERROR);
    826          TEST_ASSERT(numStatuses == 2);
    827          TEST_ASSERT(statusVals[0] == -1);
    828 
    829          status = U_ZERO_ERROR;
    830          memset(statusVals, -1, sizeof(statusVals));
    831          numStatuses = bi->getRuleStatusVec(statusVals, 1, status);
    832          TEST_ASSERT(status == U_BUFFER_OVERFLOW_ERROR);
    833          TEST_ASSERT(numStatuses == 2);
    834          TEST_ASSERT(statusVals[0] == 100);
    835          TEST_ASSERT(statusVals[1] == -1);
    836 
    837          status = U_ZERO_ERROR;
    838          memset(statusVals, -1, sizeof(statusVals));
    839          numStatuses = bi->getRuleStatusVec(statusVals, 2, status);
    840          TEST_ASSERT_SUCCESS(status);
    841          TEST_ASSERT(numStatuses == 2);
    842          TEST_ASSERT(statusVals[0] == 100);
    843          TEST_ASSERT(statusVals[1] == 300);
    844          TEST_ASSERT(statusVals[2] == -1);
    845      }
    846      delete bi;
    847 
    848 }
    849 
    850 //
    851 //   Bug 2190 Regression test.   Builder crash on rule consisting of only a
    852 //                               $variable reference
    853 void RBBIAPITest::TestBug2190() {
    854      UnicodeString rulesString1 = "$aaa = abcd;\n"
    855                                   "$bbb = $aaa;\n"
    856                                   "$bbb;\n";
    857      UnicodeString testString1  = "abcdabcd";
    858                                 // 01234567890
    859      int32_t bounds1[] = {0, 4, 8};
    860      UErrorCode status=U_ZERO_ERROR;
    861      UParseError    parseError;
    862 
    863      RuleBasedBreakIterator *bi = new RuleBasedBreakIterator(rulesString1, parseError, status);
    864      if(U_FAILURE(status)) {
    865          dataerrln("Fail : in construction - %s", u_errorName(status));
    866      } else {
    867          bi->setText(testString1);
    868          doBoundaryTest(*bi, testString1, bounds1);
    869      }
    870      delete bi;
    871 }
    872 
    873 
    874 void RBBIAPITest::TestRegistration() {
    875 #if !UCONFIG_NO_SERVICE
    876     UErrorCode status = U_ZERO_ERROR;
    877     BreakIterator* ja_word = BreakIterator::createWordInstance("ja_JP", status);
    878     // ok to not delete these if we exit because of error?
    879     BreakIterator* ja_char = BreakIterator::createCharacterInstance("ja_JP", status);
    880     BreakIterator* root_word = BreakIterator::createWordInstance("", status);
    881     BreakIterator* root_char = BreakIterator::createCharacterInstance("", status);
    882 
    883     if (status == U_MISSING_RESOURCE_ERROR || status == U_FILE_ACCESS_ERROR) {
    884         dataerrln("Error creating instances of break interactors - %s", u_errorName(status));
    885 
    886         delete ja_word;
    887         delete ja_char;
    888         delete root_word;
    889         delete root_char;
    890 
    891         return;
    892     }
    893 
    894     URegistryKey key = BreakIterator::registerInstance(ja_word, "xx", UBRK_WORD, status);
    895     {
    896 #if 0 // With a dictionary based word breaking, ja_word is identical to root.
    897         if (ja_word && *ja_word == *root_word) {
    898             errln("japan not different from root");
    899         }
    900 #endif
    901     }
    902 
    903     {
    904         BreakIterator* result = BreakIterator::createWordInstance("xx_XX", status);
    905         UBool fail = TRUE;
    906         if(result){
    907             fail = *result != *ja_word;
    908         }
    909         delete result;
    910         if (fail) {
    911             errln("bad result for xx_XX/word");
    912         }
    913     }
    914 
    915     {
    916         BreakIterator* result = BreakIterator::createCharacterInstance("ja_JP", status);
    917         UBool fail = TRUE;
    918         if(result){
    919             fail = *result != *ja_char;
    920         }
    921         delete result;
    922         if (fail) {
    923             errln("bad result for ja_JP/char");
    924         }
    925     }
    926 
    927     {
    928         BreakIterator* result = BreakIterator::createCharacterInstance("xx_XX", status);
    929         UBool fail = TRUE;
    930         if(result){
    931             fail = *result != *root_char;
    932         }
    933         delete result;
    934         if (fail) {
    935             errln("bad result for xx_XX/char");
    936         }
    937     }
    938 
    939     {
    940         StringEnumeration* avail = BreakIterator::getAvailableLocales();
    941         UBool found = FALSE;
    942         const UnicodeString* p;
    943         while ((p = avail->snext(status))) {
    944             if (p->compare("xx") == 0) {
    945                 found = TRUE;
    946                 break;
    947             }
    948         }
    949         delete avail;
    950         if (!found) {
    951             errln("did not find test locale");
    952         }
    953     }
    954 
    955     {
    956         UBool unreg = BreakIterator::unregister(key, status);
    957         if (!unreg) {
    958             errln("unable to unregister");
    959         }
    960     }
    961 
    962     {
    963         BreakIterator* result = BreakIterator::createWordInstance("en_US", status);
    964         BreakIterator* root = BreakIterator::createWordInstance("", status);
    965         UBool fail = TRUE;
    966         if(root){
    967           fail = *root != *result;
    968         }
    969         delete root;
    970         delete result;
    971         if (fail) {
    972             errln("did not get root break");
    973         }
    974     }
    975 
    976     {
    977         StringEnumeration* avail = BreakIterator::getAvailableLocales();
    978         UBool found = FALSE;
    979         const UnicodeString* p;
    980         while ((p = avail->snext(status))) {
    981             if (p->compare("xx") == 0) {
    982                 found = TRUE;
    983                 break;
    984             }
    985         }
    986         delete avail;
    987         if (found) {
    988             errln("found test locale");
    989         }
    990     }
    991 
    992     {
    993         int32_t count;
    994         UBool   foundLocale = FALSE;
    995         const Locale *avail = BreakIterator::getAvailableLocales(count);
    996         for (int i=0; i<count; i++) {
    997             if (avail[i] == Locale::getEnglish()) {
    998                 foundLocale = TRUE;
    999                 break;
   1000             }
   1001         }
   1002         if (foundLocale == FALSE) {
   1003             errln("BreakIterator::getAvailableLocales(&count), failed to find EN.");
   1004         }
   1005     }
   1006 
   1007 
   1008     // ja_word was adopted by factory
   1009     delete ja_char;
   1010     delete root_word;
   1011     delete root_char;
   1012 #endif
   1013 }
   1014 
   1015 void RBBIAPITest::RoundtripRule(const char *dataFile) {
   1016     UErrorCode status = U_ZERO_ERROR;
   1017     UParseError parseError;
   1018     parseError.line = 0;
   1019     parseError.offset = 0;
   1020     LocalUDataMemoryPointer data(udata_open(U_ICUDATA_BRKITR, "brk", dataFile, &status));
   1021     uint32_t length;
   1022     const UChar *builtSource;
   1023     const uint8_t *rbbiRules;
   1024     const uint8_t *builtRules;
   1025 
   1026     if (U_FAILURE(status)) {
   1027         errcheckln(status, "Can't open \"%s\" - %s", dataFile, u_errorName(status));
   1028         return;
   1029     }
   1030 
   1031     builtRules = (const uint8_t *)udata_getMemory(data.getAlias());
   1032     builtSource = (const UChar *)(builtRules + ((RBBIDataHeader*)builtRules)->fRuleSource);
   1033     RuleBasedBreakIterator *brkItr = new RuleBasedBreakIterator(builtSource, parseError, status);
   1034     if (U_FAILURE(status)) {
   1035         errln("createRuleBasedBreakIterator: ICU Error \"%s\"  at line %d, column %d\n",
   1036                 u_errorName(status), parseError.line, parseError.offset);
   1037         return;
   1038     };
   1039     rbbiRules = brkItr->getBinaryRules(length);
   1040     logln("Comparing \"%s\" len=%d", dataFile, length);
   1041     if (memcmp(builtRules, rbbiRules, (int32_t)length) != 0) {
   1042         errln("Built rules and rebuilt rules are different %s", dataFile);
   1043         return;
   1044     }
   1045     delete brkItr;
   1046 }
   1047 
   1048 void RBBIAPITest::TestRoundtripRules() {
   1049     RoundtripRule("word");
   1050     RoundtripRule("title");
   1051     RoundtripRule("sent");
   1052     RoundtripRule("line");
   1053     RoundtripRule("char");
   1054     if (!quick) {
   1055         RoundtripRule("word_POSIX");
   1056     }
   1057 }
   1058 
   1059 // Try out the RuleBasedBreakIterator constructors that take RBBIDataHeader*
   1060 // (these are protected so we access them via a local class RBBIWithProtectedFunctions).
   1061 // This is just a sanity check, not a thorough test (e.g. we don't check that the
   1062 // first delete actually frees rulesCopy).
   1063 void RBBIAPITest::TestCreateFromRBBIData() {
   1064     // Get some handy RBBIData
   1065     const char *brkName = "word"; // or "sent", "line", "char", etc.
   1066     UErrorCode status = U_ZERO_ERROR;
   1067     LocalUDataMemoryPointer data(udata_open(U_ICUDATA_BRKITR, "brk", brkName, &status));
   1068     if ( U_SUCCESS(status) ) {
   1069         const RBBIDataHeader * builtRules = (const RBBIDataHeader *)udata_getMemory(data.getAlias());
   1070         uint32_t length = builtRules->fLength;
   1071         RBBIWithProtectedFunctions * brkItr;
   1072 
   1073         // Try the memory-adopting constructor, need to copy the data first
   1074         RBBIDataHeader * rulesCopy = (RBBIDataHeader *) uprv_malloc(length);
   1075         if ( rulesCopy ) {
   1076             uprv_memcpy( rulesCopy, builtRules, length );
   1077 
   1078             brkItr = new RBBIWithProtectedFunctions(rulesCopy, status);
   1079             if ( U_SUCCESS(status) ) {
   1080                 delete brkItr; // this should free rulesCopy
   1081             } else {
   1082                 errln("create RuleBasedBreakIterator from RBBIData (adopted): ICU Error \"%s\"\n", u_errorName(status) );
   1083                 status = U_ZERO_ERROR;// reset for the next test
   1084                 uprv_free( rulesCopy );
   1085             }
   1086         }
   1087 
   1088         // Now try the non-adopting constructor
   1089         brkItr = new RBBIWithProtectedFunctions(builtRules, RBBIWithProtectedFunctions::kDontAdopt, status);
   1090         if ( U_SUCCESS(status) ) {
   1091             delete brkItr; // this should NOT attempt to free builtRules
   1092             if (builtRules->fLength != length) { // sanity check
   1093                 errln("create RuleBasedBreakIterator from RBBIData (non-adopted): delete affects data\n" );
   1094             }
   1095         } else {
   1096             errln("create RuleBasedBreakIterator from RBBIData (non-adopted): ICU Error \"%s\"\n", u_errorName(status) );
   1097         }
   1098     }
   1099 
   1100     // getBinaryRules() and RuleBasedBreakIterator(uint8_t binaryRules, ...)
   1101     //
   1102     status = U_ZERO_ERROR;
   1103     RuleBasedBreakIterator *rb = (RuleBasedBreakIterator *)BreakIterator::createWordInstance(Locale::getEnglish(), status);
   1104     if (rb == NULL || U_FAILURE(status)) {
   1105         dataerrln("Unable to create BreakIterator::createWordInstance (Locale::getEnglish) - %s", u_errorName(status));
   1106     } else {
   1107         uint32_t length;
   1108         const uint8_t *rules = rb->getBinaryRules(length);
   1109         RuleBasedBreakIterator *rb2 = new RuleBasedBreakIterator(rules, length, status);
   1110         TEST_ASSERT_SUCCESS(status);
   1111         TEST_ASSERT(*rb == *rb2);
   1112         UnicodeString words = "one two three ";
   1113         rb2->setText(words);
   1114         int wordCounter = 0;
   1115         while (rb2->next() != UBRK_DONE) {
   1116             wordCounter++;
   1117         }
   1118         TEST_ASSERT(wordCounter == 6);
   1119 
   1120         status = U_ZERO_ERROR;
   1121         RuleBasedBreakIterator *rb3 = new RuleBasedBreakIterator(rules, length-1, status);
   1122         TEST_ASSERT(status == U_ILLEGAL_ARGUMENT_ERROR);
   1123 
   1124         delete rb;
   1125         delete rb2;
   1126         delete rb3;
   1127     }
   1128 }
   1129 
   1130 
   1131 void RBBIAPITest::TestRefreshInputText() {
   1132     /*
   1133      *  RefreshInput changes out the input of a Break Iterator without
   1134      *    changing anything else in the iterator's state.  Used with Java JNI,
   1135      *    when Java moves the underlying string storage.   This test
   1136      *    runs BreakIterator::next() repeatedly, moving the text in the middle of the sequence.
   1137      *    The right set of boundaries should still be found.
   1138      */
   1139     UChar testStr[]  = {0x20, 0x41, 0x20, 0x42, 0x20, 0x43, 0x20, 0x44, 0x0};  /* = " A B C D"  */
   1140     UChar movedStr[] = {0x20, 0x20, 0x20, 0x20, 0x20, 0x20, 0x20, 0x20,  0};
   1141     UErrorCode status = U_ZERO_ERROR;
   1142     UText ut1 = UTEXT_INITIALIZER;
   1143     UText ut2 = UTEXT_INITIALIZER;
   1144     RuleBasedBreakIterator *bi = (RuleBasedBreakIterator *)BreakIterator::createLineInstance(Locale::getEnglish(), status);
   1145     TEST_ASSERT_SUCCESS(status);
   1146 
   1147     utext_openUChars(&ut1, testStr, -1, &status);
   1148     TEST_ASSERT_SUCCESS(status);
   1149 
   1150     if (U_SUCCESS(status)) {
   1151         bi->setText(&ut1, status);
   1152         TEST_ASSERT_SUCCESS(status);
   1153 
   1154         /* Line boundaries will occur before each letter in the original string */
   1155         TEST_ASSERT(1 == bi->next());
   1156         TEST_ASSERT(3 == bi->next());
   1157 
   1158         /* Move the string, kill the original string.  */
   1159         u_strcpy(movedStr, testStr);
   1160         u_memset(testStr, 0x20, u_strlen(testStr));
   1161         utext_openUChars(&ut2, movedStr, -1, &status);
   1162         TEST_ASSERT_SUCCESS(status);
   1163         RuleBasedBreakIterator *returnedBI = &bi->refreshInputText(&ut2, status);
   1164         TEST_ASSERT_SUCCESS(status);
   1165         TEST_ASSERT(bi == returnedBI);
   1166 
   1167         /* Find the following matches, now working in the moved string. */
   1168         TEST_ASSERT(5 == bi->next());
   1169         TEST_ASSERT(7 == bi->next());
   1170         TEST_ASSERT(8 == bi->next());
   1171         TEST_ASSERT(UBRK_DONE == bi->next());
   1172 
   1173         utext_close(&ut1);
   1174         utext_close(&ut2);
   1175     }
   1176     delete bi;
   1177 
   1178 }
   1179 
   1180 
   1181 //---------------------------------------------
   1182 // runIndexedTest
   1183 //---------------------------------------------
   1184 
   1185 void RBBIAPITest::runIndexedTest( int32_t index, UBool exec, const char* &name, char* /*par*/ )
   1186 {
   1187     if (exec) logln((UnicodeString)"TestSuite RuleBasedBreakIterator API ");
   1188     switch (index) {
   1189      //   case 0: name = "TestConstruction"; if (exec) TestConstruction(); break;
   1190 #if !UCONFIG_NO_FILE_IO
   1191         case  0: name = "TestCloneEquals"; if (exec) TestCloneEquals(); break;
   1192         case  1: name = "TestgetRules"; if (exec) TestgetRules(); break;
   1193         case  2: name = "TestHashCode"; if (exec) TestHashCode(); break;
   1194         case  3: name = "TestGetSetAdoptText"; if (exec) TestGetSetAdoptText(); break;
   1195         case  4: name = "TestIteration"; if (exec) TestIteration(); break;
   1196 #else
   1197         case  0: case  1: case  2: case  3: case  4: name = "skip"; break;
   1198 #endif
   1199         case  5: name = "TestBuilder"; if (exec) TestBuilder(); break;
   1200         case  6: name = "TestQuoteGrouping"; if (exec) TestQuoteGrouping(); break;
   1201         case  7: name = "TestRuleStatusVec"; if (exec) TestRuleStatusVec(); break;
   1202         case  8: name = "TestBug2190"; if (exec) TestBug2190(); break;
   1203 #if !UCONFIG_NO_FILE_IO
   1204         case  9: name = "TestRegistration"; if (exec) TestRegistration(); break;
   1205         case 10: name = "TestBoilerPlate"; if (exec) TestBoilerPlate(); break;
   1206         case 11: name = "TestRuleStatus"; if (exec) TestRuleStatus(); break;
   1207         case 12: name = "TestRoundtripRules"; if (exec) TestRoundtripRules(); break;
   1208         case 13: name = "TestCreateFromRBBIData"; if (exec) TestCreateFromRBBIData(); break;
   1209 #else
   1210         case  9: case 10: case 11: case 12: case 13: name = "skip"; break;
   1211 #endif
   1212         case 14: name = "TestRefreshInputText"; if (exec) TestRefreshInputText(); break;
   1213 
   1214         default: name = ""; break; // needed to end loop
   1215     }
   1216 }
   1217 
   1218 //---------------------------------------------
   1219 //Internal subroutines
   1220 //---------------------------------------------
   1221 
   1222 void RBBIAPITest::doBoundaryTest(RuleBasedBreakIterator& bi, UnicodeString& text, int32_t *boundaries){
   1223      logln((UnicodeString)"testIsBoundary():");
   1224         int32_t p = 0;
   1225         UBool isB;
   1226         for (int32_t i = 0; i < text.length(); i++) {
   1227             isB = bi.isBoundary(i);
   1228             logln((UnicodeString)"bi.isBoundary(" + i + ") -> " + isB);
   1229 
   1230             if (i == boundaries[p]) {
   1231                 if (!isB)
   1232                     errln((UnicodeString)"Wrong result from isBoundary() for " + i + (UnicodeString)": expected true, got false");
   1233                 p++;
   1234             }
   1235             else {
   1236                 if (isB)
   1237                     errln((UnicodeString)"Wrong result from isBoundary() for " + i + (UnicodeString)": expected false, got true");
   1238             }
   1239         }
   1240 }
   1241 void RBBIAPITest::doTest(UnicodeString& testString, int32_t start, int32_t gotoffset, int32_t expectedOffset, const char* expectedString){
   1242     UnicodeString selected;
   1243     UnicodeString expected=CharsToUnicodeString(expectedString);
   1244 
   1245     if(gotoffset != expectedOffset)
   1246          errln((UnicodeString)"ERROR:****returned #" + gotoffset + (UnicodeString)" instead of #" + expectedOffset);
   1247     if(start <= gotoffset){
   1248         testString.extractBetween(start, gotoffset, selected);
   1249     }
   1250     else{
   1251         testString.extractBetween(gotoffset, start, selected);
   1252     }
   1253     if(selected.compare(expected) != 0)
   1254          errln(prettify((UnicodeString)"ERROR:****selected \"" + selected + "\" instead of \"" + expected + "\""));
   1255     else
   1256         logln(prettify("****selected \"" + selected + "\""));
   1257 }
   1258 
   1259 //---------------------------------------------
   1260 //RBBIWithProtectedFunctions class functions
   1261 //---------------------------------------------
   1262 
   1263 RBBIWithProtectedFunctions::RBBIWithProtectedFunctions(RBBIDataHeader* data, UErrorCode &status)
   1264     : RuleBasedBreakIterator(data, status)
   1265 {
   1266 }
   1267 
   1268 RBBIWithProtectedFunctions::RBBIWithProtectedFunctions(const RBBIDataHeader* data, enum EDontAdopt, UErrorCode &status)
   1269     : RuleBasedBreakIterator(data, RuleBasedBreakIterator::kDontAdopt, status)
   1270 {
   1271 }
   1272 
   1273 #endif /* #if !UCONFIG_NO_BREAK_ITERATION */
   1274