Home | History | Annotate | Download | only in intltest
      1 /****************************************************************************************
      2  * COPYRIGHT:
      3  * Copyright (c) 1997-2014, International Business Machines Corporation and
      4  * others. All Rights Reserved.
      5  * Modification History:
      6  *
      7  *   Date          Name        Description
      8  *   05/22/2000    Madhu       Added tests for testing new API for utf16 support and more
      9  ****************************************************************************************/
     10 
     11 #include <string.h>
     12 #include "utypeinfo.h"  // for 'typeid' to work
     13 
     14 #include "unicode/chariter.h"
     15 #include "unicode/ustring.h"
     16 #include "unicode/unistr.h"
     17 #include "unicode/schriter.h"
     18 #include "unicode/uchriter.h"
     19 #include "unicode/uiter.h"
     20 #include "unicode/putil.h"
     21 #include "unicode/utf16.h"
     22 #include "citrtest.h"
     23 #include "cmemory.h"
     24 
     25 
     26 class  SCharacterIterator : public CharacterIterator {
     27 public:
     28     SCharacterIterator(const UnicodeString& textStr){
     29         text = textStr;
     30         pos=0;
     31         textLength = textStr.length();
     32         begin = 0;
     33         end=textLength;
     34 
     35     }
     36 
     37     virtual ~SCharacterIterator(){};
     38 
     39 
     40     void setText(const UnicodeString& newText){
     41         text = newText;
     42     }
     43 
     44     virtual void getText(UnicodeString& result) {
     45         text.extract(0,text.length(),result);
     46     }
     47     static UClassID getStaticClassID(void){
     48         return (UClassID)(&fgClassID);
     49     }
     50     virtual UClassID getDynamicClassID(void) const{
     51         return getStaticClassID();
     52     }
     53 
     54     virtual UBool operator==(const ForwardCharacterIterator& /*that*/) const{
     55         return TRUE;
     56     }
     57 
     58     virtual CharacterIterator* clone(void) const {
     59         return NULL;
     60     }
     61     virtual int32_t hashCode(void) const{
     62         return DONE;
     63     }
     64     virtual UChar nextPostInc(void){ return text.charAt(pos++);}
     65     virtual UChar32 next32PostInc(void){return text.char32At(pos++);}
     66     virtual UBool hasNext() { return TRUE;};
     67     virtual UChar first(){return DONE;};
     68     virtual UChar32 first32(){return DONE;};
     69     virtual UChar last(){return DONE;};
     70     virtual UChar32 last32(){return DONE;};
     71     virtual UChar setIndex(int32_t /*pos*/){return DONE;};
     72     virtual UChar32 setIndex32(int32_t /*pos*/){return DONE;};
     73     virtual UChar current() const{return DONE;};
     74     virtual UChar32 current32() const{return DONE;};
     75     virtual UChar next(){return DONE;};
     76     virtual UChar32 next32(){return DONE;};
     77     virtual UChar previous(){return DONE;};
     78     virtual UChar32 previous32(){return DONE;};
     79     virtual int32_t move(int32_t delta,CharacterIterator::EOrigin origin){
     80         switch(origin) {
     81         case kStart:
     82             pos = begin + delta;
     83             break;
     84         case kCurrent:
     85             pos += delta;
     86             break;
     87         case kEnd:
     88             pos = end + delta;
     89             break;
     90         default:
     91             break;
     92         }
     93 
     94         if(pos < begin) {
     95             pos = begin;
     96         } else if(pos > end) {
     97             pos = end;
     98         }
     99 
    100         return pos;
    101     };
    102     virtual int32_t move32(int32_t delta, CharacterIterator::EOrigin origin){
    103         switch(origin) {
    104         case kStart:
    105             pos = begin;
    106             if(delta > 0) {
    107                 U16_FWD_N(text, pos, end, delta);
    108             }
    109             break;
    110         case kCurrent:
    111             if(delta > 0) {
    112                 U16_FWD_N(text, pos, end, delta);
    113             } else {
    114                 U16_BACK_N(text, begin, pos, -delta);
    115             }
    116             break;
    117         case kEnd:
    118             pos = end;
    119             if(delta < 0) {
    120                 U16_BACK_N(text, begin, pos, -delta);
    121             }
    122             break;
    123         default:
    124             break;
    125         }
    126 
    127         return pos;
    128     };
    129     virtual UBool hasPrevious() {return TRUE;};
    130 
    131   SCharacterIterator&  operator=(const SCharacterIterator&    that){
    132      text = that.text;
    133      return *this;
    134   }
    135 
    136 
    137 private:
    138     UnicodeString text;
    139     static const char fgClassID;
    140 };
    141 const char SCharacterIterator::fgClassID=0;
    142 
    143 CharIterTest::CharIterTest()
    144 {
    145 }
    146 void CharIterTest::runIndexedTest( int32_t index, UBool exec, const char* &name, char* /*par*/ )
    147 {
    148     if (exec) logln("TestSuite CharIterTest: ");
    149     switch (index) {
    150         case 0: name = "TestConstructionAndEquality"; if (exec) TestConstructionAndEquality(); break;
    151         case 1: name = "TestConstructionAndEqualityUChariter"; if (exec) TestConstructionAndEqualityUChariter(); break;
    152         case 2: name = "TestIteration"; if (exec) TestIteration(); break;
    153         case 3: name = "TestIterationUChar32"; if (exec) TestIterationUChar32(); break;
    154         case 4: name = "TestUCharIterator"; if (exec) TestUCharIterator(); break;
    155         case 5: name = "TestCoverage"; if(exec) TestCoverage(); break;
    156         case 6: name = "TestCharIteratorSubClasses"; if (exec) TestCharIteratorSubClasses(); break;
    157         default: name = ""; break; //needed to end loop
    158     }
    159 }
    160 
    161 void CharIterTest::TestCoverage(){
    162     UnicodeString  testText("Now is the time for all good men to come to the aid of their country.");
    163     UnicodeString testText2("\\ud800\\udc01deadbeef");
    164     testText2 = testText2.unescape();
    165     SCharacterIterator* test = new SCharacterIterator(testText);
    166     if(test->firstPostInc()!= 0x004E){
    167         errln("Failed: firstPostInc() failed");
    168     }
    169     if(test->getIndex()!=1){
    170         errln("Failed: getIndex().");
    171     }
    172     if(test->getLength()!=testText.length()){
    173         errln("Failed: getLength()");
    174     }
    175     test->setToStart();
    176     if(test->getIndex()!=0){
    177         errln("Failed: setToStart().");
    178     }
    179     test->setToEnd();
    180     if(test->getIndex()!=testText.length()){
    181         errln("Failed: setToEnd().");
    182     }
    183     if(test->startIndex() != 0){
    184         errln("Failed: startIndex()");
    185     }
    186     test->setText(testText2);
    187     if(test->first32PostInc()!= testText2.char32At(0)){
    188         errln("Failed: first32PostInc() failed");
    189     }
    190 
    191     delete test;
    192 
    193 }
    194 void CharIterTest::TestConstructionAndEquality() {
    195     UnicodeString  testText("Now is the time for all good men to come to the aid of their country.");
    196     UnicodeString  testText2("Don't bother using this string.");
    197     UnicodeString result1, result2, result3;
    198 
    199     CharacterIterator* test1 = new StringCharacterIterator(testText);
    200     CharacterIterator* test1b= new StringCharacterIterator(testText, -1);
    201     CharacterIterator* test1c= new StringCharacterIterator(testText, 100);
    202     CharacterIterator* test1d= new StringCharacterIterator(testText, -2, 100, 5);
    203     CharacterIterator* test1e= new StringCharacterIterator(testText, 100, 20, 5);
    204     CharacterIterator* test2 = new StringCharacterIterator(testText, 5);
    205     CharacterIterator* test3 = new StringCharacterIterator(testText, 2, 20, 5);
    206     CharacterIterator* test4 = new StringCharacterIterator(testText2);
    207     CharacterIterator* test5 = test1->clone();
    208 
    209     if (test1d->startIndex() < 0)
    210         errln("Construction failed: startIndex is negative");
    211     if (test1d->endIndex() > testText.length())
    212         errln("Construction failed: endIndex is greater than the text length");
    213     if (test1d->getIndex() < test1d->startIndex() || test1d->endIndex() < test1d->getIndex())
    214         errln("Construction failed: index is invalid");
    215 
    216     if (*test1 == *test2 || *test1 == *test3 || *test1 == *test4)
    217         errln("Construction or operator== failed: Unequal objects compared equal");
    218     if (*test1 != *test5)
    219         errln("clone() or equals() failed: Two clones tested unequal");
    220 
    221     if (test1->hashCode() == test2->hashCode() || test1->hashCode() == test3->hashCode()
    222                     || test1->hashCode() == test4->hashCode())
    223         errln("hashCode() failed:  different objects have same hash code");
    224 
    225     if (test1->hashCode() != test5->hashCode())
    226         errln("hashCode() failed:  identical objects have different hash codes");
    227 
    228     if(test1->getLength() != testText.length()){
    229         errln("getLength of CharacterIterator failed");
    230     }
    231     test1->getText(result1);
    232     test1b->getText(result2);
    233     test1c->getText(result3);
    234     if(result1 != result2 ||  result1 != result3)
    235         errln("construction failed or getText() failed");
    236 
    237 
    238     test1->setIndex(5);
    239     if (*test1 != *test2 || *test1 == *test5)
    240         errln("setIndex() failed");
    241 
    242     *((StringCharacterIterator*)test1) = *((StringCharacterIterator*)test3);
    243     if (*test1 != *test3 || *test1 == *test5)
    244         errln("operator= failed");
    245 
    246     delete test2;
    247     delete test3;
    248     delete test4;
    249     delete test5;
    250     delete test1b;
    251     delete test1c;
    252     delete test1d;
    253     delete test1e;
    254 
    255 
    256     StringCharacterIterator* testChar1=new StringCharacterIterator(testText);
    257     StringCharacterIterator* testChar2=new StringCharacterIterator(testText2);
    258     StringCharacterIterator* testChar3=(StringCharacterIterator*)test1->clone();
    259 
    260     testChar1->getText(result1);
    261     testChar2->getText(result2);
    262     testChar3->getText(result3);
    263     if(result1 != result3 || result1 == result2)
    264         errln("getText() failed");
    265     testChar3->setText(testText2);
    266     testChar3->getText(result3);
    267     if(result1 == result3 || result2 != result3)
    268         errln("setText() or getText() failed");
    269     testChar3->setText(testText);
    270     testChar3->getText(result3);
    271     if(result1 != result3 || result1 == result2)
    272         errln("setText() or getText() round-trip failed");
    273 
    274     delete testChar1;
    275     delete testChar2;
    276     delete testChar3;
    277     delete test1;
    278 
    279 }
    280 void CharIterTest::TestConstructionAndEqualityUChariter() {
    281     U_STRING_DECL(testText, "Now is the time for all good men to come to the aid of their country.", 69);
    282     U_STRING_DECL(testText2, "Don't bother using this string.", 31);
    283 
    284     U_STRING_INIT(testText, "Now is the time for all good men to come to the aid of their country.", 69);
    285     U_STRING_INIT(testText2, "Don't bother using this string.", 31);
    286 
    287     UnicodeString result, result4, result5;
    288 
    289     UCharCharacterIterator* test1 = new UCharCharacterIterator(testText, u_strlen(testText));
    290     UCharCharacterIterator* test2 = new UCharCharacterIterator(testText, u_strlen(testText), 5);
    291     UCharCharacterIterator* test3 = new UCharCharacterIterator(testText, u_strlen(testText), 2, 20, 5);
    292     UCharCharacterIterator* test4 = new UCharCharacterIterator(testText2, u_strlen(testText2));
    293     UCharCharacterIterator* test5 = (UCharCharacterIterator*)test1->clone();
    294     UCharCharacterIterator* test6 = new UCharCharacterIterator(*test1);
    295 
    296     // j785: length=-1 will use u_strlen()
    297     UCharCharacterIterator* test7a = new UCharCharacterIterator(testText, -1);
    298     UCharCharacterIterator* test7b = new UCharCharacterIterator(testText, -1);
    299     UCharCharacterIterator* test7c = new UCharCharacterIterator(testText, -1, 2, 20, 5);
    300 
    301     // Bad parameters.
    302     UCharCharacterIterator* test8a = new UCharCharacterIterator(testText, -1, -1, 20, 5);
    303     UCharCharacterIterator* test8b = new UCharCharacterIterator(testText, -1, 2, 100, 5);
    304     UCharCharacterIterator* test8c = new UCharCharacterIterator(testText, -1, 2, 20, 100);
    305 
    306     if (test8a->startIndex() < 0)
    307         errln("Construction failed: startIndex is negative");
    308     if (test8b->endIndex() != u_strlen(testText))
    309         errln("Construction failed: endIndex is different from the text length");
    310     if (test8c->getIndex() < test8c->startIndex() || test8c->endIndex() < test8c->getIndex())
    311         errln("Construction failed: index is invalid");
    312 
    313     if (*test1 == *test2 || *test1 == *test3 || *test1 == *test4 )
    314         errln("Construction or operator== failed: Unequal objects compared equal");
    315     if (*test1 != *test5 )
    316         errln("clone() or equals() failed: Two clones tested unequal");
    317 
    318     if (*test6 != *test1 )
    319         errln("copy construction or equals() failed: Two copies tested unequal");
    320 
    321     if (test1->hashCode() == test2->hashCode() || test1->hashCode() == test3->hashCode()
    322                     || test1->hashCode() == test4->hashCode())
    323         errln("hashCode() failed:  different objects have same hash code");
    324 
    325     if (test1->hashCode() != test5->hashCode())
    326         errln("hashCode() failed:  identical objects have different hash codes");
    327 
    328     test7a->getText(result);
    329     test7b->getText(result4);
    330     test7c->getText(result5);
    331 
    332     if(result != UnicodeString(testText) || result4 != result || result5 != result)
    333         errln("error in construction");
    334 
    335     test1->getText(result);
    336     test4->getText(result4);
    337     test5->getText(result5);
    338     if(result != result5 || result == result4)
    339         errln("getText() failed");
    340     test5->setText(testText2, u_strlen(testText2));
    341     test5->getText(result5);
    342     if(result == result5 || result4 != result5)
    343         errln("setText() or getText() failed");
    344     test5->setText(testText, u_strlen(testText));
    345     test5->getText(result5);
    346     if(result != result5 || result == result4)
    347         errln("setText() or getText() round-trip failed");
    348 
    349 
    350     test1->setIndex(5);
    351     if (*test1 != *test2 || *test1 == *test5)
    352         errln("setIndex() failed");
    353     test8b->setIndex32(5);
    354     if (test8b->getIndex()!=5)
    355         errln("setIndex32() failed");
    356 
    357     *test1 = *test3;
    358     if (*test1 != *test3 || *test1 == *test5)
    359         errln("operator= failed");
    360 
    361     delete test1;
    362     delete test2;
    363     delete test3;
    364     delete test4;
    365     delete test5;
    366     delete test6;
    367     delete test7a;
    368     delete test7b;
    369     delete test7c;
    370     delete test8a;
    371     delete test8b;
    372     delete test8c;
    373 }
    374 
    375 
    376 void CharIterTest::TestIteration() {
    377     UnicodeString text("Now is the time for all good men to come to the aid of their country.");
    378 
    379     UChar c;
    380     int32_t i;
    381     {
    382         StringCharacterIterator   iter(text, 5);
    383 
    384         UnicodeString iterText;
    385         iter.getText(iterText);
    386         if (iterText != text)
    387           errln("iter.getText() failed");
    388 
    389         if (iter.current() != text[(int32_t)5])
    390             errln("Iterator didn't start out in the right place.");
    391 
    392         c = iter.first();
    393         i = 0;
    394 
    395         if (iter.startIndex() != 0 || iter.endIndex() != text.length())
    396             errln("startIndex() or endIndex() failed");
    397 
    398         logln("Testing forward iteration...");
    399         do {
    400             if (c == CharacterIterator::DONE && i != text.length())
    401                 errln("Iterator reached end prematurely");
    402             else if (c != text[i])
    403                 errln((UnicodeString)"Character mismatch at position " + i +
    404                                     ", iterator has " + UCharToUnicodeString(c) +
    405                                     ", string has " + UCharToUnicodeString(text[i]));
    406 
    407             if (iter.current() != c)
    408                 errln("current() isn't working right");
    409             if (iter.getIndex() != i)
    410                 errln("getIndex() isn't working right");
    411 
    412             if (c != CharacterIterator::DONE) {
    413                 c = iter.next();
    414                 i++;
    415             }
    416         } while (c != CharacterIterator::DONE);
    417         c=iter.next();
    418         if(c!= CharacterIterator::DONE)
    419             errln("next() didn't return DONE at the end");
    420         c=iter.setIndex(text.length()+1);
    421         if(c!= CharacterIterator::DONE)
    422             errln("setIndex(len+1) didn't return DONE");
    423 
    424         c = iter.last();
    425         i = text.length() - 1;
    426 
    427         logln("Testing backward iteration...");
    428         do {
    429             if (c == CharacterIterator::DONE && i >= 0)
    430                 errln("Iterator reached end prematurely");
    431             else if (c != text[i])
    432                 errln((UnicodeString)"Character mismatch at position " + i +
    433                                     ", iterator has " + UCharToUnicodeString(c) +
    434                                     ", string has " + UCharToUnicodeString(text[i]));
    435 
    436             if (iter.current() != c)
    437                 errln("current() isn't working right");
    438             if (iter.getIndex() != i)
    439                 errln("getIndex() isn't working right");
    440             if(iter.setIndex(i) != c)
    441                 errln("setIndex() isn't working right");
    442 
    443             if (c != CharacterIterator::DONE) {
    444                 c = iter.previous();
    445                 i--;
    446             }
    447         } while (c != CharacterIterator::DONE);
    448 
    449         c=iter.previous();
    450         if(c!= CharacterIterator::DONE)
    451             errln("previous didn't return DONE at the beginning");
    452 
    453 
    454         //testing firstPostInc, nextPostInc, setTostart
    455         i = 0;
    456         c=iter.firstPostInc();
    457         if(c != text[i])
    458             errln((UnicodeString)"firstPostInc failed.  Expected->" +
    459                          UCharToUnicodeString(text[i]) + " Got->" + UCharToUnicodeString(c));
    460         if(iter.getIndex() != i+1)
    461             errln((UnicodeString)"getIndex() after firstPostInc() failed");
    462 
    463         iter.setToStart();
    464         i=0;
    465         if (iter.startIndex() != 0)
    466             errln("setToStart failed");
    467 
    468         logln("Testing forward iteration...");
    469         do {
    470             if (c != CharacterIterator::DONE)
    471                 c = iter.nextPostInc();
    472 
    473             if(c != text[i])
    474                 errln((UnicodeString)"Character mismatch at position " + i +
    475                                     (UnicodeString)", iterator has " + UCharToUnicodeString(c) +
    476                                     (UnicodeString)", string has " + UCharToUnicodeString(text[i]));
    477 
    478             i++;
    479             if(iter.getIndex() != i)
    480                 errln("getIndex() aftr nextPostInc() isn't working right");
    481             if(iter.current() != text[i])
    482                 errln("current() after nextPostInc() isn't working right");
    483         } while (iter.hasNext());
    484         c=iter.nextPostInc();
    485         if(c!= CharacterIterator::DONE)
    486             errln("nextPostInc() didn't return DONE at the beginning");
    487     }
    488 
    489     {
    490         StringCharacterIterator iter(text, 5, 15, 10);
    491         if (iter.startIndex() != 5 || iter.endIndex() != 15)
    492             errln("creation of a restricted-range iterator failed");
    493 
    494         if (iter.getIndex() != 10 || iter.current() != text[(int32_t)10])
    495             errln("starting the iterator in the middle didn't work");
    496 
    497         c = iter.first();
    498         i = 5;
    499 
    500         logln("Testing forward iteration over a range...");
    501         do {
    502             if (c == CharacterIterator::DONE && i != 15)
    503                 errln("Iterator reached end prematurely");
    504             else if (c != text[i])
    505                 errln((UnicodeString)"Character mismatch at position " + i +
    506                                     ", iterator has " + UCharToUnicodeString(c) +
    507                                     ", string has " + UCharToUnicodeString(text[i]));
    508 
    509             if (iter.current() != c)
    510                 errln("current() isn't working right");
    511             if (iter.getIndex() != i)
    512                 errln("getIndex() isn't working right");
    513             if(iter.setIndex(i) != c)
    514                 errln("setIndex() isn't working right");
    515 
    516             if (c != CharacterIterator::DONE) {
    517                 c = iter.next();
    518                 i++;
    519             }
    520         } while (c != CharacterIterator::DONE);
    521 
    522         c = iter.last();
    523         i = 14;
    524 
    525         logln("Testing backward iteration over a range...");
    526         do {
    527             if (c == CharacterIterator::DONE && i >= 5)
    528                 errln("Iterator reached end prematurely");
    529             else if (c != text[i])
    530                 errln((UnicodeString)"Character mismatch at position " + i +
    531                                     ", iterator has " + UCharToUnicodeString(c) +
    532                                     ", string has " + UCharToUnicodeString(text[i]));
    533 
    534             if (iter.current() != c)
    535                 errln("current() isn't working right");
    536             if (iter.getIndex() != i)
    537                 errln("getIndex() isn't working right");
    538 
    539             if (c != CharacterIterator::DONE) {
    540                 c = iter.previous();
    541                 i--;
    542             }
    543         } while (c != CharacterIterator::DONE);
    544 
    545 
    546     }
    547 }
    548 
    549 //Tests for new API for utf-16 support
    550 void CharIterTest::TestIterationUChar32() {
    551     UChar textChars[]={ 0x0061, 0x0062, 0xd841, 0xdc02, 0x20ac, 0xd7ff, 0xd842, 0xdc06, 0xd801, 0xdc00, 0x0061, 0x0000};
    552     UnicodeString text(textChars);
    553     UChar32 c;
    554     int32_t i;
    555     {
    556         StringCharacterIterator   iter(text, 1);
    557 
    558         UnicodeString iterText;
    559         iter.getText(iterText);
    560         if (iterText != text)
    561           errln("iter.getText() failed");
    562 
    563         if (iter.current32() != text[(int32_t)1])
    564             errln("Iterator didn't start out in the right place.");
    565 
    566         c=iter.setToStart();
    567         i=0;
    568         i=iter.move32(1, CharacterIterator::kStart);
    569         c=iter.current32();
    570         if(c != text.char32At(1) || i!=1)
    571             errln("move32(1, kStart) didn't work correctly expected %X got %X", c, text.char32At(1) );
    572 
    573         i=iter.move32(2, CharacterIterator::kCurrent);
    574         c=iter.current32();
    575         if(c != text.char32At(4) || i!=4)
    576             errln("move32(2, kCurrent) didn't work correctly expected %X got %X i=%ld", c, text.char32At(4), i);
    577 
    578         i=iter.move32(-2, CharacterIterator::kCurrent);
    579         c=iter.current32();
    580         if(c != text.char32At(1) || i!=1)
    581             errln("move32(-2, kCurrent) didn't work correctly expected %X got %X i=%d", c, text.char32At(1), i);
    582 
    583 
    584         i=iter.move32(-2, CharacterIterator::kEnd);
    585         c=iter.current32();
    586         if(c != text.char32At((text.length()-3)) || i!=(text.length()-3))
    587             errln("move32(-2, kEnd) didn't work correctly expected %X got %X i=%d", c, text.char32At((text.length()-3)), i);
    588 
    589 
    590         c = iter.first32();
    591         i = 0;
    592 
    593         if (iter.startIndex() != 0 || iter.endIndex() != text.length())
    594             errln("startIndex() or endIndex() failed");
    595 
    596         logln("Testing forward iteration...");
    597         do {
    598             /* logln("c=%d i=%d char32At=%d", c, i, text.char32At(i)); */
    599             if (c == CharacterIterator::DONE && i != text.length())
    600                 errln("Iterator reached end prematurely");
    601             else if(iter.hasNext() == FALSE && i != text.length())
    602                 errln("Iterator reached end prematurely.  Failed at hasNext");
    603             else if (c != text.char32At(i))
    604                 errln("Character mismatch at position %d, iterator has %X, string has %X", i, c, text.char32At(i));
    605 
    606             if (iter.current32() != c)
    607                 errln("current32() isn't working right");
    608             if(iter.setIndex32(i) != c)
    609                 errln("setIndex32() isn't working right");
    610             if (c != CharacterIterator::DONE) {
    611                 c = iter.next32();
    612                 i=UTF16_NEED_MULTIPLE_UCHAR(c) ? i+2 : i+1;
    613             }
    614         } while (c != CharacterIterator::DONE);
    615         if(iter.hasNext() == TRUE)
    616            errln("hasNext() returned true at the end of the string");
    617 
    618 
    619 
    620         c=iter.setToEnd();
    621         if(iter.getIndex() != text.length() || iter.hasNext() != FALSE)
    622             errln("setToEnd failed");
    623 
    624         c=iter.next32();
    625         if(c!= CharacterIterator::DONE)
    626             errln("next32 didn't return DONE at the end");
    627         c=iter.setIndex32(text.length()+1);
    628         if(c!= CharacterIterator::DONE)
    629             errln("setIndex32(len+1) didn't return DONE");
    630 
    631 
    632         c = iter.last32();
    633         i = text.length()-1;
    634         logln("Testing backward iteration...");
    635         do {
    636             if (c == CharacterIterator::DONE && i >= 0)
    637                 errln((UnicodeString)"Iterator reached start prematurely for i=" + i);
    638             else if(iter.hasPrevious() == FALSE && i>0)
    639                 errln((UnicodeString)"Iterator reached start prematurely for i=" + i);
    640             else if (c != text.char32At(i))
    641                 errln("Character mismatch at position %d, iterator has %X, string has %X", i, c, text.char32At(i));
    642 
    643             if (iter.current32() != c)
    644                 errln("current32() isn't working right");
    645             if(iter.setIndex32(i) != c)
    646                 errln("setIndex32() isn't working right");
    647             if (iter.getIndex() != i)
    648                 errln("getIndex() isn't working right");
    649             if (c != CharacterIterator::DONE) {
    650                 c = iter.previous32();
    651                 i=UTF16_NEED_MULTIPLE_UCHAR(c) ? i-2 : i-1;
    652             }
    653         } while (c != CharacterIterator::DONE);
    654         if(iter.hasPrevious() == TRUE)
    655             errln("hasPrevious returned true after reaching the start");
    656 
    657         c=iter.previous32();
    658         if(c!= CharacterIterator::DONE)
    659             errln("previous32 didn't return DONE at the beginning");
    660 
    661 
    662 
    663 
    664         //testing first32PostInc, next32PostInc, setTostart
    665         i = 0;
    666         c=iter.first32PostInc();
    667         if(c != text.char32At(i))
    668             errln("first32PostInc failed.  Expected->%X Got->%X", text.char32At(i), c);
    669         if(iter.getIndex() != U16_LENGTH(c) + i)
    670             errln((UnicodeString)"getIndex() after first32PostInc() failed");
    671 
    672         iter.setToStart();
    673         i=0;
    674         if (iter.startIndex() != 0)
    675             errln("setToStart failed");
    676 
    677         logln("Testing forward iteration...");
    678         do {
    679             if (c != CharacterIterator::DONE)
    680                 c = iter.next32PostInc();
    681 
    682             if(c != text.char32At(i))
    683                 errln("Character mismatch at position %d, iterator has %X, string has %X", i, c, text.char32At(i));
    684 
    685             i=UTF16_NEED_MULTIPLE_UCHAR(c) ? i+2 : i+1;
    686             if(iter.getIndex() != i)
    687                 errln("getIndex() aftr next32PostInc() isn't working right");
    688             if(iter.current32() != text.char32At(i))
    689                 errln("current() after next32PostInc() isn't working right");
    690         } while (iter.hasNext());
    691         c=iter.next32PostInc();
    692         if(c!= CharacterIterator::DONE)
    693             errln("next32PostInc() didn't return DONE at the beginning");
    694 
    695 
    696     }
    697 
    698     {
    699         StringCharacterIterator iter(text, 1, 11, 10);
    700         if (iter.startIndex() != 1 || iter.endIndex() != 11)
    701             errln("creation of a restricted-range iterator failed");
    702 
    703         if (iter.getIndex() != 10 || iter.current32() != text.char32At(10))
    704             errln("starting the iterator in the middle didn't work");
    705 
    706         c = iter.first32();
    707 
    708         i = 1;
    709 
    710         logln("Testing forward iteration over a range...");
    711         do {
    712             if (c == CharacterIterator::DONE && i != 11)
    713                 errln("Iterator reached end prematurely");
    714             else if(iter.hasNext() == FALSE)
    715                 errln("Iterator reached end prematurely");
    716             else if (c != text.char32At(i))
    717                 errln("Character mismatch at position %d, iterator has %X, string has %X", i, c, text.char32At(i));
    718 
    719             if (iter.current32() != c)
    720                 errln("current32() isn't working right");
    721             if(iter.setIndex32(i) != c)
    722                 errln("setIndex32() isn't working right");
    723 
    724             if (c != CharacterIterator::DONE) {
    725                 c = iter.next32();
    726                 i=UTF16_NEED_MULTIPLE_UCHAR(c) ? i+2 : i+1;
    727             }
    728         } while (c != CharacterIterator::DONE);
    729         c=iter.next32();
    730         if(c != CharacterIterator::DONE)
    731             errln("error in next32()");
    732 
    733 
    734 
    735         c=iter.last32();
    736         i = 10;
    737         logln("Testing backward iteration over a range...");
    738         do {
    739             if (c == CharacterIterator::DONE && i >= 5)
    740                 errln("Iterator reached start prematurely");
    741             else if(iter.hasPrevious() == FALSE && i > 5)
    742                 errln("Iterator reached start prematurely");
    743             else if (c != text.char32At(i))
    744                 errln("Character mismatch at position %d, iterator has %X, string has %X", i, c, text.char32At(i));
    745             if (iter.current32() != c)
    746                 errln("current32() isn't working right");
    747             if (iter.getIndex() != i)
    748                 errln("getIndex() isn't working right");
    749             if(iter.setIndex32(i) != c)
    750                 errln("setIndex32() isn't working right");
    751 
    752             if (c != CharacterIterator::DONE) {
    753                 c = iter.previous32();
    754                 i=UTF16_NEED_MULTIPLE_UCHAR(c) ? i-2 : i-1;
    755             }
    756 
    757         } while (c != CharacterIterator::DONE);
    758         c=iter.previous32();
    759         if(c!= CharacterIterator::DONE)
    760             errln("error on previous32");
    761 
    762 
    763     }
    764 }
    765 
    766 void CharIterTest::TestUCharIterator(UCharIterator *iter, CharacterIterator &ci,
    767                                      const char *moves, const char *which) {
    768     int32_t m;
    769     UChar32 c, c2;
    770     UBool h, h2;
    771 
    772     for(m=0;; ++m) {
    773         // move both iter and s[index]
    774         switch(moves[m]) {
    775         case '0':
    776             h=iter->hasNext(iter);
    777             h2=ci.hasNext();
    778             c=iter->current(iter);
    779             c2=ci.current();
    780             break;
    781         case '|':
    782             h=iter->hasNext(iter);
    783             h2=ci.hasNext();
    784             c=uiter_current32(iter);
    785             c2=ci.current32();
    786             break;
    787 
    788         case '+':
    789             h=iter->hasNext(iter);
    790             h2=ci.hasNext();
    791             c=iter->next(iter);
    792             c2=ci.nextPostInc();
    793             break;
    794         case '>':
    795             h=iter->hasNext(iter);
    796             h2=ci.hasNext();
    797             c=uiter_next32(iter);
    798             c2=ci.next32PostInc();
    799             break;
    800 
    801         case '-':
    802             h=iter->hasPrevious(iter);
    803             h2=ci.hasPrevious();
    804             c=iter->previous(iter);
    805             c2=ci.previous();
    806             break;
    807         case '<':
    808             h=iter->hasPrevious(iter);
    809             h2=ci.hasPrevious();
    810             c=uiter_previous32(iter);
    811             c2=ci.previous32();
    812             break;
    813 
    814         case '2':
    815             h=h2=FALSE;
    816             c=(UChar32)iter->move(iter, 2, UITER_CURRENT);
    817             c2=(UChar32)ci.move(2, CharacterIterator::kCurrent);
    818             break;
    819 
    820         case '8':
    821             h=h2=FALSE;
    822             c=(UChar32)iter->move(iter, -2, UITER_CURRENT);
    823             c2=(UChar32)ci.move(-2, CharacterIterator::kCurrent);
    824             break;
    825 
    826         case 0:
    827             return;
    828         default:
    829             errln("error: unexpected move character '%c' in \"%s\"", moves[m], moves);
    830             return;
    831         }
    832 
    833         // compare results
    834         if(c2==0xffff) {
    835             c2=(UChar32)-1;
    836         }
    837         if(c!=c2 || h!=h2 || ci.getIndex()!=iter->getIndex(iter, UITER_CURRENT)) {
    838             errln("error: UCharIterator(%s) misbehaving at \"%s\"[%d]='%c'", which, moves, m, moves[m]);
    839         }
    840     }
    841 }
    842 
    843 void CharIterTest::TestUCharIterator() {
    844     // test string of length 8
    845     UnicodeString s=UnicodeString("a \\U00010001b\\U0010fffdz", "").unescape();
    846     const char *const moves=
    847         "0+++++++++" // 10 moves per line
    848         "----0-----"
    849         ">>|>>>>>>>"
    850         "<<|<<<<<<<"
    851         "22+>8>-8+2";
    852 
    853     StringCharacterIterator sci(s), compareCI(s);
    854 
    855     UCharIterator sIter, cIter, rIter;
    856 
    857     uiter_setString(&sIter, s.getBuffer(), s.length());
    858     uiter_setCharacterIterator(&cIter, &sci);
    859     uiter_setReplaceable(&rIter, &s);
    860 
    861     TestUCharIterator(&sIter, compareCI, moves, "uiter_setString");
    862     compareCI.setIndex(0);
    863     TestUCharIterator(&cIter, compareCI, moves, "uiter_setCharacterIterator");
    864     compareCI.setIndex(0);
    865     TestUCharIterator(&rIter, compareCI, moves, "uiter_setReplaceable");
    866 
    867     // test move & getIndex some more
    868     sIter.start=2;
    869     sIter.index=3;
    870     sIter.limit=5;
    871     if( sIter.getIndex(&sIter, UITER_ZERO)!=0 ||
    872         sIter.getIndex(&sIter, UITER_START)!=2 ||
    873         sIter.getIndex(&sIter, UITER_CURRENT)!=3 ||
    874         sIter.getIndex(&sIter, UITER_LIMIT)!=5 ||
    875         sIter.getIndex(&sIter, UITER_LENGTH)!=s.length()
    876     ) {
    877         errln("error: UCharIterator(string).getIndex returns wrong index");
    878     }
    879 
    880     if( sIter.move(&sIter, 4, UITER_ZERO)!=4 ||
    881         sIter.move(&sIter, 1, UITER_START)!=3 ||
    882         sIter.move(&sIter, 3, UITER_CURRENT)!=5 ||
    883         sIter.move(&sIter, -1, UITER_LIMIT)!=4 ||
    884         sIter.move(&sIter, -5, UITER_LENGTH)!=3 ||
    885         sIter.move(&sIter, 0, UITER_CURRENT)!=sIter.getIndex(&sIter, UITER_CURRENT) ||
    886         sIter.getIndex(&sIter, UITER_CURRENT)!=3
    887     ) {
    888         errln("error: UCharIterator(string).move sets/returns wrong index");
    889     }
    890 
    891     sci=StringCharacterIterator(s, 2, 5, 3);
    892     uiter_setCharacterIterator(&cIter, &sci);
    893     if( cIter.getIndex(&cIter, UITER_ZERO)!=0 ||
    894         cIter.getIndex(&cIter, UITER_START)!=2 ||
    895         cIter.getIndex(&cIter, UITER_CURRENT)!=3 ||
    896         cIter.getIndex(&cIter, UITER_LIMIT)!=5 ||
    897         cIter.getIndex(&cIter, UITER_LENGTH)!=s.length()
    898     ) {
    899         errln("error: UCharIterator(character iterator).getIndex returns wrong index");
    900     }
    901 
    902     if( cIter.move(&cIter, 4, UITER_ZERO)!=4 ||
    903         cIter.move(&cIter, 1, UITER_START)!=3 ||
    904         cIter.move(&cIter, 3, UITER_CURRENT)!=5 ||
    905         cIter.move(&cIter, -1, UITER_LIMIT)!=4 ||
    906         cIter.move(&cIter, -5, UITER_LENGTH)!=3 ||
    907         cIter.move(&cIter, 0, UITER_CURRENT)!=cIter.getIndex(&cIter, UITER_CURRENT) ||
    908         cIter.getIndex(&cIter, UITER_CURRENT)!=3
    909     ) {
    910         errln("error: UCharIterator(character iterator).move sets/returns wrong index");
    911     }
    912 
    913 
    914     if(cIter.getIndex(&cIter, (enum UCharIteratorOrigin)-1) != -1)
    915     {
    916         errln("error: UCharIterator(char iter).getIndex did not return error value");
    917     }
    918 
    919     if(cIter.move(&cIter, 0, (enum UCharIteratorOrigin)-1) != -1)
    920     {
    921         errln("error: UCharIterator(char iter).move did not return error value");
    922     }
    923 
    924 
    925     if(rIter.getIndex(&rIter, (enum UCharIteratorOrigin)-1) != -1)
    926     {
    927         errln("error: UCharIterator(repl iter).getIndex did not return error value");
    928     }
    929 
    930     if(rIter.move(&rIter, 0, (enum UCharIteratorOrigin)-1) != -1)
    931     {
    932         errln("error: UCharIterator(repl iter).move did not return error value");
    933     }
    934 
    935 
    936     if(sIter.getIndex(&sIter, (enum UCharIteratorOrigin)-1) != -1)
    937     {
    938         errln("error: UCharIterator(string iter).getIndex did not return error value");
    939     }
    940 
    941     if(sIter.move(&sIter, 0, (enum UCharIteratorOrigin)-1) != -1)
    942     {
    943         errln("error: UCharIterator(string iter).move did not return error value");
    944     }
    945 
    946     /* Testing function coverage on bad input */
    947     UErrorCode status = U_ZERO_ERROR;
    948     uiter_setString(&sIter, NULL, 1);
    949     uiter_setState(&sIter, 1, &status);
    950     if (status != U_UNSUPPORTED_ERROR) {
    951         errln("error: uiter_setState returned %s instead of U_UNSUPPORTED_ERROR", u_errorName(status));
    952     }
    953     status = U_ZERO_ERROR;
    954     uiter_setState(NULL, 1, &status);
    955     if (status != U_ILLEGAL_ARGUMENT_ERROR) {
    956         errln("error: uiter_setState returned %s instead of U_ILLEGAL_ARGUMENT_ERROR", u_errorName(status));
    957     }
    958     if (uiter_getState(&sIter) != UITER_NO_STATE) {
    959         errln("error: uiter_getState did not return UITER_NO_STATE on bad input");
    960     }
    961 }
    962 
    963 // subclass test, and completing API coverage -------------------------------
    964 
    965 class SubCharIter : public CharacterIterator {
    966 public:
    967     // public default constructor, to get coverage of CharacterIterator()
    968     SubCharIter() : CharacterIterator() {
    969         textLength=end=UPRV_LENGTHOF(s);
    970         s[0]=0x61;      // 'a'
    971         s[1]=0xd900;    // U+50400
    972         s[2]=0xdd00;
    973         s[3]=0x2029;    // PS
    974     }
    975 
    976     // useful stuff, mostly dummy but testing coverage and subclassability
    977     virtual UChar nextPostInc() {
    978         if(pos<UPRV_LENGTHOF(s)) {
    979             return s[pos++];
    980         } else {
    981             return DONE;
    982         }
    983     }
    984 
    985     virtual UChar32 next32PostInc() {
    986         if(pos<UPRV_LENGTHOF(s)) {
    987             UChar32 c;
    988             U16_NEXT(s, pos, UPRV_LENGTHOF(s), c);
    989             return c;
    990         } else {
    991             return DONE;
    992         }
    993     }
    994 
    995     virtual UBool hasNext() {
    996         return pos<UPRV_LENGTHOF(s);
    997     }
    998 
    999     virtual UChar first() {
   1000         pos=0;
   1001         return s[0];
   1002     }
   1003 
   1004     virtual UChar32 first32() {
   1005         UChar32 c;
   1006         pos=0;
   1007         U16_NEXT(s, pos, UPRV_LENGTHOF(s), c);
   1008         pos=0;
   1009         return c;
   1010     }
   1011 
   1012     virtual UChar setIndex(int32_t position) {
   1013         if(0<=position && position<=UPRV_LENGTHOF(s)) {
   1014             pos=position;
   1015             if(pos<UPRV_LENGTHOF(s)) {
   1016                 return s[pos];
   1017             }
   1018         }
   1019         return DONE;
   1020     }
   1021 
   1022     virtual UChar32 setIndex32(int32_t position) {
   1023         if(0<=position && position<=UPRV_LENGTHOF(s)) {
   1024             pos=position;
   1025             if(pos<UPRV_LENGTHOF(s)) {
   1026                 UChar32 c;
   1027                 U16_GET(s, 0, pos, UPRV_LENGTHOF(s), c);
   1028                 return c;
   1029             }
   1030         }
   1031         return DONE;
   1032     }
   1033 
   1034     virtual UChar current() const {
   1035         if(pos<UPRV_LENGTHOF(s)) {
   1036             return s[pos];
   1037         } else {
   1038             return DONE;
   1039         }
   1040     }
   1041 
   1042     virtual UChar32 current32() const {
   1043         if(pos<UPRV_LENGTHOF(s)) {
   1044             UChar32 c;
   1045             U16_GET(s, 0, pos, UPRV_LENGTHOF(s), c);
   1046             return c;
   1047         } else {
   1048             return DONE;
   1049         }
   1050     }
   1051 
   1052     virtual UChar next() {
   1053         if(pos<UPRV_LENGTHOF(s) && ++pos<UPRV_LENGTHOF(s)) {
   1054             return s[pos];
   1055         } else {
   1056             return DONE;
   1057         }
   1058     }
   1059 
   1060     virtual UChar32 next32() {
   1061         if(pos<UPRV_LENGTHOF(s)) {
   1062             U16_FWD_1(s, pos, UPRV_LENGTHOF(s));
   1063         }
   1064         if(pos<UPRV_LENGTHOF(s)) {
   1065             UChar32 c;
   1066             int32_t i=pos;
   1067             U16_NEXT(s, i, UPRV_LENGTHOF(s), c);
   1068             return c;
   1069         } else {
   1070             return DONE;
   1071         }
   1072     }
   1073 
   1074     virtual UBool hasPrevious() {
   1075         return pos>0;
   1076     }
   1077 
   1078     virtual void getText(UnicodeString &result) {
   1079         result.setTo(s, UPRV_LENGTHOF(s));
   1080     }
   1081 
   1082     // dummy implementations of other pure virtual base class functions
   1083     virtual UBool operator==(const ForwardCharacterIterator &that) const {
   1084         return
   1085             this==&that ||
   1086             (typeid(*this)==typeid(that) && pos==((SubCharIter &)that).pos);
   1087     }
   1088 
   1089     virtual int32_t hashCode() const {
   1090         return 2;
   1091     }
   1092 
   1093     virtual CharacterIterator *clone() const {
   1094         return NULL;
   1095     }
   1096 
   1097     virtual UChar last() {
   1098         return 0;
   1099     }
   1100 
   1101     virtual UChar32 last32() {
   1102         return 0;
   1103     }
   1104 
   1105     virtual UChar previous() {
   1106         return 0;
   1107     }
   1108 
   1109     virtual UChar32 previous32() {
   1110         return 0;
   1111     }
   1112 
   1113     virtual int32_t move(int32_t /*delta*/, EOrigin /*origin*/) {
   1114         return 0;
   1115     }
   1116 
   1117     virtual int32_t move32(int32_t /*delta*/, EOrigin /*origin*/) {
   1118         return 0;
   1119     }
   1120 
   1121     // RTTI
   1122     static UClassID getStaticClassID() {
   1123         return (UClassID)(&fgClassID);
   1124     }
   1125 
   1126     virtual UClassID getDynamicClassID() const {
   1127         return getStaticClassID();
   1128     }
   1129 
   1130 private:
   1131     // dummy string data
   1132     UChar s[4];
   1133 
   1134     static const char fgClassID;
   1135 };
   1136 
   1137 const char SubCharIter::fgClassID = 0;
   1138 
   1139 class SubStringCharIter : public StringCharacterIterator {
   1140 public:
   1141     SubStringCharIter() {
   1142         setText(UNICODE_STRING("abc", 3));
   1143     }
   1144 };
   1145 
   1146 class SubUCharCharIter : public UCharCharacterIterator {
   1147 public:
   1148     SubUCharCharIter() {
   1149         setText(u, 3);
   1150     }
   1151 
   1152 private:
   1153     static const UChar u[3];
   1154 };
   1155 
   1156 const UChar SubUCharCharIter::u[3]={ 0x61, 0x62, 0x63 };
   1157 
   1158 void CharIterTest::TestCharIteratorSubClasses() {
   1159     SubCharIter *p;
   1160 
   1161     // coverage - call functions that are not otherwise tested
   1162     // first[32]PostInc() are default implementations that are overridden
   1163     // in ICU's own CharacterIterator subclasses
   1164     p=new SubCharIter;
   1165     if(p->firstPostInc()!=0x61) {
   1166         errln("SubCharIter.firstPosInc() failed\n");
   1167     }
   1168     delete p;
   1169 
   1170     p=new SubCharIter[2];
   1171     if(p[1].first32PostInc()!=0x61) {
   1172         errln("SubCharIter.first32PosInc() failed\n");
   1173     }
   1174     delete [] p;
   1175 
   1176     // coverage: StringCharacterIterator default constructor
   1177     SubStringCharIter sci;
   1178     if(sci.firstPostInc()!=0x61) {
   1179         errln("SubStringCharIter.firstPostInc() failed\n");
   1180     }
   1181 
   1182     // coverage: UCharCharacterIterator default constructor
   1183     SubUCharCharIter uci;
   1184     if(uci.firstPostInc()!=0x61) {
   1185         errln("SubUCharCharIter.firstPostInc() failed\n");
   1186     }
   1187 }
   1188