Home | History | Annotate | Download | only in intltest
      1 /********************************************************************
      2  * COPYRIGHT:
      3  * Copyright (c) 1997-2014, International Business Machines Corporation and
      4  * others. All Rights Reserved.
      5  ********************************************************************/
      6 //===============================================================================
      7 //
      8 // File apicoll.cpp
      9 //
     10 //
     11 //
     12 // Created by: Helena Shih
     13 //
     14 // Modification History:
     15 //
     16 //  Date         Name          Description
     17 //  2/5/97      aliu        Added streamIn and streamOut methods.  Added
     18 //                          constructor which reads RuleBasedCollator object from
     19 //                          a binary file.  Added writeToFile method which streams
     20 //                          RuleBasedCollator out to a binary file.  The streamIn
     21 //                          and streamOut methods use istream and ostream objects
     22 //                          in binary mode.
     23 //  6/30/97     helena      Added tests for CollationElementIterator::setText, getOffset
     24 //                          setOffset and DecompositionIterator::getOffset, setOffset.
     25 //                          DecompositionIterator is made public so add class scope
     26 //                          testing.
     27 //  02/10/98    damiba      Added test for compare(UnicodeString&, UnicodeString&, int32_t)
     28 //===============================================================================
     29 
     30 #include "unicode/utypes.h"
     31 
     32 #if !UCONFIG_NO_COLLATION
     33 
     34 #include "unicode/localpointer.h"
     35 #include "unicode/coll.h"
     36 #include "unicode/tblcoll.h"
     37 #include "unicode/coleitr.h"
     38 #include "unicode/sortkey.h"
     39 #include "apicoll.h"
     40 #include "unicode/chariter.h"
     41 #include "unicode/schriter.h"
     42 #include "unicode/ustring.h"
     43 #include "unicode/ucol.h"
     44 
     45 #include "sfwdchit.h"
     46 #include "cmemory.h"
     47 #include <stdlib.h>
     48 
     49 #define LENGTHOF(array) (int32_t)(sizeof(array)/sizeof((array)[0]))
     50 
     51 void
     52 CollationAPITest::doAssert(UBool condition, const char *message)
     53 {
     54     if (!condition) {
     55         errln(UnicodeString("ERROR : ") + message);
     56     }
     57 }
     58 
     59 // Collator Class Properties
     60 // ctor, dtor, createInstance, compare, getStrength/setStrength
     61 // getDecomposition/setDecomposition, getDisplayName
     62 void
     63 CollationAPITest::TestProperty(/* char* par */)
     64 {
     65     UErrorCode success = U_ZERO_ERROR;
     66     Collator *col = 0;
     67     /*
     68      * Expected version of the English collator.
     69      * Currently, the major/minor version numbers change when the builder code
     70      * changes,
     71      * number 2 is from the tailoring data version and
     72      * number 3 is the UCA version.
     73      * This changes with every UCA version change, and the expected value
     74      * needs to be adjusted.
     75      * Same in cintltst/capitst.c.
     76      */
     77     UVersionInfo currVersionArray = {0x31, 0xC0, 0x05, 0x2A};  // from ICU 4.4/UCA 5.2
     78     UVersionInfo versionArray;
     79 
     80     logln("The property tests begin : ");
     81     logln("Test ctors : ");
     82     col = Collator::createInstance(Locale::getEnglish(), success);
     83     if (U_FAILURE(success)){
     84         errcheckln(success, "Default Collator creation failed. - %s", u_errorName(success));
     85         return;
     86     }
     87 
     88     StringEnumeration* kwEnum = col->getKeywordValuesForLocale("", Locale::getEnglish(),true,success);
     89     if (U_FAILURE(success)){
     90         errcheckln(success, "Get Keyword Values for Locale failed. - %s", u_errorName(success));
     91         return;
     92     }
     93     delete kwEnum;
     94 
     95     col->getVersion(versionArray);
     96     // Check for a version greater than some value rather than equality
     97     // so that we need not update the expected version each time.
     98     if (uprv_memcmp(versionArray, currVersionArray, 4)<0) {
     99       errln("Testing Collator::getVersion() - unexpected result: %02x.%02x.%02x.%02x",
    100             versionArray[0], versionArray[1], versionArray[2], versionArray[3]);
    101     } else {
    102       logln("Collator::getVersion() result: %02x.%02x.%02x.%02x",
    103             versionArray[0], versionArray[1], versionArray[2], versionArray[3]);
    104     }
    105 
    106     doAssert((col->compare("ab", "abc") == Collator::LESS), "ab < abc comparison failed");
    107     doAssert((col->compare("ab", "AB") == Collator::LESS), "ab < AB comparison failed");
    108     doAssert((col->compare("blackbird", "black-bird") == Collator::GREATER), "black-bird > blackbird comparison failed");
    109     doAssert((col->compare("black bird", "black-bird") == Collator::LESS), "black bird > black-bird comparison failed");
    110     doAssert((col->compare("Hello", "hello") == Collator::GREATER), "Hello > hello comparison failed");
    111     doAssert((col->compare("","",success) == UCOL_EQUAL), "Comparison between empty strings failed");
    112 
    113     doAssert((col->compareUTF8("\x61\x62\xc3\xa4", "\x61\x62\xc3\x9f", success) == UCOL_LESS), "ab a-umlaut < ab sharp-s UTF-8 comparison failed");
    114     success = U_ZERO_ERROR;
    115     {
    116         UnicodeString abau=UNICODE_STRING_SIMPLE("\\x61\\x62\\xe4").unescape();
    117         UnicodeString abss=UNICODE_STRING_SIMPLE("\\x61\\x62\\xdf").unescape();
    118         UCharIterator abauIter, abssIter;
    119         uiter_setReplaceable(&abauIter, &abau);
    120         uiter_setReplaceable(&abssIter, &abss);
    121         doAssert((col->compare(abauIter, abssIter, success) == UCOL_LESS), "ab a-umlaut < ab sharp-s UCharIterator comparison failed");
    122         success = U_ZERO_ERROR;
    123     }
    124 
    125     /*start of update [Bertrand A. D. 02/10/98]*/
    126     doAssert((col->compare("ab", "abc", 2) == Collator::EQUAL), "ab = abc with length 2 comparison failed");
    127     doAssert((col->compare("ab", "AB", 2) == Collator::LESS), "ab < AB  with length 2 comparison failed");
    128     doAssert((col->compare("ab", "Aa", 1) == Collator::LESS), "ab < Aa  with length 1 comparison failed");
    129     doAssert((col->compare("ab", "Aa", 2) == Collator::GREATER), "ab > Aa  with length 2 comparison failed");
    130     doAssert((col->compare("black-bird", "blackbird", 5) == Collator::EQUAL), "black-bird = blackbird with length of 5 comparison failed");
    131     doAssert((col->compare("black bird", "black-bird", 10) == Collator::LESS), "black bird < black-bird with length 10 comparison failed");
    132     doAssert((col->compare("Hello", "hello", 5) == Collator::GREATER), "Hello > hello with length 5 comparison failed");
    133     /*end of update [Bertrand A. D. 02/10/98]*/
    134 
    135 
    136     logln("Test ctors ends.");
    137     logln("testing Collator::getStrength() method ...");
    138     doAssert((col->getStrength() == Collator::TERTIARY), "collation object has the wrong strength");
    139     doAssert((col->getStrength() != Collator::PRIMARY), "collation object's strength is primary difference");
    140 
    141 
    142     logln("testing Collator::setStrength() method ...");
    143     col->setStrength(Collator::SECONDARY);
    144     doAssert((col->getStrength() != Collator::TERTIARY), "collation object's strength is secondary difference");
    145     doAssert((col->getStrength() != Collator::PRIMARY), "collation object's strength is primary difference");
    146     doAssert((col->getStrength() == Collator::SECONDARY), "collation object has the wrong strength");
    147 
    148     UnicodeString name;
    149 
    150     logln("Get display name for the US English collation in German : ");
    151     logln(Collator::getDisplayName(Locale::getUS(), Locale::getGerman(), name));
    152     doAssert((name == UnicodeString("Englisch (Vereinigte Staaten)")), "getDisplayName failed");
    153 
    154     logln("Get display name for the US English collation in English : ");
    155     logln(Collator::getDisplayName(Locale::getUS(), Locale::getEnglish(), name));
    156     doAssert((name == UnicodeString("English (United States)")), "getDisplayName failed");
    157 #if 0
    158     // weiv : this test is bogus if we're running on any machine that has different default locale than English.
    159     // Therefore, it is banned!
    160     logln("Get display name for the US English in default locale language : ");
    161     logln(Collator::getDisplayName(Locale::US, name));
    162     doAssert((name == UnicodeString("English (United States)")), "getDisplayName failed if this is an English machine");
    163 #endif
    164     delete col; col = 0;
    165     RuleBasedCollator *rcol = (RuleBasedCollator *)Collator::createInstance("da_DK",
    166                                                                             success);
    167     if (U_FAILURE(success)) {
    168         errcheckln(success, "Collator::createInstance(\"da_DK\") failed - %s", u_errorName(success));
    169         return;
    170     }
    171     const UnicodeString &daRules = rcol->getRules();
    172     if(daRules.isEmpty()) {
    173         dataerrln("missing da_DK tailoring rule string");
    174     } else {
    175         doAssert(daRules.indexOf("aa") >= 0, "da_DK rules do not contain 'aa'");
    176     }
    177     delete rcol;
    178 
    179     col = Collator::createInstance(Locale::getFrench(), success);
    180     if (U_FAILURE(success))
    181     {
    182         errln("Creating French collation failed.");
    183         return;
    184     }
    185 
    186     col->setStrength(Collator::PRIMARY);
    187     logln("testing Collator::getStrength() method again ...");
    188     doAssert((col->getStrength() != Collator::TERTIARY), "collation object has the wrong strength");
    189     doAssert((col->getStrength() == Collator::PRIMARY), "collation object's strength is not primary difference");
    190 
    191     logln("testing French Collator::setStrength() method ...");
    192     col->setStrength(Collator::TERTIARY);
    193     doAssert((col->getStrength() == Collator::TERTIARY), "collation object's strength is not tertiary difference");
    194     doAssert((col->getStrength() != Collator::PRIMARY), "collation object's strength is primary difference");
    195     doAssert((col->getStrength() != Collator::SECONDARY), "collation object's strength is secondary difference");
    196 
    197     logln("Create junk collation: ");
    198     Locale abcd("ab", "CD", "");
    199     success = U_ZERO_ERROR;
    200     Collator *junk = 0;
    201     junk = Collator::createInstance(abcd, success);
    202 
    203     if (U_FAILURE(success))
    204     {
    205         errln("Junk collation creation failed, should at least return default.");
    206         delete col;
    207         return;
    208     }
    209 
    210     delete col;
    211     col = Collator::createInstance(success);
    212     if (U_FAILURE(success))
    213     {
    214         errln("Creating default collator failed.");
    215         delete junk;
    216         return;
    217     }
    218 
    219     doAssert(((RuleBasedCollator *)col)->getRules() == ((RuleBasedCollator *)junk)->getRules(),
    220                "The default collation should be returned.");
    221     Collator *frCol = Collator::createInstance(Locale::getCanadaFrench(), success);
    222     if (U_FAILURE(success))
    223     {
    224         errln("Creating fr_CA collator failed.");
    225         delete col;
    226         delete junk;
    227         return;
    228     }
    229 
    230     // If the default locale isn't French, the French and non-French collators
    231     // should be different
    232     if (frCol->getLocale(ULOC_ACTUAL_LOCALE, success) != Locale::getCanadaFrench()) {
    233         doAssert((*frCol != *junk), "The junk is the same as the fr_CA collator.");
    234     }
    235     Collator *aFrCol = frCol->clone();
    236     doAssert((*frCol == *aFrCol), "The cloning of a fr_CA collator failed.");
    237     logln("Collator property test ended.");
    238 
    239     delete col;
    240     delete frCol;
    241     delete aFrCol;
    242     delete junk;
    243 }
    244 
    245 void
    246 CollationAPITest::TestRuleBasedColl()
    247 {
    248     RuleBasedCollator *col1, *col2, *col3, *col4;
    249     UErrorCode status = U_ZERO_ERROR;
    250 
    251     UnicodeString ruleset1("&9 < a, A < b, B < c, C; ch, cH, Ch, CH < d, D, e, E");
    252     UnicodeString ruleset2("&9 < a, A < b, B < c, C < d, D, e, E");
    253 
    254     col1 = new RuleBasedCollator(ruleset1, status);
    255     if (U_FAILURE(status)) {
    256         errcheckln(status, "RuleBased Collator creation failed. - %s", u_errorName(status));
    257         return;
    258     }
    259     else {
    260         logln("PASS: RuleBased Collator creation passed\n");
    261     }
    262 
    263     status = U_ZERO_ERROR;
    264     col2 = new RuleBasedCollator(ruleset2, status);
    265     if (U_FAILURE(status)) {
    266         errln("RuleBased Collator creation failed.\n");
    267         return;
    268     }
    269     else {
    270         logln("PASS: RuleBased Collator creation passed\n");
    271     }
    272 
    273     status = U_ZERO_ERROR;
    274     Locale locale("aa", "AA");
    275     col3 = (RuleBasedCollator *)Collator::createInstance(locale, status);
    276     if (U_FAILURE(status)) {
    277         errln("Fallback Collator creation failed.: %s\n");
    278         return;
    279     }
    280     else {
    281         logln("PASS: Fallback Collator creation passed\n");
    282     }
    283     delete col3;
    284 
    285     status = U_ZERO_ERROR;
    286     col3 = (RuleBasedCollator *)Collator::createInstance(status);
    287     if (U_FAILURE(status)) {
    288         errln("Default Collator creation failed.: %s\n");
    289         return;
    290     }
    291     else {
    292         logln("PASS: Default Collator creation passed\n");
    293     }
    294 
    295     UnicodeString rule1 = col1->getRules();
    296     UnicodeString rule2 = col2->getRules();
    297     UnicodeString rule3 = col3->getRules();
    298 
    299     doAssert(rule1 != rule2, "Default collator getRules failed");
    300     doAssert(rule2 != rule3, "Default collator getRules failed");
    301     doAssert(rule1 != rule3, "Default collator getRules failed");
    302 
    303     col4 = new RuleBasedCollator(rule2, status);
    304     if (U_FAILURE(status)) {
    305         errln("RuleBased Collator creation failed.\n");
    306         return;
    307     }
    308 
    309     UnicodeString rule4 = col4->getRules();
    310     doAssert(rule2 == rule4, "Default collator getRules failed");
    311     int32_t length4 = 0;
    312     uint8_t *clonedrule4 = col4->cloneRuleData(length4, status);
    313     if (U_FAILURE(status)) {
    314         errln("Cloned rule data failed.\n");
    315         return;
    316     }
    317 
    318  //   free(clonedrule4);     BAD API!!!!
    319     uprv_free(clonedrule4);
    320 
    321 
    322     delete col1;
    323     delete col2;
    324     delete col3;
    325     delete col4;
    326 }
    327 
    328 void
    329 CollationAPITest::TestRules()
    330 {
    331     RuleBasedCollator *coll;
    332     UErrorCode status = U_ZERO_ERROR;
    333     UnicodeString rules;
    334 
    335     coll = (RuleBasedCollator *)Collator::createInstance(Locale::getEnglish(), status);
    336     if (U_FAILURE(status)) {
    337         errcheckln(status, "English Collator creation failed. - %s", u_errorName(status));
    338         return;
    339     }
    340     else {
    341         logln("PASS: RuleBased Collator creation passed\n");
    342     }
    343 
    344     coll->getRules(UCOL_TAILORING_ONLY, rules);
    345     if (rules.length() != 0x00) {
    346       errln("English tailored rules failed - length is 0x%x expected 0x%x", rules.length(), 0x00);
    347     }
    348 
    349     coll->getRules(UCOL_FULL_RULES, rules);
    350     if (rules.length() < 0) {
    351         errln("English full rules failed");
    352     }
    353     delete coll;
    354 }
    355 
    356 void
    357 CollationAPITest::TestDecomposition() {
    358   UErrorCode status = U_ZERO_ERROR;
    359   Collator *en_US = Collator::createInstance("en_US", status),
    360     *el_GR = Collator::createInstance("el_GR", status),
    361     *vi_VN = Collator::createInstance("vi_VN", status);
    362 
    363   if (U_FAILURE(status)) {
    364     errcheckln(status, "ERROR: collation creation failed. - %s", u_errorName(status));
    365     return;
    366   }
    367 
    368   /* there is no reason to have canonical decomposition in en_US OR default locale */
    369   if (vi_VN->getAttribute(UCOL_NORMALIZATION_MODE, status) != UCOL_ON)
    370   {
    371     errln("ERROR: vi_VN collation did not have canonical decomposition for normalization!\n");
    372   }
    373 
    374   if (el_GR->getAttribute(UCOL_NORMALIZATION_MODE, status) != UCOL_ON)
    375   {
    376     errln("ERROR: el_GR collation did not have canonical decomposition for normalization!\n");
    377   }
    378 
    379   if (en_US->getAttribute(UCOL_NORMALIZATION_MODE, status) != UCOL_OFF)
    380   {
    381     errln("ERROR: en_US collation had canonical decomposition for normalization!\n");
    382   }
    383 
    384   delete en_US;
    385   delete el_GR;
    386   delete vi_VN;
    387 }
    388 
    389 void
    390 CollationAPITest::TestSafeClone() {
    391     static const int CLONETEST_COLLATOR_COUNT = 3;
    392     Collator *someCollators [CLONETEST_COLLATOR_COUNT];
    393     Collator *col;
    394     UErrorCode err = U_ZERO_ERROR;
    395     int index;
    396 
    397     UnicodeString test1("abCda");
    398     UnicodeString test2("abcda");
    399 
    400     /* one default collator & two complex ones */
    401     someCollators[0] = Collator::createInstance("en_US", err);
    402     someCollators[1] = Collator::createInstance("ko", err);
    403     someCollators[2] = Collator::createInstance("ja_JP", err);
    404     if(U_FAILURE(err)) {
    405       errcheckln(err, "Couldn't instantiate collators. Error: %s", u_errorName(err));
    406       delete someCollators[0];
    407       delete someCollators[1];
    408       delete someCollators[2];
    409       return;
    410     }
    411 
    412     /* change orig & clone & make sure they are independent */
    413 
    414     for (index = 0; index < CLONETEST_COLLATOR_COUNT; index++)
    415     {
    416         col = someCollators[index]->safeClone();
    417         if (col == 0) {
    418             errln("SafeClone of collator should not return null\n");
    419             break;
    420         }
    421         col->setStrength(Collator::TERTIARY);
    422         someCollators[index]->setStrength(Collator::PRIMARY);
    423         col->setAttribute(UCOL_CASE_LEVEL, UCOL_OFF, err);
    424         someCollators[index]->setAttribute(UCOL_CASE_LEVEL, UCOL_OFF, err);
    425 
    426         doAssert(col->greater(test1, test2), "Result should be \"abCda\" >>> \"abcda\" ");
    427         doAssert(someCollators[index]->equals(test1, test2), "Result should be \"abcda\" == \"abCda\"");
    428         delete col;
    429         delete someCollators[index];
    430     }
    431 }
    432 
    433 void
    434 CollationAPITest::TestHashCode(/* char* par */)
    435 {
    436     logln("hashCode tests begin.");
    437     UErrorCode success = U_ZERO_ERROR;
    438     Collator *col1 = 0;
    439     col1 = Collator::createInstance(Locale::getEnglish(), success);
    440     if (U_FAILURE(success))
    441     {
    442         errcheckln(success, "Default collation creation failed. - %s", u_errorName(success));
    443         return;
    444     }
    445 
    446     Collator *col2 = 0;
    447     Locale dk("da", "DK", "");
    448     col2 = Collator::createInstance(dk, success);
    449     if (U_FAILURE(success))
    450     {
    451         errln("Danish collation creation failed.");
    452         return;
    453     }
    454 
    455     Collator *col3 = 0;
    456     col3 = Collator::createInstance(Locale::getEnglish(), success);
    457     if (U_FAILURE(success))
    458     {
    459         errln("2nd default collation creation failed.");
    460         return;
    461     }
    462 
    463     logln("Collator::hashCode() testing ...");
    464 
    465     doAssert(col1->hashCode() != col2->hashCode(), "Hash test1 result incorrect" );
    466     doAssert(!(col1->hashCode() == col2->hashCode()), "Hash test2 result incorrect" );
    467     doAssert(col1->hashCode() == col3->hashCode(), "Hash result not equal" );
    468 
    469     logln("hashCode tests end.");
    470     delete col1;
    471     delete col2;
    472 
    473     UnicodeString test1("Abcda");
    474     UnicodeString test2("abcda");
    475 
    476     CollationKey sortk1, sortk2, sortk3;
    477     UErrorCode status = U_ZERO_ERROR;
    478 
    479     col3->getCollationKey(test1, sortk1, status);
    480     col3->getCollationKey(test2, sortk2, status);
    481     col3->getCollationKey(test2, sortk3, status);
    482 
    483     doAssert(sortk1.hashCode() != sortk2.hashCode(), "Hash test1 result incorrect");
    484     doAssert(sortk2.hashCode() == sortk3.hashCode(), "Hash result not equal" );
    485 
    486     delete col3;
    487 }
    488 
    489 //----------------------------------------------------------------------------
    490 // CollationKey -- Tests the CollationKey methods
    491 //
    492 void
    493 CollationAPITest::TestCollationKey(/* char* par */)
    494 {
    495     logln("testing CollationKey begins...");
    496     Collator *col = 0;
    497     UErrorCode success=U_ZERO_ERROR;
    498     col = Collator::createInstance(Locale::getEnglish(), success);
    499     if (U_FAILURE(success))
    500     {
    501         errcheckln(success, "Default collation creation failed. - %s", u_errorName(success));
    502         return;
    503     }
    504     col->setStrength(Collator::TERTIARY);
    505 
    506     CollationKey sortk1, sortk2;
    507     UnicodeString test1("Abcda"), test2("abcda");
    508     UErrorCode key1Status = U_ZERO_ERROR, key2Status = U_ZERO_ERROR;
    509 
    510     logln("Testing weird arguments");
    511     // No string vs. empty string vs. completely-ignorable string:
    512     // See ICU ticket #10495.
    513     CollationKey sortkNone;
    514     int32_t length;
    515     sortkNone.getByteArray(length);
    516     doAssert(!sortkNone.isBogus() && length == 0,
    517              "Default-constructed collation key should be empty");
    518     CollationKey sortkEmpty;
    519     col->getCollationKey(NULL, 0, sortkEmpty, key1Status);
    520     // key gets reset here
    521     const uint8_t* byteArrayEmpty = sortkEmpty.getByteArray(length);
    522     doAssert(sortkEmpty.isBogus() == FALSE && length == 3 &&
    523              byteArrayEmpty[0] == 1 && byteArrayEmpty[1] == 1 && byteArrayEmpty[2] == 0,
    524              "Empty string should return a collation key with empty levels");
    525     doAssert(sortkNone.compareTo(sortkEmpty) == Collator::LESS,
    526              "Expected no collation key < collation key for empty string");
    527     doAssert(sortkEmpty.compareTo(sortkNone) == Collator::GREATER,
    528              "Expected collation key for empty string > no collation key");
    529 
    530     CollationKey sortkIgnorable;
    531     // Most control codes and CGJ are completely ignorable.
    532     // A string with only completely ignorables must compare equal to an empty string.
    533     col->getCollationKey(UnicodeString((UChar)1).append((UChar)0x34f), sortkIgnorable, key1Status);
    534     sortkIgnorable.getByteArray(length);
    535     doAssert(!sortkIgnorable.isBogus() && length == 3,
    536              "Completely ignorable string should return a collation key with empty levels");
    537     doAssert(sortkIgnorable.compareTo(sortkEmpty) == Collator::EQUAL,
    538              "Completely ignorable string should compare equal to empty string");
    539 
    540     // bogus key returned here
    541     key1Status = U_ILLEGAL_ARGUMENT_ERROR;
    542     col->getCollationKey(NULL, 0, sortk1, key1Status);
    543     doAssert(sortk1.isBogus() && (sortk1.getByteArray(length), length) == 0,
    544         "Error code should return bogus collation key");
    545 
    546     key1Status = U_ZERO_ERROR;
    547     logln("Use tertiary comparison level testing ....");
    548 
    549     col->getCollationKey(test1, sortk1, key1Status);
    550     if (U_FAILURE(key1Status)) {
    551         errln("getCollationKey(Abcda) failed - %s", u_errorName(key1Status));
    552         return;
    553     }
    554     doAssert((sortk1.compareTo(col->getCollationKey(test2, sortk2, key2Status)))
    555                  == Collator::GREATER,
    556                 "Result should be \"Abcda\" >>> \"abcda\"");
    557 
    558     CollationKey sortk3(sortk2), sortkNew;
    559 
    560     sortkNew = sortk1;
    561     doAssert((sortk1 != sortk2), "The sort keys should be different");
    562     doAssert((sortk1.hashCode() != sortk2.hashCode()), "sort key hashCode() failed");
    563     doAssert((sortk2 == sortk3), "The sort keys should be the same");
    564     doAssert((sortk1 == sortkNew), "The sort keys assignment failed");
    565     doAssert((sortk1.hashCode() == sortkNew.hashCode()), "sort key hashCode() failed");
    566     doAssert((sortkNew != sortk3), "The sort keys should be different");
    567     doAssert(sortk1.compareTo(sortk3) == Collator::GREATER, "Result should be \"Abcda\" >>> \"abcda\"");
    568     doAssert(sortk2.compareTo(sortk3) == Collator::EQUAL, "Result should be \"abcda\" == \"abcda\"");
    569     doAssert(sortkEmpty.compareTo(sortk1) == Collator::LESS, "Result should be (empty key) <<< \"Abcda\"");
    570     doAssert(sortk1.compareTo(sortkEmpty) == Collator::GREATER, "Result should be \"Abcda\" >>> (empty key)");
    571     doAssert(sortkEmpty.compareTo(sortkEmpty) == Collator::EQUAL, "Result should be (empty key) == (empty key)");
    572     doAssert(sortk1.compareTo(sortk3, success) == UCOL_GREATER, "Result should be \"Abcda\" >>> \"abcda\"");
    573     doAssert(sortk2.compareTo(sortk3, success) == UCOL_EQUAL, "Result should be \"abcda\" == \"abcda\"");
    574     doAssert(sortkEmpty.compareTo(sortk1, success) == UCOL_LESS, "Result should be (empty key) <<< \"Abcda\"");
    575     doAssert(sortk1.compareTo(sortkEmpty, success) == UCOL_GREATER, "Result should be \"Abcda\" >>> (empty key)");
    576     doAssert(sortkEmpty.compareTo(sortkEmpty, success) == UCOL_EQUAL, "Result should be (empty key) == (empty key)");
    577 
    578     int32_t    cnt1, cnt2, cnt3, cnt4;
    579 
    580     const uint8_t* byteArray1 = sortk1.getByteArray(cnt1);
    581     const uint8_t* byteArray2 = sortk2.getByteArray(cnt2);
    582 
    583     const uint8_t* byteArray3 = 0;
    584     byteArray3 = sortk1.getByteArray(cnt3);
    585 
    586     const uint8_t* byteArray4 = 0;
    587     byteArray4 = sortk2.getByteArray(cnt4);
    588 
    589     CollationKey sortk4(byteArray1, cnt1), sortk5(byteArray2, cnt2);
    590     CollationKey sortk6(byteArray3, cnt3), sortk7(byteArray4, cnt4);
    591 
    592     doAssert(sortk1.compareTo(sortk4) == Collator::EQUAL, "CollationKey::toByteArray(sortk1) Failed.");
    593     doAssert(sortk2.compareTo(sortk5) == Collator::EQUAL, "CollationKey::toByteArray(sortk2) Failed.");
    594     doAssert(sortk4.compareTo(sortk5) == Collator::GREATER, "sortk4 >>> sortk5 Failed");
    595     doAssert(sortk1.compareTo(sortk6) == Collator::EQUAL, "CollationKey::getByteArray(sortk1) Failed.");
    596     doAssert(sortk2.compareTo(sortk7) == Collator::EQUAL, "CollationKey::getByteArray(sortk2) Failed.");
    597     doAssert(sortk6.compareTo(sortk7) == Collator::GREATER, "sortk6 >>> sortk7 Failed");
    598 
    599     logln("Equality tests : ");
    600     doAssert(sortk1 == sortk4, "sortk1 == sortk4 Failed.");
    601     doAssert(sortk2 == sortk5, "sortk2 == sortk5 Failed.");
    602     doAssert(sortk1 != sortk5, "sortk1 != sortk5 Failed.");
    603     doAssert(sortk1 == sortk6, "sortk1 == sortk6 Failed.");
    604     doAssert(sortk2 == sortk7, "sortk2 == sortk7 Failed.");
    605     doAssert(sortk1 != sortk7, "sortk1 != sortk7 Failed.");
    606 
    607     byteArray1 = 0;
    608     byteArray2 = 0;
    609 
    610     sortk3 = sortk1;
    611     doAssert(sortk1 == sortk3, "sortk1 = sortk3 assignment Failed.");
    612     doAssert(sortk2 != sortk3, "sortk2 != sortk3 Failed.");
    613     logln("testing sortkey ends...");
    614 
    615     col->setStrength(Collator::SECONDARY);
    616     doAssert(col->getCollationKey(test1, sortk1, key1Status).compareTo(
    617                                   col->getCollationKey(test2, sortk2, key2Status))
    618                                   == Collator::EQUAL,
    619                                   "Result should be \"Abcda\" == \"abcda\"");
    620     delete col;
    621 }
    622 
    623 //----------------------------------------------------------------------------
    624 // Tests the CollatorElementIterator class.
    625 // ctor, RuleBasedCollator::createCollationElementIterator(), operator==, operator!=
    626 //
    627 void
    628 CollationAPITest::TestElemIter(/* char* par */)
    629 {
    630     logln("testing sortkey begins...");
    631     Collator *col = 0;
    632     UErrorCode success = U_ZERO_ERROR;
    633     col = Collator::createInstance(Locale::getEnglish(), success);
    634     if (U_FAILURE(success))
    635     {
    636         errcheckln(success, "Default collation creation failed. - %s", u_errorName(success));
    637         return;
    638     }
    639 
    640     UnicodeString testString1("XFILE What subset of all possible test cases has the highest probability of detecting the most errors?");
    641     UnicodeString testString2("Xf_ile What subset of all possible test cases has the lowest probability of detecting the least errors?");
    642     logln("Constructors and comparison testing....");
    643     CollationElementIterator *iterator1 = ((RuleBasedCollator*)col)->createCollationElementIterator(testString1);
    644 
    645     CharacterIterator *chariter=new StringCharacterIterator(testString1);
    646     CollationElementIterator *coliter=((RuleBasedCollator*)col)->createCollationElementIterator(*chariter);
    647 
    648     // copy ctor
    649     CollationElementIterator *iterator2 = ((RuleBasedCollator*)col)->createCollationElementIterator(testString1);
    650     CollationElementIterator *iterator3 = ((RuleBasedCollator*)col)->createCollationElementIterator(testString2);
    651 
    652     int32_t offset = iterator1->getOffset();
    653     if (offset != 0) {
    654         errln("Error in getOffset for collation element iterator\n");
    655         return;
    656     }
    657     iterator1->setOffset(6, success);
    658     if (U_FAILURE(success)) {
    659         errln("Error in setOffset for collation element iterator\n");
    660         return;
    661     }
    662     iterator1->setOffset(0, success);
    663     int32_t order1, order2, order3;
    664     doAssert((*iterator1 == *iterator2), "The two iterators should be the same");
    665     doAssert((*iterator1 != *iterator3), "The two iterators should be different");
    666 
    667     doAssert((*coliter == *iterator1), "The two iterators should be the same");
    668     doAssert((*coliter == *iterator2), "The two iterators should be the same");
    669     doAssert((*coliter != *iterator3), "The two iterators should be different");
    670 
    671     order1 = iterator1->next(success);
    672     if (U_FAILURE(success))
    673     {
    674         errln("Somehow ran out of memory stepping through the iterator.");
    675         return;
    676     }
    677 
    678     doAssert((*iterator1 != *iterator2), "The first iterator advance failed");
    679     order2 = iterator2->getOffset();
    680     doAssert((order1 != order2), "The order result should not be the same");
    681     order2 = iterator2->next(success);
    682     if (U_FAILURE(success))
    683     {
    684         errln("Somehow ran out of memory stepping through the iterator.");
    685         return;
    686     }
    687 
    688     doAssert((*iterator1 == *iterator2), "The second iterator advance failed");
    689     doAssert((order1 == order2), "The order result should be the same");
    690     order3 = iterator3->next(success);
    691     if (U_FAILURE(success))
    692     {
    693         errln("Somehow ran out of memory stepping through the iterator.");
    694         return;
    695     }
    696 
    697     doAssert((CollationElementIterator::primaryOrder(order1) ==
    698         CollationElementIterator::primaryOrder(order3)), "The primary orders should be the same");
    699     doAssert((CollationElementIterator::secondaryOrder(order1) ==
    700         CollationElementIterator::secondaryOrder(order3)), "The secondary orders should be the same");
    701     doAssert((CollationElementIterator::tertiaryOrder(order1) ==
    702         CollationElementIterator::tertiaryOrder(order3)), "The tertiary orders should be the same");
    703 
    704     order1 = iterator1->next(success); order3 = iterator3->next(success);
    705     if (U_FAILURE(success))
    706     {
    707         errln("Somehow ran out of memory stepping through the iterator.");
    708         return;
    709     }
    710 
    711     doAssert((CollationElementIterator::primaryOrder(order1) ==
    712         CollationElementIterator::primaryOrder(order3)), "The primary orders should be identical");
    713     doAssert((CollationElementIterator::tertiaryOrder(order1) !=
    714         CollationElementIterator::tertiaryOrder(order3)), "The tertiary orders should be different");
    715 
    716     order1 = iterator1->next(success);
    717     order3 = iterator3->next(success);
    718     /* NO! Secondary orders of two CEs are not related, especially in the case of '_' vs 'I' */
    719     /*
    720     doAssert((CollationElementIterator::secondaryOrder(order1) !=
    721         CollationElementIterator::secondaryOrder(order3)), "The secondary orders should not be the same");
    722     */
    723     doAssert((order1 != CollationElementIterator::NULLORDER), "Unexpected end of iterator reached");
    724 
    725     iterator1->reset(); iterator2->reset(); iterator3->reset();
    726     order1 = iterator1->next(success);
    727     if (U_FAILURE(success))
    728     {
    729         errln("Somehow ran out of memory stepping through the iterator.");
    730         return;
    731     }
    732 
    733     doAssert((*iterator1 != *iterator2), "The first iterator advance failed");
    734 
    735     order2 = iterator2->next(success);
    736     if (U_FAILURE(success))
    737     {
    738         errln("Somehow ran out of memory stepping through the iterator.");
    739         return;
    740     }
    741 
    742     doAssert((*iterator1 == *iterator2), "The second iterator advance failed");
    743     doAssert((order1 == order2), "The order result should be the same");
    744 
    745     order3 = iterator3->next(success);
    746     if (U_FAILURE(success))
    747     {
    748         errln("Somehow ran out of memory stepping through the iterator.");
    749         return;
    750     }
    751 
    752     doAssert((CollationElementIterator::primaryOrder(order1) ==
    753         CollationElementIterator::primaryOrder(order3)), "The primary orders should be the same");
    754     doAssert((CollationElementIterator::secondaryOrder(order1) ==
    755         CollationElementIterator::secondaryOrder(order3)), "The secondary orders should be the same");
    756     doAssert((CollationElementIterator::tertiaryOrder(order1) ==
    757         CollationElementIterator::tertiaryOrder(order3)), "The tertiary orders should be the same");
    758 
    759     order1 = iterator1->next(success); order2 = iterator2->next(success); order3 = iterator3->next(success);
    760     if (U_FAILURE(success))
    761     {
    762         errln("Somehow ran out of memory stepping through the iterator.");
    763         return;
    764     }
    765 
    766     doAssert((CollationElementIterator::primaryOrder(order1) ==
    767         CollationElementIterator::primaryOrder(order3)), "The primary orders should be identical");
    768     doAssert((CollationElementIterator::tertiaryOrder(order1) !=
    769         CollationElementIterator::tertiaryOrder(order3)), "The tertiary orders should be different");
    770 
    771     order1 = iterator1->next(success); order3 = iterator3->next(success);
    772     if (U_FAILURE(success))
    773     {
    774         errln("Somehow ran out of memory stepping through the iterator.");
    775         return;
    776     }
    777 
    778     /* NO! Secondary orders of two CEs are not related, especially in the case of '_' vs 'I' */
    779     /*
    780     doAssert((CollationElementIterator::secondaryOrder(order1) !=
    781         CollationElementIterator::secondaryOrder(order3)), "The secondary orders should not be the same");
    782     */
    783     doAssert((order1 != CollationElementIterator::NULLORDER), "Unexpected end of iterator reached");
    784     doAssert((*iterator2 != *iterator3), "The iterators should be different");
    785 
    786 
    787     //test error values
    788     success=U_UNSUPPORTED_ERROR;
    789     Collator *colerror=NULL;
    790     colerror=Collator::createInstance(Locale::getEnglish(), success);
    791     if (colerror != 0 || success == U_ZERO_ERROR){
    792         errln("Error: createInstance(UErrorCode != U_ZERO_ERROR) should just return and not create an instance\n");
    793     }
    794     int32_t position=coliter->previous(success);
    795     if(position != CollationElementIterator::NULLORDER){
    796         errln((UnicodeString)"Expected NULLORDER got" + position);
    797     }
    798     coliter->reset();
    799     coliter->setText(*chariter, success);
    800     if(!U_FAILURE(success)){
    801         errln("Expeceted error");
    802     }
    803     iterator1->setText((UnicodeString)"hello there", success);
    804     if(!U_FAILURE(success)){
    805         errln("Expeceted error");
    806     }
    807 
    808     delete chariter;
    809     delete coliter;
    810     delete iterator1;
    811     delete iterator2;
    812     delete iterator3;
    813     delete col;
    814 
    815 
    816 
    817     logln("testing CollationElementIterator ends...");
    818 }
    819 
    820 // Test RuleBasedCollator ctor, dtor, operator==, operator!=, clone, copy, and getRules
    821 void
    822 CollationAPITest::TestOperators(/* char* par */)
    823 {
    824     UErrorCode success = U_ZERO_ERROR;
    825     UnicodeString ruleset1("&9 < a, A < b, B < c, C; ch, cH, Ch, CH < d, D, e, E");
    826     UnicodeString ruleset2("&9 < a, A < b, B < c, C < d, D, e, E");
    827     RuleBasedCollator *col1 = new RuleBasedCollator(ruleset1, success);
    828     if (U_FAILURE(success)) {
    829         errcheckln(success, "RuleBasedCollator creation failed. - %s", u_errorName(success));
    830         return;
    831     }
    832     success = U_ZERO_ERROR;
    833     RuleBasedCollator *col2 = new RuleBasedCollator(ruleset2, success);
    834     if (U_FAILURE(success)) {
    835         errln("The RuleBasedCollator constructor failed when building with the 2nd rule set.");
    836         return;
    837     }
    838     logln("The operator tests begin : ");
    839     logln("testing operator==, operator!=, clone  methods ...");
    840     doAssert((*col1 != *col2), "The two different table collations compared equal");
    841     *col1 = *col2;
    842     doAssert((*col1 == *col2), "Collator objects not equal after assignment (operator=)");
    843 
    844     success = U_ZERO_ERROR;
    845     Collator *col3 = Collator::createInstance(Locale::getEnglish(), success);
    846     if (U_FAILURE(success)) {
    847         errln("Default collation creation failed.");
    848         return;
    849     }
    850     doAssert((*col1 != *col3), "The two different table collations compared equal");
    851     Collator* col4 = col1->clone();
    852     Collator* col5 = col3->clone();
    853     doAssert((*col1 == *col4), "Cloned collation objects not equal");
    854     doAssert((*col3 != *col4), "Two different table collations compared equal");
    855     doAssert((*col3 == *col5), "Cloned collation objects not equal");
    856     doAssert((*col4 != *col5), "Two cloned collations compared equal");
    857 
    858     const UnicodeString& defRules = ((RuleBasedCollator*)col3)->getRules();
    859     RuleBasedCollator* col6 = new RuleBasedCollator(defRules, success);
    860     if (U_FAILURE(success)) {
    861         errln("Creating default collation with rules failed.");
    862         return;
    863     }
    864     doAssert((((RuleBasedCollator*)col3)->getRules() == col6->getRules()), "Default collator getRules failed");
    865 
    866     success = U_ZERO_ERROR;
    867     RuleBasedCollator *col7 = new RuleBasedCollator(ruleset2, Collator::TERTIARY, success);
    868     if (U_FAILURE(success)) {
    869         errln("The RuleBasedCollator constructor failed when building with the 2nd rule set with tertiary strength.");
    870         return;
    871     }
    872     success = U_ZERO_ERROR;
    873     RuleBasedCollator *col8 = new RuleBasedCollator(ruleset2, UCOL_OFF, success);
    874     if (U_FAILURE(success)) {
    875         errln("The RuleBasedCollator constructor failed when building with the 2nd rule set with Normalizer::NO_OP.");
    876         return;
    877     }
    878     success = U_ZERO_ERROR;
    879     RuleBasedCollator *col9 = new RuleBasedCollator(ruleset2, Collator::PRIMARY, UCOL_ON, success);
    880     if (U_FAILURE(success)) {
    881         errln("The RuleBasedCollator constructor failed when building with the 2nd rule set with tertiary strength and Normalizer::NO_OP.");
    882         return;
    883     }
    884   //  doAssert((*col7 == *col8), "The two equal table collations compared different");
    885     doAssert((*col7 != *col9), "The two different table collations compared equal");
    886     doAssert((*col8 != *col9), "The two different table collations compared equal");
    887 
    888     logln("operator tests ended.");
    889     delete col1;
    890     delete col2;
    891     delete col3;
    892     delete col4;
    893     delete col5;
    894     delete col6;
    895     delete col7;
    896     delete col8;
    897     delete col9;
    898 }
    899 
    900 // test clone and copy
    901 void
    902 CollationAPITest::TestDuplicate(/* char* par */)
    903 {
    904     UErrorCode status = U_ZERO_ERROR;
    905     Collator *col1 = Collator::createInstance(Locale::getEnglish(), status);
    906     if (U_FAILURE(status)) {
    907         logln("Default collator creation failed.");
    908         return;
    909     }
    910     Collator *col2 = col1->clone();
    911     doAssert((*col1 == *col2), "Cloned object is not equal to the orginal");
    912     UnicodeString ruleset("&9 < a, A < b, B < c, C < d, D, e, E");
    913     RuleBasedCollator *col3 = new RuleBasedCollator(ruleset, status);
    914     if (U_FAILURE(status)) {
    915         logln("Collation tailoring failed.");
    916         return;
    917     }
    918     doAssert((*col1 != *col3), "Cloned object is equal to some dummy");
    919     *col3 = *((RuleBasedCollator*)col1);
    920     doAssert((*col1 == *col3), "Copied object is not equal to the orginal");
    921 
    922     UCollationResult res;
    923     UnicodeString first((UChar)0x0061);
    924     UnicodeString second((UChar)0x0062);
    925     UnicodeString copiedEnglishRules(((RuleBasedCollator*)col1)->getRules());
    926 
    927     delete col1;
    928 
    929     // Try using the cloned collators after deleting the original data
    930     res = col2->compare(first, second, status);
    931     if(res != UCOL_LESS) {
    932         errln("a should be less then b after tailoring");
    933     }
    934     if (((RuleBasedCollator*)col2)->getRules() != copiedEnglishRules) {
    935         errln(UnicodeString("English rule difference. ")
    936             + copiedEnglishRules + UnicodeString("\ngetRules=") + ((RuleBasedCollator*)col2)->getRules());
    937     }
    938     res = col3->compare(first, second, status);
    939     if(res != UCOL_LESS) {
    940         errln("a should be less then b after tailoring");
    941     }
    942     if (col3->getRules() != copiedEnglishRules) {
    943         errln(UnicodeString("English rule difference. ")
    944             + copiedEnglishRules + UnicodeString("\ngetRules=") + col3->getRules());
    945     }
    946 
    947     delete col2;
    948     delete col3;
    949 }
    950 
    951 void
    952 CollationAPITest::TestCompare(/* char* par */)
    953 {
    954     logln("The compare tests begin : ");
    955     Collator *col = 0;
    956     UErrorCode success = U_ZERO_ERROR;
    957     col = Collator::createInstance(Locale::getEnglish(), success);
    958     if (U_FAILURE(success)) {
    959         errcheckln(success, "Default collation creation failed. - %s", u_errorName(success));
    960         return;
    961     }
    962     UnicodeString test1("Abcda"), test2("abcda");
    963     logln("Use tertiary comparison level testing ....");
    964 
    965     doAssert((!col->equals(test1, test2) ), "Result should be \"Abcda\" != \"abcda\"");
    966     doAssert((col->greater(test1, test2) ), "Result should be \"Abcda\" >>> \"abcda\"");
    967     doAssert((col->greaterOrEqual(test1, test2) ), "Result should be \"Abcda\" >>> \"abcda\"");
    968 
    969     col->setStrength(Collator::SECONDARY);
    970     logln("Use secondary comparison level testing ....");
    971 
    972     doAssert((col->equals(test1, test2) ), "Result should be \"Abcda\" == \"abcda\"");
    973     doAssert((!col->greater(test1, test2) ), "Result should be \"Abcda\" == \"abcda\"");
    974     doAssert((col->greaterOrEqual(test1, test2) ), "Result should be \"Abcda\" == \"abcda\"");
    975 
    976     col->setStrength(Collator::PRIMARY);
    977     logln("Use primary comparison level testing ....");
    978 
    979     doAssert((col->equals(test1, test2) ), "Result should be \"Abcda\" == \"abcda\"");
    980     doAssert((!col->greater(test1, test2) ), "Result should be \"Abcda\" == \"abcda\"");
    981     doAssert((col->greaterOrEqual(test1, test2) ), "Result should be \"Abcda\" == \"abcda\"");
    982 
    983     // Test different APIs
    984     const UChar* t1 = test1.getBuffer();
    985     int32_t t1Len = test1.length();
    986     const UChar* t2 = test2.getBuffer();
    987     int32_t t2Len = test2.length();
    988 
    989     doAssert((col->compare(test1, test2) == Collator::EQUAL), "Problem");
    990     doAssert((col->compare(test1, test2, success) == UCOL_EQUAL), "Problem");
    991     doAssert((col->compare(t1, t1Len, t2, t2Len) == Collator::EQUAL), "Problem");
    992     doAssert((col->compare(t1, t1Len, t2, t2Len, success) == UCOL_EQUAL), "Problem");
    993     doAssert((col->compare(test1, test2, t1Len) == Collator::EQUAL), "Problem");
    994     doAssert((col->compare(test1, test2, t1Len, success) == UCOL_EQUAL), "Problem");
    995 
    996     col->setAttribute(UCOL_STRENGTH, UCOL_TERTIARY, success);
    997     doAssert((col->compare(test1, test2) == Collator::GREATER), "Problem");
    998     doAssert((col->compare(test1, test2, success) == UCOL_GREATER), "Problem");
    999     doAssert((col->compare(t1, t1Len, t2, t2Len) == Collator::GREATER), "Problem");
   1000     doAssert((col->compare(t1, t1Len, t2, t2Len, success) == UCOL_GREATER), "Problem");
   1001     doAssert((col->compare(test1, test2, t1Len) == Collator::GREATER), "Problem");
   1002     doAssert((col->compare(test1, test2, t1Len, success) == UCOL_GREATER), "Problem");
   1003 
   1004 
   1005 
   1006     logln("The compare tests end.");
   1007     delete col;
   1008 }
   1009 
   1010 void
   1011 CollationAPITest::TestGetAll(/* char* par */)
   1012 {
   1013     if (logKnownIssue("10774","Side effects from utility/LocaleTest/TestGetLocale")) {
   1014         return;
   1015     }
   1016     int32_t count1, count2;
   1017     UErrorCode status = U_ZERO_ERROR;
   1018 
   1019     logln("Trying Collator::getAvailableLocales(int&)");
   1020 
   1021     const Locale* list = Collator::getAvailableLocales(count1);
   1022     for (int32_t i = 0; i < count1; ++i) {
   1023         UnicodeString dispName;
   1024         logln(UnicodeString("Locale name: ")
   1025             + UnicodeString(list[i].getName())
   1026             + UnicodeString(" , the display name is : ")
   1027             + UnicodeString(list[i].getDisplayName(dispName)));
   1028     }
   1029 
   1030     if (count1 == 0 || list == NULL) {
   1031         dataerrln("getAvailableLocales(int&) returned an empty list");
   1032     }
   1033 
   1034     logln("Trying Collator::getAvailableLocales()");
   1035     StringEnumeration* localeEnum = Collator::getAvailableLocales();
   1036     const UnicodeString* locStr;
   1037     const char *locCStr;
   1038     count2 = 0;
   1039 
   1040     if (localeEnum == NULL) {
   1041         dataerrln("getAvailableLocales() returned NULL");
   1042         return;
   1043     }
   1044 
   1045     while ((locStr = localeEnum->snext(status)) != NULL)
   1046     {
   1047         logln(UnicodeString("Locale name is: ") + *locStr);
   1048         count2++;
   1049     }
   1050     if (count1 != count2) {
   1051         errln("getAvailableLocales(int&) returned %d and getAvailableLocales() returned %d", count1, count2);
   1052     }
   1053 
   1054     logln("Trying Collator::getAvailableLocales() clone");
   1055     count1 = 0;
   1056     StringEnumeration* localeEnum2 = localeEnum->clone();
   1057     localeEnum2->reset(status);
   1058     while ((locCStr = localeEnum2->next(NULL, status)) != NULL)
   1059     {
   1060         logln(UnicodeString("Locale name is: ") + UnicodeString(locCStr));
   1061         count1++;
   1062     }
   1063     if (count1 != count2) {
   1064         errln("getAvailableLocales(3rd time) returned %d and getAvailableLocales(2nd time) returned %d", count1, count2);
   1065     }
   1066     if (localeEnum->count(status) != count1) {
   1067         errln("localeEnum->count() returned %d and getAvailableLocales() returned %d", localeEnum->count(status), count1);
   1068     }
   1069     delete localeEnum;
   1070     delete localeEnum2;
   1071 }
   1072 
   1073 void CollationAPITest::TestSortKey()
   1074 {
   1075     UErrorCode status = U_ZERO_ERROR;
   1076     /*
   1077     this is supposed to open default date format, but later on it treats
   1078     it like it is "en_US"
   1079     - very bad if you try to run the tests on machine where default
   1080       locale is NOT "en_US"
   1081     */
   1082     Collator *col = Collator::createInstance(Locale::getEnglish(), status);
   1083     if (U_FAILURE(status)) {
   1084         errcheckln(status, "ERROR: Default collation creation failed.: %s\n", u_errorName(status));
   1085         return;
   1086     }
   1087 
   1088     if (col->getStrength() != Collator::TERTIARY)
   1089     {
   1090         errln("ERROR: default collation did not have UCOL_DEFAULT_STRENGTH !\n");
   1091     }
   1092 
   1093     /* Need to use identical strength */
   1094     col->setAttribute(UCOL_STRENGTH, UCOL_IDENTICAL, status);
   1095 
   1096     UChar test1[6] = {0x41, 0x62, 0x63, 0x64, 0x61, 0},
   1097           test2[6] = {0x61, 0x62, 0x63, 0x64, 0x61, 0},
   1098           test3[6] = {0x61, 0x62, 0x63, 0x64, 0x61, 0};
   1099 
   1100     uint8_t sortkey1[64];
   1101     uint8_t sortkey2[64];
   1102     uint8_t sortkey3[64];
   1103 
   1104     logln("Use tertiary comparison level testing ....\n");
   1105 
   1106     CollationKey key1;
   1107     col->getCollationKey(test1, u_strlen(test1), key1, status);
   1108 
   1109     CollationKey key2;
   1110     col->getCollationKey(test2, u_strlen(test2), key2, status);
   1111 
   1112     CollationKey key3;
   1113     col->getCollationKey(test3, u_strlen(test3), key3, status);
   1114 
   1115     doAssert(key1.compareTo(key2) == Collator::GREATER,
   1116         "Result should be \"Abcda\" > \"abcda\"");
   1117     doAssert(key2.compareTo(key1) == Collator::LESS,
   1118         "Result should be \"abcda\" < \"Abcda\"");
   1119     doAssert(key2.compareTo(key3) == Collator::EQUAL,
   1120         "Result should be \"abcda\" ==  \"abcda\"");
   1121 
   1122     // Clone the key2 sortkey for later.
   1123     int32_t keylength = 0;
   1124     const uint8_t *key2primary_alias = key2.getByteArray(keylength);
   1125     LocalArray<uint8_t> key2primary(new uint8_t[keylength]);
   1126     memcpy(key2primary.getAlias(), key2primary_alias, keylength);
   1127 
   1128     col->getSortKey(test1, sortkey1, 64);
   1129     col->getSortKey(test2, sortkey2, 64);
   1130     col->getSortKey(test3, sortkey3, 64);
   1131 
   1132     const uint8_t *tempkey = key1.getByteArray(keylength);
   1133     doAssert(memcmp(tempkey, sortkey1, keylength) == 0,
   1134         "Test1 string should have the same collation key and sort key");
   1135     tempkey = key2.getByteArray(keylength);
   1136     doAssert(memcmp(tempkey, sortkey2, keylength) == 0,
   1137         "Test2 string should have the same collation key and sort key");
   1138     tempkey = key3.getByteArray(keylength);
   1139     doAssert(memcmp(tempkey, sortkey3, keylength) == 0,
   1140         "Test3 string should have the same collation key and sort key");
   1141 
   1142     col->getSortKey(test1, 5, sortkey1, 64);
   1143     col->getSortKey(test2, 5, sortkey2, 64);
   1144     col->getSortKey(test3, 5, sortkey3, 64);
   1145 
   1146     tempkey = key1.getByteArray(keylength);
   1147     doAssert(memcmp(tempkey, sortkey1, keylength) == 0,
   1148         "Test1 string should have the same collation key and sort key");
   1149     tempkey = key2.getByteArray(keylength);
   1150     doAssert(memcmp(tempkey, sortkey2, keylength) == 0,
   1151         "Test2 string should have the same collation key and sort key");
   1152     tempkey = key3.getByteArray(keylength);
   1153     doAssert(memcmp(tempkey, sortkey3, keylength) == 0,
   1154         "Test3 string should have the same collation key and sort key");
   1155 
   1156     UnicodeString strtest1(test1);
   1157     col->getSortKey(strtest1, sortkey1, 64);
   1158     UnicodeString strtest2(test2);
   1159     col->getSortKey(strtest2, sortkey2, 64);
   1160     UnicodeString strtest3(test3);
   1161     col->getSortKey(strtest3, sortkey3, 64);
   1162 
   1163     tempkey = key1.getByteArray(keylength);
   1164     doAssert(memcmp(tempkey, sortkey1, keylength) == 0,
   1165         "Test1 string should have the same collation key and sort key");
   1166     tempkey = key2.getByteArray(keylength);
   1167     doAssert(memcmp(tempkey, sortkey2, keylength) == 0,
   1168         "Test2 string should have the same collation key and sort key");
   1169     tempkey = key3.getByteArray(keylength);
   1170     doAssert(memcmp(tempkey, sortkey3, keylength) == 0,
   1171         "Test3 string should have the same collation key and sort key");
   1172 
   1173     logln("Use secondary comparision level testing ...\n");
   1174     col->setStrength(Collator::SECONDARY);
   1175 
   1176     col->getCollationKey(test1, u_strlen(test1), key1, status);
   1177     col->getCollationKey(test2, u_strlen(test2), key2, status);
   1178     col->getCollationKey(test3, u_strlen(test3), key3, status);
   1179 
   1180     doAssert(key1.compareTo(key2) == Collator::EQUAL,
   1181         "Result should be \"Abcda\" == \"abcda\"");
   1182     doAssert(key2.compareTo(key3) == Collator::EQUAL,
   1183         "Result should be \"abcda\" ==  \"abcda\"");
   1184 
   1185     tempkey = key2.getByteArray(keylength);
   1186     doAssert(memcmp(tempkey, key2primary.getAlias(), keylength - 1) == 0,
   1187              "Binary format for 'abcda' sortkey different for secondary strength!");
   1188 
   1189     col->getSortKey(test1, sortkey1, 64);
   1190     col->getSortKey(test2, sortkey2, 64);
   1191     col->getSortKey(test3, sortkey3, 64);
   1192 
   1193     tempkey = key1.getByteArray(keylength);
   1194     doAssert(memcmp(tempkey, sortkey1, keylength) == 0,
   1195         "Test1 string should have the same collation key and sort key");
   1196     tempkey = key2.getByteArray(keylength);
   1197     doAssert(memcmp(tempkey, sortkey2, keylength) == 0,
   1198         "Test2 string should have the same collation key and sort key");
   1199     tempkey = key3.getByteArray(keylength);
   1200     doAssert(memcmp(tempkey, sortkey3, keylength) == 0,
   1201         "Test3 string should have the same collation key and sort key");
   1202 
   1203     col->getSortKey(test1, 5, sortkey1, 64);
   1204     col->getSortKey(test2, 5, sortkey2, 64);
   1205     col->getSortKey(test3, 5, sortkey3, 64);
   1206 
   1207     tempkey = key1.getByteArray(keylength);
   1208     doAssert(memcmp(tempkey, sortkey1, keylength) == 0,
   1209         "Test1 string should have the same collation key and sort key");
   1210     tempkey = key2.getByteArray(keylength);
   1211     doAssert(memcmp(tempkey, sortkey2, keylength) == 0,
   1212         "Test2 string should have the same collation key and sort key");
   1213     tempkey = key3.getByteArray(keylength);
   1214     doAssert(memcmp(tempkey, sortkey3, keylength) == 0,
   1215         "Test3 string should have the same collation key and sort key");
   1216 
   1217     col->getSortKey(strtest1, sortkey1, 64);
   1218     col->getSortKey(strtest2, sortkey2, 64);
   1219     col->getSortKey(strtest3, sortkey3, 64);
   1220 
   1221     tempkey = key1.getByteArray(keylength);
   1222     doAssert(memcmp(tempkey, sortkey1, keylength) == 0,
   1223         "Test1 string should have the same collation key and sort key");
   1224     tempkey = key2.getByteArray(keylength);
   1225     doAssert(memcmp(tempkey, sortkey2, keylength) == 0,
   1226         "Test2 string should have the same collation key and sort key");
   1227     tempkey = key3.getByteArray(keylength);
   1228     doAssert(memcmp(tempkey, sortkey3, keylength) == 0,
   1229         "Test3 string should have the same collation key and sort key");
   1230 
   1231     logln("testing sortkey ends...");
   1232     delete col;
   1233 }
   1234 
   1235 void CollationAPITest::TestSortKeyOverflow() {
   1236     IcuTestErrorCode errorCode(*this, "TestSortKeyOverflow()");
   1237     LocalPointer<Collator> col(Collator::createInstance(Locale::getEnglish(), errorCode));
   1238     if (errorCode.logDataIfFailureAndReset("Collator::createInstance(English) failed")) {
   1239         return;
   1240     }
   1241     col->setAttribute(UCOL_STRENGTH, UCOL_PRIMARY, errorCode);
   1242     UChar i_and_phi[] = { 0x438, 0x3c6 };  // Cyrillic small i & Greek small phi.
   1243     // The sort key should be 6 bytes:
   1244     // 2 bytes for the Cyrillic i, 1 byte for the primary-compression terminator,
   1245     // 2 bytes for the Greek phi, and 1 byte for the NUL terminator.
   1246     uint8_t sortKey[12];
   1247     int32_t length = col->getSortKey(i_and_phi, 2, sortKey, LENGTHOF(sortKey));
   1248     uint8_t sortKey2[12];
   1249     for (int32_t capacity = 0; capacity < length; ++capacity) {
   1250         uprv_memset(sortKey2, 2, LENGTHOF(sortKey2));
   1251         int32_t length2 = col->getSortKey(i_and_phi, 2, sortKey2, capacity);
   1252         if (length2 != length || 0 != uprv_memcmp(sortKey, sortKey2, capacity)) {
   1253             errln("getSortKey(i_and_phi, capacity=%d) failed to write proper prefix", capacity);
   1254         } else if (sortKey2[capacity] != 2 || sortKey2[capacity + 1] != 2) {
   1255             errln("getSortKey(i_and_phi, capacity=%d) wrote beyond capacity", capacity);
   1256         }
   1257     }
   1258 
   1259     // Now try to break getCollationKey().
   1260     // Internally, it always starts with a large stack buffer.
   1261     // Since we cannot control the initial capacity, we throw an increasing number
   1262     // of characters at it, with the problematic part at the end.
   1263     const int32_t longCapacity = 2000;
   1264     // Each 'a' in the prefix should result in one primary sort key byte.
   1265     // For i_and_phi we expect 6 bytes, then the NUL terminator.
   1266     const int32_t maxPrefixLength = longCapacity - 6 - 1;
   1267     LocalArray<uint8_t> longSortKey(new uint8_t[longCapacity]);
   1268     UnicodeString s(FALSE, i_and_phi, 2);
   1269     for (int32_t prefixLength = 0; prefixLength < maxPrefixLength; ++prefixLength) {
   1270         length = col->getSortKey(s, longSortKey.getAlias(), longCapacity);
   1271         CollationKey collKey;
   1272         col->getCollationKey(s, collKey, errorCode);
   1273         int32_t collKeyLength;
   1274         const uint8_t *collSortKey = collKey.getByteArray(collKeyLength);
   1275         if (collKeyLength != length || 0 != uprv_memcmp(longSortKey.getAlias(), collSortKey, length)) {
   1276             errln("getCollationKey(prefix[%d]+i_and_phi) failed to write proper sort key", prefixLength);
   1277         }
   1278 
   1279         // Insert an 'a' to match ++prefixLength.
   1280         s.insert(prefixLength, (UChar)0x61);
   1281     }
   1282 }
   1283 
   1284 void CollationAPITest::TestMaxExpansion()
   1285 {
   1286     UErrorCode          status = U_ZERO_ERROR;
   1287     UChar               ch     = 0;
   1288     UChar32             unassigned = 0xEFFFD;
   1289     uint32_t            sorder = 0;
   1290     uint32_t            temporder = 0;
   1291 
   1292     UnicodeString rule("&a < ab < c/aba < d < z < ch");
   1293     RuleBasedCollator coll(rule, status);
   1294     if(U_FAILURE(status)) {
   1295       errcheckln(status, "Collator creation failed with error %s", u_errorName(status));
   1296       return;
   1297     }
   1298     UnicodeString str(ch);
   1299     CollationElementIterator *iter =
   1300                                   coll.createCollationElementIterator(str);
   1301 
   1302     while (ch < 0xFFFF && U_SUCCESS(status)) {
   1303         int      count = 1;
   1304         uint32_t order;
   1305         int32_t  size = 0;
   1306 
   1307         ch ++;
   1308 
   1309         str.setCharAt(0, ch);
   1310         iter->setText(str, status);
   1311         order = iter->previous(status);
   1312 
   1313         /* thai management */
   1314         if (order == 0)
   1315             order = iter->previous(status);
   1316 
   1317         while (U_SUCCESS(status) && iter->previous(status) != CollationElementIterator::NULLORDER) {
   1318             count ++;
   1319         }
   1320 
   1321         size = coll.getMaxExpansion(order);
   1322         if (U_FAILURE(status) || size < count) {
   1323             errln("Failure at codepoint U+%04X, maximum expansion count %d < %d",
   1324                   ch, size, count);
   1325         }
   1326     }
   1327 
   1328     /* testing for exact max expansion */
   1329     int32_t size;
   1330     ch = 0;
   1331     while (ch < 0x61) {
   1332         uint32_t order;
   1333         str.setCharAt(0, ch);
   1334         iter->setText(str, status);
   1335         order = iter->previous(status);
   1336         size  = coll.getMaxExpansion(order);
   1337         if (U_FAILURE(status) || size != 1) {
   1338             errln("Failure at codepoint U+%04X, maximum expansion count %d < %d",
   1339                   ch, size, 1);
   1340         }
   1341         ch ++;
   1342     }
   1343 
   1344     ch = 0x63;
   1345     str.setTo(ch);
   1346     iter->setText(str, status);
   1347     temporder = iter->previous(status);
   1348     size = coll.getMaxExpansion(temporder);
   1349     if (U_FAILURE(status) || size != 3) {
   1350         errln("Failure at codepoint U+%04X, CE %08x, maximum expansion count %d != %d",
   1351               ch, temporder, size, 3);
   1352     }
   1353 
   1354     ch = 0x64;
   1355     str.setTo(ch);
   1356     iter->setText(str, status);
   1357     temporder = iter->previous(status);
   1358     size = coll.getMaxExpansion(temporder);
   1359     if (U_FAILURE(status) || size != 1) {
   1360         errln("Failure at codepoint U+%04X, CE %08x, maximum expansion count %d != %d",
   1361               ch, temporder, size, 1);
   1362     }
   1363 
   1364     str.setTo(unassigned);
   1365     iter->setText(str, status);
   1366     sorder = iter->previous(status);
   1367     size = coll.getMaxExpansion(sorder);
   1368     if (U_FAILURE(status) || size != 2) {
   1369         errln("Failure at supplementary codepoints, maximum expansion count %d < %d",
   1370               size, 2);
   1371     }
   1372 
   1373     /* testing jamo */
   1374     ch = 0x1165;
   1375     str.setTo(ch);
   1376     iter->setText(str, status);
   1377     temporder = iter->previous(status);
   1378     size = coll.getMaxExpansion(temporder);
   1379     if (U_FAILURE(status) || size > 3) {
   1380         errln("Failure at codepoint U+%04X, maximum expansion count %d > %d",
   1381               ch, size, 3);
   1382     }
   1383 
   1384     delete iter;
   1385 
   1386     /* testing special jamo &a<\u1160 */
   1387     rule = CharsToUnicodeString("\\u0026\\u0071\\u003c\\u1165\\u002f\\u0071\\u0071\\u0071\\u0071");
   1388 
   1389     RuleBasedCollator jamocoll(rule, status);
   1390     iter = jamocoll.createCollationElementIterator(str);
   1391     temporder = iter->previous(status);
   1392     size = iter->getMaxExpansion(temporder);
   1393     if (U_FAILURE(status) || size != 6) {
   1394         errln("Failure at codepoint U+%04X, maximum expansion count %d > %d",
   1395               ch, size, 5);
   1396     }
   1397 
   1398     delete iter;
   1399 }
   1400 
   1401 void CollationAPITest::TestDisplayName()
   1402 {
   1403     UErrorCode error = U_ZERO_ERROR;
   1404     Collator *coll = Collator::createInstance("en_US", error);
   1405     if (U_FAILURE(error)) {
   1406         errcheckln(error, "Failure creating english collator - %s", u_errorName(error));
   1407         return;
   1408     }
   1409     UnicodeString name;
   1410     UnicodeString result;
   1411     coll->getDisplayName(Locale::getCanadaFrench(), result);
   1412     Locale::getCanadaFrench().getDisplayName(name);
   1413     if (result.compare(name)) {
   1414         errln("Failure getting the correct name for locale en_US");
   1415     }
   1416 
   1417     coll->getDisplayName(Locale::getSimplifiedChinese(), result);
   1418     Locale::getSimplifiedChinese().getDisplayName(name);
   1419     if (result.compare(name)) {
   1420         errln("Failure getting the correct name for locale zh_SG");
   1421     }
   1422     delete coll;
   1423 }
   1424 
   1425 void CollationAPITest::TestAttribute()
   1426 {
   1427     UErrorCode error = U_ZERO_ERROR;
   1428     Collator *coll = Collator::createInstance(error);
   1429 
   1430     if (U_FAILURE(error)) {
   1431         errcheckln(error, "Creation of default collator failed - %s", u_errorName(error));
   1432         return;
   1433     }
   1434 
   1435     coll->setAttribute(UCOL_FRENCH_COLLATION, UCOL_OFF, error);
   1436     if (coll->getAttribute(UCOL_FRENCH_COLLATION, error) != UCOL_OFF ||
   1437         U_FAILURE(error)) {
   1438         errln("Setting and retrieving of the french collation failed");
   1439     }
   1440 
   1441     coll->setAttribute(UCOL_FRENCH_COLLATION, UCOL_ON, error);
   1442     if (coll->getAttribute(UCOL_FRENCH_COLLATION, error) != UCOL_ON ||
   1443         U_FAILURE(error)) {
   1444         errln("Setting and retrieving of the french collation failed");
   1445     }
   1446 
   1447     coll->setAttribute(UCOL_ALTERNATE_HANDLING, UCOL_SHIFTED, error);
   1448     if (coll->getAttribute(UCOL_ALTERNATE_HANDLING, error) != UCOL_SHIFTED ||
   1449         U_FAILURE(error)) {
   1450         errln("Setting and retrieving of the alternate handling failed");
   1451     }
   1452 
   1453     coll->setAttribute(UCOL_ALTERNATE_HANDLING, UCOL_NON_IGNORABLE, error);
   1454     if (coll->getAttribute(UCOL_ALTERNATE_HANDLING, error) != UCOL_NON_IGNORABLE ||
   1455         U_FAILURE(error)) {
   1456         errln("Setting and retrieving of the alternate handling failed");
   1457     }
   1458 
   1459     coll->setAttribute(UCOL_CASE_FIRST, UCOL_LOWER_FIRST, error);
   1460     if (coll->getAttribute(UCOL_CASE_FIRST, error) != UCOL_LOWER_FIRST ||
   1461         U_FAILURE(error)) {
   1462         errln("Setting and retrieving of the case first attribute failed");
   1463     }
   1464 
   1465     coll->setAttribute(UCOL_CASE_FIRST, UCOL_UPPER_FIRST, error);
   1466     if (coll->getAttribute(UCOL_CASE_FIRST, error) != UCOL_UPPER_FIRST ||
   1467         U_FAILURE(error)) {
   1468         errln("Setting and retrieving of the case first attribute failed");
   1469     }
   1470 
   1471     coll->setAttribute(UCOL_CASE_LEVEL, UCOL_ON, error);
   1472     if (coll->getAttribute(UCOL_CASE_LEVEL, error) != UCOL_ON ||
   1473         U_FAILURE(error)) {
   1474         errln("Setting and retrieving of the case level attribute failed");
   1475     }
   1476 
   1477     coll->setAttribute(UCOL_CASE_LEVEL, UCOL_OFF, error);
   1478     if (coll->getAttribute(UCOL_CASE_LEVEL, error) != UCOL_OFF ||
   1479         U_FAILURE(error)) {
   1480         errln("Setting and retrieving of the case level attribute failed");
   1481     }
   1482 
   1483     coll->setAttribute(UCOL_NORMALIZATION_MODE, UCOL_ON, error);
   1484     if (coll->getAttribute(UCOL_NORMALIZATION_MODE, error) != UCOL_ON ||
   1485         U_FAILURE(error)) {
   1486         errln("Setting and retrieving of the normalization on/off attribute failed");
   1487     }
   1488 
   1489     coll->setAttribute(UCOL_NORMALIZATION_MODE, UCOL_OFF, error);
   1490     if (coll->getAttribute(UCOL_NORMALIZATION_MODE, error) != UCOL_OFF ||
   1491         U_FAILURE(error)) {
   1492         errln("Setting and retrieving of the normalization on/off attribute failed");
   1493     }
   1494 
   1495     coll->setAttribute(UCOL_STRENGTH, UCOL_PRIMARY, error);
   1496     if (coll->getAttribute(UCOL_STRENGTH, error) != UCOL_PRIMARY ||
   1497         U_FAILURE(error)) {
   1498         errln("Setting and retrieving of the collation strength failed");
   1499     }
   1500 
   1501     coll->setAttribute(UCOL_STRENGTH, UCOL_SECONDARY, error);
   1502     if (coll->getAttribute(UCOL_STRENGTH, error) != UCOL_SECONDARY ||
   1503         U_FAILURE(error)) {
   1504         errln("Setting and retrieving of the collation strength failed");
   1505     }
   1506 
   1507     coll->setAttribute(UCOL_STRENGTH, UCOL_TERTIARY, error);
   1508     if (coll->getAttribute(UCOL_STRENGTH, error) != UCOL_TERTIARY ||
   1509         U_FAILURE(error)) {
   1510         errln("Setting and retrieving of the collation strength failed");
   1511     }
   1512 
   1513     coll->setAttribute(UCOL_STRENGTH, UCOL_QUATERNARY, error);
   1514     if (coll->getAttribute(UCOL_STRENGTH, error) != UCOL_QUATERNARY ||
   1515         U_FAILURE(error)) {
   1516         errln("Setting and retrieving of the collation strength failed");
   1517     }
   1518 
   1519     coll->setAttribute(UCOL_STRENGTH, UCOL_IDENTICAL, error);
   1520     if (coll->getAttribute(UCOL_STRENGTH, error) != UCOL_IDENTICAL ||
   1521         U_FAILURE(error)) {
   1522         errln("Setting and retrieving of the collation strength failed");
   1523     }
   1524 
   1525     delete coll;
   1526 }
   1527 
   1528 void CollationAPITest::TestVariableTopSetting() {
   1529   UErrorCode status = U_ZERO_ERROR;
   1530 
   1531   UChar vt[256] = { 0 };
   1532 
   1533   // Use the root collator, not the default collator.
   1534   // This test fails with en_US_POSIX which tailors the dollar sign after 'A'.
   1535   Collator *coll = Collator::createInstance(Locale::getRoot(), status);
   1536   if(U_FAILURE(status)) {
   1537     delete coll;
   1538     errcheckln(status, "Collator creation failed with error %s", u_errorName(status));
   1539     return;
   1540   }
   1541 
   1542   uint32_t oldVarTop = coll->getVariableTop(status);
   1543 
   1544   // ICU 53+: The character must be in a supported reordering group,
   1545   // and the variable top is pinned to the end of that group.
   1546   vt[0] = 0x0041;
   1547 
   1548   (void)coll->setVariableTop(vt, 1, status);
   1549   if(status != U_ILLEGAL_ARGUMENT_ERROR) {
   1550     errln("setVariableTop(letter) did not detect illegal argument - %s", u_errorName(status));
   1551   }
   1552 
   1553   status = U_ZERO_ERROR;
   1554   vt[0] = 0x24;  // dollar sign (currency symbol)
   1555   uint32_t newVarTop = coll->setVariableTop(vt, 1, status);
   1556 
   1557   if(newVarTop != coll->getVariableTop(status)) {
   1558     errln("setVariableTop(dollar sign) != following getVariableTop()");
   1559   }
   1560 
   1561   UnicodeString dollar((UChar)0x24);
   1562   UnicodeString euro((UChar)0x20AC);
   1563   uint32_t newVarTop2 = coll->setVariableTop(euro, status);
   1564   assertEquals("setVariableTop(Euro sign) == following getVariableTop()",
   1565                (int64_t)newVarTop2, (int64_t)coll->getVariableTop(status));
   1566   assertEquals("setVariableTop(Euro sign) == setVariableTop(dollar sign) (should pin to top of currency group)",
   1567                (int64_t)newVarTop2, (int64_t)newVarTop);
   1568 
   1569   coll->setAttribute(UCOL_ALTERNATE_HANDLING, UCOL_SHIFTED, status);
   1570   assertEquals("empty==dollar", UCOL_EQUAL, coll->compare(UnicodeString(), dollar));
   1571   assertEquals("empty==euro", UCOL_EQUAL, coll->compare(UnicodeString(), euro));
   1572   assertEquals("dollar<zero", UCOL_LESS, coll->compare(dollar, UnicodeString((UChar)0x30)));
   1573 
   1574   coll->setVariableTop(oldVarTop, status);
   1575 
   1576   uint32_t newerVarTop = coll->setVariableTop(UnicodeString(vt, 1), status);
   1577 
   1578   if(newVarTop != newerVarTop) {
   1579     errln("Didn't set vartop properly from UnicodeString!\n");
   1580   }
   1581 
   1582   delete coll;
   1583 
   1584 }
   1585 
   1586 void CollationAPITest::TestMaxVariable() {
   1587   UErrorCode errorCode = U_ZERO_ERROR;
   1588   LocalPointer<Collator> coll(Collator::createInstance(Locale::getRoot(), errorCode));
   1589   if(U_FAILURE(errorCode)) {
   1590     errcheckln(errorCode, "Collator creation failed with error %s", u_errorName(errorCode));
   1591     return;
   1592   }
   1593 
   1594   (void)coll->setMaxVariable(UCOL_REORDER_CODE_OTHERS, errorCode);
   1595   if(errorCode != U_ILLEGAL_ARGUMENT_ERROR) {
   1596     errln("setMaxVariable(others) did not detect illegal argument - %s", u_errorName(errorCode));
   1597   }
   1598 
   1599   errorCode = U_ZERO_ERROR;
   1600   (void)coll->setMaxVariable(UCOL_REORDER_CODE_CURRENCY, errorCode);
   1601 
   1602   if(UCOL_REORDER_CODE_CURRENCY != coll->getMaxVariable()) {
   1603     errln("setMaxVariable(currency) != following getMaxVariable()");
   1604   }
   1605 
   1606   coll->setAttribute(UCOL_ALTERNATE_HANDLING, UCOL_SHIFTED, errorCode);
   1607   assertEquals("empty==dollar", UCOL_EQUAL, coll->compare(UnicodeString(), UnicodeString((UChar)0x24)));
   1608   assertEquals("empty==euro", UCOL_EQUAL, coll->compare(UnicodeString(), UnicodeString((UChar)0x20AC)));
   1609   assertEquals("dollar<zero", UCOL_LESS, coll->compare(UnicodeString((UChar)0x24), UnicodeString((UChar)0x30)));
   1610 }
   1611 
   1612 void CollationAPITest::TestGetLocale() {
   1613   UErrorCode status = U_ZERO_ERROR;
   1614   const char *rules = "&a<x<y<z";
   1615   UChar rlz[256] = {0};
   1616 
   1617   Collator *coll = Collator::createInstance("root", status);
   1618   if(U_FAILURE(status)) {
   1619     dataerrln("Failed to open collator for \"root\" with %s", u_errorName(status));
   1620     return;
   1621   }
   1622   Locale locale = coll->getLocale(ULOC_ACTUAL_LOCALE, status);
   1623   if(locale != Locale::getRoot()) {
   1624     errln("Collator::createInstance(\"root\").getLocale(actual) != Locale::getRoot(); "
   1625           "getLocale().getName() = \"%s\"",
   1626           locale.getName());
   1627   }
   1628   delete coll;
   1629 
   1630   coll = Collator::createInstance("", status);
   1631   if(U_FAILURE(status)) {
   1632     dataerrln("Failed to open collator for \"\" with %s", u_errorName(status));
   1633     return;
   1634   }
   1635   locale = coll->getLocale(ULOC_ACTUAL_LOCALE, status);
   1636   if(locale != Locale::getRoot()) {
   1637     errln("Collator::createInstance(\"\").getLocale(actual) != Locale::getRoot(); "
   1638           "getLocale().getName() = \"%s\"",
   1639           locale.getName());
   1640   }
   1641   delete coll;
   1642 
   1643   int32_t i = 0;
   1644 
   1645   static const struct {
   1646     const char* requestedLocale;
   1647     const char* validLocale;
   1648     const char* actualLocale;
   1649   } testStruct[] = {
   1650     // Note: Locale::getRoot().getName() == "" not "root".
   1651     { "de_DE", "de", "" },
   1652     { "sr_RS", "sr_Cyrl_RS", "sr" },
   1653     { "en_US_CALIFORNIA", "en_US", "" },
   1654     { "fr_FR_NONEXISTANT", "fr", "" },
   1655     // pinyin is the default, therefore suppressed.
   1656     { "zh_CN", "zh_Hans_CN", "zh" },
   1657     // zh_Hant has default=stroke but the data is in zh.
   1658     { "zh_TW", "zh_Hant_TW", "zh@collation=stroke" },
   1659     { "zh_TW@collation=pinyin", "zh_Hant_TW@collation=pinyin", "zh" },
   1660     { "zh_CN@collation=stroke", "zh_Hans_CN@collation=stroke", "zh@collation=stroke" }
   1661   };
   1662 
   1663   u_unescape(rules, rlz, 256);
   1664 
   1665   /* test opening collators for different locales */
   1666   for(i = 0; i<(int32_t)LENGTHOF(testStruct); i++) {
   1667     status = U_ZERO_ERROR;
   1668     coll = Collator::createInstance(testStruct[i].requestedLocale, status);
   1669     if(U_FAILURE(status)) {
   1670       errln("Failed to open collator for %s with %s", testStruct[i].requestedLocale, u_errorName(status));
   1671       delete coll;
   1672       continue;
   1673     }
   1674     // The requested locale may be the same as the valid locale,
   1675     // or may not be supported at all. See ticket #10477.
   1676     locale = coll->getLocale(ULOC_REQUESTED_LOCALE, status);
   1677     if(locale != testStruct[i].requestedLocale && locale != testStruct[i].validLocale) {
   1678       errln("[Coll %s]: Error in requested locale, expected %s or %s, got %s",
   1679             testStruct[i].requestedLocale,
   1680             testStruct[i].requestedLocale, testStruct[i].validLocale, locale.getName());
   1681     }
   1682     locale = coll->getLocale(ULOC_VALID_LOCALE, status);
   1683     if(locale != testStruct[i].validLocale) {
   1684       errln("[Coll %s]: Error in valid locale, expected %s, got %s",
   1685             testStruct[i].requestedLocale, testStruct[i].validLocale, locale.getName());
   1686     }
   1687     locale = coll->getLocale(ULOC_ACTUAL_LOCALE, status);
   1688     if(locale != testStruct[i].actualLocale) {
   1689       errln("[Coll %s]: Error in actual locale, expected %s, got %s",
   1690             testStruct[i].requestedLocale, testStruct[i].actualLocale, locale.getName());
   1691     }
   1692     // If we open a collator for the actual locale, we should get an equivalent one again.
   1693     LocalPointer<Collator> coll2(Collator::createInstance(locale, status));
   1694     if(U_FAILURE(status)) {
   1695       errln("Failed to open collator for actual locale \"%s\" with %s",
   1696             locale.getName(), u_errorName(status));
   1697     } else {
   1698       Locale actual2 = coll2->getLocale(ULOC_ACTUAL_LOCALE, status);
   1699       if(actual2 != locale) {
   1700         errln("[Coll actual \"%s\"]: Error in actual locale, got different one: \"%s\"",
   1701               locale.getName(), actual2.getName());
   1702       }
   1703       if(*coll2 != *coll) {
   1704         errln("[Coll actual \"%s\"]: Got different collator than before", locale.getName());
   1705       }
   1706     }
   1707     delete coll;
   1708   }
   1709 
   1710   /* completely non-existant locale for collator should get a default collator */
   1711   {
   1712     Collator *defaultColl = Collator::createInstance((const Locale)NULL, status);
   1713     coll = Collator::createInstance("blahaha", status);
   1714     if(U_FAILURE(status)) {
   1715       errln("Failed to open collator with %s", u_errorName(status));
   1716       delete coll;
   1717       delete defaultColl;
   1718       return;
   1719     }
   1720     if(coll->getLocale(ULOC_VALID_LOCALE, status) !=
   1721       defaultColl->getLocale(ULOC_VALID_LOCALE, status)) {
   1722       errln("Valid locale for nonexisting locale locale collator differs "
   1723         "from valid locale for default collator");
   1724     }
   1725     if(coll->getLocale(ULOC_ACTUAL_LOCALE, status) !=
   1726       defaultColl->getLocale(ULOC_ACTUAL_LOCALE, status)) {
   1727       errln("Actual locale for nonexisting locale locale collator differs "
   1728         "from actual locale for default collator");
   1729     }
   1730     delete coll;
   1731     delete defaultColl;
   1732   }
   1733 
   1734 
   1735 
   1736   /* collator instantiated from rules should have all three locales NULL */
   1737   coll = new RuleBasedCollator(rlz, status);
   1738   locale = coll->getLocale(ULOC_REQUESTED_LOCALE, status);
   1739   if(!locale.isBogus()) {
   1740     errln("For collator instantiated from rules, requested locale %s is not bogus", locale.getName());
   1741   }
   1742   locale = coll->getLocale(ULOC_VALID_LOCALE, status);
   1743   if(!locale.isBogus()) {
   1744     errln("For collator instantiated from rules, valid locale %s is not bogus", locale.getName());
   1745   }
   1746   locale = coll->getLocale(ULOC_ACTUAL_LOCALE, status);
   1747   if(!locale.isBogus()) {
   1748     errln("For collator instantiated from rules, actual locale %s is not bogus", locale.getName());
   1749   }
   1750   delete coll;
   1751 }
   1752 
   1753 struct teststruct {
   1754     const char *original;
   1755     uint8_t key[256];
   1756 };
   1757 
   1758 
   1759 
   1760 U_CDECL_BEGIN
   1761 static int U_CALLCONV
   1762 compare_teststruct(const void *string1, const void *string2) {
   1763   return(strcmp((const char *)((struct teststruct *)string1)->key, (const char *)((struct teststruct *)string2)->key));
   1764 }
   1765 U_CDECL_END
   1766 
   1767 
   1768 void CollationAPITest::TestBounds(void) {
   1769     UErrorCode status = U_ZERO_ERROR;
   1770 
   1771     Collator *coll = Collator::createInstance(Locale("sh"), status);
   1772     if(U_FAILURE(status)) {
   1773       delete coll;
   1774       errcheckln(status, "Collator creation failed with %s", u_errorName(status));
   1775       return;
   1776     }
   1777 
   1778     uint8_t sortkey[512], lower[512], upper[512];
   1779     UChar buffer[512];
   1780 
   1781     static const char * const test[] = {
   1782         "John Smith",
   1783         "JOHN SMITH",
   1784         "john SMITH",
   1785         "j\\u00F6hn sm\\u00EFth",
   1786         "J\\u00F6hn Sm\\u00EFth",
   1787         "J\\u00D6HN SM\\u00CFTH",
   1788         "john smithsonian",
   1789         "John Smithsonian"
   1790     };
   1791 
   1792     struct teststruct tests[] = {
   1793         {"\\u010CAKI MIHALJ", {0}},
   1794         {"\\u010CAKI MIHALJ", {0}},
   1795         {"\\u010CAKI PIRO\\u0160KA", {0}},
   1796         {"\\u010CABAI ANDRIJA", {0}},
   1797         {"\\u010CABAI LAJO\\u0160", {0}},
   1798         {"\\u010CABAI MARIJA", {0}},
   1799         {"\\u010CABAI STEVAN", {0}},
   1800         {"\\u010CABAI STEVAN", {0}},
   1801         {"\\u010CABARKAPA BRANKO", {0}},
   1802         {"\\u010CABARKAPA MILENKO", {0}},
   1803         {"\\u010CABARKAPA MIROSLAV", {0}},
   1804         {"\\u010CABARKAPA SIMO", {0}},
   1805         {"\\u010CABARKAPA STANKO", {0}},
   1806         {"\\u010CABARKAPA TAMARA", {0}},
   1807         {"\\u010CABARKAPA TOMA\\u0160", {0}},
   1808         {"\\u010CABDARI\\u0106 NIKOLA", {0}},
   1809         {"\\u010CABDARI\\u0106 ZORICA", {0}},
   1810         {"\\u010CABI NANDOR", {0}},
   1811         {"\\u010CABOVI\\u0106 MILAN", {0}},
   1812         {"\\u010CABRADI AGNEZIJA", {0}},
   1813         {"\\u010CABRADI IVAN", {0}},
   1814         {"\\u010CABRADI JELENA", {0}},
   1815         {"\\u010CABRADI LJUBICA", {0}},
   1816         {"\\u010CABRADI STEVAN", {0}},
   1817         {"\\u010CABRDA MARTIN", {0}},
   1818         {"\\u010CABRILO BOGDAN", {0}},
   1819         {"\\u010CABRILO BRANISLAV", {0}},
   1820         {"\\u010CABRILO LAZAR", {0}},
   1821         {"\\u010CABRILO LJUBICA", {0}},
   1822         {"\\u010CABRILO SPASOJA", {0}},
   1823         {"\\u010CADE\\u0160 ZDENKA", {0}},
   1824         {"\\u010CADESKI BLAGOJE", {0}},
   1825         {"\\u010CADOVSKI VLADIMIR", {0}},
   1826         {"\\u010CAGLJEVI\\u0106 TOMA", {0}},
   1827         {"\\u010CAGOROVI\\u0106 VLADIMIR", {0}},
   1828         {"\\u010CAJA VANKA", {0}},
   1829         {"\\u010CAJI\\u0106 BOGOLJUB", {0}},
   1830         {"\\u010CAJI\\u0106 BORISLAV", {0}},
   1831         {"\\u010CAJI\\u0106 RADOSLAV", {0}},
   1832         {"\\u010CAK\\u0160IRAN MILADIN", {0}},
   1833         {"\\u010CAKAN EUGEN", {0}},
   1834         {"\\u010CAKAN EVGENIJE", {0}},
   1835         {"\\u010CAKAN IVAN", {0}},
   1836         {"\\u010CAKAN JULIJAN", {0}},
   1837         {"\\u010CAKAN MIHAJLO", {0}},
   1838         {"\\u010CAKAN STEVAN", {0}},
   1839         {"\\u010CAKAN VLADIMIR", {0}},
   1840         {"\\u010CAKAN VLADIMIR", {0}},
   1841         {"\\u010CAKAN VLADIMIR", {0}},
   1842         {"\\u010CAKARA ANA", {0}},
   1843         {"\\u010CAKAREVI\\u0106 MOMIR", {0}},
   1844         {"\\u010CAKAREVI\\u0106 NEDELJKO", {0}},
   1845         {"\\u010CAKI \\u0160ANDOR", {0}},
   1846         {"\\u010CAKI AMALIJA", {0}},
   1847         {"\\u010CAKI ANDRA\\u0160", {0}},
   1848         {"\\u010CAKI LADISLAV", {0}},
   1849         {"\\u010CAKI LAJO\\u0160", {0}},
   1850         {"\\u010CAKI LASLO", {0}}
   1851     };
   1852 
   1853 
   1854 
   1855     int32_t i = 0, j = 0, k = 0, buffSize = 0, skSize = 0, lowerSize = 0, upperSize = 0;
   1856     int32_t arraySize = sizeof(tests)/sizeof(tests[0]);
   1857 
   1858     (void)lowerSize;  // Suppress unused variable warnings.
   1859     (void)upperSize;
   1860 
   1861     for(i = 0; i<arraySize; i++) {
   1862         buffSize = u_unescape(tests[i].original, buffer, 512);
   1863         skSize = coll->getSortKey(buffer, buffSize, tests[i].key, 512);
   1864     }
   1865 
   1866     qsort(tests, arraySize, sizeof(struct teststruct), compare_teststruct);
   1867 
   1868     for(i = 0; i < arraySize-1; i++) {
   1869         for(j = i+1; j < arraySize; j++) {
   1870             lowerSize = coll->getBound(tests[i].key, -1, UCOL_BOUND_LOWER, 1, lower, 512, status);
   1871             upperSize = coll->getBound(tests[j].key, -1, UCOL_BOUND_UPPER, 1, upper, 512, status);
   1872             for(k = i; k <= j; k++) {
   1873                 if(strcmp((const char *)lower, (const char *)tests[k].key) > 0) {
   1874                     errln("Problem with lower! j = %i (%s vs %s)", k, tests[k].original, tests[i].original);
   1875                 }
   1876                 if(strcmp((const char *)upper, (const char *)tests[k].key) <= 0) {
   1877                     errln("Problem with upper! j = %i (%s vs %s)", k, tests[k].original, tests[j].original);
   1878                 }
   1879             }
   1880         }
   1881     }
   1882 
   1883 
   1884     for(i = 0; i<(int32_t)(sizeof(test)/sizeof(test[0])); i++) {
   1885         buffSize = u_unescape(test[i], buffer, 512);
   1886         skSize = coll->getSortKey(buffer, buffSize, sortkey, 512);
   1887         lowerSize = ucol_getBound(sortkey, skSize, UCOL_BOUND_LOWER, 1, lower, 512, &status);
   1888         upperSize = ucol_getBound(sortkey, skSize, UCOL_BOUND_UPPER_LONG, 1, upper, 512, &status);
   1889         for(j = i+1; j<(int32_t)(sizeof(test)/sizeof(test[0])); j++) {
   1890             buffSize = u_unescape(test[j], buffer, 512);
   1891             skSize = coll->getSortKey(buffer, buffSize, sortkey, 512);
   1892             if(strcmp((const char *)lower, (const char *)sortkey) > 0) {
   1893                 errln("Problem with lower! i = %i, j = %i (%s vs %s)", i, j, test[i], test[j]);
   1894             }
   1895             if(strcmp((const char *)upper, (const char *)sortkey) <= 0) {
   1896                 errln("Problem with upper! i = %i, j = %i (%s vs %s)", i, j, test[i], test[j]);
   1897             }
   1898         }
   1899     }
   1900     delete coll;
   1901 }
   1902 
   1903 
   1904 void CollationAPITest::TestGetTailoredSet()
   1905 {
   1906   struct {
   1907     const char *rules;
   1908     const char *tests[20];
   1909     int32_t testsize;
   1910   } setTest[] = {
   1911     { "&a < \\u212b", { "\\u212b", "A\\u030a", "\\u00c5" }, 3},
   1912     { "& S < \\u0161 <<< \\u0160", { "\\u0161", "s\\u030C", "\\u0160", "S\\u030C" }, 4}
   1913   };
   1914 
   1915   int32_t i = 0, j = 0;
   1916   UErrorCode status = U_ZERO_ERROR;
   1917 
   1918   UnicodeString buff;
   1919   UnicodeSet *set = NULL;
   1920 
   1921   for(i = 0; i < LENGTHOF(setTest); i++) {
   1922     buff = UnicodeString(setTest[i].rules, -1, US_INV).unescape();
   1923     RuleBasedCollator coll(buff, status);
   1924     if(U_SUCCESS(status)) {
   1925       set = coll.getTailoredSet(status);
   1926       if(set->size() < setTest[i].testsize) {
   1927         errln("Tailored set size smaller (%d) than expected (%d)", set->size(), setTest[i].testsize);
   1928       }
   1929       for(j = 0; j < setTest[i].testsize; j++) {
   1930         buff = UnicodeString(setTest[i].tests[j], -1, US_INV).unescape();
   1931         if(!set->contains(buff)) {
   1932           errln("Tailored set doesn't contain %s... It should", setTest[i].tests[j]);
   1933         }
   1934       }
   1935       delete set;
   1936     } else {
   1937       errcheckln(status, "Couldn't open collator with rules %s - %s", setTest[i].rules, u_errorName(status));
   1938     }
   1939   }
   1940 }
   1941 
   1942 void CollationAPITest::TestUClassID()
   1943 {
   1944     char id = *((char *)RuleBasedCollator::getStaticClassID());
   1945     if (id != 0) {
   1946         errln("Static class id for RuleBasedCollator should be 0");
   1947     }
   1948     UErrorCode status = U_ZERO_ERROR;
   1949     RuleBasedCollator *coll
   1950         = (RuleBasedCollator *)Collator::createInstance(status);
   1951     if(U_FAILURE(status)) {
   1952       delete coll;
   1953       errcheckln(status, "Collator creation failed with %s", u_errorName(status));
   1954       return;
   1955     }
   1956     id = *((char *)coll->getDynamicClassID());
   1957     if (id != 0) {
   1958         errln("Dynamic class id for RuleBasedCollator should be 0");
   1959     }
   1960     id = *((char *)CollationKey::getStaticClassID());
   1961     if (id != 0) {
   1962         errln("Static class id for CollationKey should be 0");
   1963     }
   1964     CollationKey *key = new CollationKey();
   1965     id = *((char *)key->getDynamicClassID());
   1966     if (id != 0) {
   1967         errln("Dynamic class id for CollationKey should be 0");
   1968     }
   1969     id = *((char *)CollationElementIterator::getStaticClassID());
   1970     if (id != 0) {
   1971         errln("Static class id for CollationElementIterator should be 0");
   1972     }
   1973     UnicodeString str("testing");
   1974     CollationElementIterator *iter = coll->createCollationElementIterator(str);
   1975     id = *((char *)iter->getDynamicClassID());
   1976     if (id != 0) {
   1977         errln("Dynamic class id for CollationElementIterator should be 0");
   1978     }
   1979     delete key;
   1980     delete iter;
   1981     delete coll;
   1982 }
   1983 
   1984 class TestCollator  : public Collator
   1985 {
   1986 public:
   1987     virtual Collator* clone(void) const;
   1988 
   1989     using Collator::compare;
   1990 
   1991     virtual UCollationResult compare(const UnicodeString& source,
   1992                                       const UnicodeString& target,
   1993                                       UErrorCode& status) const;
   1994     virtual UCollationResult compare(const UnicodeString& source,
   1995                                       const UnicodeString& target,
   1996                                       int32_t length,
   1997                                       UErrorCode& status) const;
   1998     virtual UCollationResult compare(const UChar* source,
   1999                                       int32_t sourceLength,
   2000                                       const UChar* target,
   2001                                       int32_t targetLength,
   2002                                       UErrorCode& status) const;
   2003     virtual CollationKey& getCollationKey(const UnicodeString&  source,
   2004                                           CollationKey& key,
   2005                                           UErrorCode& status) const;
   2006     virtual CollationKey& getCollationKey(const UChar*source,
   2007                                           int32_t sourceLength,
   2008                                           CollationKey& key,
   2009                                           UErrorCode& status) const;
   2010     virtual int32_t hashCode(void) const;
   2011     virtual Locale getLocale(ULocDataLocaleType type, UErrorCode& status) const;
   2012     virtual ECollationStrength getStrength(void) const;
   2013     virtual void setStrength(ECollationStrength newStrength);
   2014     virtual UClassID getDynamicClassID(void) const;
   2015     virtual void getVersion(UVersionInfo info) const;
   2016     virtual void setAttribute(UColAttribute attr, UColAttributeValue value,
   2017                               UErrorCode &status);
   2018     virtual UColAttributeValue getAttribute(UColAttribute attr,
   2019                                             UErrorCode &status) const;
   2020     virtual uint32_t setVariableTop(const UChar *varTop, int32_t len,
   2021                                     UErrorCode &status);
   2022     virtual uint32_t setVariableTop(const UnicodeString &varTop,
   2023                                     UErrorCode &status);
   2024     virtual void setVariableTop(uint32_t varTop, UErrorCode &status);
   2025     virtual uint32_t getVariableTop(UErrorCode &status) const;
   2026     virtual int32_t getSortKey(const UnicodeString& source,
   2027                             uint8_t* result,
   2028                             int32_t resultLength) const;
   2029     virtual int32_t getSortKey(const UChar*source, int32_t sourceLength,
   2030                              uint8_t*result, int32_t resultLength) const;
   2031     virtual UnicodeSet *getTailoredSet(UErrorCode &status) const;
   2032     virtual UBool operator==(const Collator& other) const;
   2033     // Collator::operator!= calls !Collator::operator== which works for all subclasses.
   2034     virtual void setLocales(const Locale& requestedLocale, const Locale& validLocale, const Locale& actualLocale);
   2035     TestCollator() : Collator() {};
   2036     TestCollator(UCollationStrength collationStrength,
   2037            UNormalizationMode decompositionMode) : Collator(collationStrength, decompositionMode) {};
   2038 };
   2039 
   2040 inline UBool TestCollator::operator==(const Collator& other) const {
   2041     // TestCollator has no fields, so we test for identity.
   2042     return this == &other;
   2043 
   2044     // Normally, subclasses should do something like the following:
   2045     //    if (this == &other) { return TRUE; }
   2046     //    if (!Collator::operator==(other)) { return FALSE; }  // not the same class
   2047     //
   2048     //    const TestCollator &o = (const TestCollator&)other;
   2049     //    (compare this vs. o's subclass fields)
   2050 }
   2051 
   2052 Collator* TestCollator::clone() const
   2053 {
   2054     return new TestCollator();
   2055 }
   2056 
   2057 UCollationResult TestCollator::compare(const UnicodeString& source,
   2058                                         const UnicodeString& target,
   2059                                         UErrorCode& status) const
   2060 {
   2061   if(U_SUCCESS(status)) {
   2062     return UCollationResult(source.compare(target));
   2063   } else {
   2064     return UCOL_EQUAL;
   2065   }
   2066 }
   2067 
   2068 UCollationResult TestCollator::compare(const UnicodeString& source,
   2069                                         const UnicodeString& target,
   2070                                         int32_t length,
   2071                                         UErrorCode& status) const
   2072 {
   2073   if(U_SUCCESS(status)) {
   2074     return UCollationResult(source.compare(0, length, target));
   2075   } else {
   2076     return UCOL_EQUAL;
   2077   }
   2078 }
   2079 
   2080 UCollationResult TestCollator::compare(const UChar* source,
   2081                                         int32_t sourceLength,
   2082                                         const UChar* target,
   2083                                         int32_t targetLength,
   2084                                         UErrorCode& status) const
   2085 {
   2086     UnicodeString s(source, sourceLength);
   2087     UnicodeString t(target, targetLength);
   2088     return compare(s, t, status);
   2089 }
   2090 
   2091 CollationKey& TestCollator::getCollationKey(const UnicodeString& source,
   2092                                             CollationKey& key,
   2093                                             UErrorCode& status) const
   2094 {
   2095     char temp[100];
   2096     int length = 100;
   2097     length = source.extract(temp, length, NULL, status);
   2098     temp[length] = 0;
   2099     CollationKey tempkey((uint8_t*)temp, length);
   2100     key = tempkey;
   2101     return key;
   2102 }
   2103 
   2104 CollationKey& TestCollator::getCollationKey(const UChar*source,
   2105                                           int32_t sourceLength,
   2106                                           CollationKey& key,
   2107                                           UErrorCode& status) const
   2108 {
   2109     //s tack allocation used since collationkey does not keep the unicodestring
   2110     UnicodeString str(source, sourceLength);
   2111     return getCollationKey(str, key, status);
   2112 }
   2113 
   2114 int32_t TestCollator::getSortKey(const UnicodeString& source, uint8_t* result,
   2115                                  int32_t resultLength) const
   2116 {
   2117     UErrorCode status = U_ZERO_ERROR;
   2118     int32_t length = source.extract((char *)result, resultLength, NULL,
   2119                                     status);
   2120     result[length] = 0;
   2121     return length;
   2122 }
   2123 
   2124 int32_t TestCollator::getSortKey(const UChar*source, int32_t sourceLength,
   2125                                  uint8_t*result, int32_t resultLength) const
   2126 {
   2127     UnicodeString str(source, sourceLength);
   2128     return getSortKey(str, result, resultLength);
   2129 }
   2130 
   2131 int32_t TestCollator::hashCode() const
   2132 {
   2133     return 0;
   2134 }
   2135 
   2136 Locale TestCollator::getLocale(ULocDataLocaleType type, UErrorCode& status) const
   2137 {
   2138     // api not used, this is to make the compiler happy
   2139     if (U_FAILURE(status)) {
   2140         (void)type;
   2141     }
   2142     return NULL;
   2143 }
   2144 
   2145 Collator::ECollationStrength TestCollator::getStrength() const
   2146 {
   2147     return TERTIARY;
   2148 }
   2149 
   2150 void TestCollator::setStrength(Collator::ECollationStrength newStrength)
   2151 {
   2152     // api not used, this is to make the compiler happy
   2153     (void)newStrength;
   2154 }
   2155 
   2156 UClassID TestCollator::getDynamicClassID(void) const
   2157 {
   2158     return 0;
   2159 }
   2160 
   2161 void TestCollator::getVersion(UVersionInfo info) const
   2162 {
   2163     // api not used, this is to make the compiler happy
   2164     memset(info, 0, U_MAX_VERSION_LENGTH);
   2165 }
   2166 
   2167 void TestCollator::setAttribute(UColAttribute /*attr*/, UColAttributeValue /*value*/,
   2168                                 UErrorCode & /*status*/)
   2169 {
   2170 }
   2171 
   2172 UColAttributeValue TestCollator::getAttribute(UColAttribute attr,
   2173                                               UErrorCode &status) const
   2174 {
   2175     // api not used, this is to make the compiler happy
   2176     if (U_FAILURE(status) || attr == UCOL_ATTRIBUTE_COUNT) {
   2177         return UCOL_OFF;
   2178     }
   2179     return UCOL_DEFAULT;
   2180 }
   2181 
   2182 uint32_t TestCollator::setVariableTop(const UChar *varTop, int32_t len,
   2183                                   UErrorCode &status)
   2184 {
   2185     // api not used, this is to make the compiler happy
   2186     if (U_SUCCESS(status) && (varTop == 0 || len < -1)) {
   2187         status = U_ILLEGAL_ARGUMENT_ERROR;
   2188     }
   2189     return 0;
   2190 }
   2191 
   2192 uint32_t TestCollator::setVariableTop(const UnicodeString &varTop,
   2193                                   UErrorCode &status)
   2194 {
   2195     // api not used, this is to make the compiler happy
   2196     if (U_SUCCESS(status) && varTop.length() == 0) {
   2197         status = U_ILLEGAL_ARGUMENT_ERROR;
   2198     }
   2199     return 0;
   2200 }
   2201 
   2202 void TestCollator::setVariableTop(uint32_t varTop, UErrorCode &status)
   2203 {
   2204     // api not used, this is to make the compiler happy
   2205     if (U_SUCCESS(status) && varTop == 0) {
   2206         status = U_ILLEGAL_ARGUMENT_ERROR;
   2207     }
   2208 }
   2209 
   2210 uint32_t TestCollator::getVariableTop(UErrorCode &status) const
   2211 {
   2212 
   2213     // api not used, this is to make the compiler happy
   2214     if (U_SUCCESS(status)) {
   2215         return 0;
   2216     }
   2217     return (uint32_t)(0xFFFFFFFFu);
   2218 }
   2219 
   2220 UnicodeSet * TestCollator::getTailoredSet(UErrorCode &status) const
   2221 {
   2222     return Collator::getTailoredSet(status);
   2223 }
   2224 
   2225 void TestCollator::setLocales(const Locale& requestedLocale, const Locale& validLocale, const Locale& actualLocale)
   2226 {
   2227     Collator::setLocales(requestedLocale, validLocale, actualLocale);
   2228 }
   2229 
   2230 
   2231 void CollationAPITest::TestSubclass()
   2232 {
   2233     TestCollator col1;
   2234     TestCollator col2;
   2235     doAssert(col1 != col2, "2 instances of TestCollator should be different");
   2236     if (col1.hashCode() != col2.hashCode()) {
   2237         errln("Every TestCollator has the same hashcode");
   2238     }
   2239     UnicodeString abc("abc", 3);
   2240     UnicodeString bcd("bcd", 3);
   2241     if (col1.compare(abc, bcd) != abc.compare(bcd)) {
   2242         errln("TestCollator compare should be the same as the default "
   2243               "string comparison");
   2244     }
   2245     CollationKey key;
   2246     UErrorCode status = U_ZERO_ERROR;
   2247     col1.getCollationKey(abc, key, status);
   2248     int32_t length = 0;
   2249     const char* bytes = (const char *)key.getByteArray(length);
   2250     UnicodeString keyarray(bytes, length, NULL, status);
   2251     if (abc != keyarray) {
   2252         errln("TestCollator collationkey API is returning wrong values");
   2253     }
   2254 
   2255     UnicodeSet expectedset(0, 0x10FFFF);
   2256     UnicodeSet *defaultset = col1.getTailoredSet(status);
   2257     if (!defaultset->containsAll(expectedset)
   2258         || !expectedset.containsAll(*defaultset)) {
   2259         errln("Error: expected default tailoring to be 0 to 0x10ffff");
   2260     }
   2261     delete defaultset;
   2262 
   2263     // use base class implementation
   2264     Locale loc1 = Locale::getGermany();
   2265     Locale loc2 = Locale::getFrance();
   2266     col1.setLocales(loc1, loc2, loc2); // default implementation has no effect
   2267 
   2268     UnicodeString displayName;
   2269     col1.getDisplayName(loc1, loc2, displayName); // de_DE collator in fr_FR locale
   2270 
   2271     TestCollator col3(UCOL_TERTIARY, UNORM_NONE);
   2272     UnicodeString a("a");
   2273     UnicodeString b("b");
   2274     Collator::EComparisonResult result = Collator::EComparisonResult(a.compare(b));
   2275     if(col1.compare(a, b) != result) {
   2276       errln("Collator doesn't give default result");
   2277     }
   2278     if(col1.compare(a, b, 1) != result) {
   2279       errln("Collator doesn't give default result");
   2280     }
   2281     if(col1.compare(a.getBuffer(), a.length(), b.getBuffer(), b.length()) != result) {
   2282       errln("Collator doesn't give default result");
   2283     }
   2284 }
   2285 
   2286 void CollationAPITest::TestNULLCharTailoring()
   2287 {
   2288     UErrorCode status = U_ZERO_ERROR;
   2289     UChar buf[256] = {0};
   2290     int32_t len = u_unescape("&a < '\\u0000'", buf, 256);
   2291     UnicodeString first((UChar)0x0061);
   2292     UnicodeString second((UChar)0);
   2293     RuleBasedCollator *coll = new RuleBasedCollator(UnicodeString(buf, len), status);
   2294     if(U_FAILURE(status)) {
   2295         delete coll;
   2296         errcheckln(status, "Failed to open collator - %s", u_errorName(status));
   2297         return;
   2298     }
   2299     UCollationResult res = coll->compare(first, second, status);
   2300     if(res != UCOL_LESS) {
   2301         errln("a should be less then NULL after tailoring");
   2302     }
   2303     delete coll;
   2304 }
   2305 
   2306 void CollationAPITest::TestClone() {
   2307     logln("\ninit c0");
   2308     UErrorCode status = U_ZERO_ERROR;
   2309     RuleBasedCollator* c0 = (RuleBasedCollator*)Collator::createInstance(status);
   2310 
   2311     if (U_FAILURE(status)) {
   2312         errcheckln(status, "Collator::CreateInstance(status) failed with %s", u_errorName(status));
   2313         return;
   2314     }
   2315 
   2316     c0->setStrength(Collator::TERTIARY);
   2317     dump("c0", c0, status);
   2318 
   2319     logln("\ninit c1");
   2320     RuleBasedCollator* c1 = (RuleBasedCollator*)Collator::createInstance(status);
   2321     c1->setStrength(Collator::TERTIARY);
   2322     UColAttributeValue val = c1->getAttribute(UCOL_CASE_FIRST, status);
   2323     if(val == UCOL_LOWER_FIRST){
   2324         c1->setAttribute(UCOL_CASE_FIRST, UCOL_UPPER_FIRST, status);
   2325     }else{
   2326         c1->setAttribute(UCOL_CASE_FIRST, UCOL_LOWER_FIRST, status);
   2327     }
   2328     dump("c0", c0, status);
   2329     dump("c1", c1, status);
   2330 
   2331     logln("\ninit c2");
   2332     RuleBasedCollator* c2 = (RuleBasedCollator*)c1->clone();
   2333     val = c2->getAttribute(UCOL_CASE_FIRST, status);
   2334     if(val == UCOL_LOWER_FIRST){
   2335         c2->setAttribute(UCOL_CASE_FIRST, UCOL_UPPER_FIRST, status);
   2336     }else{
   2337         c2->setAttribute(UCOL_CASE_FIRST, UCOL_LOWER_FIRST, status);
   2338     }
   2339     if(U_FAILURE(status)){
   2340         errln("set and get attributes of collator failed. %s\n", u_errorName(status));
   2341         return;
   2342     }
   2343     dump("c0", c0, status);
   2344     dump("c1", c1, status);
   2345     dump("c2", c2, status);
   2346     if(*c1 == *c2){
   2347         errln("The cloned objects refer to same data");
   2348     }
   2349     delete c0;
   2350     delete c1;
   2351     delete c2;
   2352 }
   2353 
   2354 void CollationAPITest::TestCloneBinary() {
   2355     IcuTestErrorCode errorCode(*this, "TestCloneBinary");
   2356     LocalPointer<Collator> root(Collator::createInstance(Locale::getRoot(), errorCode));
   2357     LocalPointer<Collator> coll(Collator::createInstance("de@collation=phonebook", errorCode));
   2358     if(errorCode.logDataIfFailureAndReset("Collator::createInstance(de@collation=phonebook)")) {
   2359         return;
   2360     }
   2361     RuleBasedCollator *rbRoot = dynamic_cast<RuleBasedCollator *>(root.getAlias());
   2362     RuleBasedCollator *rbc = dynamic_cast<RuleBasedCollator *>(coll.getAlias());
   2363     if(rbRoot == NULL || rbc == NULL) {
   2364         infoln("root or de@collation=phonebook is not a RuleBasedCollator");
   2365         return;
   2366     }
   2367     rbc->setAttribute(UCOL_STRENGTH, UCOL_PRIMARY, errorCode);
   2368     UnicodeString uUmlaut((UChar)0xfc);
   2369     UnicodeString ue = UNICODE_STRING_SIMPLE("ue");
   2370     assertEquals("rbc/primary: u-umlaut==ue", UCOL_EQUAL, rbc->compare(uUmlaut, ue, errorCode));
   2371     uint8_t bin[25000];
   2372     int32_t binLength = rbc->cloneBinary(bin, LENGTHOF(bin), errorCode);
   2373     if(errorCode.logDataIfFailureAndReset("rbc->cloneBinary()")) {
   2374         return;
   2375     }
   2376     logln("rbc->cloneBinary() -> %d bytes", (int)binLength);
   2377 
   2378     RuleBasedCollator rbc2(bin, binLength, rbRoot, errorCode);
   2379     if(errorCode.logDataIfFailureAndReset("RuleBasedCollator(rbc binary)")) {
   2380         return;
   2381     }
   2382     assertEquals("rbc2.strength==primary", UCOL_PRIMARY, rbc2.getAttribute(UCOL_STRENGTH, errorCode));
   2383     assertEquals("rbc2: u-umlaut==ue", UCOL_EQUAL, rbc2.compare(uUmlaut, ue, errorCode));
   2384     assertTrue("rbc==rbc2", *rbc == rbc2);
   2385     uint8_t bin2[25000];
   2386     int32_t bin2Length = rbc2.cloneBinary(bin2, LENGTHOF(bin2), errorCode);
   2387     assertEquals("len(rbc binary)==len(rbc2 binary)", binLength, bin2Length);
   2388     assertTrue("rbc binary==rbc2 binary", binLength == bin2Length && memcmp(bin, bin2, binLength) == 0);
   2389 }
   2390 
   2391 void CollationAPITest::TestIterNumeric() {
   2392     // Regression test for ticket #9915.
   2393     // The collation code sometimes masked the continuation marker away
   2394     // but later tested the result for isContinuation().
   2395     // This test case failed because the third bytes of the computed numeric-collation primaries
   2396     // were permutated with the script reordering table.
   2397     // It should have been possible to reproduce this with the root collator
   2398     // and characters with appropriate 3-byte primary weights.
   2399     // The effectiveness of this test depends completely on the collation elements
   2400     // and on the implementation code.
   2401     IcuTestErrorCode errorCode(*this, "TestIterNumeric");
   2402     RuleBasedCollator coll(UnicodeString("[reorder Hang Hani]"), errorCode);
   2403     if(errorCode.logDataIfFailureAndReset("RuleBasedCollator constructor")) {
   2404         return;
   2405     }
   2406     coll.setAttribute(UCOL_NUMERIC_COLLATION, UCOL_ON, errorCode);
   2407     UCharIterator iter40, iter72;
   2408     uiter_setUTF8(&iter40, "\x34\x30", 2);
   2409     uiter_setUTF8(&iter72, "\x37\x32", 2);
   2410     UCollationResult result = coll.compare(iter40, iter72, errorCode);
   2411     assertEquals("40<72", (int32_t)UCOL_LESS, (int32_t)result);
   2412 }
   2413 
   2414 void CollationAPITest::TestBadKeywords() {
   2415     // Test locale IDs with errors.
   2416     // Valid locale IDs are tested via data-driven tests.
   2417     UErrorCode errorCode = U_ZERO_ERROR;
   2418     Locale bogusLocale(Locale::getRoot());
   2419     bogusLocale.setToBogus();
   2420     LocalPointer<Collator> coll(Collator::createInstance(bogusLocale, errorCode));
   2421     if(errorCode != U_ILLEGAL_ARGUMENT_ERROR) {
   2422         errln("Collator::createInstance(bogus locale) did not fail as expected - %s",
   2423               u_errorName(errorCode));
   2424     }
   2425 
   2426     // Unknown value.
   2427     const char *localeID = "it-u-ks-xyz";
   2428     errorCode = U_ZERO_ERROR;
   2429     coll.adoptInstead(Collator::createInstance(localeID, errorCode));
   2430     if(errorCode != U_ILLEGAL_ARGUMENT_ERROR) {
   2431         errln("Collator::createInstance(%s) did not fail as expected - %s",
   2432               localeID, u_errorName(errorCode));
   2433     }
   2434 
   2435     // Unsupported attributes.
   2436     localeID = "it@colHiraganaQuaternary=true";
   2437     errorCode = U_ZERO_ERROR;
   2438     coll.adoptInstead(Collator::createInstance(localeID, errorCode));
   2439     if(errorCode != U_UNSUPPORTED_ERROR) {
   2440         errln("Collator::createInstance(%s) did not fail as expected - %s",
   2441               localeID, u_errorName(errorCode));
   2442     }
   2443 
   2444     localeID = "it-u-vt-u24";
   2445     errorCode = U_ZERO_ERROR;
   2446     coll.adoptInstead(Collator::createInstance(localeID, errorCode));
   2447     if(errorCode != U_UNSUPPORTED_ERROR) {
   2448         errln("Collator::createInstance(%s) did not fail as expected - %s",
   2449               localeID, u_errorName(errorCode));
   2450     }
   2451 }
   2452 
   2453  void CollationAPITest::dump(UnicodeString msg, RuleBasedCollator* c, UErrorCode& status) {
   2454     const char* bigone = "One";
   2455     const char* littleone = "one";
   2456 
   2457     logln(msg + " " + c->compare(bigone, littleone) +
   2458                         " s: " + c->getStrength() +
   2459                         " u: " + c->getAttribute(UCOL_CASE_FIRST, status));
   2460 }
   2461 void CollationAPITest::runIndexedTest( int32_t index, UBool exec, const char* &name, char* /*par */)
   2462 {
   2463     if (exec) logln("TestSuite CollationAPITest: ");
   2464     TESTCASE_AUTO_BEGIN;
   2465     TESTCASE_AUTO(TestProperty);
   2466     TESTCASE_AUTO(TestOperators);
   2467     TESTCASE_AUTO(TestDuplicate);
   2468     TESTCASE_AUTO(TestCompare);
   2469     TESTCASE_AUTO(TestHashCode);
   2470     TESTCASE_AUTO(TestCollationKey);
   2471     TESTCASE_AUTO(TestElemIter);
   2472     TESTCASE_AUTO(TestGetAll);
   2473     TESTCASE_AUTO(TestRuleBasedColl);
   2474     TESTCASE_AUTO(TestDecomposition);
   2475     TESTCASE_AUTO(TestSafeClone);
   2476     TESTCASE_AUTO(TestSortKey);
   2477     TESTCASE_AUTO(TestSortKeyOverflow);
   2478     TESTCASE_AUTO(TestMaxExpansion);
   2479     TESTCASE_AUTO(TestDisplayName);
   2480     TESTCASE_AUTO(TestAttribute);
   2481     TESTCASE_AUTO(TestVariableTopSetting);
   2482     TESTCASE_AUTO(TestMaxVariable);
   2483     TESTCASE_AUTO(TestRules);
   2484     TESTCASE_AUTO(TestGetLocale);
   2485     TESTCASE_AUTO(TestBounds);
   2486     TESTCASE_AUTO(TestGetTailoredSet);
   2487     TESTCASE_AUTO(TestUClassID);
   2488     TESTCASE_AUTO(TestSubclass);
   2489     TESTCASE_AUTO(TestNULLCharTailoring);
   2490     TESTCASE_AUTO(TestClone);
   2491     TESTCASE_AUTO(TestCloneBinary);
   2492     TESTCASE_AUTO(TestIterNumeric);
   2493     TESTCASE_AUTO(TestBadKeywords);
   2494     TESTCASE_AUTO_END;
   2495 }
   2496 
   2497 #endif /* #if !UCONFIG_NO_COLLATION */
   2498