Home | History | Annotate | Download | only in cintltst
      1 /********************************************************************
      2  * COPYRIGHT:
      3  * Copyright (c) 1997-2010, International Business Machines Corporation and
      4  * others. All Rights Reserved.
      5  ********************************************************************/
      6 
      7 #include "cintltst.h"
      8 #include "unicode/ures.h"
      9 #include "unicode/ucurr.h"
     10 #include "unicode/ustring.h"
     11 #include "unicode/uset.h"
     12 #include "unicode/udat.h"
     13 #include "unicode/uscript.h"
     14 #include "unicode/ulocdata.h"
     15 #include "cstring.h"
     16 #include "locmap.h"
     17 #include "uresimp.h"
     18 
     19 /*
     20 returns a new UnicodeSet that is a flattened form of the original
     21 UnicodeSet.
     22 */
     23 static USet*
     24 createFlattenSet(USet *origSet, UErrorCode *status) {
     25 
     26 
     27     USet *newSet = NULL;
     28     int32_t origItemCount = 0;
     29     int32_t idx, graphmeSize;
     30     UChar32 start, end;
     31     UChar graphme[64];
     32     if (U_FAILURE(*status)) {
     33         log_err("createFlattenSet called with %s\n", u_errorName(*status));
     34         return NULL;
     35     }
     36     newSet = uset_open(1, 0);
     37     origItemCount = uset_getItemCount(origSet);
     38     for (idx = 0; idx < origItemCount; idx++) {
     39         graphmeSize = uset_getItem(origSet, idx,
     40             &start, &end,
     41             graphme, (int32_t)(sizeof(graphme)/sizeof(graphme[0])),
     42             status);
     43         if (U_FAILURE(*status)) {
     44             log_err("ERROR: uset_getItem returned %s\n", u_errorName(*status));
     45             *status = U_ZERO_ERROR;
     46         }
     47         if (graphmeSize) {
     48             uset_addAllCodePoints(newSet, graphme, graphmeSize);
     49         }
     50         else {
     51             uset_addRange(newSet, start, end);
     52         }
     53     }
     54     return newSet;
     55 }
     56 static UBool
     57 isCurrencyPreEuro(const char* currencyKey){
     58     if( strcmp(currencyKey, "PTE") == 0 ||
     59         strcmp(currencyKey, "ESP") == 0 ||
     60         strcmp(currencyKey, "LUF") == 0 ||
     61         strcmp(currencyKey, "GRD") == 0 ||
     62         strcmp(currencyKey, "BEF") == 0 ||
     63         strcmp(currencyKey, "ITL") == 0 ||
     64         strcmp(currencyKey, "EEK") == 0){
     65             return TRUE;
     66     }
     67     return FALSE;
     68 }
     69 static void
     70 TestKeyInRootRecursive(UResourceBundle *root, const char *rootName,
     71                        UResourceBundle *currentBundle, const char *locale) {
     72     UErrorCode errorCode = U_ZERO_ERROR;
     73     UResourceBundle *subRootBundle = NULL, *subBundle = NULL, *arr = NULL;
     74 
     75     ures_resetIterator(root);
     76     ures_resetIterator(currentBundle);
     77     while (ures_hasNext(currentBundle)) {
     78         const char *subBundleKey = NULL;
     79         const char *currentBundleKey = NULL;
     80 
     81         errorCode = U_ZERO_ERROR;
     82         currentBundleKey = ures_getKey(currentBundle);
     83         subBundle = ures_getNextResource(currentBundle, NULL, &errorCode);
     84         if (U_FAILURE(errorCode)) {
     85             log_err("Can't open a resource for lnocale %s. Error: %s\n", locale, u_errorName(errorCode));
     86             continue;
     87         }
     88         subBundleKey = ures_getKey(subBundle);
     89 
     90 
     91         subRootBundle = ures_getByKey(root, subBundleKey, NULL, &errorCode);
     92         if (U_FAILURE(errorCode)) {
     93             log_err("Can't open a resource with key \"%s\" in \"%s\" from %s for locale \"%s\"\n",
     94                     subBundleKey,
     95                     ures_getKey(currentBundle),
     96                     rootName,
     97                     locale);
     98             ures_close(subBundle);
     99             continue;
    100         }
    101         if (ures_getType(subRootBundle) != ures_getType(subBundle)) {
    102             log_err("key \"%s\" in \"%s\" has a different type from root for locale \"%s\"\n"
    103                     "\troot=%d, locale=%d\n",
    104                     subBundleKey,
    105                     ures_getKey(currentBundle),
    106                     locale,
    107                     ures_getType(subRootBundle),
    108                     ures_getType(subBundle));
    109             ures_close(subBundle);
    110             continue;
    111         }
    112         else if (ures_getType(subBundle) == URES_INT_VECTOR) {
    113             int32_t minSize;
    114             int32_t subBundleSize;
    115             int32_t idx;
    116             UBool sameArray = TRUE;
    117             const int32_t *subRootBundleArr = ures_getIntVector(subRootBundle, &minSize, &errorCode);
    118             const int32_t *subBundleArr = ures_getIntVector(subBundle, &subBundleSize, &errorCode);
    119 
    120             if (minSize > subBundleSize) {
    121                 minSize = subBundleSize;
    122                 log_err("Arrays are different size with key \"%s\" in \"%s\" from root for locale \"%s\"\n",
    123                         subBundleKey,
    124                         ures_getKey(currentBundle),
    125                         locale);
    126             }
    127 
    128             for (idx = 0; idx < minSize && sameArray; idx++) {
    129                 if (subRootBundleArr[idx] != subBundleArr[idx]) {
    130                     sameArray = FALSE;
    131                 }
    132                 if (strcmp(subBundleKey, "DateTimeElements") == 0
    133                     && (subBundleArr[idx] < 1 || 7 < subBundleArr[idx]))
    134                 {
    135                     log_err("Value out of range with key \"%s\" at index %d in \"%s\" for locale \"%s\"\n",
    136                             subBundleKey,
    137                             idx,
    138                             ures_getKey(currentBundle),
    139                             locale);
    140                 }
    141             }
    142             /* Special exception es_US and DateTimeElements */
    143             if (sameArray
    144                 && !(strcmp(locale, "es_US") == 0 && strcmp(subBundleKey, "DateTimeElements") == 0))
    145             {
    146                 log_err("Integer vectors are the same with key \"%s\" in \"%s\" from root for locale \"%s\"\n",
    147                         subBundleKey,
    148                         ures_getKey(currentBundle),
    149                         locale);
    150             }
    151         }
    152         else if (ures_getType(subBundle) == URES_ARRAY) {
    153             UResourceBundle *subSubBundle = ures_getByIndex(subBundle, 0, NULL, &errorCode);
    154             UResourceBundle *subSubRootBundle = ures_getByIndex(subRootBundle, 0, NULL, &errorCode);
    155 
    156             if (U_SUCCESS(errorCode)
    157                 && (ures_getType(subSubBundle) == URES_ARRAY || ures_getType(subSubRootBundle) == URES_ARRAY))
    158             {
    159                 /* Here is one of the recursive parts */
    160                 TestKeyInRootRecursive(subRootBundle, rootName, subBundle, locale);
    161             }
    162             else {
    163                 int32_t minSize = ures_getSize(subRootBundle);
    164                 int32_t idx;
    165                 UBool sameArray = TRUE;
    166 
    167                 if (minSize > ures_getSize(subBundle)) {
    168                     minSize = ures_getSize(subBundle);
    169                 }
    170 
    171                 if ((subBundleKey == NULL
    172                     || (subBundleKey != NULL &&  strcmp(subBundleKey, "LocaleScript") != 0 && !isCurrencyPreEuro(subBundleKey)))
    173                     && ures_getSize(subRootBundle) != ures_getSize(subBundle))
    174                 {
    175                     log_err("Different size array with key \"%s\" in \"%s\" from root for locale \"%s\"\n"
    176                             "\troot array size=%d, locale array size=%d\n",
    177                             subBundleKey,
    178                             ures_getKey(currentBundle),
    179                             locale,
    180                             ures_getSize(subRootBundle),
    181                             ures_getSize(subBundle));
    182                 }
    183                 /*
    184                 if(isCurrencyPreEuro(subBundleKey) && ures_getSize(subBundle)!=3){
    185                     log_err("Different size array with key \"%s\" in \"%s\" for locale \"%s\" the expected size is 3 got size=%d\n",
    186                             subBundleKey,
    187                             ures_getKey(currentBundle),
    188                             locale,
    189                             ures_getSize(subBundle));
    190                 }
    191                 */
    192                 for (idx = 0; idx < minSize; idx++) {
    193                     int32_t rootStrLen, localeStrLen;
    194                     const UChar *rootStr = ures_getStringByIndex(subRootBundle,idx,&rootStrLen,&errorCode);
    195                     const UChar *localeStr = ures_getStringByIndex(subBundle,idx,&localeStrLen,&errorCode);
    196                     if (rootStr && localeStr && U_SUCCESS(errorCode)) {
    197                         if (u_strcmp(rootStr, localeStr) != 0) {
    198                             sameArray = FALSE;
    199                         }
    200                     }
    201                     else {
    202                         if ( rootStrLen > 1 && rootStr[0] == 0x41 && rootStr[1] >= 0x30 && rootStr[1] <= 0x39 ) {
    203                            /* A2 or A4 in the root string indicates that the resource can optionally be an array instead of a */
    204                            /* string.  Attempt to read it as an array. */
    205                           errorCode = U_ZERO_ERROR;
    206                           arr = ures_getByIndex(subBundle,idx,NULL,&errorCode);
    207                           if (U_FAILURE(errorCode)) {
    208                               log_err("Got a NULL string with key \"%s\" in \"%s\" at index %d for root or locale \"%s\"\n",
    209                                       subBundleKey,
    210                                       ures_getKey(currentBundle),
    211                                       idx,
    212                                       locale);
    213                               continue;
    214                           }
    215                           if (ures_getType(arr) != URES_ARRAY || ures_getSize(arr) != (int32_t)rootStr[1] - 0x30) {
    216                               log_err("Got something other than a string or array of size %d for key \"%s\" in \"%s\" at index %d for root or locale \"%s\"\n",
    217                                       rootStr[1] - 0x30,
    218                                       subBundleKey,
    219                                       ures_getKey(currentBundle),
    220                                       idx,
    221                                       locale);
    222                               ures_close(arr);
    223                               continue;
    224                           }
    225                           localeStr = ures_getStringByIndex(arr,0,&localeStrLen,&errorCode);
    226                           ures_close(arr);
    227                           if (U_FAILURE(errorCode)) {
    228                               log_err("Got something other than a string or array for key \"%s\" in \"%s\" at index %d for root or locale \"%s\"\n",
    229                                       subBundleKey,
    230                                       ures_getKey(currentBundle),
    231                                       idx,
    232                                       locale);
    233                               continue;
    234                           }
    235                         } else {
    236                             log_err("Got a NULL string with key \"%s\" in \"%s\" at index %d for root or locale \"%s\"\n",
    237                                 subBundleKey,
    238                                 ures_getKey(currentBundle),
    239                                 idx,
    240                                 locale);
    241                             continue;
    242                         }
    243                     }
    244                     if (localeStr[0] == (UChar)0x20) {
    245                         log_err("key \"%s\" at index %d in \"%s\" starts with a space in locale \"%s\"\n",
    246                                 subBundleKey,
    247                                 idx,
    248                                 ures_getKey(currentBundle),
    249                                 locale);
    250                     }
    251                     else if ((localeStr[localeStrLen - 1] == (UChar)0x20) && (strcmp(subBundleKey,"separator") != 0)) {
    252                         log_err("key \"%s\" at index %d in \"%s\" ends with a space in locale \"%s\"\n",
    253                                 subBundleKey,
    254                                 idx,
    255                                 ures_getKey(currentBundle),
    256                                 locale);
    257                     }
    258                     else if (subBundleKey != NULL
    259                         && strcmp(subBundleKey, "DateTimePatterns") == 0)
    260                     {
    261                         int32_t quoted = 0;
    262                         const UChar *localeStrItr = localeStr;
    263                         while (*localeStrItr) {
    264                             if (*localeStrItr == (UChar)0x27 /* ' */) {
    265                                 quoted++;
    266                             }
    267                             else if ((quoted % 2) == 0) {
    268                                 /* Search for unquoted characters */
    269                                 if (4 <= idx && idx <= 7
    270                                     && (*localeStrItr == (UChar)0x6B /* k */
    271                                     || *localeStrItr == (UChar)0x48 /* H */
    272                                     || *localeStrItr == (UChar)0x6D /* m */
    273                                     || *localeStrItr == (UChar)0x73 /* s */
    274                                     || *localeStrItr == (UChar)0x53 /* S */
    275                                     || *localeStrItr == (UChar)0x61 /* a */
    276                                     || *localeStrItr == (UChar)0x68 /* h */
    277                                     || *localeStrItr == (UChar)0x7A /* z */))
    278                                 {
    279                                     log_err("key \"%s\" at index %d has time pattern chars in date for locale \"%s\"\n",
    280                                             subBundleKey,
    281                                             idx,
    282                                             locale);
    283                                 }
    284                                 else if (0 <= idx && idx <= 3
    285                                     && (*localeStrItr == (UChar)0x47 /* G */
    286                                     || *localeStrItr == (UChar)0x79 /* y */
    287                                     || *localeStrItr == (UChar)0x4D /* M */
    288                                     || *localeStrItr == (UChar)0x64 /* d */
    289                                     || *localeStrItr == (UChar)0x45 /* E */
    290                                     || *localeStrItr == (UChar)0x44 /* D */
    291                                     || *localeStrItr == (UChar)0x46 /* F */
    292                                     || *localeStrItr == (UChar)0x77 /* w */
    293                                     || *localeStrItr == (UChar)0x57 /* W */))
    294                                 {
    295                                     log_err("key \"%s\" at index %d has date pattern chars in time for locale \"%s\"\n",
    296                                             subBundleKey,
    297                                             idx,
    298                                             locale);
    299                                 }
    300                             }
    301                             localeStrItr++;
    302                         }
    303                     }
    304                     else if (idx == 4 && subBundleKey != NULL
    305                         && strcmp(subBundleKey, "NumberElements") == 0
    306                         && u_charDigitValue(localeStr[0]) != 0)
    307                     {
    308                         log_err("key \"%s\" at index %d has a non-zero based number for locale \"%s\"\n",
    309                                 subBundleKey,
    310                                 idx,
    311                                 locale);
    312                     }
    313                 }
    314 /*                if (sameArray && strcmp(rootName, "root") == 0) {
    315                     log_err("Arrays are the same with key \"%s\" in \"%s\" from root for locale \"%s\"\n",
    316                             subBundleKey,
    317                             ures_getKey(currentBundle),
    318                             locale);
    319                 }*/
    320             }
    321             ures_close(subSubBundle);
    322             ures_close(subSubRootBundle);
    323         }
    324         else if (ures_getType(subBundle) == URES_STRING) {
    325             int32_t len = 0;
    326             const UChar *string = ures_getString(subBundle, &len, &errorCode);
    327             if (U_FAILURE(errorCode) || string == NULL) {
    328                 log_err("Can't open a string with key \"%s\" in \"%s\" for locale \"%s\"\n",
    329                         subBundleKey,
    330                         ures_getKey(currentBundle),
    331                         locale);
    332             } else if (string[0] == (UChar)0x20) {
    333                 log_err("key \"%s\" in \"%s\" starts with a space in locale \"%s\"\n",
    334                         subBundleKey,
    335                         ures_getKey(currentBundle),
    336                         locale);
    337             /* localeDisplayPattern/separator can end with a space */
    338             } else if (string[len - 1] == (UChar)0x20 && (strcmp(subBundleKey,"separator"))) {
    339                 log_err("key \"%s\" in \"%s\" ends with a space in locale \"%s\"\n",
    340                         subBundleKey,
    341                         ures_getKey(currentBundle),
    342                         locale);
    343             } else if (strcmp(subBundleKey, "localPatternChars") == 0) {
    344                 /* Note: We no longer import localPatternChars data starting
    345                  * ICU 3.8.  So it never comes into this else if block. (ticket#5597)
    346                  */
    347 
    348                 /* Check well-formedness of localPatternChars.  First, the
    349                  * length must match the number of fields defined by
    350                  * DateFormat.  Second, each character in the string must
    351                  * be in the set [A-Za-z].  Finally, each character must be
    352                  * unique.
    353                  */
    354                 int32_t i,j;
    355 #if !UCONFIG_NO_FORMATTING
    356                 if (len != UDAT_FIELD_COUNT) {
    357                     log_err("key \"%s\" has the wrong number of characters in locale \"%s\"\n",
    358                             subBundleKey,
    359                             locale);
    360                 }
    361 #endif
    362                 /* Check char validity. */
    363                 for (i=0; i<len; ++i) {
    364                     if (!((string[i] >= 65/*'A'*/ && string[i] <= 90/*'Z'*/) ||
    365                           (string[i] >= 97/*'a'*/ && string[i] <= 122/*'z'*/))) {
    366                         log_err("key \"%s\" has illegal character '%c' in locale \"%s\"\n",
    367                                 subBundleKey,
    368                                 (char) string[i],
    369                                 locale);
    370                     }
    371                     /* Do O(n^2) check for duplicate chars. */
    372                     for (j=0; j<i; ++j) {
    373                         if (string[j] == string[i]) {
    374                             log_err("key \"%s\" has duplicate character '%c' in locale \"%s\"\n",
    375                                     subBundleKey,
    376                                     (char) string[i],
    377                                     locale);
    378                         }
    379                     }
    380                 }
    381             }
    382             /* No fallback was done. Check for duplicate data */
    383             /* The ures_* API does not do fallback of sub-resource bundles,
    384                So we can't do this now. */
    385 #if 0
    386             else if (strcmp(locale, "root") != 0 && errorCode == U_ZERO_ERROR) {
    387 
    388                 const UChar *rootString = ures_getString(subRootBundle, &len, &errorCode);
    389                 if (U_FAILURE(errorCode) || rootString == NULL) {
    390                     log_err("Can't open a string with key \"%s\" in \"%s\" in root\n",
    391                             ures_getKey(subRootBundle),
    392                             ures_getKey(currentBundle));
    393                     continue;
    394                 } else if (u_strcmp(string, rootString) == 0) {
    395                     if (strcmp(locale, "de_CH") != 0 && strcmp(subBundleKey, "Countries") != 0 &&
    396                         strcmp(subBundleKey, "Version") != 0) {
    397                         log_err("Found duplicate data with key \"%s\" in \"%s\" in locale \"%s\"\n",
    398                                 ures_getKey(subRootBundle),
    399                                 ures_getKey(currentBundle),
    400                                 locale);
    401                     }
    402                     else {
    403                         /* Ignore for now. */
    404                         /* Can be fixed if fallback through de locale was done. */
    405                         log_verbose("Skipping key %s in %s\n", subBundleKey, locale);
    406                     }
    407                 }
    408             }
    409 #endif
    410         }
    411         else if (ures_getType(subBundle) == URES_TABLE) {
    412             if (strcmp(subBundleKey, "availableFormats")!=0) {
    413                 /* Here is one of the recursive parts */
    414                 TestKeyInRootRecursive(subRootBundle, rootName, subBundle, locale);
    415             }
    416             else {
    417                 log_verbose("Skipping key %s in %s\n", subBundleKey, locale);
    418             }
    419         }
    420         else if (ures_getType(subBundle) == URES_BINARY || ures_getType(subBundle) == URES_INT) {
    421             /* Can't do anything to check it */
    422             /* We'll assume it's all correct */
    423             if (strcmp(subBundleKey, "MeasurementSystem") != 0) {
    424                 log_verbose("Skipping key \"%s\" in \"%s\" for locale \"%s\"\n",
    425                         subBundleKey,
    426                         ures_getKey(currentBundle),
    427                         locale);
    428             }
    429             /* Testing for MeasurementSystem is done in VerifyTranslation */
    430         }
    431         else {
    432             log_err("Type %d for key \"%s\" in \"%s\" is unknown for locale \"%s\"\n",
    433                     ures_getType(subBundle),
    434                     subBundleKey,
    435                     ures_getKey(currentBundle),
    436                     locale);
    437         }
    438         ures_close(subRootBundle);
    439         ures_close(subBundle);
    440     }
    441 }
    442 
    443 
    444 static void
    445 testLCID(UResourceBundle *currentBundle,
    446          const char *localeName)
    447 {
    448     UErrorCode status = U_ZERO_ERROR;
    449     uint32_t expectedLCID;
    450     char lcidStringC[64] = {0};
    451 
    452     expectedLCID = uloc_getLCID(localeName);
    453     if (expectedLCID == 0) {
    454         log_verbose("INFO:    %-5s does not have any LCID mapping\n",
    455             localeName);
    456         return;
    457     }
    458 
    459     status = U_ZERO_ERROR;
    460     uprv_strcpy(lcidStringC, uprv_convertToPosix(expectedLCID, &status));
    461     if (U_FAILURE(status)) {
    462         log_err("ERROR:   %.4x does not have a POSIX mapping due to %s\n",
    463             expectedLCID, u_errorName(status));
    464     }
    465 
    466     if(strcmp(localeName, lcidStringC) != 0) {
    467         char langName[1024];
    468         char langLCID[1024];
    469         uloc_getLanguage(localeName, langName, sizeof(langName), &status);
    470         uloc_getLanguage(lcidStringC, langLCID, sizeof(langLCID), &status);
    471 
    472         if (strcmp(langName, langLCID) == 0) {
    473             log_verbose("WARNING: %-5s resolves to %s (0x%.4x)\n",
    474                 localeName, lcidStringC, expectedLCID);
    475         }
    476         else {
    477             log_err("ERROR:   %-5s has 0x%.4x and the number resolves wrongfully to %s\n",
    478                 localeName, expectedLCID, lcidStringC);
    479         }
    480     }
    481 }
    482 
    483 static void
    484 TestLocaleStructure(void) {
    485     UResourceBundle *root, *currentLocale;
    486     int32_t locCount = uloc_countAvailable();
    487     int32_t locIndex;
    488     UErrorCode errorCode = U_ZERO_ERROR;
    489     const char *currLoc, *resolvedLoc;
    490 
    491     /* TODO: Compare against parent's data too. This code can't handle fallbacks that some tools do already. */
    492 /*    char locName[ULOC_FULLNAME_CAPACITY];
    493     char *locNamePtr;
    494 
    495     for (locIndex = 0; locIndex < locCount; locIndex++) {
    496         errorCode=U_ZERO_ERROR;
    497         strcpy(locName, uloc_getAvailable(locIndex));
    498         locNamePtr = strrchr(locName, '_');
    499         if (locNamePtr) {
    500             *locNamePtr = 0;
    501         }
    502         else {
    503             strcpy(locName, "root");
    504         }
    505 
    506         root = ures_openDirect(NULL, locName, &errorCode);
    507         if(U_FAILURE(errorCode)) {
    508             log_err("Can't open %s\n", locName);
    509             continue;
    510         }
    511 */
    512     if (locCount <= 1) {
    513         log_data_err("At least root needs to be installed\n");
    514     }
    515 
    516     root = ures_openDirect(loadTestData(&errorCode), "structLocale", &errorCode);
    517     if(U_FAILURE(errorCode)) {
    518         log_data_err("Can't open structLocale\n");
    519         return;
    520     }
    521     for (locIndex = 0; locIndex < locCount; locIndex++) {
    522         errorCode=U_ZERO_ERROR;
    523         currLoc = uloc_getAvailable(locIndex);
    524         currentLocale = ures_open(NULL, currLoc, &errorCode);
    525         if(errorCode != U_ZERO_ERROR) {
    526             if(U_SUCCESS(errorCode)) {
    527                 /* It's installed, but there is no data.
    528                    It's installed for the g18n white paper [grhoten] */
    529                 log_err("ERROR: Locale %-5s not installed, and it should be, err %s\n",
    530                     uloc_getAvailable(locIndex), u_errorName(errorCode));
    531             } else {
    532                 log_err("%%%%%%% Unexpected error %d in %s %%%%%%%",
    533                     u_errorName(errorCode),
    534                     uloc_getAvailable(locIndex));
    535             }
    536             ures_close(currentLocale);
    537             continue;
    538         }
    539         ures_getStringByKey(currentLocale, "Version", NULL, &errorCode);
    540         if(errorCode != U_ZERO_ERROR) {
    541             log_err("No version information is available for locale %s, and it should be!\n",
    542                 currLoc);
    543         }
    544         else if (ures_getStringByKey(currentLocale, "Version", NULL, &errorCode)[0] == (UChar)(0x78)) {
    545             log_verbose("WARNING: The locale %s is experimental! It shouldn't be listed as an installed locale.\n",
    546                 currLoc);
    547         }
    548         resolvedLoc = ures_getLocaleByType(currentLocale, ULOC_ACTUAL_LOCALE, &errorCode);
    549         if (strcmp(resolvedLoc, currLoc) != 0) {
    550             /* All locales have at least a Version resource.
    551                If it's absolutely empty, then the previous test will fail too.*/
    552             log_err("Locale resolves to different locale. Is %s an alias of %s?\n",
    553                 currLoc, resolvedLoc);
    554         }
    555         TestKeyInRootRecursive(root, "root", currentLocale, currLoc);
    556 
    557         testLCID(currentLocale, currLoc);
    558 
    559         ures_close(currentLocale);
    560     }
    561 
    562     ures_close(root);
    563 }
    564 
    565 static void
    566 compareArrays(const char *keyName,
    567               UResourceBundle *fromArray, const char *fromLocale,
    568               UResourceBundle *toArray, const char *toLocale,
    569               int32_t start, int32_t end)
    570 {
    571     int32_t fromSize = ures_getSize(fromArray);
    572     int32_t toSize = ures_getSize(fromArray);
    573     int32_t idx;
    574     UErrorCode errorCode = U_ZERO_ERROR;
    575 
    576     if (fromSize > toSize) {
    577         fromSize = toSize;
    578         log_err("Arrays are different size from \"%s\" to \"%s\"\n",
    579                 fromLocale,
    580                 toLocale);
    581     }
    582 
    583     for (idx = start; idx <= end; idx++) {
    584         const UChar *fromBundleStr = ures_getStringByIndex(fromArray, idx, NULL, &errorCode);
    585         const UChar *toBundleStr = ures_getStringByIndex(toArray, idx, NULL, &errorCode);
    586         if (fromBundleStr && toBundleStr && u_strcmp(fromBundleStr, toBundleStr) != 0)
    587         {
    588             log_err("Difference for %s at index %d from %s= \"%s\" to %s= \"%s\"\n",
    589                     keyName,
    590                     idx,
    591                     fromLocale,
    592                     austrdup(fromBundleStr),
    593                     toLocale,
    594                     austrdup(toBundleStr));
    595         }
    596     }
    597 }
    598 
    599 static void
    600 compareConsistentCountryInfo(const char *fromLocale, const char *toLocale) {
    601     UErrorCode errorCode = U_ZERO_ERROR;
    602     UResourceBundle *fromDateTimeElements, *toDateTimeElements, *fromWeekendData = NULL, *toWeekendData = NULL;
    603     UResourceBundle *fromArray, *toArray;
    604     UResourceBundle *fromLocaleBund = ures_open(NULL, fromLocale, &errorCode);
    605     UResourceBundle *toLocaleBund = ures_open(NULL, toLocale, &errorCode);
    606     UResourceBundle *toCalendar, *fromCalendar, *toGregorian, *fromGregorian;
    607 
    608     if(U_FAILURE(errorCode)) {
    609         log_err("Can't open resource bundle %s or %s - %s\n", fromLocale, toLocale, u_errorName(errorCode));
    610         return;
    611     }
    612     fromCalendar = ures_getByKey(fromLocaleBund, "calendar", NULL, &errorCode);
    613     fromGregorian = ures_getByKeyWithFallback(fromCalendar, "gregorian", NULL, &errorCode);
    614     fromDateTimeElements = ures_getByKeyWithFallback(fromGregorian, "DateTimeElements", NULL, &errorCode);
    615 
    616     toCalendar = ures_getByKey(toLocaleBund, "calendar", NULL, &errorCode);
    617     toGregorian = ures_getByKeyWithFallback(toCalendar, "gregorian", NULL, &errorCode);
    618     toDateTimeElements = ures_getByKeyWithFallback(toGregorian, "DateTimeElements", NULL, &errorCode);
    619 
    620     if(U_FAILURE(errorCode)){
    621         log_err("Did not get DateTimeElements from the bundle %s or %s\n", fromLocale, toLocale);
    622         goto cleanup;
    623     }
    624 
    625     fromWeekendData = ures_getByKeyWithFallback(fromGregorian, "weekend", NULL, &errorCode);
    626     if(U_FAILURE(errorCode)){
    627         log_err("Did not get weekend data from the bundle %s to compare against %s\n", fromLocale, toLocale);
    628         goto cleanup;
    629     }
    630     toWeekendData = ures_getByKeyWithFallback(toGregorian, "weekend", NULL, &errorCode);
    631     if(U_FAILURE(errorCode)){
    632         log_err("Did not get weekend data from the bundle %s to compare against %s\n", toLocale, fromLocale);
    633         goto cleanup;
    634     }
    635 
    636     if (strcmp(fromLocale, "ar_IN") != 0)
    637     {
    638         int32_t fromSize;
    639         int32_t toSize;
    640         int32_t idx;
    641         const int32_t *fromBundleArr = ures_getIntVector(fromDateTimeElements, &fromSize, &errorCode);
    642         const int32_t *toBundleArr = ures_getIntVector(toDateTimeElements, &toSize, &errorCode);
    643 
    644         if (fromSize > toSize) {
    645             fromSize = toSize;
    646             log_err("Arrays are different size with key \"DateTimeElements\" from \"%s\" to \"%s\"\n",
    647                     fromLocale,
    648                     toLocale);
    649         }
    650 
    651         for (idx = 0; idx < fromSize; idx++) {
    652             if (fromBundleArr[idx] != toBundleArr[idx]) {
    653                 log_err("Difference with key \"DateTimeElements\" at index %d from \"%s\" to \"%s\"\n",
    654                         idx,
    655                         fromLocale,
    656                         toLocale);
    657             }
    658         }
    659     }
    660 
    661     /* test for weekend data */
    662     {
    663         int32_t fromSize;
    664         int32_t toSize;
    665         int32_t idx;
    666         const int32_t *fromBundleArr = ures_getIntVector(fromWeekendData, &fromSize, &errorCode);
    667         const int32_t *toBundleArr = ures_getIntVector(toWeekendData, &toSize, &errorCode);
    668 
    669         if (fromSize > toSize) {
    670             fromSize = toSize;
    671             log_err("Arrays are different size with key \"weekend\" data from \"%s\" to \"%s\"\n",
    672                     fromLocale,
    673                     toLocale);
    674         }
    675 
    676         for (idx = 0; idx < fromSize; idx++) {
    677             if (fromBundleArr[idx] != toBundleArr[idx]) {
    678                 log_err("Difference with key \"weekend\" data at index %d from \"%s\" to \"%s\"\n",
    679                         idx,
    680                         fromLocale,
    681                         toLocale);
    682             }
    683         }
    684     }
    685 
    686     fromArray = ures_getByKey(fromLocaleBund, "CurrencyElements", NULL, &errorCode);
    687     toArray = ures_getByKey(toLocaleBund, "CurrencyElements", NULL, &errorCode);
    688     if (strcmp(fromLocale, "en_CA") != 0)
    689     {
    690         /* The first one is probably localized. */
    691         compareArrays("CurrencyElements", fromArray, fromLocale, toArray, toLocale, 1, 2);
    692     }
    693     ures_close(fromArray);
    694     ures_close(toArray);
    695 
    696     fromArray = ures_getByKey(fromLocaleBund, "NumberPatterns", NULL, &errorCode);
    697     toArray = ures_getByKey(toLocaleBund, "NumberPatterns", NULL, &errorCode);
    698     if (strcmp(fromLocale, "en_CA") != 0)
    699     {
    700         compareArrays("NumberPatterns", fromArray, fromLocale, toArray, toLocale, 0, 3);
    701     }
    702     ures_close(fromArray);
    703     ures_close(toArray);
    704 
    705     /* Difficult to test properly */
    706 /*
    707     fromArray = ures_getByKey(fromLocaleBund, "DateTimePatterns", NULL, &errorCode);
    708     toArray = ures_getByKey(toLocaleBund, "DateTimePatterns", NULL, &errorCode);
    709     {
    710         compareArrays("DateTimePatterns", fromArray, fromLocale, toArray, toLocale);
    711     }
    712     ures_close(fromArray);
    713     ures_close(toArray);*/
    714 
    715     fromArray = ures_getByKey(fromLocaleBund, "NumberElements", NULL, &errorCode);
    716     toArray = ures_getByKey(toLocaleBund, "NumberElements", NULL, &errorCode);
    717     if (strcmp(fromLocale, "en_CA") != 0)
    718     {
    719         compareArrays("NumberElements", fromArray, fromLocale, toArray, toLocale, 0, 3);
    720         /* Index 4 is a script based 0 */
    721         compareArrays("NumberElements", fromArray, fromLocale, toArray, toLocale, 5, 10);
    722     }
    723     ures_close(fromArray);
    724     ures_close(toArray);
    725 
    726 cleanup:
    727     ures_close(fromDateTimeElements);
    728     ures_close(toDateTimeElements);
    729     ures_close(fromWeekendData);
    730     ures_close(toWeekendData);
    731 
    732     ures_close(fromCalendar);
    733     ures_close(toCalendar);
    734     ures_close(fromGregorian);
    735     ures_close(toGregorian);
    736 
    737     ures_close(fromLocaleBund);
    738     ures_close(toLocaleBund);
    739 }
    740 
    741 static void
    742 TestConsistentCountryInfo(void) {
    743 /*    UResourceBundle *fromLocale, *toLocale;*/
    744     int32_t locCount = uloc_countAvailable();
    745     int32_t fromLocIndex, toLocIndex;
    746 
    747     int32_t fromCountryLen, toCountryLen;
    748     char fromCountry[ULOC_FULLNAME_CAPACITY], toCountry[ULOC_FULLNAME_CAPACITY];
    749 
    750     int32_t fromVariantLen, toVariantLen;
    751     char fromVariant[ULOC_FULLNAME_CAPACITY], toVariant[ULOC_FULLNAME_CAPACITY];
    752 
    753     UErrorCode errorCode = U_ZERO_ERROR;
    754 
    755     for (fromLocIndex = 0; fromLocIndex < locCount; fromLocIndex++) {
    756         const char *fromLocale = uloc_getAvailable(fromLocIndex);
    757 
    758         errorCode=U_ZERO_ERROR;
    759         fromCountryLen = uloc_getCountry(fromLocale, fromCountry, ULOC_FULLNAME_CAPACITY, &errorCode);
    760         if (fromCountryLen <= 0) {
    761             /* Ignore countryless locales */
    762             continue;
    763         }
    764         fromVariantLen = uloc_getVariant(fromLocale, fromVariant, ULOC_FULLNAME_CAPACITY, &errorCode);
    765         if (fromVariantLen > 0) {
    766             /* Most variants are ignorable like PREEURO, or collation variants. */
    767             continue;
    768         }
    769         /* Start comparing only after the current index.
    770            Previous loop should have already compared fromLocIndex.
    771         */
    772         for (toLocIndex = fromLocIndex + 1; toLocIndex < locCount; toLocIndex++) {
    773             const char *toLocale = uloc_getAvailable(toLocIndex);
    774 
    775             toCountryLen = uloc_getCountry(toLocale, toCountry, ULOC_FULLNAME_CAPACITY, &errorCode);
    776             if(U_FAILURE(errorCode)) {
    777                 log_err("Unknown failure fromLocale=%s toLocale=%s errorCode=%s\n",
    778                     fromLocale, toLocale, u_errorName(errorCode));
    779                 continue;
    780             }
    781 
    782             if (toCountryLen <= 0) {
    783                 /* Ignore countryless locales */
    784                 continue;
    785             }
    786             toVariantLen = uloc_getVariant(toLocale, toVariant, ULOC_FULLNAME_CAPACITY, &errorCode);
    787             if (toVariantLen > 0) {
    788                 /* Most variants are ignorable like PREEURO, or collation variants. */
    789                 /* They're a variant for a reason. */
    790                 continue;
    791             }
    792             if (strcmp(fromCountry, toCountry) == 0) {
    793                 log_verbose("comparing fromLocale=%s toLocale=%s\n",
    794                     fromLocale, toLocale);
    795                 compareConsistentCountryInfo(fromLocale, toLocale);
    796             }
    797         }
    798     }
    799 }
    800 
    801 static int32_t
    802 findStringSetMismatch(const char *currLoc, const UChar *string, int32_t langSize,
    803                       const UChar *exemplarCharacters, int32_t exemplarLen,
    804                       UBool ignoreNumbers, UChar* badCharPtr) {
    805     UErrorCode errorCode = U_ZERO_ERROR;
    806     USet *origSet = uset_openPatternOptions(exemplarCharacters, exemplarLen, USET_CASE_INSENSITIVE, &errorCode);
    807     USet *exemplarSet = createFlattenSet(origSet, &errorCode);
    808     int32_t strIdx;
    809     uset_close(origSet);
    810     if (U_FAILURE(errorCode)) {
    811         log_err("%s: error uset_openPattern returned %s\n", currLoc, u_errorName(errorCode));
    812         return -1;
    813     }
    814 
    815     for (strIdx = 0; strIdx < langSize; strIdx++) {
    816         if (!uset_contains(exemplarSet, string[strIdx])
    817             && string[strIdx] != 0x0020 && string[strIdx] != 0x00A0 && string[strIdx] != 0x002e && string[strIdx] != 0x002c && string[strIdx] != 0x002d && string[strIdx] != 0x0027 && string[strIdx] != 0x2019 && string[strIdx] != 0x0f0b
    818             && string[strIdx] != 0x200C && string[strIdx] != 0x200D) {
    819             if (!ignoreNumbers || (ignoreNumbers && (string[strIdx] < 0x30 || string[strIdx] > 0x39))) {
    820                 uset_close(exemplarSet);
    821                 if (badCharPtr) {
    822                     *badCharPtr = string[strIdx];
    823                 }
    824                 return strIdx;
    825             }
    826         }
    827     }
    828     uset_close(exemplarSet);
    829     if (badCharPtr) {
    830         *badCharPtr = 0;
    831     }
    832     return -1;
    833 }
    834 /* include non-invariant chars */
    835 static int32_t
    836 myUCharsToChars(const UChar* us, char* cs, int32_t len){
    837     int32_t i=0;
    838     for(; i< len; i++){
    839         if(us[i] < 0x7f){
    840             cs[i] = (char)us[i];
    841         }else{
    842             return -1;
    843         }
    844     }
    845     return i;
    846 }
    847 static void
    848 findSetMatch( UScriptCode *scriptCodes, int32_t scriptsLen,
    849               USet *exemplarSet,
    850               const char  *locale){
    851     USet *scripts[10]= {0};
    852     char pattern[256] = { '[', ':', 0x000 };
    853     int32_t patternLen;
    854     UChar uPattern[256] = {0};
    855     UErrorCode status = U_ZERO_ERROR;
    856     int32_t i;
    857 
    858     /* create the sets with script codes */
    859     for(i = 0; i<scriptsLen; i++){
    860         strcat(pattern, uscript_getShortName(scriptCodes[i]));
    861         strcat(pattern, ":]");
    862         patternLen = (int32_t)strlen(pattern);
    863         u_charsToUChars(pattern, uPattern, patternLen);
    864         scripts[i] = uset_openPattern(uPattern, patternLen, &status);
    865         if(U_FAILURE(status)){
    866             log_err("Could not create set for pattern %s. Error: %s\n", pattern, u_errorName(status));
    867             return;
    868         }
    869         pattern[2] = 0;
    870     }
    871     if (strcmp(locale, "uk") == 0 || strcmp(locale, "uk_UA") == 0) {
    872         /* Special addition. Add the modifying apostrophe, which isn't in Cyrillic. */
    873         uset_add(scripts[0], 0x2bc);
    874     }
    875     if(U_SUCCESS(status)){
    876         UBool existsInScript = FALSE;
    877         /* iterate over the exemplarSet and ascertain if all
    878          * UChars in exemplarSet belong to the scripts returned
    879          * by getScript
    880          */
    881         int32_t count = uset_getItemCount(exemplarSet);
    882 
    883         for( i=0; i < count; i++){
    884             UChar32 start = 0;
    885             UChar32 end = 0;
    886             UChar *str = NULL;
    887             int32_t strCapacity = 0;
    888 
    889             strCapacity = uset_getItem(exemplarSet, i, &start, &end, str, strCapacity, &status);
    890             if(U_SUCCESS(status)){
    891                 int32_t j;
    892                 if(strCapacity == 0){
    893                     /* ok the item is a range */
    894                      for( j = 0; j < scriptsLen; j++){
    895                         if(uset_containsRange(scripts[j], start, end) == TRUE){
    896                             existsInScript = TRUE;
    897                         }
    898                     }
    899                     if(existsInScript == FALSE){
    900                         for( j = 0; j < scriptsLen; j++){
    901                             UChar toPattern[500]={'\0'};
    902                             char pat[500]={'\0'};
    903                             int32_t len = uset_toPattern(scripts[j], toPattern, 500, TRUE, &status);
    904                             len = myUCharsToChars(toPattern, pat, len);
    905                             log_err("uset_indexOf(\\u%04X)=%i uset_indexOf(\\u%04X)=%i\n", start, uset_indexOf(scripts[0], start), end, uset_indexOf(scripts[0], end));
    906                             if(len!=-1){
    907                                 log_err("Pattern: %s\n",pat);
    908                             }
    909                         }
    910                         log_err("ExemplarCharacters and LocaleScript containment test failed for locale %s. \n", locale);
    911                     }
    912                 }else{
    913                     strCapacity++; /* increment for NUL termination */
    914                     /* allocate the str and call the api again */
    915                     str = (UChar*) malloc(U_SIZEOF_UCHAR * strCapacity);
    916                     strCapacity =  uset_getItem(exemplarSet, i, &start, &end, str, strCapacity, &status);
    917                     /* iterate over the scripts and figure out if the string contained is actually
    918                      * in the script set
    919                      */
    920                     for( j = 0; j < scriptsLen; j++){
    921                         if(uset_containsString(scripts[j],str, strCapacity) == TRUE){
    922                             existsInScript = TRUE;
    923                         }
    924                     }
    925                     if(existsInScript == FALSE){
    926                         log_err("ExemplarCharacters and LocaleScript containment test failed for locale %s. \n", locale);
    927                     }
    928                 }
    929             }
    930         }
    931 
    932     }
    933 
    934     /* close the sets */
    935     for(i = 0; i<scriptsLen; i++){
    936         uset_close(scripts[i]);
    937     }
    938 }
    939 
    940 static void VerifyTranslation(void) {
    941     static const UVersionInfo icu47 = { 4, 7, 0, 0 };
    942     UResourceBundle *root, *currentLocale;
    943     int32_t locCount = uloc_countAvailable();
    944     int32_t locIndex;
    945     UErrorCode errorCode = U_ZERO_ERROR;
    946     int32_t exemplarLen;
    947     const UChar *exemplarCharacters;
    948     const char *currLoc;
    949     UScriptCode scripts[USCRIPT_CODE_LIMIT];
    950     int32_t numScripts;
    951     int32_t idx;
    952     int32_t end;
    953     UResourceBundle *resArray;
    954 
    955     if (locCount <= 1) {
    956         log_data_err("At least root needs to be installed\n");
    957     }
    958 
    959     root = ures_openDirect(NULL, "root", &errorCode);
    960     if(U_FAILURE(errorCode)) {
    961         log_data_err("Can't open root\n");
    962         return;
    963     }
    964     for (locIndex = 0; locIndex < locCount; locIndex++) {
    965         errorCode=U_ZERO_ERROR;
    966         currLoc = uloc_getAvailable(locIndex);
    967         currentLocale = ures_open(NULL, currLoc, &errorCode);
    968         if(errorCode != U_ZERO_ERROR) {
    969             if(U_SUCCESS(errorCode)) {
    970                 /* It's installed, but there is no data.
    971                    It's installed for the g18n white paper [grhoten] */
    972                 log_err("ERROR: Locale %-5s not installed, and it should be!\n",
    973                     uloc_getAvailable(locIndex));
    974             } else {
    975                 log_err("%%%%%%% Unexpected error %d in %s %%%%%%%",
    976                     u_errorName(errorCode),
    977                     uloc_getAvailable(locIndex));
    978             }
    979             ures_close(currentLocale);
    980             continue;
    981         }
    982         exemplarCharacters = ures_getStringByKey(currentLocale, "ExemplarCharacters", &exemplarLen, &errorCode);
    983         if (U_FAILURE(errorCode)) {
    984             log_err("error ures_getStringByKey returned %s\n", u_errorName(errorCode));
    985         }
    986         else if (getTestOption(QUICK_OPTION) && exemplarLen > 2048) {
    987             log_verbose("skipping test for %s\n", currLoc);
    988         }
    989         else if (uprv_strncmp(currLoc,"bem",3) == 0) {
    990             log_verbose("skipping test for %s, some month and country names known to use aux exemplars\n", currLoc);
    991         }
    992         else {
    993             UChar langBuffer[128];
    994             int32_t langSize;
    995             int32_t strIdx;
    996             UChar badChar;
    997             langSize = uloc_getDisplayLanguage(currLoc, currLoc, langBuffer, sizeof(langBuffer)/sizeof(langBuffer[0]), &errorCode);
    998             if (U_FAILURE(errorCode)) {
    999                 log_err("error uloc_getDisplayLanguage returned %s\n", u_errorName(errorCode));
   1000             }
   1001             else {
   1002                 strIdx = findStringSetMismatch(currLoc, langBuffer, langSize, exemplarCharacters, exemplarLen, FALSE, &badChar);
   1003                 if (strIdx >= 0) {
   1004                     log_err("getDisplayLanguage(%s) at index %d returned characters not in the exemplar characters: %04X.\n",
   1005                         currLoc, strIdx, badChar);
   1006                 }
   1007             }
   1008             langSize = uloc_getDisplayCountry(currLoc, currLoc, langBuffer, sizeof(langBuffer)/sizeof(langBuffer[0]), &errorCode);
   1009             if (U_FAILURE(errorCode)) {
   1010                 log_err("error uloc_getDisplayCountry returned %s\n", u_errorName(errorCode));
   1011             }
   1012             else if (uprv_strstr(currLoc, "ti_") != currLoc || isICUVersionAtLeast(icu47)) { /* TODO: restore DisplayCountry test for ti_* when cldrbug 3058 is fixed) */
   1013               strIdx = findStringSetMismatch(currLoc, langBuffer, langSize, exemplarCharacters, exemplarLen, FALSE, &badChar);
   1014                 if (strIdx >= 0) {
   1015                     log_err("getDisplayCountry(%s) at index %d returned characters not in the exemplar characters: %04X.\n",
   1016                         currLoc, strIdx, badChar);
   1017                 }
   1018             }
   1019             {
   1020                 UResourceBundle* cal = ures_getByKey(currentLocale, "calendar", NULL, &errorCode);
   1021                 UResourceBundle* greg = ures_getByKeyWithFallback(cal, "gregorian", NULL, &errorCode);
   1022                 UResourceBundle* names = ures_getByKeyWithFallback(greg,  "dayNames", NULL, &errorCode);
   1023                 UResourceBundle* format = ures_getByKeyWithFallback(names,  "format", NULL, &errorCode);
   1024                 resArray = ures_getByKeyWithFallback(format,  "wide", NULL, &errorCode);
   1025 
   1026                 if (U_FAILURE(errorCode)) {
   1027                     log_err("error ures_getByKey returned %s\n", u_errorName(errorCode));
   1028                 }
   1029                 if (getTestOption(QUICK_OPTION)) {
   1030                     end = 1;
   1031                 }
   1032                 else {
   1033                     end = ures_getSize(resArray);
   1034                 }
   1035 
   1036 
   1037                 for (idx = 0; idx < end; idx++) {
   1038                     const UChar *fromBundleStr = ures_getStringByIndex(resArray, idx, &langSize, &errorCode);
   1039                     if (U_FAILURE(errorCode)) {
   1040                         log_err("error ures_getStringByIndex(%d) returned %s\n", idx, u_errorName(errorCode));
   1041                         continue;
   1042                     }
   1043                     strIdx = findStringSetMismatch(currLoc, fromBundleStr, langSize, exemplarCharacters, exemplarLen, TRUE, &badChar);
   1044                     if (strIdx >= 0) {
   1045                         log_err("getDayNames(%s, %d) at index %d returned characters not in the exemplar characters: %04X.\n",
   1046                             currLoc, idx, strIdx, badChar);
   1047                     }
   1048                 }
   1049                 ures_close(resArray);
   1050                 ures_close(format);
   1051                 ures_close(names);
   1052 
   1053                 names = ures_getByKeyWithFallback(greg, "monthNames", NULL, &errorCode);
   1054                 format = ures_getByKeyWithFallback(names,"format", NULL, &errorCode);
   1055                 resArray = ures_getByKeyWithFallback(format, "wide", NULL, &errorCode);
   1056                 if (U_FAILURE(errorCode)) {
   1057                     log_err("error ures_getByKey returned %s\n", u_errorName(errorCode));
   1058                 }
   1059                 if (getTestOption(QUICK_OPTION)) {
   1060                     end = 1;
   1061                 }
   1062                 else {
   1063                     end = ures_getSize(resArray);
   1064                 }
   1065 
   1066                 for (idx = 0; idx < end; idx++) {
   1067                     const UChar *fromBundleStr = ures_getStringByIndex(resArray, idx, &langSize, &errorCode);
   1068                     if (U_FAILURE(errorCode)) {
   1069                         log_err("error ures_getStringByIndex(%d) returned %s\n", idx, u_errorName(errorCode));
   1070                         continue;
   1071                     }
   1072                     strIdx = findStringSetMismatch(currLoc, fromBundleStr, langSize, exemplarCharacters, exemplarLen, TRUE, &badChar);
   1073                     if (strIdx >= 0) {
   1074                         log_err("getMonthNames(%s, %d) at index %d returned characters not in the exemplar characters: %04X.\n",
   1075                             currLoc, idx, strIdx, badChar);
   1076                     }
   1077                 }
   1078                 ures_close(resArray);
   1079                 ures_close(format);
   1080                 ures_close(names);
   1081                 ures_close(greg);
   1082                 ures_close(cal);
   1083             }
   1084             errorCode = U_ZERO_ERROR;
   1085             numScripts = uscript_getCode(currLoc, scripts, sizeof(scripts)/sizeof(scripts[0]), &errorCode);
   1086             if (numScripts == 0) {
   1087                 log_err("uscript_getCode(%s) doesn't work.\n", currLoc);
   1088             }else if(scripts[0] == USCRIPT_COMMON){
   1089                 log_err("uscript_getCode(%s) returned USCRIPT_COMMON.\n", currLoc);
   1090             }
   1091 
   1092             /* test that the scripts are a superset of exemplar characters. */
   1093            {
   1094                 ULocaleData *uld = ulocdata_open(currLoc,&errorCode);
   1095                 USet *exemplarSet =  ulocdata_getExemplarSet(uld, NULL, 0, ULOCDATA_ES_STANDARD, &errorCode);
   1096                 /* test if exemplar characters are part of script code */
   1097                 findSetMatch(scripts, numScripts, exemplarSet, currLoc);
   1098                 uset_close(exemplarSet);
   1099                 ulocdata_close(uld);
   1100             }
   1101 
   1102            /* test that the paperSize API works */
   1103            {
   1104                int32_t height=0, width=0;
   1105                ulocdata_getPaperSize(currLoc, &height, &width, &errorCode);
   1106                if(U_FAILURE(errorCode)){
   1107                    log_err("ulocdata_getPaperSize failed for locale %s with error: %s \n", currLoc, u_errorName(errorCode));
   1108                }
   1109                if(strstr(currLoc, "_US")!=NULL && height != 279 && width != 216 ){
   1110                    log_err("ulocdata_getPaperSize did not return expected data for locale %s \n", currLoc);
   1111                }
   1112            }
   1113             /* test that the MeasurementSystem works API works */
   1114            {
   1115                UMeasurementSystem measurementSystem = ulocdata_getMeasurementSystem(currLoc, &errorCode);
   1116                if(U_FAILURE(errorCode)){
   1117                    log_err("ulocdata_getMeasurementSystem failed for locale %s with error: %s \n", currLoc, u_errorName(errorCode));
   1118                }
   1119                if(strstr(currLoc, "_US")!=NULL || strstr(currLoc, "_MM")!=NULL || strstr(currLoc, "_LR")!=NULL){
   1120                    if(measurementSystem != UMS_US){
   1121                         log_err("ulocdata_getMeasurementSystem did not return expected data for locale %s \n", currLoc);
   1122                    }
   1123                }else if(measurementSystem != UMS_SI){
   1124                    log_err("ulocdata_getMeasurementSystem did not return expected data for locale %s \n", currLoc);
   1125                }
   1126            }
   1127         }
   1128         ures_close(currentLocale);
   1129     }
   1130 
   1131     ures_close(root);
   1132 }
   1133 
   1134 /* adjust this limit as appropriate */
   1135 #define MAX_SCRIPTS_PER_LOCALE 8
   1136 
   1137 static void TestExemplarSet(void){
   1138     int32_t i, j, k, m, n;
   1139     int32_t equalCount = 0;
   1140     UErrorCode ec = U_ZERO_ERROR;
   1141     UEnumeration* avail;
   1142     USet* exemplarSets[2];
   1143     USet* unassignedSet;
   1144     UScriptCode code[MAX_SCRIPTS_PER_LOCALE];
   1145     USet* codeSets[MAX_SCRIPTS_PER_LOCALE];
   1146     int32_t codeLen;
   1147     char cbuf[32]; /* 9 should be enough */
   1148     UChar ubuf[64]; /* adjust as needed */
   1149     UBool existsInScript;
   1150     int32_t itemCount;
   1151     int32_t strLen;
   1152     UChar32 start, end;
   1153 
   1154     unassignedSet = NULL;
   1155     exemplarSets[0] = NULL;
   1156     exemplarSets[1] = NULL;
   1157     for (i=0; i<MAX_SCRIPTS_PER_LOCALE; ++i) {
   1158         codeSets[i] = NULL;
   1159     }
   1160 
   1161     avail = ures_openAvailableLocales(NULL, &ec);
   1162     if (!assertSuccess("ures_openAvailableLocales", &ec)) goto END;
   1163     n = uenum_count(avail, &ec);
   1164     if (!assertSuccess("uenum_count", &ec)) goto END;
   1165 
   1166     u_uastrcpy(ubuf, "[:unassigned:]");
   1167     unassignedSet = uset_openPattern(ubuf, -1, &ec);
   1168     if (!assertSuccess("uset_openPattern", &ec)) goto END;
   1169 
   1170     for(i=0; i<n; i++){
   1171         const char* locale = uenum_next(avail, NULL, &ec);
   1172         if (!assertSuccess("uenum_next", &ec)) goto END;
   1173         log_verbose("%s\n", locale);
   1174         for (k=0; k<2; ++k) {
   1175             uint32_t option = (k==0) ? 0 : USET_CASE_INSENSITIVE;
   1176             ULocaleData *uld = ulocdata_open(locale,&ec);
   1177             USet* exemplarSet = ulocdata_getExemplarSet(uld,NULL, option, ULOCDATA_ES_STANDARD, &ec);
   1178             uset_close(exemplarSets[k]);
   1179             ulocdata_close(uld);
   1180             exemplarSets[k] = exemplarSet;
   1181             if (!assertSuccess("ulocaledata_getExemplarSet", &ec)) goto END;
   1182 
   1183             if (uset_containsSome(exemplarSet, unassignedSet)) {
   1184                 log_err("ExemplarSet contains unassigned characters for locale : %s\n", locale);
   1185             }
   1186             codeLen = uscript_getCode(locale, code, 8, &ec);
   1187             if (!assertSuccess("uscript_getCode", &ec)) goto END;
   1188 
   1189             for (j=0; j<MAX_SCRIPTS_PER_LOCALE; ++j) {
   1190                 uset_close(codeSets[j]);
   1191                 codeSets[j] = NULL;
   1192             }
   1193             for (j=0; j<codeLen; ++j) {
   1194                 uprv_strcpy(cbuf, "[:");
   1195                 if(code[j]==-1){
   1196                     log_err("USCRIPT_INVALID_CODE returned for locale: %s\n", locale);
   1197                     continue;
   1198                 }
   1199                 uprv_strcat(cbuf, uscript_getShortName(code[j]));
   1200                 uprv_strcat(cbuf, ":]");
   1201                 u_uastrcpy(ubuf, cbuf);
   1202                 codeSets[j] = uset_openPattern(ubuf, -1, &ec);
   1203             }
   1204             if (!assertSuccess("uset_openPattern", &ec)) goto END;
   1205 
   1206             existsInScript = FALSE;
   1207             itemCount = uset_getItemCount(exemplarSet);
   1208             for (m=0; m<itemCount && !existsInScript; ++m) {
   1209                 strLen = uset_getItem(exemplarSet, m, &start, &end, ubuf,
   1210                                       sizeof(ubuf)/sizeof(ubuf[0]), &ec);
   1211                 /* failure here might mean str[] needs to be larger */
   1212                 if (!assertSuccess("uset_getItem", &ec)) goto END;
   1213                 if (strLen == 0) {
   1214                     for (j=0; j<codeLen; ++j) {
   1215                         if (codeSets[j]!=NULL && uset_containsRange(codeSets[j], start, end)) {
   1216                             existsInScript = TRUE;
   1217                             break;
   1218                         }
   1219                     }
   1220                 } else {
   1221                     for (j=0; j<codeLen; ++j) {
   1222                         if (codeSets[j]!=NULL && uset_containsString(codeSets[j], ubuf, strLen)) {
   1223                             existsInScript = TRUE;
   1224                             break;
   1225                         }
   1226                     }
   1227                 }
   1228             }
   1229 
   1230             if (existsInScript == FALSE){
   1231                 log_err("ExemplarSet containment failed for locale : %s\n", locale);
   1232             }
   1233         }
   1234         assertTrue("case-folded is a superset",
   1235                    uset_containsAll(exemplarSets[1], exemplarSets[0]));
   1236         if (uset_equals(exemplarSets[1], exemplarSets[0])) {
   1237             ++equalCount;
   1238         }
   1239     }
   1240     /* Note: The case-folded set should sometimes be a strict superset
   1241        and sometimes be equal. */
   1242     assertTrue("case-folded is sometimes a strict superset, and sometimes equal",
   1243                equalCount > 0 && equalCount < n);
   1244 
   1245  END:
   1246     uenum_close(avail);
   1247     uset_close(exemplarSets[0]);
   1248     uset_close(exemplarSets[1]);
   1249     uset_close(unassignedSet);
   1250     for (i=0; i<MAX_SCRIPTS_PER_LOCALE; ++i) {
   1251         uset_close(codeSets[i]);
   1252     }
   1253 }
   1254 
   1255 static void TestLocaleDisplayPattern(void){
   1256     UErrorCode status = U_ZERO_ERROR;
   1257     UChar pattern[32] = {0,};
   1258     UChar separator[32] = {0,};
   1259     ULocaleData *uld = ulocdata_open(uloc_getDefault(), &status);
   1260 
   1261     if(U_FAILURE(status)){
   1262         log_data_err("ulocdata_open error");
   1263         return;
   1264     }
   1265     ulocdata_getLocaleDisplayPattern(uld, pattern, 32, &status);
   1266     if (U_FAILURE(status)){
   1267         log_err("ulocdata_getLocaleDisplayPattern error!");
   1268     }
   1269     status = U_ZERO_ERROR;
   1270     ulocdata_getLocaleSeparator(uld, separator, 32, &status);
   1271     if (U_FAILURE(status)){
   1272         log_err("ulocdata_getLocaleSeparator error!");
   1273     }
   1274     ulocdata_close(uld);
   1275 }
   1276 
   1277 static void TestCoverage(void){
   1278     ULocaleDataDelimiterType types[] = {
   1279      ULOCDATA_QUOTATION_START,     /* Quotation start */
   1280      ULOCDATA_QUOTATION_END,       /* Quotation end */
   1281      ULOCDATA_ALT_QUOTATION_START, /* Alternate quotation start */
   1282      ULOCDATA_ALT_QUOTATION_END,   /* Alternate quotation end */
   1283      ULOCDATA_DELIMITER_COUNT
   1284     };
   1285     int i;
   1286     UBool sub;
   1287     UErrorCode status = U_ZERO_ERROR;
   1288     ULocaleData *uld = ulocdata_open(uloc_getDefault(), &status);
   1289 
   1290     if(U_FAILURE(status)){
   1291         log_data_err("ulocdata_open error");
   1292         return;
   1293     }
   1294 
   1295 
   1296     for(i = 0; i < ULOCDATA_DELIMITER_COUNT; i++){
   1297         UChar result[32] = {0,};
   1298         status = U_ZERO_ERROR;
   1299         ulocdata_getDelimiter(uld, types[i], result, 32, &status);
   1300         if (U_FAILURE(status)){
   1301             log_err("ulocdata_getgetDelimiter error with type %d", types[i]);
   1302         }
   1303     }
   1304 
   1305     sub = ulocdata_getNoSubstitute(uld);
   1306     ulocdata_setNoSubstitute(uld,sub);
   1307     ulocdata_close(uld);
   1308 }
   1309 
   1310 static void TestCurrencyList(void){
   1311 #if !UCONFIG_NO_FORMATTING
   1312     UErrorCode errorCode = U_ZERO_ERROR;
   1313     int32_t structLocaleCount, currencyCount;
   1314     UEnumeration *en = ucurr_openISOCurrencies(UCURR_ALL, &errorCode);
   1315     const char *isoCode, *structISOCode;
   1316     UResourceBundle *subBundle;
   1317     UResourceBundle *currencies = ures_openDirect(loadTestData(&errorCode), "structLocale", &errorCode);
   1318     if(U_FAILURE(errorCode)) {
   1319         log_data_err("Can't open structLocale\n");
   1320         return;
   1321     }
   1322     currencies = ures_getByKey(currencies, "Currencies", currencies, &errorCode);
   1323     currencyCount = uenum_count(en, &errorCode);
   1324     structLocaleCount = ures_getSize(currencies);
   1325     if (currencyCount != structLocaleCount) {
   1326         log_err("structLocale(%d) and ISO4217(%d) currency list are out of sync.\n", structLocaleCount, currencyCount);
   1327 #if U_CHARSET_FAMILY == U_ASCII_FAMILY
   1328         ures_resetIterator(currencies);
   1329         while ((isoCode = uenum_next(en, NULL, &errorCode)) != NULL && ures_hasNext(currencies)) {
   1330             subBundle = ures_getNextResource(currencies, NULL, &errorCode);
   1331             structISOCode = ures_getKey(subBundle);
   1332             ures_close(subBundle);
   1333             if (strcmp(structISOCode, isoCode) != 0) {
   1334                 log_err("First difference found at structLocale(%s) and ISO4217(%s).\n", structISOCode, isoCode);
   1335                 break;
   1336             }
   1337         }
   1338 #endif
   1339     }
   1340     ures_close(currencies);
   1341     uenum_close(en);
   1342 #endif
   1343 }
   1344 
   1345 #define TESTCASE(name) addTest(root, &name, "tsutil/cldrtest/" #name)
   1346 
   1347 void addCLDRTest(TestNode** root);
   1348 
   1349 void addCLDRTest(TestNode** root)
   1350 {
   1351 #if !UCONFIG_NO_FILE_IO && !UCONFIG_NO_LEGACY_CONVERSION
   1352     TESTCASE(TestLocaleStructure);
   1353     TESTCASE(TestCurrencyList);
   1354 #endif
   1355     TESTCASE(TestConsistentCountryInfo);
   1356     TESTCASE(VerifyTranslation);
   1357     TESTCASE(TestExemplarSet);
   1358     TESTCASE(TestLocaleDisplayPattern);
   1359     TESTCASE(TestCoverage);
   1360 }
   1361