1 /********************************************************************
2  * COPYRIGHT:
3  * Copyright (c) 1997-2015, International Business Machines Corporation and
4  * others. All Rights Reserved.
5  ********************************************************************/
6 
7 #include "cintltst.h"
8 #include "unicode/ures.h"
9 #include "unicode/ucurr.h"
10 #include "unicode/ustring.h"
11 #include "unicode/uset.h"
12 #include "unicode/udat.h"
13 #include "unicode/uscript.h"
14 #include "unicode/ulocdata.h"
15 #include "cstring.h"
16 #include "locmap.h"
17 #include "uresimp.h"
18 
19 /*
20 returns a new UnicodeSet that is a flattened form of the original
21 UnicodeSet.
22 */
23 static USet*
createFlattenSet(USet * origSet,UErrorCode * status)24 createFlattenSet(USet *origSet, UErrorCode *status) {
25 
26 
27     USet *newSet = NULL;
28     int32_t origItemCount = 0;
29     int32_t idx, graphmeSize;
30     UChar32 start, end;
31     UChar graphme[64];
32     if (U_FAILURE(*status)) {
33         log_err("createFlattenSet called with %s\n", u_errorName(*status));
34         return NULL;
35     }
36     newSet = uset_open(1, 0);
37     origItemCount = uset_getItemCount(origSet);
38     for (idx = 0; idx < origItemCount; idx++) {
39         graphmeSize = uset_getItem(origSet, idx,
40             &start, &end,
41             graphme, (int32_t)(sizeof(graphme)/sizeof(graphme[0])),
42             status);
43         if (U_FAILURE(*status)) {
44             log_err("ERROR: uset_getItem returned %s\n", u_errorName(*status));
45             *status = U_ZERO_ERROR;
46         }
47         if (graphmeSize) {
48             uset_addAllCodePoints(newSet, graphme, graphmeSize);
49         }
50         else {
51             uset_addRange(newSet, start, end);
52         }
53     }
54     uset_closeOver(newSet,USET_CASE_INSENSITIVE);
55     return newSet;
56 }
57 
58 static UBool
isCurrencyPreEuro(const char * currencyKey)59 isCurrencyPreEuro(const char* currencyKey){
60     if( strcmp(currencyKey, "PTE") == 0 ||
61         strcmp(currencyKey, "ESP") == 0 ||
62         strcmp(currencyKey, "LUF") == 0 ||
63         strcmp(currencyKey, "GRD") == 0 ||
64         strcmp(currencyKey, "BEF") == 0 ||
65         strcmp(currencyKey, "ITL") == 0 ||
66         strcmp(currencyKey, "EEK") == 0){
67             return TRUE;
68     }
69     return FALSE;
70 }
71 #if !UCONFIG_NO_FILE_IO && !UCONFIG_NO_LEGACY_CONVERSION
72 static void
TestKeyInRootRecursive(UResourceBundle * root,const char * rootName,UResourceBundle * currentBundle,const char * locale)73 TestKeyInRootRecursive(UResourceBundle *root, const char *rootName,
74                        UResourceBundle *currentBundle, const char *locale) {
75     UErrorCode errorCode = U_ZERO_ERROR;
76     UResourceBundle *subRootBundle = NULL, *subBundle = NULL, *arr = NULL;
77 
78     ures_resetIterator(root);
79     ures_resetIterator(currentBundle);
80     while (ures_hasNext(currentBundle)) {
81         const char *subBundleKey = NULL;
82         const char *currentBundleKey = NULL;
83 
84         errorCode = U_ZERO_ERROR;
85         currentBundleKey = ures_getKey(currentBundle);
86         (void)currentBundleKey;    /* Suppress set but not used warning. */
87         subBundle = ures_getNextResource(currentBundle, NULL, &errorCode);
88         if (U_FAILURE(errorCode)) {
89             log_err("Can't open a resource for lnocale %s. Error: %s\n", locale, u_errorName(errorCode));
90             continue;
91         }
92         subBundleKey = ures_getKey(subBundle);
93 
94 
95         subRootBundle = ures_getByKey(root, subBundleKey, NULL, &errorCode);
96         if (U_FAILURE(errorCode)) {
97             log_err("Can't open a resource with key \"%s\" in \"%s\" from %s for locale \"%s\"\n",
98                     subBundleKey,
99                     ures_getKey(currentBundle),
100                     rootName,
101                     locale);
102             ures_close(subBundle);
103             continue;
104         }
105         if (ures_getType(subRootBundle) != ures_getType(subBundle)) {
106             log_err("key \"%s\" in \"%s\" has a different type from root for locale \"%s\"\n"
107                     "\troot=%d, locale=%d\n",
108                     subBundleKey,
109                     ures_getKey(currentBundle),
110                     locale,
111                     ures_getType(subRootBundle),
112                     ures_getType(subBundle));
113             ures_close(subBundle);
114             continue;
115         }
116         else if (ures_getType(subBundle) == URES_INT_VECTOR) {
117             int32_t minSize;
118             int32_t subBundleSize;
119             int32_t idx;
120             UBool sameArray = TRUE;
121             const int32_t *subRootBundleArr = ures_getIntVector(subRootBundle, &minSize, &errorCode);
122             const int32_t *subBundleArr = ures_getIntVector(subBundle, &subBundleSize, &errorCode);
123 
124             if (minSize > subBundleSize) {
125                 minSize = subBundleSize;
126                 log_err("Arrays are different size with key \"%s\" in \"%s\" from root for locale \"%s\"\n",
127                         subBundleKey,
128                         ures_getKey(currentBundle),
129                         locale);
130             }
131 
132             for (idx = 0; idx < minSize && sameArray; idx++) {
133                 if (subRootBundleArr[idx] != subBundleArr[idx]) {
134                     sameArray = FALSE;
135                 }
136                 if (strcmp(subBundleKey, "DateTimeElements") == 0
137                     && (subBundleArr[idx] < 1 || 7 < subBundleArr[idx]))
138                 {
139                     log_err("Value out of range with key \"%s\" at index %d in \"%s\" for locale \"%s\"\n",
140                             subBundleKey,
141                             idx,
142                             ures_getKey(currentBundle),
143                             locale);
144                 }
145             }
146             /* Special exception es_US and DateTimeElements */
147             if (sameArray
148                 && !(strcmp(locale, "es_US") == 0 && strcmp(subBundleKey, "DateTimeElements") == 0))
149             {
150                 log_err("Integer vectors are the same with key \"%s\" in \"%s\" from root for locale \"%s\"\n",
151                         subBundleKey,
152                         ures_getKey(currentBundle),
153                         locale);
154             }
155         }
156         else if (ures_getType(subBundle) == URES_ARRAY) {
157             UResourceBundle *subSubBundle = ures_getByIndex(subBundle, 0, NULL, &errorCode);
158             UResourceBundle *subSubRootBundle = ures_getByIndex(subRootBundle, 0, NULL, &errorCode);
159 
160             if (U_SUCCESS(errorCode)
161                 && (ures_getType(subSubBundle) == URES_ARRAY || ures_getType(subSubRootBundle) == URES_ARRAY))
162             {
163                 /* Here is one of the recursive parts */
164                 TestKeyInRootRecursive(subRootBundle, rootName, subBundle, locale);
165             }
166             else {
167                 int32_t minSize = ures_getSize(subRootBundle);
168                 int32_t idx;
169                 UBool sameArray = TRUE;
170 
171                 if (minSize > ures_getSize(subBundle)) {
172                     minSize = ures_getSize(subBundle);
173                 }
174 
175                 if ((subBundleKey == NULL
176                     || (subBundleKey != NULL &&  strcmp(subBundleKey, "LocaleScript") != 0 && !isCurrencyPreEuro(subBundleKey)))
177                     && ures_getSize(subRootBundle) != ures_getSize(subBundle))
178                 {
179                     log_err("Different size array with key \"%s\" in \"%s\" from root for locale \"%s\"\n"
180                             "\troot array size=%d, locale array size=%d\n",
181                             subBundleKey,
182                             ures_getKey(currentBundle),
183                             locale,
184                             ures_getSize(subRootBundle),
185                             ures_getSize(subBundle));
186                 }
187                 /*
188                 if(isCurrencyPreEuro(subBundleKey) && ures_getSize(subBundle)!=3){
189                     log_err("Different size array with key \"%s\" in \"%s\" for locale \"%s\" the expected size is 3 got size=%d\n",
190                             subBundleKey,
191                             ures_getKey(currentBundle),
192                             locale,
193                             ures_getSize(subBundle));
194                 }
195                 */
196                 for (idx = 0; idx < minSize; idx++) {
197                     int32_t rootStrLen, localeStrLen;
198                     const UChar *rootStr = ures_getStringByIndex(subRootBundle,idx,&rootStrLen,&errorCode);
199                     const UChar *localeStr = ures_getStringByIndex(subBundle,idx,&localeStrLen,&errorCode);
200                     if (rootStr && localeStr && U_SUCCESS(errorCode)) {
201                         if (u_strcmp(rootStr, localeStr) != 0) {
202                             sameArray = FALSE;
203                         }
204                     }
205                     else {
206                         if ( rootStrLen > 1 && rootStr[0] == 0x41 && rootStr[1] >= 0x30 && rootStr[1] <= 0x39 ) {
207                            /* A2 or A4 in the root string indicates that the resource can optionally be an array instead of a */
208                            /* string.  Attempt to read it as an array. */
209                           errorCode = U_ZERO_ERROR;
210                           arr = ures_getByIndex(subBundle,idx,NULL,&errorCode);
211                           if (U_FAILURE(errorCode)) {
212                               log_err("Got a NULL string with key \"%s\" in \"%s\" at index %d for root or locale \"%s\"\n",
213                                       subBundleKey,
214                                       ures_getKey(currentBundle),
215                                       idx,
216                                       locale);
217                               continue;
218                           }
219                           if (ures_getType(arr) != URES_ARRAY || ures_getSize(arr) != (int32_t)rootStr[1] - 0x30) {
220                               log_err("Got something other than a string or array of size %d for key \"%s\" in \"%s\" at index %d for root or locale \"%s\"\n",
221                                       rootStr[1] - 0x30,
222                                       subBundleKey,
223                                       ures_getKey(currentBundle),
224                                       idx,
225                                       locale);
226                               ures_close(arr);
227                               continue;
228                           }
229                           localeStr = ures_getStringByIndex(arr,0,&localeStrLen,&errorCode);
230                           ures_close(arr);
231                           if (U_FAILURE(errorCode)) {
232                               log_err("Got something other than a string or array for key \"%s\" in \"%s\" at index %d for root or locale \"%s\"\n",
233                                       subBundleKey,
234                                       ures_getKey(currentBundle),
235                                       idx,
236                                       locale);
237                               continue;
238                           }
239                         } else {
240                             log_err("Got a NULL string with key \"%s\" in \"%s\" at index %d for root or locale \"%s\"\n",
241                                 subBundleKey,
242                                 ures_getKey(currentBundle),
243                                 idx,
244                                 locale);
245                             continue;
246                         }
247                     }
248                     if (localeStr[0] == (UChar)0x20) {
249                         log_err("key \"%s\" at index %d in \"%s\" starts with a space in locale \"%s\"\n",
250                                 subBundleKey,
251                                 idx,
252                                 ures_getKey(currentBundle),
253                                 locale);
254                     }
255                     else if ((localeStr[localeStrLen - 1] == (UChar)0x20) && (strcmp(subBundleKey,"separator") != 0)) {
256                         log_err("key \"%s\" at index %d in \"%s\" ends with a space in locale \"%s\"\n",
257                                 subBundleKey,
258                                 idx,
259                                 ures_getKey(currentBundle),
260                                 locale);
261                     }
262                     else if (subBundleKey != NULL
263                         && strcmp(subBundleKey, "DateTimePatterns") == 0)
264                     {
265                         int32_t quoted = 0;
266                         const UChar *localeStrItr = localeStr;
267                         while (*localeStrItr) {
268                             if (*localeStrItr == (UChar)0x27 /* ' */) {
269                                 quoted++;
270                             }
271                             else if ((quoted % 2) == 0) {
272                                 /* Search for unquoted characters */
273                                 if (4 <= idx && idx <= 7
274                                     && (*localeStrItr == (UChar)0x6B /* k */
275                                     || *localeStrItr == (UChar)0x48 /* H */
276                                     || *localeStrItr == (UChar)0x6D /* m */
277                                     || *localeStrItr == (UChar)0x73 /* s */
278                                     || *localeStrItr == (UChar)0x53 /* S */
279                                     || *localeStrItr == (UChar)0x61 /* a */
280                                     || *localeStrItr == (UChar)0x68 /* h */
281                                     || *localeStrItr == (UChar)0x7A /* z */))
282                                 {
283                                     log_err("key \"%s\" at index %d has time pattern chars in date for locale \"%s\"\n",
284                                             subBundleKey,
285                                             idx,
286                                             locale);
287                                 }
288                                 else if (0 <= idx && idx <= 3
289                                     && (*localeStrItr == (UChar)0x47 /* G */
290                                     || *localeStrItr == (UChar)0x79 /* y */
291                                     || *localeStrItr == (UChar)0x4D /* M */
292                                     || *localeStrItr == (UChar)0x64 /* d */
293                                     || *localeStrItr == (UChar)0x45 /* E */
294                                     || *localeStrItr == (UChar)0x44 /* D */
295                                     || *localeStrItr == (UChar)0x46 /* F */
296                                     || *localeStrItr == (UChar)0x77 /* w */
297                                     || *localeStrItr == (UChar)0x57 /* W */))
298                                 {
299                                     log_err("key \"%s\" at index %d has date pattern chars in time for locale \"%s\"\n",
300                                             subBundleKey,
301                                             idx,
302                                             locale);
303                                 }
304                             }
305                             localeStrItr++;
306                         }
307                     }
308                     else if (idx == 4 && subBundleKey != NULL
309                         && strcmp(subBundleKey, "NumberElements") == 0
310                         && u_charDigitValue(localeStr[0]) != 0)
311                     {
312                         log_err("key \"%s\" at index %d has a non-zero based number for locale \"%s\"\n",
313                                 subBundleKey,
314                                 idx,
315                                 locale);
316                     }
317                 }
318                 (void)sameArray;    /* Suppress set but not used warning. */
319 /*                if (sameArray && strcmp(rootName, "root") == 0) {
320                     log_err("Arrays are the same with key \"%s\" in \"%s\" from root for locale \"%s\"\n",
321                             subBundleKey,
322                             ures_getKey(currentBundle),
323                             locale);
324                 }*/
325             }
326             ures_close(subSubBundle);
327             ures_close(subSubRootBundle);
328         }
329         else if (ures_getType(subBundle) == URES_STRING) {
330             int32_t len = 0;
331             const UChar *string = ures_getString(subBundle, &len, &errorCode);
332             if (U_FAILURE(errorCode) || string == NULL) {
333                 log_err("Can't open a string with key \"%s\" in \"%s\" for locale \"%s\"\n",
334                         subBundleKey,
335                         ures_getKey(currentBundle),
336                         locale);
337             } else if (string[0] == (UChar)0x20) {
338                 log_err("key \"%s\" in \"%s\" starts with a space in locale \"%s\"\n",
339                         subBundleKey,
340                         ures_getKey(currentBundle),
341                         locale);
342             /* localeDisplayPattern/separator can end with a space */
343             } else if (string[len - 1] == (UChar)0x20 && (strcmp(subBundleKey,"separator"))) {
344                 log_err("key \"%s\" in \"%s\" ends with a space in locale \"%s\"\n",
345                         subBundleKey,
346                         ures_getKey(currentBundle),
347                         locale);
348             } else if (strcmp(subBundleKey, "localPatternChars") == 0) {
349                 /* Note: We no longer import localPatternChars data starting
350                  * ICU 3.8.  So it never comes into this else if block. (ticket#5597)
351                  */
352 
353                 /* Check well-formedness of localPatternChars.  First, the
354                  * length must match the number of fields defined by
355                  * DateFormat.  Second, each character in the string must
356                  * be in the set [A-Za-z].  Finally, each character must be
357                  * unique.
358                  */
359                 int32_t i,j;
360 #if !UCONFIG_NO_FORMATTING
361                 if (len != UDAT_FIELD_COUNT) {
362                     log_err("key \"%s\" has the wrong number of characters in locale \"%s\"\n",
363                             subBundleKey,
364                             locale);
365                 }
366 #endif
367                 /* Check char validity. */
368                 for (i=0; i<len; ++i) {
369                     if (!((string[i] >= 65/*'A'*/ && string[i] <= 90/*'Z'*/) ||
370                           (string[i] >= 97/*'a'*/ && string[i] <= 122/*'z'*/))) {
371                         log_err("key \"%s\" has illegal character '%c' in locale \"%s\"\n",
372                                 subBundleKey,
373                                 (char) string[i],
374                                 locale);
375                     }
376                     /* Do O(n^2) check for duplicate chars. */
377                     for (j=0; j<i; ++j) {
378                         if (string[j] == string[i]) {
379                             log_err("key \"%s\" has duplicate character '%c' in locale \"%s\"\n",
380                                     subBundleKey,
381                                     (char) string[i],
382                                     locale);
383                         }
384                     }
385                 }
386             }
387             /* No fallback was done. Check for duplicate data */
388             /* The ures_* API does not do fallback of sub-resource bundles,
389                So we can't do this now. */
390 #if 0
391             else if (strcmp(locale, "root") != 0 && errorCode == U_ZERO_ERROR) {
392 
393                 const UChar *rootString = ures_getString(subRootBundle, &len, &errorCode);
394                 if (U_FAILURE(errorCode) || rootString == NULL) {
395                     log_err("Can't open a string with key \"%s\" in \"%s\" in root\n",
396                             ures_getKey(subRootBundle),
397                             ures_getKey(currentBundle));
398                     continue;
399                 } else if (u_strcmp(string, rootString) == 0) {
400                     if (strcmp(locale, "de_CH") != 0 && strcmp(subBundleKey, "Countries") != 0 &&
401                         strcmp(subBundleKey, "Version") != 0) {
402                         log_err("Found duplicate data with key \"%s\" in \"%s\" in locale \"%s\"\n",
403                                 ures_getKey(subRootBundle),
404                                 ures_getKey(currentBundle),
405                                 locale);
406                     }
407                     else {
408                         /* Ignore for now. */
409                         /* Can be fixed if fallback through de locale was done. */
410                         log_verbose("Skipping key %s in %s\n", subBundleKey, locale);
411                     }
412                 }
413             }
414 #endif
415         }
416         else if (ures_getType(subBundle) == URES_TABLE) {
417             if (strcmp(subBundleKey, "availableFormats")!=0) {
418                 /* Here is one of the recursive parts */
419                 TestKeyInRootRecursive(subRootBundle, rootName, subBundle, locale);
420             }
421             else {
422                 log_verbose("Skipping key %s in %s\n", subBundleKey, locale);
423             }
424         }
425         else if (ures_getType(subBundle) == URES_BINARY || ures_getType(subBundle) == URES_INT) {
426             /* Can't do anything to check it */
427             /* We'll assume it's all correct */
428             if (strcmp(subBundleKey, "MeasurementSystem") != 0) {
429                 log_verbose("Skipping key \"%s\" in \"%s\" for locale \"%s\"\n",
430                         subBundleKey,
431                         ures_getKey(currentBundle),
432                         locale);
433             }
434             /* Testing for MeasurementSystem is done in VerifyTranslation */
435         }
436         else {
437             log_err("Type %d for key \"%s\" in \"%s\" is unknown for locale \"%s\"\n",
438                     ures_getType(subBundle),
439                     subBundleKey,
440                     ures_getKey(currentBundle),
441                     locale);
442         }
443         ures_close(subRootBundle);
444         ures_close(subBundle);
445     }
446 }
447 #endif
448 
449 static void
testLCID(UResourceBundle * currentBundle,const char * localeName)450 testLCID(UResourceBundle *currentBundle,
451          const char *localeName)
452 {
453     UErrorCode status = U_ZERO_ERROR;
454     uint32_t expectedLCID;
455     char lcidStringC[64] = {0};
456     int32_t len;
457 
458     expectedLCID = uloc_getLCID(localeName);
459     if (expectedLCID == 0) {
460         log_verbose("INFO:    %-5s does not have any LCID mapping\n",
461             localeName);
462         return;
463     }
464 
465     status = U_ZERO_ERROR;
466     len = uprv_convertToPosix(expectedLCID, lcidStringC, sizeof(lcidStringC)/sizeof(lcidStringC[0]) - 1, &status);
467     if (U_FAILURE(status)) {
468         log_err("ERROR:   %.4x does not have a POSIX mapping due to %s\n",
469             expectedLCID, u_errorName(status));
470     }
471     lcidStringC[len] = 0;
472 
473     if(strcmp(localeName, lcidStringC) != 0) {
474         char langName[1024];
475         char langLCID[1024];
476         uloc_getLanguage(localeName, langName, sizeof(langName), &status);
477         uloc_getLanguage(lcidStringC, langLCID, sizeof(langLCID), &status);
478 
479         if (strcmp(langName, langLCID) == 0) {
480             log_verbose("WARNING: %-5s resolves to %s (0x%.4x)\n",
481                 localeName, lcidStringC, expectedLCID);
482         }
483         else {
484             log_err("ERROR:   %-5s has 0x%.4x and the number resolves wrongfully to %s\n",
485                 localeName, expectedLCID, lcidStringC);
486         }
487     }
488 }
489 
490 #if !UCONFIG_NO_FILE_IO && !UCONFIG_NO_LEGACY_CONVERSION
491 static void
TestLocaleStructure(void)492 TestLocaleStructure(void) {
493     // This test checks the locale structure against a key file located
494     // at source/test/testdata/structLocale.txt. When adding new data to
495     // a locale file such as en.txt, the structLocale.txt file must be changed
496     // too to include the the template of the new data. Otherwise this test
497     // will fail!
498 
499     UResourceBundle *root, *currentLocale;
500     int32_t locCount = uloc_countAvailable();
501     int32_t locIndex;
502     UErrorCode errorCode = U_ZERO_ERROR;
503     const char *currLoc, *resolvedLoc;
504 
505     /* TODO: Compare against parent's data too. This code can't handle fallbacks that some tools do already. */
506 /*    char locName[ULOC_FULLNAME_CAPACITY];
507     char *locNamePtr;
508 
509     for (locIndex = 0; locIndex < locCount; locIndex++) {
510         errorCode=U_ZERO_ERROR;
511         strcpy(locName, uloc_getAvailable(locIndex));
512         locNamePtr = strrchr(locName, '_');
513         if (locNamePtr) {
514             *locNamePtr = 0;
515         }
516         else {
517             strcpy(locName, "root");
518         }
519 
520         root = ures_openDirect(NULL, locName, &errorCode);
521         if(U_FAILURE(errorCode)) {
522             log_err("Can't open %s\n", locName);
523             continue;
524         }
525 */
526     if (locCount <= 1) {
527         log_data_err("At least root needs to be installed\n");
528     }
529 
530     root = ures_openDirect(loadTestData(&errorCode), "structLocale", &errorCode);
531     if(U_FAILURE(errorCode)) {
532         log_data_err("Can't open structLocale\n");
533         return;
534     }
535     for (locIndex = 0; locIndex < locCount; locIndex++) {
536         errorCode=U_ZERO_ERROR;
537         currLoc = uloc_getAvailable(locIndex);
538         currentLocale = ures_open(NULL, currLoc, &errorCode);
539         if(errorCode != U_ZERO_ERROR) {
540             if(U_SUCCESS(errorCode)) {
541                 /* It's installed, but there is no data.
542                    It's installed for the g18n white paper [grhoten] */
543                 log_err("ERROR: Locale %-5s not installed, and it should be, err %s\n",
544                     uloc_getAvailable(locIndex), u_errorName(errorCode));
545             } else {
546                 log_err("%%%%%%% Unexpected error %d in %s %%%%%%%",
547                     u_errorName(errorCode),
548                     uloc_getAvailable(locIndex));
549             }
550             ures_close(currentLocale);
551             continue;
552         }
553         ures_getStringByKey(currentLocale, "Version", NULL, &errorCode);
554         if(errorCode != U_ZERO_ERROR) {
555             log_err("No version information is available for locale %s, and it should be!\n",
556                 currLoc);
557         }
558         else if (ures_getStringByKey(currentLocale, "Version", NULL, &errorCode)[0] == (UChar)(0x78)) {
559             log_verbose("WARNING: The locale %s is experimental! It shouldn't be listed as an installed locale.\n",
560                 currLoc);
561         }
562         resolvedLoc = ures_getLocaleByType(currentLocale, ULOC_ACTUAL_LOCALE, &errorCode);
563         if (strcmp(resolvedLoc, currLoc) != 0) {
564             /* All locales have at least a Version resource.
565                If it's absolutely empty, then the previous test will fail too.*/
566             log_err("Locale resolves to different locale. Is %s an alias of %s?\n",
567                 currLoc, resolvedLoc);
568         }
569         TestKeyInRootRecursive(root, "root", currentLocale, currLoc);
570 
571         testLCID(currentLocale, currLoc);
572 
573         ures_close(currentLocale);
574     }
575 
576     ures_close(root);
577 }
578 #endif
579 
580 static void
compareArrays(const char * keyName,UResourceBundle * fromArray,const char * fromLocale,UResourceBundle * toArray,const char * toLocale,int32_t start,int32_t end)581 compareArrays(const char *keyName,
582               UResourceBundle *fromArray, const char *fromLocale,
583               UResourceBundle *toArray, const char *toLocale,
584               int32_t start, int32_t end)
585 {
586     int32_t fromSize = ures_getSize(fromArray);
587     int32_t toSize = ures_getSize(fromArray);
588     int32_t idx;
589     UErrorCode errorCode = U_ZERO_ERROR;
590 
591     if (fromSize > toSize) {
592         fromSize = toSize;
593         log_err("Arrays are different size from \"%s\" to \"%s\"\n",
594                 fromLocale,
595                 toLocale);
596     }
597 
598     for (idx = start; idx <= end; idx++) {
599         const UChar *fromBundleStr = ures_getStringByIndex(fromArray, idx, NULL, &errorCode);
600         const UChar *toBundleStr = ures_getStringByIndex(toArray, idx, NULL, &errorCode);
601         if (fromBundleStr && toBundleStr && u_strcmp(fromBundleStr, toBundleStr) != 0)
602         {
603             log_err("Difference for %s at index %d from %s= \"%s\" to %s= \"%s\"\n",
604                     keyName,
605                     idx,
606                     fromLocale,
607                     austrdup(fromBundleStr),
608                     toLocale,
609                     austrdup(toBundleStr));
610         }
611     }
612 }
613 
614 static void
compareConsistentCountryInfo(const char * fromLocale,const char * toLocale)615 compareConsistentCountryInfo(const char *fromLocale, const char *toLocale) {
616     UErrorCode errorCode = U_ZERO_ERROR;
617     UResourceBundle *fromArray, *toArray;
618     UResourceBundle *fromLocaleBund = ures_open(NULL, fromLocale, &errorCode);
619     UResourceBundle *toLocaleBund = ures_open(NULL, toLocale, &errorCode);
620     UResourceBundle *toCalendar, *fromCalendar, *toGregorian, *fromGregorian;
621 
622     if(U_FAILURE(errorCode)) {
623         log_err("Can't open resource bundle %s or %s - %s\n", fromLocale, toLocale, u_errorName(errorCode));
624         return;
625     }
626     fromCalendar = ures_getByKey(fromLocaleBund, "calendar", NULL, &errorCode);
627     fromGregorian = ures_getByKeyWithFallback(fromCalendar, "gregorian", NULL, &errorCode);
628 
629     toCalendar = ures_getByKey(toLocaleBund, "calendar", NULL, &errorCode);
630     toGregorian = ures_getByKeyWithFallback(toCalendar, "gregorian", NULL, &errorCode);
631 
632     fromArray = ures_getByKey(fromLocaleBund, "CurrencyElements", NULL, &errorCode);
633     toArray = ures_getByKey(toLocaleBund, "CurrencyElements", NULL, &errorCode);
634     if (strcmp(fromLocale, "en_CA") != 0)
635     {
636         /* The first one is probably localized. */
637         compareArrays("CurrencyElements", fromArray, fromLocale, toArray, toLocale, 1, 2);
638     }
639     ures_close(fromArray);
640     ures_close(toArray);
641 
642     fromArray = ures_getByKey(fromLocaleBund, "NumberPatterns", NULL, &errorCode);
643     toArray = ures_getByKey(toLocaleBund, "NumberPatterns", NULL, &errorCode);
644     if (strcmp(fromLocale, "en_CA") != 0)
645     {
646         compareArrays("NumberPatterns", fromArray, fromLocale, toArray, toLocale, 0, 3);
647     }
648     ures_close(fromArray);
649     ures_close(toArray);
650 
651     /* Difficult to test properly */
652 /*
653     fromArray = ures_getByKey(fromLocaleBund, "DateTimePatterns", NULL, &errorCode);
654     toArray = ures_getByKey(toLocaleBund, "DateTimePatterns", NULL, &errorCode);
655     {
656         compareArrays("DateTimePatterns", fromArray, fromLocale, toArray, toLocale);
657     }
658     ures_close(fromArray);
659     ures_close(toArray);*/
660 
661     fromArray = ures_getByKey(fromLocaleBund, "NumberElements", NULL, &errorCode);
662     toArray = ures_getByKey(toLocaleBund, "NumberElements", NULL, &errorCode);
663     if (strcmp(fromLocale, "en_CA") != 0)
664     {
665         compareArrays("NumberElements", fromArray, fromLocale, toArray, toLocale, 0, 3);
666         /* Index 4 is a script based 0 */
667         compareArrays("NumberElements", fromArray, fromLocale, toArray, toLocale, 5, 10);
668     }
669     ures_close(fromArray);
670     ures_close(toArray);
671     ures_close(fromCalendar);
672     ures_close(toCalendar);
673     ures_close(fromGregorian);
674     ures_close(toGregorian);
675 
676     ures_close(fromLocaleBund);
677     ures_close(toLocaleBund);
678 }
679 
680 static void
TestConsistentCountryInfo(void)681 TestConsistentCountryInfo(void) {
682 /*    UResourceBundle *fromLocale, *toLocale;*/
683     int32_t locCount = uloc_countAvailable();
684     int32_t fromLocIndex, toLocIndex;
685 
686     int32_t fromCountryLen, toCountryLen;
687     char fromCountry[ULOC_FULLNAME_CAPACITY], toCountry[ULOC_FULLNAME_CAPACITY];
688 
689     int32_t fromVariantLen, toVariantLen;
690     char fromVariant[ULOC_FULLNAME_CAPACITY], toVariant[ULOC_FULLNAME_CAPACITY];
691 
692     UErrorCode errorCode = U_ZERO_ERROR;
693 
694     for (fromLocIndex = 0; fromLocIndex < locCount; fromLocIndex++) {
695         const char *fromLocale = uloc_getAvailable(fromLocIndex);
696 
697         errorCode=U_ZERO_ERROR;
698         fromCountryLen = uloc_getCountry(fromLocale, fromCountry, ULOC_FULLNAME_CAPACITY, &errorCode);
699         if (fromCountryLen <= 0) {
700             /* Ignore countryless locales */
701             continue;
702         }
703         fromVariantLen = uloc_getVariant(fromLocale, fromVariant, ULOC_FULLNAME_CAPACITY, &errorCode);
704         if (fromVariantLen > 0) {
705             /* Most variants are ignorable like PREEURO, or collation variants. */
706             continue;
707         }
708         /* Start comparing only after the current index.
709            Previous loop should have already compared fromLocIndex.
710         */
711         for (toLocIndex = fromLocIndex + 1; toLocIndex < locCount; toLocIndex++) {
712             const char *toLocale = uloc_getAvailable(toLocIndex);
713 
714             toCountryLen = uloc_getCountry(toLocale, toCountry, ULOC_FULLNAME_CAPACITY, &errorCode);
715             if(U_FAILURE(errorCode)) {
716                 log_err("Unknown failure fromLocale=%s toLocale=%s errorCode=%s\n",
717                     fromLocale, toLocale, u_errorName(errorCode));
718                 continue;
719             }
720 
721             if (toCountryLen <= 0) {
722                 /* Ignore countryless locales */
723                 continue;
724             }
725             toVariantLen = uloc_getVariant(toLocale, toVariant, ULOC_FULLNAME_CAPACITY, &errorCode);
726             if (toVariantLen > 0) {
727                 /* Most variants are ignorable like PREEURO, or collation variants. */
728                 /* They're a variant for a reason. */
729                 continue;
730             }
731             if (strcmp(fromCountry, toCountry) == 0) {
732                 log_verbose("comparing fromLocale=%s toLocale=%s\n",
733                     fromLocale, toLocale);
734                 compareConsistentCountryInfo(fromLocale, toLocale);
735             }
736         }
737     }
738 }
739 
740 static int32_t
findStringSetMismatch(const char * currLoc,const UChar * string,int32_t langSize,USet * mergedExemplarSet,UBool ignoreNumbers,UChar * badCharPtr)741 findStringSetMismatch(const char *currLoc, const UChar *string, int32_t langSize,
742                       USet * mergedExemplarSet,
743                       UBool ignoreNumbers, UChar* badCharPtr) {
744     UErrorCode errorCode = U_ZERO_ERROR;
745     USet *exemplarSet;
746     int32_t strIdx;
747     if (mergedExemplarSet == NULL) {
748         return -1;
749     }
750     exemplarSet = createFlattenSet(mergedExemplarSet, &errorCode);
751     if (U_FAILURE(errorCode)) {
752         log_err("%s: error createFlattenSet returned %s\n", currLoc, u_errorName(errorCode));
753         return -1;
754     }
755 
756     for (strIdx = 0; strIdx < langSize; strIdx++) {
757         if (!uset_contains(exemplarSet, string[strIdx])
758             && string[strIdx] != 0x0020 && string[strIdx] != 0x00A0 && string[strIdx] != 0x002e && string[strIdx] != 0x002c && string[strIdx] != 0x002d && string[strIdx] != 0x0027 && string[strIdx] != 0x005B && string[strIdx] != 0x005D && string[strIdx] != 0x2019 && string[strIdx] != 0x0f0b
759             && string[strIdx] != 0x200C && string[strIdx] != 0x200D) {
760             if (!ignoreNumbers || (ignoreNumbers && (string[strIdx] < 0x30 || string[strIdx] > 0x39))) {
761                 uset_close(exemplarSet);
762                 if (badCharPtr) {
763                     *badCharPtr = string[strIdx];
764                 }
765                 return strIdx;
766             }
767         }
768     }
769     uset_close(exemplarSet);
770     if (badCharPtr) {
771         *badCharPtr = 0;
772     }
773     return -1;
774 }
775 /* include non-invariant chars */
776 static int32_t
myUCharsToChars(const UChar * us,char * cs,int32_t len)777 myUCharsToChars(const UChar* us, char* cs, int32_t len){
778     int32_t i=0;
779     for(; i< len; i++){
780         if(us[i] < 0x7f){
781             cs[i] = (char)us[i];
782         }else{
783             return -1;
784         }
785     }
786     return i;
787 }
788 static void
findSetMatch(UScriptCode * scriptCodes,int32_t scriptsLen,USet * exemplarSet,const char * locale)789 findSetMatch( UScriptCode *scriptCodes, int32_t scriptsLen,
790               USet *exemplarSet,
791               const char  *locale){
792     USet *scripts[10]= {0};
793     char pattern[256] = { '[', ':', 0x000 };
794     int32_t patternLen;
795     UChar uPattern[256] = {0};
796     UErrorCode status = U_ZERO_ERROR;
797     int32_t i;
798 
799     /* create the sets with script codes */
800     for(i = 0; i<scriptsLen; i++){
801         strcat(pattern, uscript_getShortName(scriptCodes[i]));
802         strcat(pattern, ":]");
803         patternLen = (int32_t)strlen(pattern);
804         u_charsToUChars(pattern, uPattern, patternLen);
805         scripts[i] = uset_openPattern(uPattern, patternLen, &status);
806         if(U_FAILURE(status)){
807             log_err("Could not create set for pattern %s. Error: %s\n", pattern, u_errorName(status));
808             return;
809         }
810         pattern[2] = 0;
811     }
812     if (strcmp(locale, "uk") == 0 || strcmp(locale, "uk_UA") == 0) {
813         /* Special addition. Add the modifying apostrophe, which isn't in Cyrillic. */
814         uset_add(scripts[0], 0x2bc);
815     }
816     if(U_SUCCESS(status)){
817         UBool existsInScript = FALSE;
818         /* iterate over the exemplarSet and ascertain if all
819          * UChars in exemplarSet belong to the scripts returned
820          * by getScript
821          */
822         int32_t count = uset_getItemCount(exemplarSet);
823 
824         for( i=0; i < count; i++){
825             UChar32 start = 0;
826             UChar32 end = 0;
827             UChar *str = NULL;
828             int32_t strCapacity = 0;
829 
830             strCapacity = uset_getItem(exemplarSet, i, &start, &end, str, strCapacity, &status);
831             if(U_SUCCESS(status)){
832                 int32_t j;
833                 if(strCapacity == 0){
834                     /* ok the item is a range */
835                      for( j = 0; j < scriptsLen; j++){
836                         if(uset_containsRange(scripts[j], start, end) == TRUE){
837                             existsInScript = TRUE;
838                         }
839                     }
840                     if(existsInScript == FALSE){
841                         for( j = 0; j < scriptsLen; j++){
842                             UChar toPattern[500]={'\0'};
843                             char pat[500]={'\0'};
844                             int32_t len = uset_toPattern(scripts[j], toPattern, 500, TRUE, &status);
845                             len = myUCharsToChars(toPattern, pat, len);
846                             log_err("uset_indexOf(\\u%04X)=%i uset_indexOf(\\u%04X)=%i\n", start, uset_indexOf(scripts[0], start), end, uset_indexOf(scripts[0], end));
847                             if(len!=-1){
848                                 log_err("Pattern: %s\n",pat);
849                             }
850                         }
851                         log_err("ExemplarCharacters and LocaleScript containment test failed for locale %s. \n", locale);
852                     }
853                 }else{
854                     strCapacity++; /* increment for NUL termination */
855                     /* allocate the str and call the api again */
856                     str = (UChar*) malloc(U_SIZEOF_UCHAR * strCapacity);
857                     strCapacity =  uset_getItem(exemplarSet, i, &start, &end, str, strCapacity, &status);
858                     /* iterate over the scripts and figure out if the string contained is actually
859                      * in the script set
860                      */
861                     for( j = 0; j < scriptsLen; j++){
862                         if(uset_containsString(scripts[j],str, strCapacity) == TRUE){
863                             existsInScript = TRUE;
864                         }
865                     }
866                     if(existsInScript == FALSE){
867                         log_err("ExemplarCharacters and LocaleScript containment test failed for locale %s. \n", locale);
868                     }
869                 }
870             }
871         }
872 
873     }
874 
875     /* close the sets */
876     for(i = 0; i<scriptsLen; i++){
877         uset_close(scripts[i]);
878     }
879 }
880 
VerifyTranslation(void)881 static void VerifyTranslation(void) {
882     UResourceBundle *root, *currentLocale;
883     int32_t locCount = uloc_countAvailable();
884     int32_t locIndex;
885     UErrorCode errorCode = U_ZERO_ERROR;
886     const char *currLoc;
887     UScriptCode scripts[USCRIPT_CODE_LIMIT];
888     int32_t numScripts;
889     int32_t idx;
890     int32_t end;
891     UResourceBundle *resArray;
892 
893     if (locCount <= 1) {
894         log_data_err("At least root needs to be installed\n");
895     }
896 
897     root = ures_openDirect(NULL, "root", &errorCode);
898     if(U_FAILURE(errorCode)) {
899         log_data_err("Can't open root\n");
900         return;
901     }
902     for (locIndex = 0; locIndex < locCount; locIndex++) {
903         USet * mergedExemplarSet = NULL;
904         errorCode=U_ZERO_ERROR;
905         currLoc = uloc_getAvailable(locIndex);
906         currentLocale = ures_open(NULL, currLoc, &errorCode);
907         if(errorCode != U_ZERO_ERROR) {
908             if(U_SUCCESS(errorCode)) {
909                 /* It's installed, but there is no data.
910                    It's installed for the g18n white paper [grhoten] */
911                 log_err("ERROR: Locale %-5s not installed, and it should be!\n",
912                     uloc_getAvailable(locIndex));
913             } else {
914                 log_err("%%%%%%% Unexpected error %d in %s %%%%%%%",
915                     u_errorName(errorCode),
916                     uloc_getAvailable(locIndex));
917             }
918             ures_close(currentLocale);
919             continue;
920         }
921         {
922             UErrorCode exemplarStatus = U_ZERO_ERROR;
923             ULocaleData * uld = ulocdata_open(currLoc, &exemplarStatus);
924             if (U_SUCCESS(exemplarStatus)) {
925                 USet * exemplarSet = ulocdata_getExemplarSet(uld, NULL, USET_ADD_CASE_MAPPINGS, ULOCDATA_ES_STANDARD, &exemplarStatus);
926                 if (U_SUCCESS(exemplarStatus)) {
927                     mergedExemplarSet = uset_cloneAsThawed(exemplarSet);
928                     uset_close(exemplarSet);
929                     exemplarSet = ulocdata_getExemplarSet(uld, NULL, USET_ADD_CASE_MAPPINGS, ULOCDATA_ES_AUXILIARY, &exemplarStatus);
930                     if (U_SUCCESS(exemplarStatus)) {
931                         uset_addAll(mergedExemplarSet, exemplarSet);
932                         uset_close(exemplarSet);
933                     }
934                     exemplarStatus = U_ZERO_ERROR;
935                     exemplarSet = ulocdata_getExemplarSet(uld, NULL, 0, ULOCDATA_ES_PUNCTUATION, &exemplarStatus);
936                     if (U_SUCCESS(exemplarStatus)) {
937                         uset_addAll(mergedExemplarSet, exemplarSet);
938                         uset_close(exemplarSet);
939                     }
940                 } else {
941                     log_err("error ulocdata_getExemplarSet (main) for locale %s returned %s\n", currLoc, u_errorName(errorCode));
942                 }
943                 ulocdata_close(uld);
944             } else {
945                 log_err("error ulocdata_open for locale %s returned %s\n", currLoc, u_errorName(errorCode));
946             }
947         }
948         if (mergedExemplarSet == NULL /*|| (getTestOption(QUICK_OPTION) && uset_size() > 2048)*/) {
949             log_verbose("skipping test for %s\n", currLoc);
950         }
951         //else if (uprv_strncmp(currLoc,"bem",3) == 0 || uprv_strncmp(currLoc,"mgo",3) == 0 || uprv_strncmp(currLoc,"nl",2) == 0) {
952         //    log_verbose("skipping test for %s, some month and country names known to use aux exemplars\n", currLoc);
953         //}
954         else {
955             UChar langBuffer[128];
956             int32_t langSize;
957             int32_t strIdx;
958             UChar badChar;
959             langSize = uloc_getDisplayLanguage(currLoc, currLoc, langBuffer, sizeof(langBuffer)/sizeof(langBuffer[0]), &errorCode);
960             if (U_FAILURE(errorCode)) {
961                 log_err("error uloc_getDisplayLanguage returned %s\n", u_errorName(errorCode));
962             }
963             else {
964                 strIdx = findStringSetMismatch(currLoc, langBuffer, langSize, mergedExemplarSet, FALSE, &badChar);
965                 if (strIdx >= 0) {
966                     log_err("getDisplayLanguage(%s) at index %d returned characters not in the exemplar characters: %04X.\n",
967                         currLoc, strIdx, badChar);
968                 }
969             }
970             langSize = uloc_getDisplayCountry(currLoc, currLoc, langBuffer, sizeof(langBuffer)/sizeof(langBuffer[0]), &errorCode);
971             if (U_FAILURE(errorCode)) {
972                 log_err("error uloc_getDisplayCountry returned %s\n", u_errorName(errorCode));
973             }
974             {
975                 UResourceBundle* cal = ures_getByKey(currentLocale, "calendar", NULL, &errorCode);
976                 UResourceBundle* greg = ures_getByKeyWithFallback(cal, "gregorian", NULL, &errorCode);
977                 UResourceBundle* names = ures_getByKeyWithFallback(greg,  "dayNames", NULL, &errorCode);
978                 UResourceBundle* format = ures_getByKeyWithFallback(names,  "format", NULL, &errorCode);
979                 resArray = ures_getByKeyWithFallback(format,  "wide", NULL, &errorCode);
980 
981                 if (U_FAILURE(errorCode)) {
982                     log_err("error ures_getByKey returned %s\n", u_errorName(errorCode));
983                 }
984                 if (getTestOption(QUICK_OPTION)) {
985                     end = 1;
986                 }
987                 else {
988                     end = ures_getSize(resArray);
989                 }
990 
991                 if ((uprv_strncmp(currLoc,"lrc",3) == 0 || uprv_strncmp(currLoc,"mzn",3) == 0) &&
992                         log_knownIssue("cldrbug:8899", "lrc and mzn locales don't have translated day names")) {
993                     end = 0;
994                 }
995 
996                 for (idx = 0; idx < end; idx++) {
997                     const UChar *fromBundleStr = ures_getStringByIndex(resArray, idx, &langSize, &errorCode);
998                     if (U_FAILURE(errorCode)) {
999                         log_err("error ures_getStringByIndex(%d) returned %s\n", idx, u_errorName(errorCode));
1000                         continue;
1001                     }
1002                     strIdx = findStringSetMismatch(currLoc, fromBundleStr, langSize, mergedExemplarSet, TRUE, &badChar);
1003                     if ( strIdx >= 0 ) {
1004                         log_err("getDayNames(%s, %d) at index %d returned characters not in the exemplar characters: %04X.\n",
1005                             currLoc, idx, strIdx, badChar);
1006                     }
1007                 }
1008                 ures_close(resArray);
1009                 ures_close(format);
1010                 ures_close(names);
1011 
1012                 names = ures_getByKeyWithFallback(greg, "monthNames", NULL, &errorCode);
1013                 format = ures_getByKeyWithFallback(names,"format", NULL, &errorCode);
1014                 resArray = ures_getByKeyWithFallback(format, "wide", NULL, &errorCode);
1015                 if (U_FAILURE(errorCode)) {
1016                     log_err("error ures_getByKey returned %s\n", u_errorName(errorCode));
1017                 }
1018                 if (getTestOption(QUICK_OPTION)) {
1019                     end = 1;
1020                 }
1021                 else {
1022                     end = ures_getSize(resArray);
1023                 }
1024 
1025                 for (idx = 0; idx < end; idx++) {
1026                     const UChar *fromBundleStr = ures_getStringByIndex(resArray, idx, &langSize, &errorCode);
1027                     if (U_FAILURE(errorCode)) {
1028                         log_err("error ures_getStringByIndex(%d) returned %s\n", idx, u_errorName(errorCode));
1029                         continue;
1030                     }
1031                     strIdx = findStringSetMismatch(currLoc, fromBundleStr, langSize, mergedExemplarSet, TRUE, &badChar);
1032                     if (strIdx >= 0) {
1033                         log_err("getMonthNames(%s, %d) at index %d returned characters not in the exemplar characters: %04X.\n",
1034                             currLoc, idx, strIdx, badChar);
1035                     }
1036                 }
1037                 ures_close(resArray);
1038                 ures_close(format);
1039                 ures_close(names);
1040                 ures_close(greg);
1041                 ures_close(cal);
1042             }
1043             errorCode = U_ZERO_ERROR;
1044             numScripts = uscript_getCode(currLoc, scripts, sizeof(scripts)/sizeof(scripts[0]), &errorCode);
1045             if (strcmp(currLoc, "yi") == 0 && numScripts > 0 && log_knownIssue("11217", "Fix result of uscript_getCode for yi: USCRIPT_YI -> USCRIPT_HEBREW")) {
1046                 scripts[0] = USCRIPT_HEBREW;
1047             }
1048             if (numScripts == 0) {
1049                 log_err("uscript_getCode(%s) doesn't work.\n", currLoc);
1050             }else if(scripts[0] == USCRIPT_COMMON){
1051                 log_err("uscript_getCode(%s) returned USCRIPT_COMMON.\n", currLoc);
1052             }
1053 
1054             /* test that the scripts are a superset of exemplar characters. */
1055            {
1056                 ULocaleData *uld = ulocdata_open(currLoc,&errorCode);
1057                 USet *exemplarSet =  ulocdata_getExemplarSet(uld, NULL, 0, ULOCDATA_ES_STANDARD, &errorCode);
1058                 /* test if exemplar characters are part of script code */
1059                 findSetMatch(scripts, numScripts, exemplarSet, currLoc);
1060                 uset_close(exemplarSet);
1061                 ulocdata_close(uld);
1062             }
1063 
1064            /* test that the paperSize API works */
1065            {
1066                int32_t height=0, width=0;
1067                ulocdata_getPaperSize(currLoc, &height, &width, &errorCode);
1068                if(U_FAILURE(errorCode)){
1069                    log_err("ulocdata_getPaperSize failed for locale %s with error: %s \n", currLoc, u_errorName(errorCode));
1070                }
1071                if(strstr(currLoc, "_US")!=NULL && height != 279 && width != 216 ){
1072                    log_err("ulocdata_getPaperSize did not return expected data for locale %s \n", currLoc);
1073                }
1074            }
1075             /* test that the MeasurementSystem API works */
1076            {
1077                char fullLoc[ULOC_FULLNAME_CAPACITY];
1078                UMeasurementSystem measurementSystem;
1079                int32_t height = 0, width = 0;
1080 
1081                uloc_addLikelySubtags(currLoc, fullLoc, ULOC_FULLNAME_CAPACITY, &errorCode);
1082 
1083                errorCode = U_ZERO_ERROR;
1084                measurementSystem = ulocdata_getMeasurementSystem(currLoc, &errorCode);
1085                if (U_FAILURE(errorCode)) {
1086                    log_err("ulocdata_getMeasurementSystem failed for locale %s with error: %s \n", currLoc, u_errorName(errorCode));
1087                } else {
1088                    if ( strstr(fullLoc, "_US")!=NULL || strstr(fullLoc, "_MM")!=NULL || strstr(fullLoc, "_LR")!=NULL ) {
1089                        if(measurementSystem != UMS_US){
1090                             log_err("ulocdata_getMeasurementSystem did not return expected data for locale %s \n", currLoc);
1091                        }
1092                    } else if ( strstr(fullLoc, "_GB")!=NULL ) {
1093                        if(measurementSystem != UMS_UK){
1094                             log_err("ulocdata_getMeasurementSystem did not return expected data for locale %s \n", currLoc);
1095                        }
1096                    } else if (measurementSystem != UMS_SI) {
1097                        log_err("ulocdata_getMeasurementSystem did not return expected data for locale %s \n", currLoc);
1098                    }
1099                }
1100 
1101                errorCode = U_ZERO_ERROR;
1102                ulocdata_getPaperSize(currLoc, &height, &width, &errorCode);
1103                if (U_FAILURE(errorCode)) {
1104                    log_err("ulocdata_getPaperSize failed for locale %s with error: %s \n", currLoc, u_errorName(errorCode));
1105                } else {
1106                    if ( strstr(fullLoc, "_US")!=NULL || strstr(fullLoc, "_BZ")!=NULL || strstr(fullLoc, "_CA")!=NULL || strstr(fullLoc, "_CL")!=NULL ||
1107                         strstr(fullLoc, "_CO")!=NULL || strstr(fullLoc, "_CR")!=NULL || strstr(fullLoc, "_GT")!=NULL || strstr(fullLoc, "_MX")!=NULL ||
1108                         strstr(fullLoc, "_NI")!=NULL || strstr(fullLoc, "_PA")!=NULL || strstr(fullLoc, "_PH")!=NULL || strstr(fullLoc, "_PR")!=NULL ||
1109                         strstr(fullLoc, "_SV")!=NULL || strstr(fullLoc, "_VE")!=NULL ) {
1110                        if (height != 279 || width != 216) {
1111                             log_err("ulocdata_getPaperSize did not return expected data for locale %s \n", currLoc);
1112                        }
1113                    } else if (height != 297 || width != 210) {
1114                        log_err("ulocdata_getPaperSize did not return expected data for locale %s \n", currLoc);
1115                    }
1116                }
1117            }
1118         }
1119         if (mergedExemplarSet != NULL) {
1120             uset_close(mergedExemplarSet);
1121         }
1122         ures_close(currentLocale);
1123     }
1124 
1125     ures_close(root);
1126 }
1127 
1128 /* adjust this limit as appropriate */
1129 #define MAX_SCRIPTS_PER_LOCALE 8
1130 
TestExemplarSet(void)1131 static void TestExemplarSet(void){
1132     int32_t i, j, k, m, n;
1133     int32_t equalCount = 0;
1134     UErrorCode ec = U_ZERO_ERROR;
1135     UEnumeration* avail;
1136     USet* exemplarSets[2];
1137     USet* unassignedSet;
1138     UScriptCode code[MAX_SCRIPTS_PER_LOCALE];
1139     USet* codeSets[MAX_SCRIPTS_PER_LOCALE];
1140     int32_t codeLen;
1141     char cbuf[32]; /* 9 should be enough */
1142     UChar ubuf[64]; /* adjust as needed */
1143     UBool existsInScript;
1144     int32_t itemCount;
1145     int32_t strLen;
1146     UChar32 start, end;
1147 
1148     unassignedSet = NULL;
1149     exemplarSets[0] = NULL;
1150     exemplarSets[1] = NULL;
1151     for (i=0; i<MAX_SCRIPTS_PER_LOCALE; ++i) {
1152         codeSets[i] = NULL;
1153     }
1154 
1155     avail = ures_openAvailableLocales(NULL, &ec);
1156     if (!assertSuccess("ures_openAvailableLocales", &ec)) goto END;
1157     n = uenum_count(avail, &ec);
1158     if (!assertSuccess("uenum_count", &ec)) goto END;
1159 
1160     u_uastrcpy(ubuf, "[:unassigned:]");
1161     unassignedSet = uset_openPattern(ubuf, -1, &ec);
1162     if (!assertSuccess("uset_openPattern", &ec)) goto END;
1163 
1164     for(i=0; i<n; i++){
1165         const char* locale = uenum_next(avail, NULL, &ec);
1166         if (!assertSuccess("uenum_next", &ec)) goto END;
1167         log_verbose("%s\n", locale);
1168         for (k=0; k<2; ++k) {
1169             uint32_t option = (k==0) ? 0 : USET_CASE_INSENSITIVE;
1170             ULocaleData *uld = ulocdata_open(locale,&ec);
1171             USet* exemplarSet = ulocdata_getExemplarSet(uld,NULL, option, ULOCDATA_ES_STANDARD, &ec);
1172             uset_close(exemplarSets[k]);
1173             ulocdata_close(uld);
1174             exemplarSets[k] = exemplarSet;
1175             if (!assertSuccess("ulocaledata_getExemplarSet", &ec)) goto END;
1176 
1177             if (uset_containsSome(exemplarSet, unassignedSet)) {
1178                 log_err("ExemplarSet contains unassigned characters for locale : %s\n", locale);
1179             }
1180             codeLen = uscript_getCode(locale, code, 8, &ec);
1181             if (strcmp(locale, "yi") == 0 && codeLen > 0 && log_knownIssue("11217", "Fix result of uscript_getCode for yi: USCRIPT_YI -> USCRIPT_HEBREW")) {
1182                 code[0] = USCRIPT_HEBREW;
1183             }
1184             if (!assertSuccess("uscript_getCode", &ec)) goto END;
1185 
1186             for (j=0; j<MAX_SCRIPTS_PER_LOCALE; ++j) {
1187                 uset_close(codeSets[j]);
1188                 codeSets[j] = NULL;
1189             }
1190             for (j=0; j<codeLen; ++j) {
1191                 uprv_strcpy(cbuf, "[:");
1192                 if(code[j]==-1){
1193                     log_err("USCRIPT_INVALID_CODE returned for locale: %s\n", locale);
1194                     continue;
1195                 }
1196                 uprv_strcat(cbuf, uscript_getShortName(code[j]));
1197                 uprv_strcat(cbuf, ":]");
1198                 u_uastrcpy(ubuf, cbuf);
1199                 codeSets[j] = uset_openPattern(ubuf, -1, &ec);
1200             }
1201             if (!assertSuccess("uset_openPattern", &ec)) goto END;
1202 
1203             existsInScript = FALSE;
1204             itemCount = uset_getItemCount(exemplarSet);
1205             for (m=0; m<itemCount && !existsInScript; ++m) {
1206                 strLen = uset_getItem(exemplarSet, m, &start, &end, ubuf,
1207                                       sizeof(ubuf)/sizeof(ubuf[0]), &ec);
1208                 /* failure here might mean str[] needs to be larger */
1209                 if (!assertSuccess("uset_getItem", &ec)) goto END;
1210                 if (strLen == 0) {
1211                     for (j=0; j<codeLen; ++j) {
1212                         if (codeSets[j]!=NULL && uset_containsRange(codeSets[j], start, end)) {
1213                             existsInScript = TRUE;
1214                             break;
1215                         }
1216                     }
1217                 } else {
1218                     for (j=0; j<codeLen; ++j) {
1219                         if (codeSets[j]!=NULL && uset_containsString(codeSets[j], ubuf, strLen)) {
1220                             existsInScript = TRUE;
1221                             break;
1222                         }
1223                     }
1224                 }
1225             }
1226 
1227             if (existsInScript == FALSE){
1228                 log_err("ExemplarSet containment failed for locale : %s\n", locale);
1229             }
1230         }
1231         assertTrue("case-folded is a superset",
1232                    uset_containsAll(exemplarSets[1], exemplarSets[0]));
1233         if (uset_equals(exemplarSets[1], exemplarSets[0])) {
1234             ++equalCount;
1235         }
1236     }
1237     /* Note: The case-folded set should sometimes be a strict superset
1238        and sometimes be equal. */
1239     assertTrue("case-folded is sometimes a strict superset, and sometimes equal",
1240                equalCount > 0 && equalCount < n);
1241 
1242  END:
1243     uenum_close(avail);
1244     uset_close(exemplarSets[0]);
1245     uset_close(exemplarSets[1]);
1246     uset_close(unassignedSet);
1247     for (i=0; i<MAX_SCRIPTS_PER_LOCALE; ++i) {
1248         uset_close(codeSets[i]);
1249     }
1250 }
1251 
1252 enum { kUBufMax = 32 };
TestLocaleDisplayPattern(void)1253 static void TestLocaleDisplayPattern(void){
1254     UErrorCode status;
1255     UChar pattern[kUBufMax] = {0,};
1256     UChar separator[kUBufMax] = {0,};
1257     ULocaleData *uld;
1258     static const UChar enExpectPat[] = { 0x007B,0x0030,0x007D,0x0020,0x0028,0x007B,0x0031,0x007D,0x0029,0 }; /* "{0} ({1})" */
1259     static const UChar enExpectSep[] = { 0x002C,0x0020,0 }; /* ", " */
1260     static const UChar zhExpectPat[] = { 0x007B,0x0030,0x007D,0xFF08,0x007B,0x0031,0x007D,0xFF09,0 };
1261     static const UChar zhExpectSep[] = { 0x3001,0 };
1262 
1263     status = U_ZERO_ERROR;
1264     uld = ulocdata_open("en", &status);
1265     if(U_FAILURE(status)){
1266         log_data_err("ulocdata_open en error %s", u_errorName(status));
1267     } else {
1268         ulocdata_getLocaleDisplayPattern(uld, pattern, kUBufMax, &status);
1269         if (U_FAILURE(status)){
1270             log_err("ulocdata_getLocaleDisplayPattern en error %s", u_errorName(status));
1271         } else if (u_strcmp(pattern, enExpectPat) != 0) {
1272              log_err("ulocdata_getLocaleDisplayPattern en returns unexpected pattern");
1273         }
1274         status = U_ZERO_ERROR;
1275         ulocdata_getLocaleSeparator(uld, separator, kUBufMax, &status);
1276         if (U_FAILURE(status)){
1277             log_err("ulocdata_getLocaleSeparator en error %s", u_errorName(status));
1278         } else if (u_strcmp(separator, enExpectSep) != 0) {
1279              log_err("ulocdata_getLocaleSeparator en returns unexpected string ");
1280         }
1281         ulocdata_close(uld);
1282     }
1283 
1284     status = U_ZERO_ERROR;
1285     uld = ulocdata_open("zh", &status);
1286     if(U_FAILURE(status)){
1287         log_data_err("ulocdata_open zh error %s", u_errorName(status));
1288     } else {
1289         ulocdata_getLocaleDisplayPattern(uld, pattern, kUBufMax, &status);
1290         if (U_FAILURE(status)){
1291             log_err("ulocdata_getLocaleDisplayPattern zh error %s", u_errorName(status));
1292         } else if (u_strcmp(pattern, zhExpectPat) != 0) {
1293              log_err("ulocdata_getLocaleDisplayPattern zh returns unexpected pattern");
1294         }
1295         status = U_ZERO_ERROR;
1296         ulocdata_getLocaleSeparator(uld, separator, kUBufMax, &status);
1297         if (U_FAILURE(status)){
1298             log_err("ulocdata_getLocaleSeparator zh error %s", u_errorName(status));
1299         } else if (u_strcmp(separator, zhExpectSep) != 0) {
1300              log_err("ulocdata_getLocaleSeparator zh returns unexpected string ");
1301         }
1302         ulocdata_close(uld);
1303     }
1304 }
1305 
TestCoverage(void)1306 static void TestCoverage(void){
1307     ULocaleDataDelimiterType types[] = {
1308      ULOCDATA_QUOTATION_START,     /* Quotation start */
1309      ULOCDATA_QUOTATION_END,       /* Quotation end */
1310      ULOCDATA_ALT_QUOTATION_START, /* Alternate quotation start */
1311      ULOCDATA_ALT_QUOTATION_END,   /* Alternate quotation end */
1312      ULOCDATA_DELIMITER_COUNT
1313     };
1314     int i;
1315     UBool sub;
1316     UErrorCode status = U_ZERO_ERROR;
1317     ULocaleData *uld = ulocdata_open(uloc_getDefault(), &status);
1318 
1319     if(U_FAILURE(status)){
1320         log_data_err("ulocdata_open error");
1321         return;
1322     }
1323 
1324 
1325     for(i = 0; i < ULOCDATA_DELIMITER_COUNT; i++){
1326         UChar result[32] = {0,};
1327         status = U_ZERO_ERROR;
1328         ulocdata_getDelimiter(uld, types[i], result, 32, &status);
1329         if (U_FAILURE(status)){
1330             log_err("ulocdata_getgetDelimiter error with type %d", types[i]);
1331         }
1332     }
1333 
1334     sub = ulocdata_getNoSubstitute(uld);
1335     ulocdata_setNoSubstitute(uld,sub);
1336     ulocdata_close(uld);
1337 }
1338 
TestIndexChars(void)1339 static void TestIndexChars(void) {
1340     /* Very basic test of ULOCDATA_ES_INDEX.
1341      * No comprehensive test of data, just basic check that the code path is alive.
1342      */
1343     UErrorCode status = U_ZERO_ERROR;
1344     ULocaleData  *uld;
1345     USet *exemplarChars;
1346     USet *indexChars;
1347 
1348     uld = ulocdata_open("en", &status);
1349     exemplarChars = uset_openEmpty();
1350     indexChars = uset_openEmpty();
1351     ulocdata_getExemplarSet(uld, exemplarChars, 0, ULOCDATA_ES_STANDARD, &status);
1352     ulocdata_getExemplarSet(uld, indexChars, 0, ULOCDATA_ES_INDEX, &status);
1353     if (U_FAILURE(status)) {
1354         log_data_err("File %s, line %d, Failure opening exemplar chars: %s", __FILE__, __LINE__, u_errorName(status));
1355         goto close_sets;
1356     }
1357     /* en data, standard exemplars are [a-z], lower case. */
1358     /* en data, index characters are [A-Z], upper case. */
1359     if ((uset_contains(exemplarChars, (UChar32)0x41) || uset_contains(indexChars, (UChar32)0x61))) {
1360         log_err("File %s, line %d, Exemplar characters incorrect.", __FILE__, __LINE__ );
1361         goto close_sets;
1362     }
1363     if (!(uset_contains(exemplarChars, (UChar32)0x61) && uset_contains(indexChars, (UChar32)0x41) )) {
1364         log_err("File %s, line %d, Exemplar characters incorrect.", __FILE__, __LINE__ );
1365         goto close_sets;
1366     }
1367 
1368   close_sets:
1369     uset_close(exemplarChars);
1370     uset_close(indexChars);
1371     ulocdata_close(uld);
1372 }
1373 
1374 
1375 
1376 #if !UCONFIG_NO_FILE_IO && !UCONFIG_NO_LEGACY_CONVERSION
TestCurrencyList(void)1377 static void TestCurrencyList(void){
1378 #if !UCONFIG_NO_FORMATTING
1379     UErrorCode errorCode = U_ZERO_ERROR;
1380     int32_t structLocaleCount, currencyCount;
1381     UEnumeration *en = ucurr_openISOCurrencies(UCURR_ALL, &errorCode);
1382     const char *isoCode, *structISOCode;
1383     UResourceBundle *subBundle;
1384     UResourceBundle *currencies = ures_openDirect(loadTestData(&errorCode), "structLocale", &errorCode);
1385     if(U_FAILURE(errorCode)) {
1386         log_data_err("Can't open structLocale\n");
1387         return;
1388     }
1389     currencies = ures_getByKey(currencies, "Currencies", currencies, &errorCode);
1390     currencyCount = uenum_count(en, &errorCode);
1391     structLocaleCount = ures_getSize(currencies);
1392     if (currencyCount != structLocaleCount) {
1393         log_err("structLocale(%d) and ISO4217(%d) currency list are out of sync.\n", structLocaleCount, currencyCount);
1394 #if U_CHARSET_FAMILY == U_ASCII_FAMILY
1395         ures_resetIterator(currencies);
1396         while ((isoCode = uenum_next(en, NULL, &errorCode)) != NULL && ures_hasNext(currencies)) {
1397             subBundle = ures_getNextResource(currencies, NULL, &errorCode);
1398             structISOCode = ures_getKey(subBundle);
1399             ures_close(subBundle);
1400             if (strcmp(structISOCode, isoCode) != 0) {
1401                 log_err("First difference found at structLocale(%s) and ISO4217(%s).\n", structISOCode, isoCode);
1402                 break;
1403             }
1404         }
1405 #endif
1406     }
1407     ures_close(currencies);
1408     uenum_close(en);
1409 #endif
1410 }
1411 #endif
1412 
TestAvailableIsoCodes(void)1413 static void TestAvailableIsoCodes(void){
1414 #if !UCONFIG_NO_FORMATTING
1415     UErrorCode errorCode = U_ZERO_ERROR;
1416     const char* eurCode = "EUR";
1417     const char* usdCode = "USD";
1418     const char* lastCode = "RHD";
1419     const char* zzzCode = "ZZZ";
1420     UDate date1950 = (UDate)-630720000000.0;/* year 1950 */
1421     UDate date1970 = (UDate)0.0;            /* year 1970 */
1422     UDate date1975 = (UDate)173448000000.0; /* year 1975 */
1423     UDate date1978 = (UDate)260172000000.0; /* year 1978 */
1424     UDate date1981 = (UDate)346896000000.0; /* year 1981 */
1425     UDate date1992 = (UDate)693792000000.0; /* year 1992 */
1426     UChar* isoCode = (UChar*)malloc(sizeof(UChar) * (uprv_strlen(usdCode) + 1));
1427 
1428     /* testing available codes with no time ranges */
1429     u_charsToUChars(eurCode, isoCode, uprv_strlen(usdCode) + 1);
1430     if (ucurr_isAvailable(isoCode, U_DATE_MIN, U_DATE_MAX, &errorCode) == FALSE) {
1431        log_data_err("FAIL: ISO code (%s) is not found.\n", eurCode);
1432     }
1433 
1434     u_charsToUChars(usdCode, isoCode, uprv_strlen(zzzCode) + 1);
1435     if (ucurr_isAvailable(isoCode, U_DATE_MIN, U_DATE_MAX, &errorCode) == FALSE) {
1436        log_data_err("FAIL: ISO code (%s) is not found.\n", usdCode);
1437     }
1438 
1439     u_charsToUChars(zzzCode, isoCode, uprv_strlen(zzzCode) + 1);
1440     if (ucurr_isAvailable(isoCode, U_DATE_MIN, U_DATE_MAX, &errorCode) == TRUE) {
1441        log_err("FAIL: ISO code (%s) is reported as available, but it doesn't exist.\n", zzzCode);
1442     }
1443 
1444     u_charsToUChars(lastCode, isoCode, uprv_strlen(zzzCode) + 1);
1445     if (ucurr_isAvailable(isoCode, U_DATE_MIN, U_DATE_MAX, &errorCode) == FALSE) {
1446        log_data_err("FAIL: ISO code (%s) is not found.\n", lastCode);
1447     }
1448 
1449     /* RHD was used from 1970-02-17  to 1980-04-18*/
1450 
1451     /* to = null */
1452     if (ucurr_isAvailable(isoCode, date1970, U_DATE_MAX, &errorCode) == FALSE) {
1453        log_data_err("FAIL: ISO code (%s) was available in time range >1970-01-01.\n", lastCode);
1454     }
1455 
1456     if (ucurr_isAvailable(isoCode, date1975, U_DATE_MAX, &errorCode) == FALSE) {
1457        log_data_err("FAIL: ISO code (%s) was available in time range >1975.\n", lastCode);
1458     }
1459 
1460     if (ucurr_isAvailable(isoCode, date1981, U_DATE_MAX, &errorCode) == TRUE) {
1461        log_err("FAIL: ISO code (%s) was not available in time range >1981.\n", lastCode);
1462     }
1463 
1464     /* from = null */
1465     if (ucurr_isAvailable(isoCode, U_DATE_MIN, date1970, &errorCode) == TRUE) {
1466        log_err("FAIL: ISO code (%s) was not available in time range <1970.\n", lastCode);
1467     }
1468 
1469     if (ucurr_isAvailable(isoCode, U_DATE_MIN, date1975, &errorCode) == FALSE) {
1470        log_data_err("FAIL: ISO code (%s) was available in time range <1975.\n", lastCode);
1471     }
1472 
1473     if (ucurr_isAvailable(isoCode, U_DATE_MIN, date1981, &errorCode) == FALSE) {
1474        log_data_err("FAIL: ISO code (%s) was available in time range <1981.\n", lastCode);
1475     }
1476 
1477     /* full ranges */
1478     if (ucurr_isAvailable(isoCode, date1975, date1978, &errorCode) == FALSE) {
1479        log_data_err("FAIL: ISO code (%s) was available in time range 1975-1978.\n", lastCode);
1480     }
1481 
1482     if (ucurr_isAvailable(isoCode, date1970, date1975, &errorCode) == FALSE) {
1483        log_data_err("FAIL: ISO code (%s) was available in time range 1970-1975.\n", lastCode);
1484     }
1485 
1486     if (ucurr_isAvailable(isoCode, date1975, date1981, &errorCode) == FALSE) {
1487        log_data_err("FAIL: ISO code (%s) was available in time range 1975-1981.\n", lastCode);
1488     }
1489 
1490     if (ucurr_isAvailable(isoCode, date1970,  date1981, &errorCode) == FALSE) {
1491        log_data_err("FAIL: ISO code (%s) was available in time range 1970-1981.\n", lastCode);
1492     }
1493 
1494     if (ucurr_isAvailable(isoCode, date1981,  date1992, &errorCode) == TRUE) {
1495        log_err("FAIL: ISO code (%s) was not available in time range 1981-1992.\n", lastCode);
1496     }
1497 
1498     if (ucurr_isAvailable(isoCode, date1950,  date1970, &errorCode) == TRUE) {
1499        log_err("FAIL: ISO code (%s) was not available in time range 1950-1970.\n", lastCode);
1500     }
1501 
1502     /* wrong range - from > to*/
1503     if (ucurr_isAvailable(isoCode, date1975,  date1970, &errorCode) == TRUE) {
1504        log_err("FAIL: Wrong range 1975-1970 for ISO code (%s) was not reported.\n", lastCode);
1505     } else if (errorCode != U_ILLEGAL_ARGUMENT_ERROR) {
1506        log_data_err("FAIL: Error code not reported for wrong range 1975-1970 for ISO code (%s).\n", lastCode);
1507     }
1508 
1509     free(isoCode);
1510 #endif
1511 }
1512 
1513 #define TESTCASE(name) addTest(root, &name, "tsutil/cldrtest/" #name)
1514 
1515 void addCLDRTest(TestNode** root);
1516 
addCLDRTest(TestNode ** root)1517 void addCLDRTest(TestNode** root)
1518 {
1519 #if !UCONFIG_NO_FILE_IO && !UCONFIG_NO_LEGACY_CONVERSION
1520     TESTCASE(TestLocaleStructure);
1521     TESTCASE(TestCurrencyList);
1522 #endif
1523     TESTCASE(TestConsistentCountryInfo);
1524     TESTCASE(VerifyTranslation);
1525     TESTCASE(TestExemplarSet);
1526     TESTCASE(TestLocaleDisplayPattern);
1527     TESTCASE(TestCoverage);
1528     TESTCASE(TestIndexChars);
1529     TESTCASE(TestAvailableIsoCodes);
1530 }
1531 
1532