1 // © 2019 and later: Unicode, Inc. and others.
2 // License & terms of use: http://www.unicode.org/copyright.html
3 
4 // localematchertest.cpp
5 // created: 2019jul04 Markus W. Scherer
6 
7 #include <string>
8 #include <vector>
9 #include <utility>
10 
11 #include "unicode/utypes.h"
12 #include "unicode/localematcher.h"
13 #include "unicode/locid.h"
14 #include "charstr.h"
15 #include "cmemory.h"
16 #include "intltest.h"
17 #include "localeprioritylist.h"
18 #include "ucbuf.h"
19 
20 #define ARRAY_RANGE(array) (array), ((array) + UPRV_LENGTHOF(array))
21 
22 namespace {
23 
locString(const Locale * loc)24 const char *locString(const Locale *loc) {
25     return loc != nullptr ? loc->getName() : "(null)";
26 }
27 
28 struct TestCase {
29     int32_t lineNr = 0;
30 
31     CharString supported;
32     CharString def;
33     UnicodeString favor;
34     UnicodeString threshold;
35     CharString desired;
36     CharString expMatch;
37     CharString expDesired;
38     CharString expCombined;
39 
reset__anon53c202e20111::TestCase40     void reset() {
41         supported.clear();
42         def.clear();
43         favor.remove();
44         threshold.remove();
45     }
46 };
47 
48 }  // namespace
49 
50 class LocaleMatcherTest : public IntlTest {
51 public:
LocaleMatcherTest()52     LocaleMatcherTest() {}
53 
54     void runIndexedTest(int32_t index, UBool exec, const char *&name, char *par=NULL);
55 
56     void testEmpty();
57     void testCopyErrorTo();
58     void testBasics();
59     void testSupportedDefault();
60     void testUnsupportedDefault();
61     void testNoDefault();
62     void testDemotion();
63     void testDirection();
64     void testMaxDistanceAndIsMatch();
65     void testMatch();
66     void testResolvedLocale();
67     void testDataDriven();
68 
69 private:
70     UBool dataDriven(const TestCase &test, IcuTestErrorCode &errorCode);
71 };
72 
createLocaleMatcherTest()73 extern IntlTest *createLocaleMatcherTest() {
74     return new LocaleMatcherTest();
75 }
76 
runIndexedTest(int32_t index,UBool exec,const char * & name,char *)77 void LocaleMatcherTest::runIndexedTest(int32_t index, UBool exec, const char *&name, char * /*par*/) {
78     if(exec) {
79         logln("TestSuite LocaleMatcherTest: ");
80     }
81     TESTCASE_AUTO_BEGIN;
82     TESTCASE_AUTO(testEmpty);
83     TESTCASE_AUTO(testCopyErrorTo);
84     TESTCASE_AUTO(testBasics);
85     TESTCASE_AUTO(testSupportedDefault);
86     TESTCASE_AUTO(testUnsupportedDefault);
87     TESTCASE_AUTO(testNoDefault);
88     TESTCASE_AUTO(testDemotion);
89     TESTCASE_AUTO(testDirection);
90     TESTCASE_AUTO(testMaxDistanceAndIsMatch);
91     TESTCASE_AUTO(testMatch);
92     TESTCASE_AUTO(testResolvedLocale);
93     TESTCASE_AUTO(testDataDriven);
94     TESTCASE_AUTO_END;
95 }
96 
testEmpty()97 void LocaleMatcherTest::testEmpty() {
98     IcuTestErrorCode errorCode(*this, "testEmpty");
99     LocaleMatcher matcher = LocaleMatcher::Builder().build(errorCode);
100     const Locale *best = matcher.getBestMatch(Locale::getFrench(), errorCode);
101     assertEquals("getBestMatch(fr)", "(null)", locString(best));
102     LocaleMatcher::Result result = matcher.getBestMatchResult("fr", errorCode);
103     assertEquals("getBestMatchResult(fr).des", "(null)", locString(result.getDesiredLocale()));
104     assertEquals("getBestMatchResult(fr).desIndex", -1, result.getDesiredIndex());
105     assertEquals("getBestMatchResult(fr).supp",
106                  "(null)", locString(result.getSupportedLocale()));
107     assertEquals("getBestMatchResult(fr).suppIndex",
108                  -1, result.getSupportedIndex());
109 }
110 
testCopyErrorTo()111 void LocaleMatcherTest::testCopyErrorTo() {
112     IcuTestErrorCode errorCode(*this, "testCopyErrorTo");
113     // The builder does not set any errors except out-of-memory.
114     // Test what we can.
115     LocaleMatcher::Builder builder;
116     UErrorCode success = U_ZERO_ERROR;
117     assertFalse("no error", builder.copyErrorTo(success));
118     assertTrue("still success", U_SUCCESS(success));
119     UErrorCode failure = U_INVALID_FORMAT_ERROR;
120     assertTrue("failure passed in", builder.copyErrorTo(failure));
121     assertEquals("same failure", U_INVALID_FORMAT_ERROR, failure);
122 }
123 
testBasics()124 void LocaleMatcherTest::testBasics() {
125     IcuTestErrorCode errorCode(*this, "testBasics");
126     Locale locales[] = { "fr", "en_GB", "en" };
127     {
128         LocaleMatcher matcher = LocaleMatcher::Builder().
129             setSupportedLocales(ARRAY_RANGE(locales)).build(errorCode);
130         const Locale *best = matcher.getBestMatch("en_GB", errorCode);
131         assertEquals("fromRange.getBestMatch(en_GB)", "en_GB", locString(best));
132         best = matcher.getBestMatch("en_US", errorCode);
133         assertEquals("fromRange.getBestMatch(en_US)", "en", locString(best));
134         best = matcher.getBestMatch("fr_FR", errorCode);
135         assertEquals("fromRange.getBestMatch(fr_FR)", "fr", locString(best));
136         best = matcher.getBestMatch("ja_JP", errorCode);
137         assertEquals("fromRange.getBestMatch(ja_JP)", "fr", locString(best));
138     }
139     // Code coverage: Variations of setting supported locales.
140     {
141         std::vector<Locale> locales{ "fr", "en_GB", "en" };
142         LocaleMatcher matcher = LocaleMatcher::Builder().
143             setSupportedLocales(locales.begin(), locales.end()).build(errorCode);
144         const Locale *best = matcher.getBestMatch("en_GB", errorCode);
145         assertEquals("fromRange.getBestMatch(en_GB)", "en_GB", locString(best));
146         best = matcher.getBestMatch("en_US", errorCode);
147         assertEquals("fromRange.getBestMatch(en_US)", "en", locString(best));
148         best = matcher.getBestMatch("fr_FR", errorCode);
149         assertEquals("fromRange.getBestMatch(fr_FR)", "fr", locString(best));
150         best = matcher.getBestMatch("ja_JP", errorCode);
151         assertEquals("fromRange.getBestMatch(ja_JP)", "fr", locString(best));
152     }
153     {
154         Locale::RangeIterator<Locale *> iter(ARRAY_RANGE(locales));
155         LocaleMatcher matcher = LocaleMatcher::Builder().
156             setSupportedLocales(iter).build(errorCode);
157         const Locale *best = matcher.getBestMatch("en_GB", errorCode);
158         assertEquals("fromIter.getBestMatch(en_GB)", "en_GB", locString(best));
159         best = matcher.getBestMatch("en_US", errorCode);
160         assertEquals("fromIter.getBestMatch(en_US)", "en", locString(best));
161         best = matcher.getBestMatch("fr_FR", errorCode);
162         assertEquals("fromIter.getBestMatch(fr_FR)", "fr", locString(best));
163         best = matcher.getBestMatch("ja_JP", errorCode);
164         assertEquals("fromIter.getBestMatch(ja_JP)", "fr", locString(best));
165     }
166     {
167         Locale *pointers[] = { locales, locales + 1, locales + 2 };
168         // Lambda with explicit reference return type to prevent copy-constructing a temporary
169         // which would be destructed right away.
170         LocaleMatcher matcher = LocaleMatcher::Builder().
171             setSupportedLocalesViaConverter(
172                 ARRAY_RANGE(pointers), [](const Locale *p) -> const Locale & { return *p; }).
173             build(errorCode);
174         const Locale *best = matcher.getBestMatch("en_GB", errorCode);
175         assertEquals("viaConverter.getBestMatch(en_GB)", "en_GB", locString(best));
176         best = matcher.getBestMatch("en_US", errorCode);
177         assertEquals("viaConverter.getBestMatch(en_US)", "en", locString(best));
178         best = matcher.getBestMatch("fr_FR", errorCode);
179         assertEquals("viaConverter.getBestMatch(fr_FR)", "fr", locString(best));
180         best = matcher.getBestMatch("ja_JP", errorCode);
181         assertEquals("viaConverter.getBestMatch(ja_JP)", "fr", locString(best));
182     }
183     {
184         LocaleMatcher matcher = LocaleMatcher::Builder().
185             addSupportedLocale(locales[0]).
186             addSupportedLocale(locales[1]).
187             addSupportedLocale(locales[2]).
188             build(errorCode);
189         const Locale *best = matcher.getBestMatch("en_GB", errorCode);
190         assertEquals("added.getBestMatch(en_GB)", "en_GB", locString(best));
191         best = matcher.getBestMatch("en_US", errorCode);
192         assertEquals("added.getBestMatch(en_US)", "en", locString(best));
193         best = matcher.getBestMatch("fr_FR", errorCode);
194         assertEquals("added.getBestMatch(fr_FR)", "fr", locString(best));
195         best = matcher.getBestMatch("ja_JP", errorCode);
196         assertEquals("added.getBestMatch(ja_JP)", "fr", locString(best));
197     }
198     {
199         LocaleMatcher matcher = LocaleMatcher::Builder().
200             setSupportedLocalesFromListString(
201                 " el, fr;q=0.555555, en-GB ; q = 0.88  , el; q =0, en;q=0.88 , fr ").
202             build(errorCode);
203         const Locale *best = matcher.getBestMatchForListString("el, fr, fr;q=0, en-GB", errorCode);
204         assertEquals("fromList.getBestMatch(en_GB)", "en_GB", locString(best));
205         best = matcher.getBestMatch("en_US", errorCode);
206         assertEquals("fromList.getBestMatch(en_US)", "en", locString(best));
207         best = matcher.getBestMatch("fr_FR", errorCode);
208         assertEquals("fromList.getBestMatch(fr_FR)", "fr", locString(best));
209         best = matcher.getBestMatch("ja_JP", errorCode);
210         assertEquals("fromList.getBestMatch(ja_JP)", "fr", locString(best));
211     }
212     // more API coverage
213     {
214         LocalePriorityList list("fr, en-GB", errorCode);
215         LocalePriorityList::Iterator iter(list.iterator());
216         LocaleMatcher matcher = LocaleMatcher::Builder().
217             setSupportedLocales(iter).
218             addSupportedLocale(Locale::getEnglish()).
219             setDefaultLocale(&Locale::getGerman()).
220             build(errorCode);
221         const Locale *best = matcher.getBestMatch("en_GB", errorCode);
222         assertEquals("withDefault.getBestMatch(en_GB)", "en_GB", locString(best));
223         best = matcher.getBestMatch("en_US", errorCode);
224         assertEquals("withDefault.getBestMatch(en_US)", "en", locString(best));
225         best = matcher.getBestMatch("fr_FR", errorCode);
226         assertEquals("withDefault.getBestMatch(fr_FR)", "fr", locString(best));
227         best = matcher.getBestMatch("ja_JP", errorCode);
228         assertEquals("withDefault.getBestMatch(ja_JP)", "de", locString(best));
229 
230         Locale desired("en_GB");  // distinct object from Locale.UK
231         LocaleMatcher::Result result = matcher.getBestMatchResult(desired, errorCode);
232         assertTrue("withDefault: exactly desired en-GB object",
233                    &desired == result.getDesiredLocale());
234         assertEquals("withDefault: en-GB desired index", 0, result.getDesiredIndex());
235         assertEquals("withDefault: en-GB supported",
236                      "en_GB", locString(result.getSupportedLocale()));
237         assertEquals("withDefault: en-GB supported index", 1, result.getSupportedIndex());
238 
239         LocalePriorityList list2("ja-JP, en-US", errorCode);
240         LocalePriorityList::Iterator iter2(list2.iterator());
241         result = matcher.getBestMatchResult(iter2, errorCode);
242         assertEquals("withDefault: ja-JP, en-US desired index", 1, result.getDesiredIndex());
243         assertEquals("withDefault: ja-JP, en-US desired",
244                      "en_US", locString(result.getDesiredLocale()));
245 
246         desired = Locale("en", "US");  // distinct object from Locale.US
247         result = matcher.getBestMatchResult(desired, errorCode);
248         assertTrue("withDefault: exactly desired en-US object",
249                    &desired == result.getDesiredLocale());
250         assertEquals("withDefault: en-US desired index", 0, result.getDesiredIndex());
251         assertEquals("withDefault: en-US supported", "en", locString(result.getSupportedLocale()));
252         assertEquals("withDefault: en-US supported index", 2, result.getSupportedIndex());
253 
254         result = matcher.getBestMatchResult("ja_JP", errorCode);
255         assertEquals("withDefault: ja-JP desired", "(null)", locString(result.getDesiredLocale()));
256         assertEquals("withDefault: ja-JP desired index", -1, result.getDesiredIndex());
257         assertEquals("withDefault: ja-JP supported", "de", locString(result.getSupportedLocale()));
258         assertEquals("withDefault: ja-JP supported index", -1, result.getSupportedIndex());
259     }
260 }
261 
testSupportedDefault()262 void LocaleMatcherTest::testSupportedDefault() {
263     // The default locale is one of the supported locales.
264     IcuTestErrorCode errorCode(*this, "testSupportedDefault");
265     Locale locales[] = { "fr", "en_GB", "en" };
266     LocaleMatcher matcher = LocaleMatcher::Builder().
267         setSupportedLocales(ARRAY_RANGE(locales)).
268         setDefaultLocale(&locales[1]).
269         build(errorCode);
270     const Locale *best = matcher.getBestMatch("en_GB", errorCode);
271     assertEquals("getBestMatch(en_GB)", "en_GB", locString(best));
272     best = matcher.getBestMatch("en_US", errorCode);
273     assertEquals("getBestMatch(en_US)", "en", locString(best));
274     best = matcher.getBestMatch("fr_FR", errorCode);
275     assertEquals("getBestMatch(fr_FR)", "fr", locString(best));
276     best = matcher.getBestMatch("ja_JP", errorCode);
277     assertEquals("getBestMatch(ja_JP)", "en_GB", locString(best));
278     LocaleMatcher::Result result = matcher.getBestMatchResult("ja_JP", errorCode);
279     assertEquals("getBestMatchResult(ja_JP).supp",
280                  "en_GB", locString(result.getSupportedLocale()));
281     assertEquals("getBestMatchResult(ja_JP).suppIndex",
282                  -1, result.getSupportedIndex());
283 }
284 
testUnsupportedDefault()285 void LocaleMatcherTest::testUnsupportedDefault() {
286     // The default locale does not match any of the supported locales.
287     IcuTestErrorCode errorCode(*this, "testUnsupportedDefault");
288     Locale locales[] = { "fr", "en_GB", "en" };
289     Locale def("de");
290     LocaleMatcher matcher = LocaleMatcher::Builder().
291         setSupportedLocales(ARRAY_RANGE(locales)).
292         setDefaultLocale(&def).
293         build(errorCode);
294     const Locale *best = matcher.getBestMatch("en_GB", errorCode);
295     assertEquals("getBestMatch(en_GB)", "en_GB", locString(best));
296     best = matcher.getBestMatch("en_US", errorCode);
297     assertEquals("getBestMatch(en_US)", "en", locString(best));
298     best = matcher.getBestMatch("fr_FR", errorCode);
299     assertEquals("getBestMatch(fr_FR)", "fr", locString(best));
300     best = matcher.getBestMatch("ja_JP", errorCode);
301     assertEquals("getBestMatch(ja_JP)", "de", locString(best));
302     LocaleMatcher::Result result = matcher.getBestMatchResult("ja_JP", errorCode);
303     assertEquals("getBestMatchResult(ja_JP).supp",
304                  "de", locString(result.getSupportedLocale()));
305     assertEquals("getBestMatchResult(ja_JP).suppIndex",
306                  -1, result.getSupportedIndex());
307 }
308 
testNoDefault()309 void LocaleMatcherTest::testNoDefault() {
310     // We want nullptr instead of any default locale.
311     IcuTestErrorCode errorCode(*this, "testNoDefault");
312     Locale locales[] = { "fr", "en_GB", "en" };
313     LocaleMatcher matcher = LocaleMatcher::Builder().
314         setSupportedLocales(ARRAY_RANGE(locales)).
315         setNoDefaultLocale().
316         build(errorCode);
317     const Locale *best = matcher.getBestMatch("en_GB", errorCode);
318     assertEquals("getBestMatch(en_GB)", "en_GB", locString(best));
319     best = matcher.getBestMatch("en_US", errorCode);
320     assertEquals("getBestMatch(en_US)", "en", locString(best));
321     best = matcher.getBestMatch("fr_FR", errorCode);
322     assertEquals("getBestMatch(fr_FR)", "fr", locString(best));
323     best = matcher.getBestMatch("ja_JP", errorCode);
324     assertEquals("getBestMatch(ja_JP)", "(null)", locString(best));
325     LocaleMatcher::Result result = matcher.getBestMatchResult("ja_JP", errorCode);
326     assertEquals("getBestMatchResult(ja_JP).supp",
327                  "(null)", locString(result.getSupportedLocale()));
328     assertEquals("getBestMatchResult(ja_JP).suppIndex",
329                  -1, result.getSupportedIndex());
330 }
331 
testDemotion()332 void LocaleMatcherTest::testDemotion() {
333     IcuTestErrorCode errorCode(*this, "testDemotion");
334     Locale supported[] = { "fr", "de-CH", "it" };
335     Locale desired[] = { "fr-CH", "de-CH", "it" };
336     {
337         LocaleMatcher noDemotion = LocaleMatcher::Builder().
338             setSupportedLocales(ARRAY_RANGE(supported)).
339             setDemotionPerDesiredLocale(ULOCMATCH_DEMOTION_NONE).build(errorCode);
340         Locale::RangeIterator<Locale *> desiredIter(ARRAY_RANGE(desired));
341         assertEquals("no demotion",
342                      "de_CH", locString(noDemotion.getBestMatch(desiredIter, errorCode)));
343     }
344 
345     {
346         LocaleMatcher regionDemotion = LocaleMatcher::Builder().
347             setSupportedLocales(ARRAY_RANGE(supported)).
348             setDemotionPerDesiredLocale(ULOCMATCH_DEMOTION_REGION).build(errorCode);
349         Locale::RangeIterator<Locale *> desiredIter(ARRAY_RANGE(desired));
350         assertEquals("region demotion",
351                      "fr", locString(regionDemotion.getBestMatch(desiredIter, errorCode)));
352     }
353 }
354 
testDirection()355 void LocaleMatcherTest::testDirection() {
356     IcuTestErrorCode errorCode(*this, "testDirection");
357     Locale supported[] = { "ar", "nn" };
358     Locale desired[] = { "arz-EG", "nb-DK" };
359     LocaleMatcher::Builder builder;
360     builder.setSupportedLocales(ARRAY_RANGE(supported));
361     {
362         // arz is a close one-way match to ar, and the region matches.
363         // (Egyptian Arabic vs. Arabic)
364         // Also explicitly exercise the move copy constructor.
365         LocaleMatcher built = builder.build(errorCode);
366         LocaleMatcher withOneWay(std::move(built));
367         Locale::RangeIterator<Locale *> desiredIter(ARRAY_RANGE(desired));
368         assertEquals("with one-way", "ar",
369                      locString(withOneWay.getBestMatch(desiredIter, errorCode)));
370     }
371     {
372         // nb is a less close two-way match to nn, and the regions differ.
373         // (Norwegian Bokmal vs. Nynorsk)
374         // Also explicitly exercise the move assignment operator.
375         LocaleMatcher onlyTwoWay = builder.build(errorCode);
376         LocaleMatcher built =
377             builder.setDirection(ULOCMATCH_DIRECTION_ONLY_TWO_WAY).build(errorCode);
378         onlyTwoWay = std::move(built);
379         Locale::RangeIterator<Locale *> desiredIter(ARRAY_RANGE(desired));
380         assertEquals("only two-way", "nn",
381                      locString(onlyTwoWay.getBestMatch(desiredIter, errorCode)));
382     }
383 }
384 
testMaxDistanceAndIsMatch()385 void LocaleMatcherTest::testMaxDistanceAndIsMatch() {
386     IcuTestErrorCode errorCode(*this, "testMaxDistanceAndIsMatch");
387     LocaleMatcher::Builder builder;
388     LocaleMatcher standard = builder.build(errorCode);
389     Locale germanLux("de-LU");
390     Locale germanPhoenician("de-Phnx-AT");
391     Locale greek("el");
392     assertTrue("standard de-LU / de", standard.isMatch(germanLux, Locale::getGerman(), errorCode));
393     assertFalse("standard de-Phnx-AT / de",
394                 standard.isMatch(germanPhoenician, Locale::getGerman(), errorCode));
395 
396     // Allow a script difference to still match.
397     LocaleMatcher loose =
398         builder.setMaxDistance(germanPhoenician, Locale::getGerman()).build(errorCode);
399     assertTrue("loose de-LU / de", loose.isMatch(germanLux, Locale::getGerman(), errorCode));
400     assertTrue("loose de-Phnx-AT / de",
401                loose.isMatch(germanPhoenician, Locale::getGerman(), errorCode));
402     assertFalse("loose el / de", loose.isMatch(greek, Locale::getGerman(), errorCode));
403 
404     // Allow at most a regional difference.
405     LocaleMatcher regional =
406         builder.setMaxDistance(Locale("de-AT"), Locale::getGerman()).build(errorCode);
407     assertTrue("regional de-LU / de",
408                regional.isMatch(Locale("de-LU"), Locale::getGerman(), errorCode));
409     assertFalse("regional da / no", regional.isMatch(Locale("da"), Locale("no"), errorCode));
410     assertFalse("regional zh-Hant / zh",
411                 regional.isMatch(Locale::getChinese(), Locale::getTraditionalChinese(), errorCode));
412 }
413 
414 
testMatch()415 void LocaleMatcherTest::testMatch() {
416     IcuTestErrorCode errorCode(*this, "testMatch");
417     LocaleMatcher matcher = LocaleMatcher::Builder().build(errorCode);
418 
419     // Java test function testMatch_exact()
420     Locale en_CA("en_CA");
421     assertEquals("exact match", 1.0, matcher.internalMatch(en_CA, en_CA, errorCode));
422 
423     // testMatch_none
424     Locale ar_MK("ar_MK");
425     double match = matcher.internalMatch(ar_MK, en_CA, errorCode);
426     assertTrue("mismatch: 0<=match<0.2", 0 <= match && match < 0.2);
427 
428     // testMatch_matchOnMaximized
429     Locale und_TW("und_TW");
430     Locale zh("zh");
431     Locale zh_Hant("zh_Hant");
432     double matchZh = matcher.internalMatch(und_TW, zh, errorCode);
433     double matchZhHant = matcher.internalMatch(und_TW, zh_Hant, errorCode);
434     assertTrue("und_TW should be closer to zh_Hant than to zh",
435                matchZh < matchZhHant);
436     Locale en_Hant_TW("en_Hant_TW");
437     double matchEnHantTw = matcher.internalMatch(en_Hant_TW, zh_Hant, errorCode);
438     assertTrue("zh_Hant should be closer to und_TW than to en_Hant_TW",
439                matchEnHantTw < matchZhHant);
440     assertTrue("zh should be closer to und_TW than to en_Hant_TW",
441                matchEnHantTw < matchZh);
442 }
443 
testResolvedLocale()444 void LocaleMatcherTest::testResolvedLocale() {
445     IcuTestErrorCode errorCode(*this, "testResolvedLocale");
446     LocaleMatcher matcher = LocaleMatcher::Builder().
447         addSupportedLocale("ar-EG").
448         build(errorCode);
449     Locale desired("ar-SA-u-nu-latn");
450     LocaleMatcher::Result result = matcher.getBestMatchResult(desired, errorCode);
451     assertEquals("best", "ar_EG", locString(result.getSupportedLocale()));
452     Locale resolved = result.makeResolvedLocale(errorCode);
453     assertEquals("ar-EG + ar-SA-u-nu-latn = ar-SA-u-nu-latn",
454                  "ar-SA-u-nu-latn",
455                  resolved.toLanguageTag<std::string>(errorCode).data());
456 }
457 
458 namespace {
459 
toInvariant(const UnicodeString & s,CharString & inv,ErrorCode & errorCode)460 bool toInvariant(const UnicodeString &s, CharString &inv, ErrorCode &errorCode) {
461     if (errorCode.isSuccess()) {
462         inv.clear().appendInvariantChars(s, errorCode);
463         return errorCode.isSuccess();
464     }
465     return false;
466 }
467 
getSuffixAfterPrefix(const UnicodeString & s,int32_t limit,const UnicodeString & prefix,UnicodeString & suffix)468 bool getSuffixAfterPrefix(const UnicodeString &s, int32_t limit,
469                           const UnicodeString &prefix, UnicodeString &suffix) {
470     if (prefix.length() <= limit && s.startsWith(prefix)) {
471         suffix.setTo(s, prefix.length(), limit - prefix.length());
472         return true;
473     } else {
474         return false;
475     }
476 }
477 
getInvariantSuffixAfterPrefix(const UnicodeString & s,int32_t limit,const UnicodeString & prefix,CharString & suffix,ErrorCode & errorCode)478 bool getInvariantSuffixAfterPrefix(const UnicodeString &s, int32_t limit,
479                                    const UnicodeString &prefix, CharString &suffix,
480                                    ErrorCode &errorCode) {
481     UnicodeString u_suffix;
482     return getSuffixAfterPrefix(s, limit, prefix, u_suffix) &&
483         toInvariant(u_suffix, suffix, errorCode);
484 }
485 
readTestCase(const UnicodeString & line,TestCase & test,IcuTestErrorCode & errorCode)486 bool readTestCase(const UnicodeString &line, TestCase &test, IcuTestErrorCode &errorCode) {
487     if (errorCode.isFailure()) { return false; }
488     ++test.lineNr;
489     // Start of comment, or end of line, minus trailing spaces.
490     int32_t limit = line.indexOf(u'#');
491     if (limit < 0) {
492         limit = line.length();
493         // Remove trailing CR LF.
494         char16_t c;
495         while (limit > 0 && ((c = line.charAt(limit - 1)) == u'\n' || c == u'\r')) {
496             --limit;
497         }
498     }
499     // Remove spaces before comment or at the end of the line.
500     char16_t c;
501     while (limit > 0 && ((c = line.charAt(limit - 1)) == u' ' || c == u'\t')) {
502         --limit;
503     }
504     if (limit == 0) {  // empty line
505         return false;
506     }
507     if (line.startsWith(u"** test: ")) {
508         test.reset();
509     } else if (getInvariantSuffixAfterPrefix(line, limit, u"@supported=",
510                                              test.supported, errorCode)) {
511     } else if (getInvariantSuffixAfterPrefix(line, limit, u"@default=",
512                                              test.def, errorCode)) {
513     } else if (getSuffixAfterPrefix(line, limit, u"@favor=", test.favor)) {
514     } else if (getSuffixAfterPrefix(line, limit, u"@threshold=", test.threshold)) {
515     } else {
516         int32_t matchSep = line.indexOf(u">>");
517         // >> before an inline comment, and followed by more than white space.
518         if (0 <= matchSep && (matchSep + 2) < limit) {
519             toInvariant(line.tempSubStringBetween(0, matchSep).trim(), test.desired, errorCode);
520             test.expDesired.clear();
521             test.expCombined.clear();
522             int32_t start = matchSep + 2;
523             int32_t expLimit = line.indexOf(u'|', start);
524             if (expLimit < 0) {
525                 toInvariant(line.tempSubStringBetween(start, limit).trim(),
526                             test.expMatch, errorCode);
527             } else {
528                 toInvariant(line.tempSubStringBetween(start, expLimit).trim(),
529                             test.expMatch, errorCode);
530                 start = expLimit + 1;
531                 expLimit = line.indexOf(u'|', start);
532                 if (expLimit < 0) {
533                     toInvariant(line.tempSubStringBetween(start, limit).trim(),
534                                 test.expDesired, errorCode);
535                 } else {
536                     toInvariant(line.tempSubStringBetween(start, expLimit).trim(),
537                                 test.expDesired, errorCode);
538                     toInvariant(line.tempSubStringBetween(expLimit + 1, limit).trim(),
539                                 test.expCombined, errorCode);
540                 }
541             }
542             return errorCode.isSuccess();
543         } else {
544             errorCode.set(U_INVALID_FORMAT_ERROR);
545         }
546     }
547     return false;
548 }
549 
getLocaleOrNull(const CharString & s,Locale & locale)550 Locale *getLocaleOrNull(const CharString &s, Locale &locale) {
551     if (s == "null") {
552         return nullptr;
553     } else {
554         return &(locale = Locale(s.data()));
555     }
556 }
557 
558 }  // namespace
559 
dataDriven(const TestCase & test,IcuTestErrorCode & errorCode)560 UBool LocaleMatcherTest::dataDriven(const TestCase &test, IcuTestErrorCode &errorCode) {
561     LocaleMatcher::Builder builder;
562     builder.setSupportedLocalesFromListString(test.supported.toStringPiece());
563     if (!test.def.isEmpty()) {
564         Locale defaultLocale(test.def.data());
565         builder.setDefaultLocale(&defaultLocale);
566     }
567     if (!test.favor.isEmpty()) {
568         ULocMatchFavorSubtag favor;
569         if (test.favor == u"normal") {
570             favor = ULOCMATCH_FAVOR_LANGUAGE;
571         } else if (test.favor == u"script") {
572             favor = ULOCMATCH_FAVOR_SCRIPT;
573         } else {
574             errln(UnicodeString(u"unsupported FavorSubtag value ") + test.favor);
575             return FALSE;
576         }
577         builder.setFavorSubtag(favor);
578     }
579     if (!test.threshold.isEmpty()) {
580         infoln("skipping test case on line %d with non-default threshold: not exposed via API",
581                (int)test.lineNr);
582         return TRUE;
583         // int32_t threshold = Integer.valueOf(test.threshold);
584         // builder.internalSetThresholdDistance(threshold);
585     }
586     LocaleMatcher matcher = builder.build(errorCode);
587     if (errorCode.errIfFailureAndReset("LocaleMatcher::Builder::build()")) {
588         return FALSE;
589     }
590 
591     Locale expMatchLocale("");
592     Locale *expMatch = getLocaleOrNull(test.expMatch, expMatchLocale);
593     if (test.expDesired.isEmpty() && test.expCombined.isEmpty()) {
594         StringPiece desiredSP = test.desired.toStringPiece();
595         const Locale *bestSupported = matcher.getBestMatchForListString(desiredSP, errorCode);
596         if (!assertEquals("bestSupported from string",
597                           locString(expMatch), locString(bestSupported))) {
598             return FALSE;
599         }
600         LocalePriorityList desired(test.desired.toStringPiece(), errorCode);
601         LocalePriorityList::Iterator desiredIter = desired.iterator();
602         if (desired.getLength() == 1) {
603             const Locale &desiredLocale = desiredIter.next();
604             bestSupported = matcher.getBestMatch(desiredLocale, errorCode);
605             UBool ok = assertEquals("bestSupported from Locale",
606                                     locString(expMatch), locString(bestSupported));
607 
608             LocaleMatcher::Result result = matcher.getBestMatchResult(desiredLocale, errorCode);
609             return ok & assertEquals("result.getSupportedLocale from Locale",
610                                      locString(expMatch), locString(result.getSupportedLocale()));
611         } else {
612             bestSupported = matcher.getBestMatch(desiredIter, errorCode);
613             return assertEquals("bestSupported from Locale iterator",
614                                 locString(expMatch), locString(bestSupported));
615         }
616     } else {
617         LocalePriorityList desired(test.desired.toStringPiece(), errorCode);
618         LocalePriorityList::Iterator desiredIter = desired.iterator();
619         LocaleMatcher::Result result = matcher.getBestMatchResult(desiredIter, errorCode);
620         UBool ok = assertEquals("result.getSupportedLocale from Locales",
621                                 locString(expMatch), locString(result.getSupportedLocale()));
622         if (!test.expDesired.isEmpty()) {
623             Locale expDesiredLocale("");
624             Locale *expDesired = getLocaleOrNull(test.expDesired, expDesiredLocale);
625             ok &= assertEquals("result.getDesiredLocale from Locales",
626                                locString(expDesired), locString(result.getDesiredLocale()));
627         }
628         if (!test.expCombined.isEmpty()) {
629             if (test.expMatch.contains("-u-")) {
630                 logKnownIssue("20727",
631                               UnicodeString(u"ignoring makeResolvedLocale() line ") + test.lineNr);
632                 return ok;
633             }
634             Locale expCombinedLocale("");
635             Locale *expCombined = getLocaleOrNull(test.expCombined, expCombinedLocale);
636             Locale combined = result.makeResolvedLocale(errorCode);
637             ok &= assertEquals("combined Locale from Locales",
638                                locString(expCombined), locString(&combined));
639         }
640         return ok;
641     }
642 }
643 
testDataDriven()644 void LocaleMatcherTest::testDataDriven() {
645     IcuTestErrorCode errorCode(*this, "testDataDriven");
646     CharString path(getSourceTestData(errorCode), errorCode);
647     path.appendPathPart("localeMatcherTest.txt", errorCode);
648     const char *codePage = "UTF-8";
649     LocalUCHARBUFPointer f(ucbuf_open(path.data(), &codePage, TRUE, FALSE, errorCode));
650     if(errorCode.errIfFailureAndReset("ucbuf_open(localeMatcherTest.txt)")) {
651         return;
652     }
653     int32_t lineLength;
654     const UChar *p;
655     UnicodeString line;
656     TestCase test;
657     int32_t numPassed = 0;
658     while ((p = ucbuf_readline(f.getAlias(), &lineLength, errorCode)) != nullptr &&
659             errorCode.isSuccess()) {
660         line.setTo(FALSE, p, lineLength);
661         if (!readTestCase(line, test, errorCode)) {
662             if (errorCode.errIfFailureAndReset(
663                     "test data syntax error on line %d", (int)test.lineNr)) {
664                 infoln(line);
665             }
666             continue;
667         }
668         UBool ok = dataDriven(test, errorCode);
669         if (errorCode.errIfFailureAndReset("test error on line %d", (int)test.lineNr)) {
670             infoln(line);
671         } else if (!ok) {
672             infoln("test failure on line %d", (int)test.lineNr);
673             infoln(line);
674         } else {
675             ++numPassed;
676         }
677     }
678     infoln("number of passing test cases: %d", (int)numPassed);
679 }
680