1 /***********************************************************************
2 * COPYRIGHT:
3 * Copyright (c) 1997-2015, International Business Machines Corporation
4 * and others. All Rights Reserved.
5 ***********************************************************************/
6
7 #include "unicode/utypes.h"
8
9 #if !UCONFIG_NO_FORMATTING
10
11 #include "unicode/datefmt.h"
12 #include "unicode/smpdtfmt.h"
13 #include "unicode/gregocal.h"
14 #include "dtfmtrtts.h"
15 #include "caltest.h"
16 #include "cstring.h"
17
18 #include <stdio.h>
19 #include <string.h>
20
21 // *****************************************************************************
22 // class DateFormatRoundTripTest
23 // *****************************************************************************
24
25 // Useful for turning up subtle bugs: Change the following to TRUE, recompile,
26 // and run while at lunch.
27 // Warning -- makes test run infinite loop!!!
28 #ifndef INFINITE
29 #define INFINITE 0
30 #endif
31
32 // Define this to test just a single locale
33 //#define TEST_ONE_LOC "cs_CZ"
34
35 // If SPARSENESS is > 0, we don't run each exhaustive possibility.
36 // There are 24 total possible tests per each locale. A SPARSENESS
37 // of 12 means we run half of them. A SPARSENESS of 23 means we run
38 // 1 of them. SPARSENESS _must_ be in the range 0..23.
39 int32_t DateFormatRoundTripTest::SPARSENESS = 0;
40 int32_t DateFormatRoundTripTest::TRIALS = 4;
41 int32_t DateFormatRoundTripTest::DEPTH = 5;
42
DateFormatRoundTripTest()43 DateFormatRoundTripTest::DateFormatRoundTripTest() : dateFormat(0) {
44 }
45
~DateFormatRoundTripTest()46 DateFormatRoundTripTest::~DateFormatRoundTripTest() {
47 delete dateFormat;
48 }
49
50 #define CASE(id,test) case id: name = #test; if (exec) { logln(#test "---"); logln((UnicodeString)""); test(); } break;
51
52 void
runIndexedTest(int32_t index,UBool exec,const char * & name,char * par)53 DateFormatRoundTripTest::runIndexedTest( int32_t index, UBool exec, const char* &name, char* par )
54 {
55 optionv = (par && *par=='v');
56 switch (index) {
57 CASE(0,TestDateFormatRoundTrip)
58 CASE(1, TestCentury)
59 default: name = ""; break;
60 }
61 }
62
63 UBool
failure(UErrorCode status,const char * msg)64 DateFormatRoundTripTest::failure(UErrorCode status, const char* msg)
65 {
66 if(U_FAILURE(status)) {
67 errln(UnicodeString("FAIL: ") + msg + " failed, error " + u_errorName(status));
68 return TRUE;
69 }
70
71 return FALSE;
72 }
73
74 UBool
failure(UErrorCode status,const char * msg,const UnicodeString & str)75 DateFormatRoundTripTest::failure(UErrorCode status, const char* msg, const UnicodeString& str)
76 {
77 if(U_FAILURE(status)) {
78 UnicodeString escaped;
79 escape(str,escaped);
80 errln(UnicodeString("FAIL: ") + msg + " failed, error " + u_errorName(status) + ", str=" + escaped);
81 return TRUE;
82 }
83
84 return FALSE;
85 }
86
TestCentury()87 void DateFormatRoundTripTest::TestCentury()
88 {
89 UErrorCode status = U_ZERO_ERROR;
90 Locale locale("es_PA");
91 UnicodeString pattern = "MM/dd/yy hh:mm:ss a z";
92 SimpleDateFormat fmt(pattern, locale, status);
93 if (U_FAILURE(status)) {
94 dataerrln("Fail: construct SimpleDateFormat: %s", u_errorName(status));
95 return;
96 }
97 UDate date[] = {-55018555891590.05, 0, 0};
98 UnicodeString result[2];
99
100 fmt.format(date[0], result[0]);
101 date[1] = fmt.parse(result[0], status);
102 fmt.format(date[1], result[1]);
103 date[2] = fmt.parse(result[1], status);
104
105 /* This test case worked OK by accident before. date[1] != date[0],
106 * because we use -80/+20 year window for 2-digit year parsing.
107 * (date[0] is in year 1926, date[1] is in year 2026.) result[1] set
108 * by the first format call returns "07/13/26 07:48:28 p.m. PST",
109 * which is correct, because DST was not used in year 1926 in zone
110 * America/Los_Angeles. When this is parsed, date[1] becomes a time
111 * in 2026, which is "07/13/26 08:48:28 p.m. PDT". There was a zone
112 * offset calculation bug that observed DST in 1926, which was resolved.
113 * Before the bug was resolved, result[0] == result[1] was true,
114 * but after the bug fix, the expected result is actually
115 * result[0] != result[1]. -Yoshito
116 */
117 /* TODO: We need to review this code and clarify what we really
118 * want to test here.
119 */
120 //if (date[1] != date[2] || result[0] != result[1]) {
121 if (date[1] != date[2]) {
122 errln("Round trip failure: \"%S\" (%f), \"%S\" (%f)", result[0].getBuffer(), date[1], result[1].getBuffer(), date[2]);
123 }
124 }
125
126 // ==
127
TestDateFormatRoundTrip()128 void DateFormatRoundTripTest::TestDateFormatRoundTrip()
129 {
130 UErrorCode status = U_ZERO_ERROR;
131
132 getFieldCal = Calendar::createInstance(status);
133 if (U_FAILURE(status)) {
134 dataerrln("Fail: Calendar::createInstance: %s", u_errorName(status));
135 return;
136 }
137
138
139 int32_t locCount = 0;
140 const Locale *avail = DateFormat::getAvailableLocales(locCount);
141 logln("DateFormat available locales: %d", locCount);
142 if(quick) {
143 SPARSENESS = 18;
144 logln("Quick mode: only testing SPARSENESS = 18");
145 }
146 TimeZone *tz = TimeZone::createDefault();
147 UnicodeString temp;
148 logln("Default TimeZone: " + tz->getID(temp));
149 delete tz;
150
151 #ifdef TEST_ONE_LOC // define this to just test ONE locale.
152 Locale loc(TEST_ONE_LOC);
153 test(loc);
154 #if INFINITE
155 for(;;) {
156 test(loc);
157 }
158 #endif
159
160 #else
161 # if INFINITE
162 // Special infinite loop test mode for finding hard to reproduce errors
163 Locale loc = Locale::getDefault();
164 logln("ENTERING INFINITE TEST LOOP FOR Locale: " + loc.getDisplayName(temp));
165 for(;;)
166 test(loc);
167 # else
168 test(Locale::getDefault());
169
170 #if 1
171 // installed locales
172 for (int i=0; i < locCount; ++i) {
173 test(avail[i]);
174 }
175 #endif
176
177 #if 1
178 // special locales
179 int32_t jCount = CalendarTest::testLocaleCount();
180 for (int32_t j=0; j < jCount; ++j) {
181 test(Locale(CalendarTest::testLocaleID(j)));
182 }
183 #endif
184
185 # endif
186 #endif
187
188 delete getFieldCal;
189 }
190
styleName(DateFormat::EStyle s)191 static const char *styleName(DateFormat::EStyle s)
192 {
193 switch(s)
194 {
195 case DateFormat::SHORT: return "SHORT";
196 case DateFormat::MEDIUM: return "MEDIUM";
197 case DateFormat::LONG: return "LONG";
198 case DateFormat::FULL: return "FULL";
199 // case DateFormat::DEFAULT: return "DEFAULT";
200 case DateFormat::DATE_OFFSET: return "DATE_OFFSET";
201 case DateFormat::NONE: return "NONE";
202 case DateFormat::DATE_TIME: return "DATE_TIME";
203 default: return "Unknown";
204 }
205 }
206
test(const Locale & loc)207 void DateFormatRoundTripTest::test(const Locale& loc)
208 {
209 UnicodeString temp;
210 #if !INFINITE
211 logln("Locale: " + loc.getDisplayName(temp));
212 #endif
213
214 // Total possibilities = 24
215 // 4 date
216 // 4 time
217 // 16 date-time
218 UBool TEST_TABLE [24];//= new boolean[24];
219 int32_t i = 0;
220 for(i = 0; i < 24; ++i)
221 TEST_TABLE[i] = TRUE;
222
223 // If we have some sparseness, implement it here. Sparseness decreases
224 // test time by eliminating some tests, up to 23.
225 for(i = 0; i < SPARSENESS; ) {
226 int random = (int)(randFraction() * 24);
227 if (random >= 0 && random < 24 && TEST_TABLE[i]) {
228 TEST_TABLE[i] = FALSE;
229 ++i;
230 }
231 }
232
233 int32_t itable = 0;
234 int32_t style = 0;
235 for(style = DateFormat::FULL; style <= DateFormat::SHORT; ++style) {
236 if(TEST_TABLE[itable++]) {
237 logln("Testing style " + UnicodeString(styleName((DateFormat::EStyle)style)));
238 DateFormat *df = DateFormat::createDateInstance((DateFormat::EStyle)style, loc);
239 if(df == NULL) {
240 errln(UnicodeString("Could not DF::createDateInstance ") + UnicodeString(styleName((DateFormat::EStyle)style)) + " Locale: " + loc.getDisplayName(temp));
241 } else {
242 test(df, loc);
243 delete df;
244 }
245 }
246 }
247
248 for(style = DateFormat::FULL; style <= DateFormat::SHORT; ++style) {
249 if (TEST_TABLE[itable++]) {
250 logln("Testing style " + UnicodeString(styleName((DateFormat::EStyle)style)));
251 DateFormat *df = DateFormat::createTimeInstance((DateFormat::EStyle)style, loc);
252 if(df == NULL) {
253 errln(UnicodeString("Could not DF::createTimeInstance ") + UnicodeString(styleName((DateFormat::EStyle)style)) + " Locale: " + loc.getDisplayName(temp));
254 } else {
255 test(df, loc, TRUE);
256 delete df;
257 }
258 }
259 }
260
261 for(int32_t dstyle = DateFormat::FULL; dstyle <= DateFormat::SHORT; ++dstyle) {
262 for(int32_t tstyle = DateFormat::FULL; tstyle <= DateFormat::SHORT; ++tstyle) {
263 if(TEST_TABLE[itable++]) {
264 logln("Testing dstyle" + UnicodeString(styleName((DateFormat::EStyle)dstyle)) + ", tstyle" + UnicodeString(styleName((DateFormat::EStyle)tstyle)) );
265 DateFormat *df = DateFormat::createDateTimeInstance((DateFormat::EStyle)dstyle, (DateFormat::EStyle)tstyle, loc);
266 if(df == NULL) {
267 dataerrln(UnicodeString("Could not DF::createDateTimeInstance ") + UnicodeString(styleName((DateFormat::EStyle)dstyle)) + ", tstyle" + UnicodeString(styleName((DateFormat::EStyle)tstyle)) + "Locale: " + loc.getDisplayName(temp));
268 } else {
269 test(df, loc);
270 delete df;
271 }
272 }
273 }
274 }
275 }
276
test(DateFormat * fmt,const Locale & origLocale,UBool timeOnly)277 void DateFormatRoundTripTest::test(DateFormat *fmt, const Locale &origLocale, UBool timeOnly)
278 {
279 UnicodeString pat;
280 if(fmt->getDynamicClassID() != SimpleDateFormat::getStaticClassID()) {
281 errln("DateFormat wasn't a SimpleDateFormat");
282 return;
283 }
284
285 UBool isGregorian = FALSE;
286 UErrorCode minStatus = U_ZERO_ERROR;
287 if(fmt->getCalendar() == NULL) {
288 errln((UnicodeString)"DateFormatRoundTripTest::test, DateFormat getCalendar() returns null for " + origLocale.getName());
289 return;
290 }
291 UDate minDate = CalendarTest::minDateOfCalendar(*fmt->getCalendar(), isGregorian, minStatus);
292 if(U_FAILURE(minStatus)) {
293 errln((UnicodeString)"Failure getting min date for " + origLocale.getName());
294 return;
295 }
296 //logln(UnicodeString("Min date is ") + fullFormat(minDate) + " for " + origLocale.getName());
297
298 pat = ((SimpleDateFormat*)fmt)->toPattern(pat);
299
300 // NOTE TO MAINTAINER
301 // This indexOf check into the pattern needs to be refined to ignore
302 // quoted characters. Currently, this isn't a problem with the locale
303 // patterns we have, but it may be a problem later.
304
305 UBool hasEra = (pat.indexOf(UnicodeString("G")) != -1);
306 UBool hasZoneDisplayName = (pat.indexOf(UnicodeString("z")) != -1) || (pat.indexOf(UnicodeString("v")) != -1)
307 || (pat.indexOf(UnicodeString("V")) != -1);
308
309 // Because patterns contain incomplete data representing the Date,
310 // we must be careful of how we do the roundtrip. We start with
311 // a randomly generated Date because they're easier to generate.
312 // From this we get a string. The string is our real starting point,
313 // because this string should parse the same way all the time. Note
314 // that it will not necessarily parse back to the original date because
315 // of incompleteness in patterns. For example, a time-only pattern won't
316 // parse back to the same date.
317
318 //try {
319 for(int i = 0; i < TRIALS; ++i) {
320 UDate *d = new UDate [DEPTH];
321 UnicodeString *s = new UnicodeString[DEPTH];
322
323 if(isGregorian == TRUE) {
324 d[0] = generateDate();
325 } else {
326 d[0] = generateDate(minDate);
327 }
328
329 UErrorCode status = U_ZERO_ERROR;
330
331 // We go through this loop until we achieve a match or until
332 // the maximum loop count is reached. We record the points at
333 // which the date and the string starts to match. Once matching
334 // starts, it should continue.
335 int loop;
336 int dmatch = 0; // d[dmatch].getTime() == d[dmatch-1].getTime()
337 int smatch = 0; // s[smatch].equals(s[smatch-1])
338 for(loop = 0; loop < DEPTH; ++loop) {
339 if (loop > 0) {
340 d[loop] = fmt->parse(s[loop-1], status);
341 failure(status, "fmt->parse", s[loop-1]+" in locale: " + origLocale.getName() + " with pattern: " + pat);
342 status = U_ZERO_ERROR; /* any error would have been reported */
343 }
344
345 s[loop] = fmt->format(d[loop], s[loop]);
346
347 // For displaying which date is being tested
348 //logln(s[loop] + " = " + fullFormat(d[loop]));
349
350 if(s[loop].length() == 0) {
351 errln("FAIL: fmt->format gave 0-length string in " + pat + " with number " + d[loop] + " in locale " + origLocale.getName());
352 }
353
354 if(loop > 0) {
355 if(smatch == 0) {
356 UBool match = s[loop] == s[loop-1];
357 if(smatch == 0) {
358 if(match)
359 smatch = loop;
360 }
361 else if( ! match)
362 errln("FAIL: String mismatch after match");
363 }
364
365 if(dmatch == 0) {
366 // {sfb} watch out here, this might not work
367 UBool match = d[loop]/*.getTime()*/ == d[loop-1]/*.getTime()*/;
368 if(dmatch == 0) {
369 if(match)
370 dmatch = loop;
371 }
372 else if( ! match)
373 errln("FAIL: Date mismatch after match");
374 }
375
376 if(smatch != 0 && dmatch != 0)
377 break;
378 }
379 }
380 // At this point loop == DEPTH if we've failed, otherwise loop is the
381 // max(smatch, dmatch), that is, the index at which we have string and
382 // date matching.
383
384 // Date usually matches in 2. Exceptions handled below.
385 int maxDmatch = 2;
386 int maxSmatch = 1;
387 if (dmatch > maxDmatch) {
388 // Time-only pattern with zone information and a starting date in PST.
389 if(timeOnly && hasZoneDisplayName) {
390 int32_t startRaw, startDst;
391 fmt->getTimeZone().getOffset(d[0], FALSE, startRaw, startDst, status);
392 failure(status, "TimeZone::getOffset");
393 // if the start offset is greater than the offset on Jan 1, 1970
394 // in PST, then need one more round trip. There are two cases
395 // fall into this category. The start date is 1) DST or
396 // 2) LMT (GMT-07:52:58).
397 if (startRaw + startDst > -28800000) {
398 maxDmatch = 3;
399 maxSmatch = 2;
400 }
401 }
402 }
403
404 // String usually matches in 1. Exceptions are checked for here.
405 if(smatch > maxSmatch) { // Don't compute unless necessary
406 UBool in0;
407 // Starts in BC, with no era in pattern
408 if( ! hasEra && getField(d[0], UCAL_ERA) == GregorianCalendar::BC)
409 maxSmatch = 2;
410 // Starts in DST, no year in pattern
411 else if((in0=fmt->getTimeZone().inDaylightTime(d[0], status)) && ! failure(status, "gettingDaylightTime") &&
412 pat.indexOf(UnicodeString("yyyy")) == -1)
413 maxSmatch = 2;
414 // If we start not in DST, but transition into DST
415 else if (!in0 &&
416 fmt->getTimeZone().inDaylightTime(d[1], status) && !failure(status, "gettingDaylightTime"))
417 maxSmatch = 2;
418 // Two digit year with no time zone change,
419 // unless timezone isn't used or we aren't close to the DST changover
420 else if (pat.indexOf(UnicodeString("y")) != -1
421 && pat.indexOf(UnicodeString("yyyy")) == -1
422 && getField(d[0], UCAL_YEAR)
423 != getField(d[dmatch], UCAL_YEAR)
424 && !failure(status, "error status [smatch>maxSmatch]")
425 && ((hasZoneDisplayName
426 && (fmt->getTimeZone().inDaylightTime(d[0], status)
427 == fmt->getTimeZone().inDaylightTime(d[dmatch], status)
428 || getField(d[0], UCAL_MONTH) == UCAL_APRIL
429 || getField(d[0], UCAL_MONTH) == UCAL_OCTOBER))
430 || !hasZoneDisplayName)
431 )
432 {
433 maxSmatch = 2;
434 }
435 // If zone display name is used, fallback format might be used before 1970
436 else if (hasZoneDisplayName && d[0] < 0) {
437 maxSmatch = 2;
438 }
439 else if (timeOnly && !isGregorian && hasZoneDisplayName && maxSmatch == 1) {
440 int32_t startRaw, startDst;
441 fmt->getTimeZone().getOffset(d[1], FALSE, startRaw, startDst, status);
442 failure(status, "TimeZone::getOffset");
443 // If the calendar type is not Gregorian and the pattern is time only,
444 // the calendar implementation may use a date before 1970 as day 0.
445 // In this case, time zone offset of the default year might be
446 // different from the one at 1970-01-01 in PST and string match requires
447 // one more iteration.
448 if (startRaw + startDst != -28800000) {
449 maxSmatch = 2;
450 }
451 }
452 }
453
454 /*
455 * Special case for Japanese and Buddhist (could have large negative years)
456 * Also, Hebrew calendar need help handling leap month.
457 */
458 if(dmatch > maxDmatch || smatch > maxSmatch) {
459 const char *type = fmt->getCalendar()->getType();
460 if(!strcmp(type,"japanese") || (!strcmp(type,"buddhist"))) {
461 maxSmatch = 4;
462 maxDmatch = 4;
463 } else if(!strcmp(type,"hebrew")) {
464 maxSmatch = 3;
465 maxDmatch = 3;
466 }
467 }
468
469 // Use @v to see verbose results on successful cases
470 UBool fail = (dmatch > maxDmatch || smatch > maxSmatch);
471 if (optionv || fail) {
472 if (fail) {
473 errln(UnicodeString("\nFAIL: Pattern: ") + pat +
474 " in Locale: " + origLocale.getName());
475 } else {
476 errln(UnicodeString("\nOk: Pattern: ") + pat +
477 " in Locale: " + origLocale.getName());
478 }
479
480 logln("Date iters until match=%d (max allowed=%d), string iters until match=%d (max allowed=%d)",
481 dmatch,maxDmatch, smatch, maxSmatch);
482
483 for(int j = 0; j <= loop && j < DEPTH; ++j) {
484 UnicodeString temp;
485 FieldPosition pos(FieldPosition::DONT_CARE);
486 errln((j>0?" P> ":" ") + fullFormat(d[j]) + " F> " +
487 escape(s[j], temp) + UnicodeString(" d=") + d[j] +
488 (j > 0 && d[j]/*.getTime()*/==d[j-1]/*.getTime()*/?" d==":"") +
489 (j > 0 && s[j] == s[j-1]?" s==":""));
490 }
491 }
492 delete[] d;
493 delete[] s;
494 }
495 /*}
496 catch (ParseException e) {
497 errln("Exception: " + e.getMessage());
498 logln(e.toString());
499 }*/
500 }
501
fullFormat(UDate d)502 const UnicodeString& DateFormatRoundTripTest::fullFormat(UDate d) {
503 UErrorCode ec = U_ZERO_ERROR;
504 if (dateFormat == 0) {
505 dateFormat = new SimpleDateFormat((UnicodeString)"EEE MMM dd HH:mm:ss.SSS zzz yyyy G", ec);
506 if (U_FAILURE(ec) || dateFormat == 0) {
507 fgStr = "[FAIL: SimpleDateFormat constructor]";
508 delete dateFormat;
509 dateFormat = 0;
510 return fgStr;
511 }
512 }
513 fgStr.truncate(0);
514 dateFormat->format(d, fgStr);
515 return fgStr;
516 }
517
518 /**
519 * Return a field of the given date
520 */
getField(UDate d,int32_t f)521 int32_t DateFormatRoundTripTest::getField(UDate d, int32_t f) {
522 // Should be synchronized, but we're single threaded so it's ok
523 UErrorCode status = U_ZERO_ERROR;
524 getFieldCal->setTime(d, status);
525 failure(status, "getfieldCal->setTime");
526 int32_t ret = getFieldCal->get((UCalendarDateFields)f, status);
527 failure(status, "getfieldCal->get");
528 return ret;
529 }
530
escape(const UnicodeString & src,UnicodeString & dst)531 UnicodeString& DateFormatRoundTripTest::escape(const UnicodeString& src, UnicodeString& dst )
532 {
533 dst.remove();
534 for (int32_t i = 0; i < src.length(); ++i) {
535 UChar c = src[i];
536 if(c < 0x0080)
537 dst += c;
538 else {
539 dst += UnicodeString("[");
540 char buf [8];
541 sprintf(buf, "%#x", c);
542 dst += UnicodeString(buf);
543 dst += UnicodeString("]");
544 }
545 }
546
547 return dst;
548 }
549
550 #define U_MILLIS_PER_YEAR (365.25 * 24 * 60 * 60 * 1000)
551
generateDate(UDate minDate)552 UDate DateFormatRoundTripTest::generateDate(UDate minDate)
553 {
554 // Bring range in conformance to generateDate() below.
555 if(minDate < (U_MILLIS_PER_YEAR * -(4000-1970))) {
556 minDate = (U_MILLIS_PER_YEAR * -(4000-1970));
557 }
558 for(int i=0;i<8;i++) {
559 double a = randFraction();
560
561 // Range from (min) to (8000-1970) AD
562 double dateRange = (0.0 - minDate) + (U_MILLIS_PER_YEAR + (8000-1970));
563
564 a *= dateRange;
565
566 // Now offset from minDate
567 a += minDate;
568
569 // Last sanity check
570 if(a>=minDate) {
571 return a;
572 }
573 }
574 return minDate;
575 }
576
generateDate()577 UDate DateFormatRoundTripTest::generateDate()
578 {
579 double a = randFraction();
580
581 // Now 'a' ranges from 0..1; scale it to range from 0 to 8000 years
582 a *= 8000;
583
584 // Range from (4000-1970) BC to (8000-1970) AD
585 a -= 4000;
586
587 // Now scale up to ms
588 a *= 365.25 * 24 * 60 * 60 * 1000;
589
590 //return new Date((long)a);
591 return a;
592 }
593
594 #endif /* #if !UCONFIG_NO_FORMATTING */
595
596 //eof
597