1 // © 2016 and later: Unicode, Inc. and others.
2 // License & terms of use: http://www.unicode.org/copyright.html
3 /*
4 *******************************************************************************
5 * Copyright (C) 2011-2015, International Business Machines Corporation and
6 * others. All Rights Reserved.
7 *******************************************************************************
8 */
9 
10 #include "unicode/utypes.h"
11 
12 #if !UCONFIG_NO_FORMATTING
13 
14 #include "unicode/calendar.h"
15 #include "unicode/tzfmt.h"
16 #include "unicode/numsys.h"
17 #include "unicode/strenum.h"
18 #include "unicode/uchar.h"
19 #include "unicode/udat.h"
20 #include "unicode/ustring.h"
21 #include "unicode/utf16.h"
22 #include "tzgnames.h"
23 #include "cmemory.h"
24 #include "cstring.h"
25 #include "putilimp.h"
26 #include "uassert.h"
27 #include "ucln_in.h"
28 #include "umutex.h"
29 #include "uresimp.h"
30 #include "ureslocs.h"
31 #include "uvector.h"
32 #include "zonemeta.h"
33 #include "tznames_impl.h"   // TextTrieMap
34 #include "patternprops.h"
35 
36 U_NAMESPACE_BEGIN
37 
38 // Bit flags used by the parse method.
39 // The order must match UTimeZoneFormatStyle enum.
40 #define ISO_Z_STYLE_FLAG 0x0080
41 #define ISO_LOCAL_STYLE_FLAG 0x0100
42 static const int16_t STYLE_PARSE_FLAGS[] = {
43     0x0001, // UTZFMT_STYLE_GENERIC_LOCATION,
44     0x0002, // UTZFMT_STYLE_GENERIC_LONG,
45     0x0004, // UTZFMT_STYLE_GENERIC_SHORT,
46     0x0008, // UTZFMT_STYLE_SPECIFIC_LONG,
47     0x0010, // UTZFMT_STYLE_SPECIFIC_SHORT,
48     0x0020, // UTZFMT_STYLE_LOCALIZED_GMT,
49     0x0040, // UTZFMT_STYLE_LOCALIZED_GMT_SHORT,
50     ISO_Z_STYLE_FLAG,       // UTZFMT_STYLE_ISO_BASIC_SHORT,
51     ISO_LOCAL_STYLE_FLAG,   // UTZFMT_STYLE_ISO_BASIC_LOCAL_SHORT,
52     ISO_Z_STYLE_FLAG,       // UTZFMT_STYLE_ISO_BASIC_FIXED,
53     ISO_LOCAL_STYLE_FLAG,   // UTZFMT_STYLE_ISO_BASIC_LOCAL_FIXED,
54     ISO_Z_STYLE_FLAG,       // UTZFMT_STYLE_ISO_BASIC_FULL,
55     ISO_LOCAL_STYLE_FLAG,   // UTZFMT_STYLE_ISO_BASIC_LOCAL_FULL,
56     ISO_Z_STYLE_FLAG,       // UTZFMT_STYLE_ISO_EXTENDED_FIXED,
57     ISO_LOCAL_STYLE_FLAG,   // UTZFMT_STYLE_ISO_EXTENDED_LOCAL_FIXED,
58     ISO_Z_STYLE_FLAG,       // UTZFMT_STYLE_ISO_EXTENDED_FULL,
59     ISO_LOCAL_STYLE_FLAG,   // UTZFMT_STYLE_ISO_EXTENDED_LOCAL_FULL,
60     0x0200, // UTZFMT_STYLE_ZONE_ID,
61     0x0400, // UTZFMT_STYLE_ZONE_ID_SHORT,
62     0x0800  // UTZFMT_STYLE_EXEMPLAR_LOCATION
63 };
64 
65 static const char gZoneStringsTag[] = "zoneStrings";
66 static const char gGmtFormatTag[]= "gmtFormat";
67 static const char gGmtZeroFormatTag[] = "gmtZeroFormat";
68 static const char gHourFormatTag[]= "hourFormat";
69 
70 static const UChar TZID_GMT[] = {0x0045, 0x0074, 0x0063, 0x002F, 0x0047, 0x004D, 0x0054, 0};    // Etc/GMT
71 static const UChar UNKNOWN_ZONE_ID[] = {
72     0x0045, 0x0074, 0x0063, 0x002F, 0x0055, 0x006E, 0x006B, 0x006E, 0x006F, 0x0077, 0x006E, 0}; // Etc/Unknown
73 static const UChar UNKNOWN_SHORT_ZONE_ID[] = {0x0075, 0x006E, 0x006B, 0};   // unk
74 static const UChar UNKNOWN_LOCATION[] = {0x0055, 0x006E, 0x006B, 0x006E, 0x006F, 0x0077, 0x006E, 0};    // Unknown
75 
76 static const UChar DEFAULT_GMT_PATTERN[] = {0x0047, 0x004D, 0x0054, 0x007B, 0x0030, 0x007D, 0}; // GMT{0}
77 //static const UChar DEFAULT_GMT_ZERO[] = {0x0047, 0x004D, 0x0054, 0}; // GMT
78 static const UChar DEFAULT_GMT_POSITIVE_HM[] = {0x002B, 0x0048, 0x003A, 0x006D, 0x006D, 0}; // +H:mm
79 static const UChar DEFAULT_GMT_POSITIVE_HMS[] = {0x002B, 0x0048, 0x003A, 0x006D, 0x006D, 0x003A, 0x0073, 0x0073, 0}; // +H:mm:ss
80 static const UChar DEFAULT_GMT_NEGATIVE_HM[] = {0x002D, 0x0048, 0x003A, 0x006D, 0x006D, 0}; // -H:mm
81 static const UChar DEFAULT_GMT_NEGATIVE_HMS[] = {0x002D, 0x0048, 0x003A, 0x006D, 0x006D, 0x003A, 0x0073, 0x0073, 0}; // -H:mm:ss
82 static const UChar DEFAULT_GMT_POSITIVE_H[] = {0x002B, 0x0048, 0}; // +H
83 static const UChar DEFAULT_GMT_NEGATIVE_H[] = {0x002D, 0x0048, 0}; // -H
84 
85 static const UChar32 DEFAULT_GMT_DIGITS[] = {
86     0x0030, 0x0031, 0x0032, 0x0033, 0x0034,
87     0x0035, 0x0036, 0x0037, 0x0038, 0x0039
88 };
89 
90 static const UChar DEFAULT_GMT_OFFSET_SEP = 0x003A; // ':'
91 
92 static const UChar ARG0[] = {0x007B, 0x0030, 0x007D};   // "{0}"
93 static const int32_t ARG0_LEN = 3;
94 
95 static const UChar DEFAULT_GMT_OFFSET_MINUTE_PATTERN[] = {0x006D, 0x006D, 0};   // "mm"
96 static const UChar DEFAULT_GMT_OFFSET_SECOND_PATTERN[] = {0x0073, 0x0073, 0};   // "ss"
97 
98 static const UChar ALT_GMT_STRINGS[][4] = {
99     {0x0047, 0x004D, 0x0054, 0},    // GMT
100     {0x0055, 0x0054, 0x0043, 0},    // UTC
101     {0x0055, 0x0054, 0, 0},         // UT
102     {0, 0, 0, 0}
103 };
104 
105 // Order of GMT offset pattern parsing, *_HMS must be evaluated first
106 // because *_HM is most likely a substring of *_HMS
107 static const int32_t PARSE_GMT_OFFSET_TYPES[] = {
108     UTZFMT_PAT_POSITIVE_HMS,
109     UTZFMT_PAT_NEGATIVE_HMS,
110     UTZFMT_PAT_POSITIVE_HM,
111     UTZFMT_PAT_NEGATIVE_HM,
112     UTZFMT_PAT_POSITIVE_H,
113     UTZFMT_PAT_NEGATIVE_H,
114     -1
115 };
116 
117 static const UChar SINGLEQUOTE  = 0x0027;
118 static const UChar PLUS         = 0x002B;
119 static const UChar MINUS        = 0x002D;
120 static const UChar ISO8601_UTC  = 0x005A;   // 'Z'
121 static const UChar ISO8601_SEP  = 0x003A;   // ':'
122 
123 static const int32_t MILLIS_PER_HOUR = 60 * 60 * 1000;
124 static const int32_t MILLIS_PER_MINUTE = 60 * 1000;
125 static const int32_t MILLIS_PER_SECOND = 1000;
126 
127 // Maximum offset (exclusive) in millisecond supported by offset formats
128 static int32_t MAX_OFFSET = 24 * MILLIS_PER_HOUR;
129 
130 // Maximum values for GMT offset fields
131 static const int32_t MAX_OFFSET_HOUR = 23;
132 static const int32_t MAX_OFFSET_MINUTE = 59;
133 static const int32_t MAX_OFFSET_SECOND = 59;
134 
135 static const int32_t UNKNOWN_OFFSET = 0x7FFFFFFF;
136 
137 static const int32_t ALL_SIMPLE_NAME_TYPES = UTZNM_LONG_STANDARD | UTZNM_LONG_DAYLIGHT | UTZNM_SHORT_STANDARD | UTZNM_SHORT_DAYLIGHT | UTZNM_EXEMPLAR_LOCATION;
138 static const int32_t ALL_GENERIC_NAME_TYPES = UTZGNM_LOCATION | UTZGNM_LONG | UTZGNM_SHORT;
139 
140 #define DIGIT_VAL(c) (0x0030 <= (c) && (c) <= 0x0039 ? (c) - 0x0030 : -1)
141 #define MAX_OFFSET_DIGITS 6
142 
143 // Time Zone ID/Short ID trie
144 static TextTrieMap *gZoneIdTrie = NULL;
145 static icu::UInitOnce gZoneIdTrieInitOnce = U_INITONCE_INITIALIZER;
146 
147 static TextTrieMap *gShortZoneIdTrie = NULL;
148 static icu::UInitOnce gShortZoneIdTrieInitOnce = U_INITONCE_INITIALIZER;
149 
150 static UMutex gLock = U_MUTEX_INITIALIZER;
151 
152 U_CDECL_BEGIN
153 /**
154  * Cleanup callback func
155  */
tzfmt_cleanup(void)156 static UBool U_CALLCONV tzfmt_cleanup(void)
157 {
158     if (gZoneIdTrie != NULL) {
159         delete gZoneIdTrie;
160     }
161     gZoneIdTrie = NULL;
162     gZoneIdTrieInitOnce.reset();
163 
164     if (gShortZoneIdTrie != NULL) {
165         delete gShortZoneIdTrie;
166     }
167     gShortZoneIdTrie = NULL;
168     gShortZoneIdTrieInitOnce.reset();
169 
170     return TRUE;
171 }
172 U_CDECL_END
173 
174 // ------------------------------------------------------------------
175 // GMTOffsetField
176 //
177 // This class represents a localized GMT offset pattern
178 // item and used by TimeZoneFormat
179 // ------------------------------------------------------------------
180 class GMTOffsetField : public UMemory {
181 public:
182     enum FieldType {
183         TEXT = 0,
184         HOUR = 1,
185         MINUTE = 2,
186         SECOND = 4
187     };
188 
189     virtual ~GMTOffsetField();
190 
191     static GMTOffsetField* createText(const UnicodeString& text, UErrorCode& status);
192     static GMTOffsetField* createTimeField(FieldType type, uint8_t width, UErrorCode& status);
193     static UBool isValid(FieldType type, int32_t width);
194     static FieldType getTypeByLetter(UChar ch);
195 
196     FieldType getType() const;
197     uint8_t getWidth() const;
198     const UChar* getPatternText(void) const;
199 
200 private:
201     UChar* fText;
202     FieldType fType;
203     uint8_t fWidth;
204 
205     GMTOffsetField();
206 };
207 
GMTOffsetField()208 GMTOffsetField::GMTOffsetField()
209 : fText(NULL), fType(TEXT), fWidth(0) {
210 }
211 
~GMTOffsetField()212 GMTOffsetField::~GMTOffsetField() {
213     if (fText) {
214         uprv_free(fText);
215     }
216 }
217 
218 GMTOffsetField*
createText(const UnicodeString & text,UErrorCode & status)219 GMTOffsetField::createText(const UnicodeString& text, UErrorCode& status) {
220     if (U_FAILURE(status)) {
221         return NULL;
222     }
223     GMTOffsetField* result = new GMTOffsetField();
224     if (result == NULL) {
225         status = U_MEMORY_ALLOCATION_ERROR;
226         return NULL;
227     }
228 
229     int32_t len = text.length();
230     result->fText = (UChar*)uprv_malloc((len + 1) * sizeof(UChar));
231     if (result->fText == NULL) {
232         status = U_MEMORY_ALLOCATION_ERROR;
233         delete result;
234         return NULL;
235     }
236     u_strncpy(result->fText, text.getBuffer(), len);
237     result->fText[len] = 0;
238     result->fType = TEXT;
239 
240     return result;
241 }
242 
243 GMTOffsetField*
createTimeField(FieldType type,uint8_t width,UErrorCode & status)244 GMTOffsetField::createTimeField(FieldType type, uint8_t width, UErrorCode& status) {
245     U_ASSERT(type != TEXT);
246     if (U_FAILURE(status)) {
247         return NULL;
248     }
249     GMTOffsetField* result = new GMTOffsetField();
250     if (result == NULL) {
251         status = U_MEMORY_ALLOCATION_ERROR;
252         return NULL;
253     }
254 
255     result->fType = type;
256     result->fWidth = width;
257 
258     return result;
259 }
260 
261 UBool
isValid(FieldType type,int32_t width)262 GMTOffsetField::isValid(FieldType type, int32_t width) {
263     switch (type) {
264     case HOUR:
265         return (width == 1 || width == 2);
266     case MINUTE:
267     case SECOND:
268         return (width == 2);
269     default:
270         U_ASSERT(FALSE);
271     }
272     return (width > 0);
273 }
274 
275 GMTOffsetField::FieldType
getTypeByLetter(UChar ch)276 GMTOffsetField::getTypeByLetter(UChar ch) {
277     if (ch == 0x0048 /* H */) {
278         return HOUR;
279     } else if (ch == 0x006D /* m */) {
280         return MINUTE;
281     } else if (ch == 0x0073 /* s */) {
282         return SECOND;
283     }
284     return TEXT;
285 }
286 
287 inline GMTOffsetField::FieldType
getType() const288 GMTOffsetField::getType() const {
289      return fType;
290  }
291 
292 inline uint8_t
getWidth() const293 GMTOffsetField::getWidth() const {
294     return fWidth;
295 }
296 
297 inline const UChar*
getPatternText(void) const298 GMTOffsetField::getPatternText(void) const {
299     return fText;
300 }
301 
302 
303 U_CDECL_BEGIN
304 static void U_CALLCONV
deleteGMTOffsetField(void * obj)305 deleteGMTOffsetField(void *obj) {
306     delete static_cast<GMTOffsetField *>(obj);
307 }
308 U_CDECL_END
309 
310 
311 // ------------------------------------------------------------------
312 // TimeZoneFormat
313 // ------------------------------------------------------------------
UOBJECT_DEFINE_RTTI_IMPLEMENTATION(TimeZoneFormat)314 UOBJECT_DEFINE_RTTI_IMPLEMENTATION(TimeZoneFormat)
315 
316 TimeZoneFormat::TimeZoneFormat(const Locale& locale, UErrorCode& status)
317 : fLocale(locale), fTimeZoneNames(NULL), fTimeZoneGenericNames(NULL),
318   fDefParseOptionFlags(0), fTZDBTimeZoneNames(NULL) {
319 
320     for (int32_t i = 0; i < UTZFMT_PAT_COUNT; i++) {
321         fGMTOffsetPatternItems[i] = NULL;
322     }
323 
324     const char* region = fLocale.getCountry();
325     int32_t regionLen = static_cast<int32_t>(uprv_strlen(region));
326     if (regionLen == 0) {
327         char loc[ULOC_FULLNAME_CAPACITY];
328         uloc_addLikelySubtags(fLocale.getName(), loc, sizeof(loc), &status);
329 
330         regionLen = uloc_getCountry(loc, fTargetRegion, sizeof(fTargetRegion), &status);
331         if (U_SUCCESS(status)) {
332             fTargetRegion[regionLen] = 0;
333         } else {
334             return;
335         }
336     } else if (regionLen < (int32_t)sizeof(fTargetRegion)) {
337         uprv_strcpy(fTargetRegion, region);
338     } else {
339         fTargetRegion[0] = 0;
340     }
341 
342     fTimeZoneNames = TimeZoneNames::createInstance(locale, status);
343     // fTimeZoneGenericNames is lazily instantiated
344     if (U_FAILURE(status)) {
345         return;
346     }
347 
348     const UChar* gmtPattern = NULL;
349     const UChar* hourFormats = NULL;
350 
351     UResourceBundle *zoneBundle = ures_open(U_ICUDATA_ZONE, locale.getName(), &status);
352     UResourceBundle *zoneStringsArray = ures_getByKeyWithFallback(zoneBundle, gZoneStringsTag, NULL, &status);
353     if (U_SUCCESS(status)) {
354         const UChar* resStr;
355         int32_t len;
356         resStr = ures_getStringByKeyWithFallback(zoneStringsArray, gGmtFormatTag, &len, &status);
357         if (len > 0) {
358             gmtPattern = resStr;
359         }
360         resStr = ures_getStringByKeyWithFallback(zoneStringsArray, gGmtZeroFormatTag, &len, &status);
361         if (len > 0) {
362             fGMTZeroFormat.setTo(TRUE, resStr, len);
363         }
364         resStr = ures_getStringByKeyWithFallback(zoneStringsArray, gHourFormatTag, &len, &status);
365         if (len > 0) {
366             hourFormats = resStr;
367         }
368         ures_close(zoneStringsArray);
369         ures_close(zoneBundle);
370     }
371 
372     if (gmtPattern == NULL) {
373         gmtPattern = DEFAULT_GMT_PATTERN;
374     }
375     initGMTPattern(UnicodeString(TRUE, gmtPattern, -1), status);
376 
377     UBool useDefaultOffsetPatterns = TRUE;
378     if (hourFormats) {
379         UChar *sep = u_strchr(hourFormats, (UChar)0x003B /* ';' */);
380         if (sep != NULL) {
381             UErrorCode tmpStatus = U_ZERO_ERROR;
382             fGMTOffsetPatterns[UTZFMT_PAT_POSITIVE_HM].setTo(FALSE, hourFormats, (int32_t)(sep - hourFormats));
383             fGMTOffsetPatterns[UTZFMT_PAT_NEGATIVE_HM].setTo(TRUE, sep + 1, -1);
384             expandOffsetPattern(fGMTOffsetPatterns[UTZFMT_PAT_POSITIVE_HM], fGMTOffsetPatterns[UTZFMT_PAT_POSITIVE_HMS], tmpStatus);
385             expandOffsetPattern(fGMTOffsetPatterns[UTZFMT_PAT_NEGATIVE_HM], fGMTOffsetPatterns[UTZFMT_PAT_NEGATIVE_HMS], tmpStatus);
386             truncateOffsetPattern(fGMTOffsetPatterns[UTZFMT_PAT_POSITIVE_HM], fGMTOffsetPatterns[UTZFMT_PAT_POSITIVE_H], tmpStatus);
387             truncateOffsetPattern(fGMTOffsetPatterns[UTZFMT_PAT_NEGATIVE_HM], fGMTOffsetPatterns[UTZFMT_PAT_NEGATIVE_H], tmpStatus);
388             if (U_SUCCESS(tmpStatus)) {
389                 useDefaultOffsetPatterns = FALSE;
390             }
391         }
392     }
393     if (useDefaultOffsetPatterns) {
394         fGMTOffsetPatterns[UTZFMT_PAT_POSITIVE_H].setTo(TRUE, DEFAULT_GMT_POSITIVE_H, -1);
395         fGMTOffsetPatterns[UTZFMT_PAT_POSITIVE_HM].setTo(TRUE, DEFAULT_GMT_POSITIVE_HM, -1);
396         fGMTOffsetPatterns[UTZFMT_PAT_POSITIVE_HMS].setTo(TRUE, DEFAULT_GMT_POSITIVE_HMS, -1);
397         fGMTOffsetPatterns[UTZFMT_PAT_NEGATIVE_H].setTo(TRUE, DEFAULT_GMT_NEGATIVE_H, -1);
398         fGMTOffsetPatterns[UTZFMT_PAT_NEGATIVE_HM].setTo(TRUE, DEFAULT_GMT_NEGATIVE_HM, -1);
399         fGMTOffsetPatterns[UTZFMT_PAT_NEGATIVE_HMS].setTo(TRUE, DEFAULT_GMT_NEGATIVE_HMS, -1);
400     }
401     initGMTOffsetPatterns(status);
402 
403     NumberingSystem* ns = NumberingSystem::createInstance(locale, status);
404     UBool useDefDigits = TRUE;
405     if (ns && !ns->isAlgorithmic()) {
406         UnicodeString digits = ns->getDescription();
407         useDefDigits = !toCodePoints(digits, fGMTOffsetDigits, 10);
408     }
409     if (useDefDigits) {
410         uprv_memcpy(fGMTOffsetDigits, DEFAULT_GMT_DIGITS, sizeof(UChar32) * 10);
411     }
412     delete ns;
413 }
414 
TimeZoneFormat(const TimeZoneFormat & other)415 TimeZoneFormat::TimeZoneFormat(const TimeZoneFormat& other)
416 : Format(other), fTimeZoneNames(NULL), fTimeZoneGenericNames(NULL),
417   fTZDBTimeZoneNames(NULL) {
418 
419     for (int32_t i = 0; i < UTZFMT_PAT_COUNT; i++) {
420         fGMTOffsetPatternItems[i] = NULL;
421     }
422     *this = other;
423 }
424 
425 
~TimeZoneFormat()426 TimeZoneFormat::~TimeZoneFormat() {
427     delete fTimeZoneNames;
428     delete fTimeZoneGenericNames;
429     delete fTZDBTimeZoneNames;
430     for (int32_t i = 0; i < UTZFMT_PAT_COUNT; i++) {
431         delete fGMTOffsetPatternItems[i];
432     }
433 }
434 
435 TimeZoneFormat&
operator =(const TimeZoneFormat & other)436 TimeZoneFormat::operator=(const TimeZoneFormat& other) {
437     if (this == &other) {
438         return *this;
439     }
440 
441     delete fTimeZoneNames;
442     delete fTimeZoneGenericNames;
443     fTimeZoneGenericNames = NULL;
444     delete fTZDBTimeZoneNames;
445     fTZDBTimeZoneNames = NULL;
446 
447     fLocale = other.fLocale;
448     uprv_memcpy(fTargetRegion, other.fTargetRegion, sizeof(fTargetRegion));
449 
450     fTimeZoneNames = other.fTimeZoneNames->clone();
451     if (other.fTimeZoneGenericNames) {
452         // TODO: this test has dubious thread safety.
453         fTimeZoneGenericNames = other.fTimeZoneGenericNames->clone();
454     }
455 
456     fGMTPattern = other.fGMTPattern;
457     fGMTPatternPrefix = other.fGMTPatternPrefix;
458     fGMTPatternSuffix = other.fGMTPatternSuffix;
459 
460     UErrorCode status = U_ZERO_ERROR;
461     for (int32_t i = 0; i < UTZFMT_PAT_COUNT; i++) {
462         fGMTOffsetPatterns[i] = other.fGMTOffsetPatterns[i];
463         delete fGMTOffsetPatternItems[i];
464         fGMTOffsetPatternItems[i] = NULL;
465     }
466     initGMTOffsetPatterns(status);
467     U_ASSERT(U_SUCCESS(status));
468 
469     fGMTZeroFormat = other.fGMTZeroFormat;
470 
471     uprv_memcpy(fGMTOffsetDigits, other.fGMTOffsetDigits, sizeof(fGMTOffsetDigits));
472 
473     fDefParseOptionFlags = other.fDefParseOptionFlags;
474 
475     return *this;
476 }
477 
478 
479 UBool
operator ==(const Format & other) const480 TimeZoneFormat::operator==(const Format& other) const {
481     TimeZoneFormat* tzfmt = (TimeZoneFormat*)&other;
482 
483     UBool isEqual =
484             fLocale == tzfmt->fLocale
485             && fGMTPattern == tzfmt->fGMTPattern
486             && fGMTZeroFormat == tzfmt->fGMTZeroFormat
487             && *fTimeZoneNames == *tzfmt->fTimeZoneNames;
488 
489     for (int32_t i = 0; i < UTZFMT_PAT_COUNT && isEqual; i++) {
490         isEqual = fGMTOffsetPatterns[i] == tzfmt->fGMTOffsetPatterns[i];
491     }
492     for (int32_t i = 0; i < 10 && isEqual; i++) {
493         isEqual = fGMTOffsetDigits[i] == tzfmt->fGMTOffsetDigits[i];
494     }
495     // TODO
496     // Check fTimeZoneGenericNames. For now,
497     // if fTimeZoneNames is same, fTimeZoneGenericNames should
498     // be also equivalent.
499     return isEqual;
500 }
501 
502 Format*
clone() const503 TimeZoneFormat::clone() const {
504     return new TimeZoneFormat(*this);
505 }
506 
507 TimeZoneFormat* U_EXPORT2
createInstance(const Locale & locale,UErrorCode & status)508 TimeZoneFormat::createInstance(const Locale& locale, UErrorCode& status) {
509     TimeZoneFormat* tzfmt = new TimeZoneFormat(locale, status);
510     if (U_SUCCESS(status)) {
511         return tzfmt;
512     }
513     delete tzfmt;
514     return NULL;
515 }
516 
517 // ------------------------------------------------------------------
518 // Setter and Getter
519 
520 const TimeZoneNames*
getTimeZoneNames() const521 TimeZoneFormat::getTimeZoneNames() const {
522     return (const TimeZoneNames*)fTimeZoneNames;
523 }
524 
525 void
adoptTimeZoneNames(TimeZoneNames * tznames)526 TimeZoneFormat::adoptTimeZoneNames(TimeZoneNames *tznames) {
527     delete fTimeZoneNames;
528     fTimeZoneNames = tznames;
529 
530     // TODO - We should also update fTimeZoneGenericNames
531 }
532 
533 void
setTimeZoneNames(const TimeZoneNames & tznames)534 TimeZoneFormat::setTimeZoneNames(const TimeZoneNames &tznames) {
535     delete fTimeZoneNames;
536     fTimeZoneNames = tznames.clone();
537 
538     // TODO - We should also update fTimeZoneGenericNames
539 }
540 
541 void
setDefaultParseOptions(uint32_t flags)542 TimeZoneFormat::setDefaultParseOptions(uint32_t flags) {
543     fDefParseOptionFlags = flags;
544 }
545 
546 uint32_t
getDefaultParseOptions(void) const547 TimeZoneFormat::getDefaultParseOptions(void) const {
548     return fDefParseOptionFlags;
549 }
550 
551 
552 UnicodeString&
getGMTPattern(UnicodeString & pattern) const553 TimeZoneFormat::getGMTPattern(UnicodeString& pattern) const {
554     return pattern.setTo(fGMTPattern);
555 }
556 
557 void
setGMTPattern(const UnicodeString & pattern,UErrorCode & status)558 TimeZoneFormat::setGMTPattern(const UnicodeString& pattern, UErrorCode& status) {
559     initGMTPattern(pattern, status);
560 }
561 
562 UnicodeString&
getGMTOffsetPattern(UTimeZoneFormatGMTOffsetPatternType type,UnicodeString & pattern) const563 TimeZoneFormat::getGMTOffsetPattern(UTimeZoneFormatGMTOffsetPatternType type, UnicodeString& pattern) const {
564     return pattern.setTo(fGMTOffsetPatterns[type]);
565 }
566 
567 void
setGMTOffsetPattern(UTimeZoneFormatGMTOffsetPatternType type,const UnicodeString & pattern,UErrorCode & status)568 TimeZoneFormat::setGMTOffsetPattern(UTimeZoneFormatGMTOffsetPatternType type, const UnicodeString& pattern, UErrorCode& status) {
569     if (U_FAILURE(status)) {
570         return;
571     }
572     if (pattern == fGMTOffsetPatterns[type]) {
573         // No need to reset
574         return;
575     }
576 
577     OffsetFields required = FIELDS_HM;
578     switch (type) {
579     case UTZFMT_PAT_POSITIVE_H:
580     case UTZFMT_PAT_NEGATIVE_H:
581         required = FIELDS_H;
582         break;
583     case UTZFMT_PAT_POSITIVE_HM:
584     case UTZFMT_PAT_NEGATIVE_HM:
585         required = FIELDS_HM;
586         break;
587     case UTZFMT_PAT_POSITIVE_HMS:
588     case UTZFMT_PAT_NEGATIVE_HMS:
589         required = FIELDS_HMS;
590         break;
591     default:
592         U_ASSERT(FALSE);
593         break;
594     }
595 
596     UVector* patternItems = parseOffsetPattern(pattern, required, status);
597     if (patternItems == NULL) {
598         return;
599     }
600 
601     fGMTOffsetPatterns[type].setTo(pattern);
602     delete fGMTOffsetPatternItems[type];
603     fGMTOffsetPatternItems[type] = patternItems;
604     checkAbuttingHoursAndMinutes();
605 }
606 
607 UnicodeString&
getGMTOffsetDigits(UnicodeString & digits) const608 TimeZoneFormat::getGMTOffsetDigits(UnicodeString& digits) const {
609     digits.remove();
610     for (int32_t i = 0; i < 10; i++) {
611         digits.append(fGMTOffsetDigits[i]);
612     }
613     return digits;
614 }
615 
616 void
setGMTOffsetDigits(const UnicodeString & digits,UErrorCode & status)617 TimeZoneFormat::setGMTOffsetDigits(const UnicodeString& digits, UErrorCode& status) {
618     if (U_FAILURE(status)) {
619         return;
620     }
621     UChar32 digitArray[10];
622     if (!toCodePoints(digits, digitArray, 10)) {
623         status = U_ILLEGAL_ARGUMENT_ERROR;
624         return;
625     }
626     uprv_memcpy(fGMTOffsetDigits, digitArray, sizeof(UChar32)*10);
627 }
628 
629 UnicodeString&
getGMTZeroFormat(UnicodeString & gmtZeroFormat) const630 TimeZoneFormat::getGMTZeroFormat(UnicodeString& gmtZeroFormat) const {
631     return gmtZeroFormat.setTo(fGMTZeroFormat);
632 }
633 
634 void
setGMTZeroFormat(const UnicodeString & gmtZeroFormat,UErrorCode & status)635 TimeZoneFormat::setGMTZeroFormat(const UnicodeString& gmtZeroFormat, UErrorCode& status) {
636     if (U_SUCCESS(status)) {
637         if (gmtZeroFormat.isEmpty()) {
638             status = U_ILLEGAL_ARGUMENT_ERROR;
639         } else if (gmtZeroFormat != fGMTZeroFormat) {
640             fGMTZeroFormat.setTo(gmtZeroFormat);
641         }
642     }
643 }
644 
645 // ------------------------------------------------------------------
646 // Format and Parse
647 
648 UnicodeString&
format(UTimeZoneFormatStyle style,const TimeZone & tz,UDate date,UnicodeString & name,UTimeZoneFormatTimeType * timeType) const649 TimeZoneFormat::format(UTimeZoneFormatStyle style, const TimeZone& tz, UDate date,
650         UnicodeString& name, UTimeZoneFormatTimeType* timeType /* = NULL */) const {
651     if (timeType) {
652         *timeType = UTZFMT_TIME_TYPE_UNKNOWN;
653     }
654 
655     UBool noOffsetFormatFallback = FALSE;
656 
657     switch (style) {
658     case UTZFMT_STYLE_GENERIC_LOCATION:
659         formatGeneric(tz, UTZGNM_LOCATION, date, name);
660         break;
661     case UTZFMT_STYLE_GENERIC_LONG:
662         formatGeneric(tz, UTZGNM_LONG, date, name);
663         break;
664     case UTZFMT_STYLE_GENERIC_SHORT:
665         formatGeneric(tz, UTZGNM_SHORT, date, name);
666         break;
667     case UTZFMT_STYLE_SPECIFIC_LONG:
668         formatSpecific(tz, UTZNM_LONG_STANDARD, UTZNM_LONG_DAYLIGHT, date, name, timeType);
669         break;
670     case UTZFMT_STYLE_SPECIFIC_SHORT:
671         formatSpecific(tz, UTZNM_SHORT_STANDARD, UTZNM_SHORT_DAYLIGHT, date, name, timeType);
672         break;
673 
674     case UTZFMT_STYLE_ZONE_ID:
675         tz.getID(name);
676         noOffsetFormatFallback = TRUE;
677         break;
678     case UTZFMT_STYLE_ZONE_ID_SHORT:
679         {
680             const UChar* shortID = ZoneMeta::getShortID(tz);
681             if (shortID == NULL) {
682                 shortID = UNKNOWN_SHORT_ZONE_ID;
683             }
684             name.setTo(shortID, -1);
685         }
686         noOffsetFormatFallback = TRUE;
687         break;
688 
689     case UTZFMT_STYLE_EXEMPLAR_LOCATION:
690         formatExemplarLocation(tz, name);
691         noOffsetFormatFallback = TRUE;
692         break;
693 
694     default:
695         // will be handled below
696         break;
697     }
698 
699     if (name.isEmpty() && !noOffsetFormatFallback) {
700         UErrorCode status = U_ZERO_ERROR;
701         int32_t rawOffset, dstOffset;
702         tz.getOffset(date, FALSE, rawOffset, dstOffset, status);
703         int32_t offset = rawOffset + dstOffset;
704         if (U_SUCCESS(status)) {
705             switch (style) {
706             case UTZFMT_STYLE_GENERIC_LOCATION:
707             case UTZFMT_STYLE_GENERIC_LONG:
708             case UTZFMT_STYLE_SPECIFIC_LONG:
709             case UTZFMT_STYLE_LOCALIZED_GMT:
710                 formatOffsetLocalizedGMT(offset, name, status);
711                 break;
712 
713             case UTZFMT_STYLE_GENERIC_SHORT:
714             case UTZFMT_STYLE_SPECIFIC_SHORT:
715             case UTZFMT_STYLE_LOCALIZED_GMT_SHORT:
716                 formatOffsetShortLocalizedGMT(offset, name, status);
717                 break;
718 
719             case UTZFMT_STYLE_ISO_BASIC_SHORT:
720                 formatOffsetISO8601Basic(offset, TRUE, TRUE, TRUE, name, status);
721                 break;
722 
723             case UTZFMT_STYLE_ISO_BASIC_LOCAL_SHORT:
724                 formatOffsetISO8601Basic(offset, FALSE, TRUE, TRUE, name, status);
725                 break;
726 
727             case UTZFMT_STYLE_ISO_BASIC_FIXED:
728                 formatOffsetISO8601Basic(offset, TRUE, FALSE, TRUE, name, status);
729                 break;
730 
731             case UTZFMT_STYLE_ISO_BASIC_LOCAL_FIXED:
732                 formatOffsetISO8601Basic(offset, FALSE, FALSE, TRUE, name, status);
733                 break;
734 
735             case UTZFMT_STYLE_ISO_EXTENDED_FIXED:
736                 formatOffsetISO8601Extended(offset, TRUE, FALSE, TRUE, name, status);
737                 break;
738 
739             case UTZFMT_STYLE_ISO_EXTENDED_LOCAL_FIXED:
740                 formatOffsetISO8601Extended(offset, FALSE, FALSE, TRUE, name, status);
741                 break;
742 
743             case UTZFMT_STYLE_ISO_BASIC_FULL:
744                 formatOffsetISO8601Basic(offset, TRUE, FALSE, FALSE, name, status);
745                 break;
746 
747             case UTZFMT_STYLE_ISO_BASIC_LOCAL_FULL:
748                 formatOffsetISO8601Basic(offset, FALSE, FALSE, FALSE, name, status);
749                 break;
750 
751             case UTZFMT_STYLE_ISO_EXTENDED_FULL:
752                 formatOffsetISO8601Extended(offset, TRUE, FALSE, FALSE, name, status);
753                 break;
754 
755             case UTZFMT_STYLE_ISO_EXTENDED_LOCAL_FULL:
756                 formatOffsetISO8601Extended(offset, FALSE, FALSE, FALSE, name, status);
757                 break;
758 
759             default:
760               // UTZFMT_STYLE_ZONE_ID, UTZFMT_STYLE_ZONE_ID_SHORT, UTZFMT_STYLE_EXEMPLAR_LOCATION
761               break;
762             }
763 
764             if (timeType) {
765                 *timeType = (dstOffset != 0) ? UTZFMT_TIME_TYPE_DAYLIGHT : UTZFMT_TIME_TYPE_STANDARD;
766             }
767         }
768     }
769 
770     return name;
771 }
772 
773 UnicodeString&
format(const Formattable & obj,UnicodeString & appendTo,FieldPosition & pos,UErrorCode & status) const774 TimeZoneFormat::format(const Formattable& obj, UnicodeString& appendTo,
775         FieldPosition& pos, UErrorCode& status) const {
776     if (U_FAILURE(status)) {
777         return appendTo;
778     }
779     UDate date = Calendar::getNow();
780     if (obj.getType() == Formattable::kObject) {
781         const UObject* formatObj = obj.getObject();
782         const TimeZone* tz = dynamic_cast<const TimeZone*>(formatObj);
783         if (tz == NULL) {
784             const Calendar* cal = dynamic_cast<const Calendar*>(formatObj);
785             if (cal != NULL) {
786                 tz = &cal->getTimeZone();
787                 date = cal->getTime(status);
788             }
789         }
790         if (tz != NULL) {
791             int32_t rawOffset, dstOffset;
792             tz->getOffset(date, FALSE, rawOffset, dstOffset, status);
793             UChar buf[ZONE_NAME_U16_MAX];
794             UnicodeString result(buf, 0, UPRV_LENGTHOF(buf));
795             formatOffsetLocalizedGMT(rawOffset + dstOffset, result, status);
796             if (U_SUCCESS(status)) {
797                 appendTo.append(result);
798                 if (pos.getField() == UDAT_TIMEZONE_FIELD) {
799                     pos.setBeginIndex(0);
800                     pos.setEndIndex(result.length());
801                 }
802             }
803         }
804     }
805     return appendTo;
806 }
807 
808 TimeZone*
parse(UTimeZoneFormatStyle style,const UnicodeString & text,ParsePosition & pos,UTimeZoneFormatTimeType * timeType) const809 TimeZoneFormat::parse(UTimeZoneFormatStyle style, const UnicodeString& text, ParsePosition& pos,
810         UTimeZoneFormatTimeType* timeType /*= NULL*/) const {
811     return parse(style, text, pos, getDefaultParseOptions(), timeType);
812 }
813 
814 TimeZone*
parse(UTimeZoneFormatStyle style,const UnicodeString & text,ParsePosition & pos,int32_t parseOptions,UTimeZoneFormatTimeType * timeType) const815 TimeZoneFormat::parse(UTimeZoneFormatStyle style, const UnicodeString& text, ParsePosition& pos,
816         int32_t parseOptions, UTimeZoneFormatTimeType* timeType /* = NULL */) const {
817     if (timeType) {
818         *timeType = UTZFMT_TIME_TYPE_UNKNOWN;
819     }
820 
821     int32_t startIdx = pos.getIndex();
822     int32_t maxPos = text.length();
823     int32_t offset;
824 
825     // Styles using localized GMT format as fallback
826     UBool fallbackLocalizedGMT =
827         (style == UTZFMT_STYLE_SPECIFIC_LONG || style == UTZFMT_STYLE_GENERIC_LONG || style == UTZFMT_STYLE_GENERIC_LOCATION);
828     UBool fallbackShortLocalizedGMT =
829         (style == UTZFMT_STYLE_SPECIFIC_SHORT || style == UTZFMT_STYLE_GENERIC_SHORT);
830 
831     int32_t evaluated = 0;  // bit flags representing already evaluated styles
832     ParsePosition tmpPos(startIdx);
833 
834     int32_t parsedOffset = UNKNOWN_OFFSET;  // stores successfully parsed offset for later use
835     int32_t parsedPos = -1;                 // stores successfully parsed offset position for later use
836 
837     // Try localized GMT format first if necessary
838     if (fallbackLocalizedGMT || fallbackShortLocalizedGMT) {
839         UBool hasDigitOffset = FALSE;
840         offset = parseOffsetLocalizedGMT(text, tmpPos, fallbackShortLocalizedGMT, &hasDigitOffset);
841         if (tmpPos.getErrorIndex() == -1) {
842             // Even when the input text was successfully parsed as a localized GMT format text,
843             // we may still need to evaluate the specified style if -
844             //   1) GMT zero format was used, and
845             //   2) The input text was not completely processed
846             if (tmpPos.getIndex() == maxPos || hasDigitOffset) {
847                 pos.setIndex(tmpPos.getIndex());
848                 return createTimeZoneForOffset(offset);
849             }
850             parsedOffset = offset;
851             parsedPos = tmpPos.getIndex();
852         }
853         // Note: For now, no distinction between long/short localized GMT format in the parser.
854         // This might be changed in future.
855         // evaluated |= (fallbackLocalizedGMT ? STYLE_PARSE_FLAGS[UTZFMT_STYLE_LOCALIZED_GMT] : STYLE_PARSE_FLAGS[UTZFMT_STYLE_LOCALIZED_GMT_SHORT]);
856         evaluated |= STYLE_PARSE_FLAGS[UTZFMT_STYLE_LOCALIZED_GMT] | STYLE_PARSE_FLAGS[UTZFMT_STYLE_LOCALIZED_GMT_SHORT];
857     }
858 
859     UErrorCode status = U_ZERO_ERROR;
860     UChar tzIDBuf[32];
861     UnicodeString tzID(tzIDBuf, 0, UPRV_LENGTHOF(tzIDBuf));
862 
863     UBool parseTZDBAbbrev = ((parseOptions & UTZFMT_PARSE_OPTION_TZ_DATABASE_ABBREVIATIONS) != 0);
864 
865     // Try the specified style
866     switch (style) {
867     case UTZFMT_STYLE_LOCALIZED_GMT:
868         {
869             tmpPos.setIndex(startIdx);
870             tmpPos.setErrorIndex(-1);
871 
872             offset = parseOffsetLocalizedGMT(text, tmpPos);
873             if (tmpPos.getErrorIndex() == -1) {
874                 pos.setIndex(tmpPos.getIndex());
875                 return createTimeZoneForOffset(offset);
876             }
877 
878             // Note: For now, no distinction between long/short localized GMT format in the parser.
879             // This might be changed in future.
880             evaluated |= STYLE_PARSE_FLAGS[UTZFMT_STYLE_LOCALIZED_GMT_SHORT];
881 
882             break;
883         }
884     case UTZFMT_STYLE_LOCALIZED_GMT_SHORT:
885         {
886             tmpPos.setIndex(startIdx);
887             tmpPos.setErrorIndex(-1);
888 
889             offset = parseOffsetShortLocalizedGMT(text, tmpPos);
890             if (tmpPos.getErrorIndex() == -1) {
891                 pos.setIndex(tmpPos.getIndex());
892                 return createTimeZoneForOffset(offset);
893             }
894 
895             // Note: For now, no distinction between long/short localized GMT format in the parser.
896             // This might be changed in future.
897             evaluated |= STYLE_PARSE_FLAGS[UTZFMT_STYLE_LOCALIZED_GMT];
898 
899             break;
900         }
901     case UTZFMT_STYLE_ISO_BASIC_SHORT:
902     case UTZFMT_STYLE_ISO_BASIC_FIXED:
903     case UTZFMT_STYLE_ISO_BASIC_FULL:
904     case UTZFMT_STYLE_ISO_EXTENDED_FIXED:
905     case UTZFMT_STYLE_ISO_EXTENDED_FULL:
906         {
907             tmpPos.setIndex(startIdx);
908             tmpPos.setErrorIndex(-1);
909 
910             offset = parseOffsetISO8601(text, tmpPos);
911             if (tmpPos.getErrorIndex() == -1) {
912                 pos.setIndex(tmpPos.getIndex());
913                 return createTimeZoneForOffset(offset);
914             }
915 
916             break;
917         }
918 
919     case UTZFMT_STYLE_ISO_BASIC_LOCAL_SHORT:
920     case UTZFMT_STYLE_ISO_BASIC_LOCAL_FIXED:
921     case UTZFMT_STYLE_ISO_BASIC_LOCAL_FULL:
922     case UTZFMT_STYLE_ISO_EXTENDED_LOCAL_FIXED:
923     case UTZFMT_STYLE_ISO_EXTENDED_LOCAL_FULL:
924         {
925             tmpPos.setIndex(startIdx);
926             tmpPos.setErrorIndex(-1);
927 
928             // Exclude the case of UTC Indicator "Z" here
929             UBool hasDigitOffset = FALSE;
930             offset = parseOffsetISO8601(text, tmpPos, FALSE, &hasDigitOffset);
931             if (tmpPos.getErrorIndex() == -1 && hasDigitOffset) {
932                 pos.setIndex(tmpPos.getIndex());
933                 return createTimeZoneForOffset(offset);
934             }
935 
936             break;
937         }
938 
939     case UTZFMT_STYLE_SPECIFIC_LONG:
940     case UTZFMT_STYLE_SPECIFIC_SHORT:
941         {
942             // Specific styles
943             int32_t nameTypes = 0;
944             if (style == UTZFMT_STYLE_SPECIFIC_LONG) {
945                 nameTypes = (UTZNM_LONG_STANDARD | UTZNM_LONG_DAYLIGHT);
946             } else {
947                 U_ASSERT(style == UTZFMT_STYLE_SPECIFIC_SHORT);
948                 nameTypes = (UTZNM_SHORT_STANDARD | UTZNM_SHORT_DAYLIGHT);
949             }
950             LocalPointer<TimeZoneNames::MatchInfoCollection> specificMatches(fTimeZoneNames->find(text, startIdx, nameTypes, status));
951             if (U_FAILURE(status)) {
952                 pos.setErrorIndex(startIdx);
953                 return NULL;
954             }
955             if (!specificMatches.isNull()) {
956                 int32_t matchIdx = -1;
957                 int32_t matchPos = -1;
958                 for (int32_t i = 0; i < specificMatches->size(); i++) {
959                     matchPos  = startIdx + specificMatches->getMatchLengthAt(i);
960                     if (matchPos > parsedPos) {
961                         matchIdx = i;
962                         parsedPos = matchPos;
963                     }
964                 }
965                 if (matchIdx >= 0) {
966                     if (timeType) {
967                         *timeType = getTimeType(specificMatches->getNameTypeAt(matchIdx));
968                     }
969                     pos.setIndex(matchPos);
970                     getTimeZoneID(specificMatches.getAlias(), matchIdx, tzID);
971                     U_ASSERT(!tzID.isEmpty());
972                     return TimeZone::createTimeZone(tzID);
973                 }
974             }
975 
976             if (parseTZDBAbbrev && style == UTZFMT_STYLE_SPECIFIC_SHORT) {
977                 U_ASSERT((nameTypes & UTZNM_SHORT_STANDARD) != 0);
978                 U_ASSERT((nameTypes & UTZNM_SHORT_DAYLIGHT) != 0);
979 
980                 const TZDBTimeZoneNames *tzdbTimeZoneNames = getTZDBTimeZoneNames(status);
981                 if (U_SUCCESS(status)) {
982                     LocalPointer<TimeZoneNames::MatchInfoCollection> tzdbNameMatches(
983                         tzdbTimeZoneNames->find(text, startIdx, nameTypes, status));
984                     if (U_FAILURE(status)) {
985                         pos.setErrorIndex(startIdx);
986                         return NULL;
987                     }
988                     if (!tzdbNameMatches.isNull()) {
989                         int32_t matchIdx = -1;
990                         int32_t matchPos = -1;
991                         for (int32_t i = 0; i < tzdbNameMatches->size(); i++) {
992                             matchPos = startIdx + tzdbNameMatches->getMatchLengthAt(i);
993                             if (matchPos > parsedPos) {
994                                 matchIdx = i;
995                                 parsedPos = matchPos;
996                             }
997                         }
998                         if (matchIdx >= 0) {
999                             if (timeType) {
1000                                 *timeType = getTimeType(tzdbNameMatches->getNameTypeAt(matchIdx));
1001                             }
1002                             pos.setIndex(matchPos);
1003                             getTimeZoneID(tzdbNameMatches.getAlias(), matchIdx, tzID);
1004                             U_ASSERT(!tzID.isEmpty());
1005                             return TimeZone::createTimeZone(tzID);
1006                         }
1007                     }
1008                 }
1009             }
1010             break;
1011         }
1012     case UTZFMT_STYLE_GENERIC_LONG:
1013     case UTZFMT_STYLE_GENERIC_SHORT:
1014     case UTZFMT_STYLE_GENERIC_LOCATION:
1015         {
1016             int32_t genericNameTypes = 0;
1017             switch (style) {
1018             case UTZFMT_STYLE_GENERIC_LOCATION:
1019                 genericNameTypes = UTZGNM_LOCATION;
1020                 break;
1021 
1022             case UTZFMT_STYLE_GENERIC_LONG:
1023                 genericNameTypes = UTZGNM_LONG | UTZGNM_LOCATION;
1024                 break;
1025 
1026             case UTZFMT_STYLE_GENERIC_SHORT:
1027                 genericNameTypes = UTZGNM_SHORT | UTZGNM_LOCATION;
1028                 break;
1029 
1030             default:
1031                 U_ASSERT(FALSE);
1032             }
1033 
1034             int32_t len = 0;
1035             UTimeZoneFormatTimeType tt = UTZFMT_TIME_TYPE_UNKNOWN;
1036             const TimeZoneGenericNames *gnames = getTimeZoneGenericNames(status);
1037             if (U_SUCCESS(status)) {
1038                 len = gnames->findBestMatch(text, startIdx, genericNameTypes, tzID, tt, status);
1039             }
1040             if (U_FAILURE(status)) {
1041                 pos.setErrorIndex(startIdx);
1042                 return NULL;
1043             }
1044             if (len > 0) {
1045                 // Found a match
1046                 if (timeType) {
1047                     *timeType = tt;
1048                 }
1049                 pos.setIndex(startIdx + len);
1050                 U_ASSERT(!tzID.isEmpty());
1051                 return TimeZone::createTimeZone(tzID);
1052             }
1053 
1054             break;
1055         }
1056     case UTZFMT_STYLE_ZONE_ID:
1057         {
1058             tmpPos.setIndex(startIdx);
1059             tmpPos.setErrorIndex(-1);
1060 
1061             parseZoneID(text, tmpPos, tzID);
1062             if (tmpPos.getErrorIndex() == -1) {
1063                 pos.setIndex(tmpPos.getIndex());
1064                 return TimeZone::createTimeZone(tzID);
1065             }
1066             break;
1067         }
1068     case UTZFMT_STYLE_ZONE_ID_SHORT:
1069         {
1070             tmpPos.setIndex(startIdx);
1071             tmpPos.setErrorIndex(-1);
1072 
1073             parseShortZoneID(text, tmpPos, tzID);
1074             if (tmpPos.getErrorIndex() == -1) {
1075                 pos.setIndex(tmpPos.getIndex());
1076                 return TimeZone::createTimeZone(tzID);
1077             }
1078             break;
1079         }
1080     case UTZFMT_STYLE_EXEMPLAR_LOCATION:
1081         {
1082             tmpPos.setIndex(startIdx);
1083             tmpPos.setErrorIndex(-1);
1084 
1085             parseExemplarLocation(text, tmpPos, tzID);
1086             if (tmpPos.getErrorIndex() == -1) {
1087                 pos.setIndex(tmpPos.getIndex());
1088                 return TimeZone::createTimeZone(tzID);
1089             }
1090             break;
1091         }
1092     }
1093     evaluated |= STYLE_PARSE_FLAGS[style];
1094 
1095 
1096     if (parsedPos > startIdx) {
1097         // When the specified style is one of SPECIFIC_XXX or GENERIC_XXX, we tried to parse the input
1098         // as localized GMT format earlier. If parsedOffset is positive, it means it was successfully
1099         // parsed as localized GMT format, but offset digits were not detected (more specifically, GMT
1100         // zero format). Then, it tried to find a match within the set of display names, but could not
1101         // find a match. At this point, we can safely assume the input text contains the localized
1102         // GMT format.
1103         U_ASSERT(parsedOffset != UNKNOWN_OFFSET);
1104         pos.setIndex(parsedPos);
1105         return createTimeZoneForOffset(parsedOffset);
1106     }
1107 
1108     // Failed to parse the input text as the time zone format in the specified style.
1109     // Check the longest match among other styles below.
1110     UChar parsedIDBuf[32];
1111     UnicodeString parsedID(parsedIDBuf, 0, UPRV_LENGTHOF(parsedIDBuf));
1112     UTimeZoneFormatTimeType parsedTimeType = UTZFMT_TIME_TYPE_UNKNOWN;
1113 
1114     U_ASSERT(parsedPos < 0);
1115     U_ASSERT(parsedOffset == UNKNOWN_OFFSET);
1116 
1117     // ISO 8601
1118     if (parsedPos < maxPos &&
1119         ((evaluated & ISO_Z_STYLE_FLAG) == 0 || (evaluated & ISO_LOCAL_STYLE_FLAG) == 0)) {
1120         tmpPos.setIndex(startIdx);
1121         tmpPos.setErrorIndex(-1);
1122 
1123         UBool hasDigitOffset = FALSE;
1124         offset = parseOffsetISO8601(text, tmpPos, FALSE, &hasDigitOffset);
1125         if (tmpPos.getErrorIndex() == -1) {
1126             if (tmpPos.getIndex() == maxPos || hasDigitOffset) {
1127                 pos.setIndex(tmpPos.getIndex());
1128                 return createTimeZoneForOffset(offset);
1129             }
1130             // Note: When ISO 8601 format contains offset digits, it should not
1131             // collide with other formats. However, ISO 8601 UTC format "Z" (single letter)
1132             // may collide with other names. In this case, we need to evaluate other names.
1133             if (parsedPos < tmpPos.getIndex()) {
1134                 parsedOffset = offset;
1135                 parsedID.setToBogus();
1136                 parsedTimeType = UTZFMT_TIME_TYPE_UNKNOWN;
1137                 parsedPos = tmpPos.getIndex();
1138                 U_ASSERT(parsedPos == startIdx + 1);    // only when "Z" is used
1139             }
1140         }
1141     }
1142 
1143     // Localized GMT format
1144     if (parsedPos < maxPos &&
1145         (evaluated & STYLE_PARSE_FLAGS[UTZFMT_STYLE_LOCALIZED_GMT]) == 0) {
1146         tmpPos.setIndex(startIdx);
1147         tmpPos.setErrorIndex(-1);
1148 
1149         UBool hasDigitOffset = FALSE;
1150         offset = parseOffsetLocalizedGMT(text, tmpPos, FALSE, &hasDigitOffset);
1151         if (tmpPos.getErrorIndex() == -1) {
1152             if (tmpPos.getIndex() == maxPos || hasDigitOffset) {
1153                 pos.setIndex(tmpPos.getIndex());
1154                 return createTimeZoneForOffset(offset);
1155             }
1156             // Evaluate other names - see the comment earlier in this method.
1157             if (parsedPos < tmpPos.getIndex()) {
1158                 parsedOffset = offset;
1159                 parsedID.setToBogus();
1160                 parsedTimeType = UTZFMT_TIME_TYPE_UNKNOWN;
1161                 parsedPos = tmpPos.getIndex();
1162             }
1163         }
1164     }
1165 
1166     if (parsedPos < maxPos &&
1167         (evaluated & STYLE_PARSE_FLAGS[UTZFMT_STYLE_LOCALIZED_GMT_SHORT]) == 0) {
1168         tmpPos.setIndex(startIdx);
1169         tmpPos.setErrorIndex(-1);
1170 
1171         UBool hasDigitOffset = FALSE;
1172         offset = parseOffsetLocalizedGMT(text, tmpPos, TRUE, &hasDigitOffset);
1173         if (tmpPos.getErrorIndex() == -1) {
1174             if (tmpPos.getIndex() == maxPos || hasDigitOffset) {
1175                 pos.setIndex(tmpPos.getIndex());
1176                 return createTimeZoneForOffset(offset);
1177             }
1178             // Evaluate other names - see the comment earlier in this method.
1179             if (parsedPos < tmpPos.getIndex()) {
1180                 parsedOffset = offset;
1181                 parsedID.setToBogus();
1182                 parsedTimeType = UTZFMT_TIME_TYPE_UNKNOWN;
1183                 parsedPos = tmpPos.getIndex();
1184             }
1185         }
1186     }
1187 
1188     // When ParseOption.ALL_STYLES is available, we also try to look all possible display names and IDs.
1189     // For example, when style is GENERIC_LONG, "EST" (SPECIFIC_SHORT) is never
1190     // used for America/New_York. With parseAllStyles true, this code parses "EST"
1191     // as America/New_York.
1192 
1193     // Note: Adding all possible names into the trie used by the implementation is quite heavy operation,
1194     // which we want to avoid normally (note that we cache the trie, so this is applicable to the
1195     // first time only as long as the cache does not expire).
1196 
1197     if (parseOptions & UTZFMT_PARSE_OPTION_ALL_STYLES) {
1198         // Try all specific names and exemplar location names
1199         if (parsedPos < maxPos) {
1200             LocalPointer<TimeZoneNames::MatchInfoCollection> specificMatches(fTimeZoneNames->find(text, startIdx, ALL_SIMPLE_NAME_TYPES, status));
1201             if (U_FAILURE(status)) {
1202                 pos.setErrorIndex(startIdx);
1203                 return NULL;
1204             }
1205             int32_t specificMatchIdx = -1;
1206             int32_t matchPos = -1;
1207             if (!specificMatches.isNull()) {
1208                 for (int32_t i = 0; i < specificMatches->size(); i++) {
1209                     if (startIdx + specificMatches->getMatchLengthAt(i) > matchPos) {
1210                         specificMatchIdx = i;
1211                         matchPos = startIdx + specificMatches->getMatchLengthAt(i);
1212                     }
1213                 }
1214             }
1215             if (parsedPos < matchPos) {
1216                 U_ASSERT(specificMatchIdx >= 0);
1217                 parsedPos = matchPos;
1218                 getTimeZoneID(specificMatches.getAlias(), specificMatchIdx, parsedID);
1219                 parsedTimeType = getTimeType(specificMatches->getNameTypeAt(specificMatchIdx));
1220                 parsedOffset = UNKNOWN_OFFSET;
1221             }
1222         }
1223         if (parseTZDBAbbrev && parsedPos < maxPos && (evaluated & STYLE_PARSE_FLAGS[UTZFMT_STYLE_SPECIFIC_SHORT]) == 0) {
1224             const TZDBTimeZoneNames *tzdbTimeZoneNames = getTZDBTimeZoneNames(status);
1225             if (U_SUCCESS(status)) {
1226                 LocalPointer<TimeZoneNames::MatchInfoCollection> tzdbNameMatches(
1227                     tzdbTimeZoneNames->find(text, startIdx, ALL_SIMPLE_NAME_TYPES, status));
1228                 if (U_FAILURE(status)) {
1229                     pos.setErrorIndex(startIdx);
1230                     return NULL;
1231                 }
1232                 int32_t tzdbNameMatchIdx = -1;
1233                 int32_t matchPos = -1;
1234                 if (!tzdbNameMatches.isNull()) {
1235                     for (int32_t i = 0; i < tzdbNameMatches->size(); i++) {
1236                         if (startIdx + tzdbNameMatches->getMatchLengthAt(i) > matchPos) {
1237                             tzdbNameMatchIdx = i;
1238                             matchPos = startIdx + tzdbNameMatches->getMatchLengthAt(i);
1239                         }
1240                     }
1241                 }
1242                 if (parsedPos < matchPos) {
1243                     U_ASSERT(tzdbNameMatchIdx >= 0);
1244                     parsedPos = matchPos;
1245                     getTimeZoneID(tzdbNameMatches.getAlias(), tzdbNameMatchIdx, parsedID);
1246                     parsedTimeType = getTimeType(tzdbNameMatches->getNameTypeAt(tzdbNameMatchIdx));
1247                     parsedOffset = UNKNOWN_OFFSET;
1248                 }
1249             }
1250         }
1251         // Try generic names
1252         if (parsedPos < maxPos) {
1253             int32_t genMatchLen = -1;
1254             UTimeZoneFormatTimeType tt = UTZFMT_TIME_TYPE_UNKNOWN;
1255 
1256             const TimeZoneGenericNames *gnames = getTimeZoneGenericNames(status);
1257             if (U_SUCCESS(status)) {
1258                 genMatchLen = gnames->findBestMatch(text, startIdx, ALL_GENERIC_NAME_TYPES, tzID, tt, status);
1259             }
1260             if (U_FAILURE(status)) {
1261                 pos.setErrorIndex(startIdx);
1262                 return NULL;
1263             }
1264 
1265             if (genMatchLen > 0 && parsedPos < startIdx + genMatchLen) {
1266                 parsedPos = startIdx + genMatchLen;
1267                 parsedID.setTo(tzID);
1268                 parsedTimeType = tt;
1269                 parsedOffset = UNKNOWN_OFFSET;
1270             }
1271         }
1272 
1273         // Try time zone ID
1274         if (parsedPos < maxPos && (evaluated & STYLE_PARSE_FLAGS[UTZFMT_STYLE_ZONE_ID]) == 0) {
1275             tmpPos.setIndex(startIdx);
1276             tmpPos.setErrorIndex(-1);
1277 
1278             parseZoneID(text, tmpPos, tzID);
1279             if (tmpPos.getErrorIndex() == -1 && parsedPos < tmpPos.getIndex()) {
1280                 parsedPos = tmpPos.getIndex();
1281                 parsedID.setTo(tzID);
1282                 parsedTimeType = UTZFMT_TIME_TYPE_UNKNOWN;
1283                 parsedOffset = UNKNOWN_OFFSET;
1284             }
1285         }
1286         // Try short time zone ID
1287         if (parsedPos < maxPos && (evaluated & STYLE_PARSE_FLAGS[UTZFMT_STYLE_ZONE_ID]) == 0) {
1288             tmpPos.setIndex(startIdx);
1289             tmpPos.setErrorIndex(-1);
1290 
1291             parseShortZoneID(text, tmpPos, tzID);
1292             if (tmpPos.getErrorIndex() == -1 && parsedPos < tmpPos.getIndex()) {
1293                 parsedPos = tmpPos.getIndex();
1294                 parsedID.setTo(tzID);
1295                 parsedTimeType = UTZFMT_TIME_TYPE_UNKNOWN;
1296                 parsedOffset = UNKNOWN_OFFSET;
1297             }
1298         }
1299     }
1300 
1301     if (parsedPos > startIdx) {
1302         // Parsed successfully
1303         TimeZone* parsedTZ;
1304         if (parsedID.length() > 0) {
1305             parsedTZ = TimeZone::createTimeZone(parsedID);
1306         } else {
1307             U_ASSERT(parsedOffset != UNKNOWN_OFFSET);
1308             parsedTZ = createTimeZoneForOffset(parsedOffset);
1309         }
1310         if (timeType) {
1311             *timeType = parsedTimeType;
1312         }
1313         pos.setIndex(parsedPos);
1314         return parsedTZ;
1315     }
1316 
1317     pos.setErrorIndex(startIdx);
1318     return NULL;
1319 }
1320 
1321 void
parseObject(const UnicodeString & source,Formattable & result,ParsePosition & parse_pos) const1322 TimeZoneFormat::parseObject(const UnicodeString& source, Formattable& result,
1323         ParsePosition& parse_pos) const {
1324     result.adoptObject(parse(UTZFMT_STYLE_GENERIC_LOCATION, source, parse_pos, UTZFMT_PARSE_OPTION_ALL_STYLES));
1325 }
1326 
1327 
1328 // ------------------------------------------------------------------
1329 // Private zone name format/parse implementation
1330 
1331 UnicodeString&
formatGeneric(const TimeZone & tz,int32_t genType,UDate date,UnicodeString & name) const1332 TimeZoneFormat::formatGeneric(const TimeZone& tz, int32_t genType, UDate date, UnicodeString& name) const {
1333     UErrorCode status = U_ZERO_ERROR;
1334     const TimeZoneGenericNames* gnames = getTimeZoneGenericNames(status);
1335     if (U_FAILURE(status)) {
1336         name.setToBogus();
1337         return name;
1338     }
1339 
1340     if (genType == UTZGNM_LOCATION) {
1341         const UChar* canonicalID = ZoneMeta::getCanonicalCLDRID(tz);
1342         if (canonicalID == NULL) {
1343             name.setToBogus();
1344             return name;
1345         }
1346         return gnames->getGenericLocationName(UnicodeString(TRUE, canonicalID, -1), name);
1347     }
1348     return gnames->getDisplayName(tz, (UTimeZoneGenericNameType)genType, date, name);
1349 }
1350 
1351 UnicodeString&
formatSpecific(const TimeZone & tz,UTimeZoneNameType stdType,UTimeZoneNameType dstType,UDate date,UnicodeString & name,UTimeZoneFormatTimeType * timeType) const1352 TimeZoneFormat::formatSpecific(const TimeZone& tz, UTimeZoneNameType stdType, UTimeZoneNameType dstType,
1353         UDate date, UnicodeString& name, UTimeZoneFormatTimeType *timeType) const {
1354     if (fTimeZoneNames == NULL) {
1355         name.setToBogus();
1356         return name;
1357     }
1358 
1359     UErrorCode status = U_ZERO_ERROR;
1360     UBool isDaylight = tz.inDaylightTime(date, status);
1361     const UChar* canonicalID = ZoneMeta::getCanonicalCLDRID(tz);
1362 
1363     if (U_FAILURE(status) || canonicalID == NULL) {
1364         name.setToBogus();
1365         return name;
1366     }
1367 
1368     if (isDaylight) {
1369         fTimeZoneNames->getDisplayName(UnicodeString(TRUE, canonicalID, -1), dstType, date, name);
1370     } else {
1371         fTimeZoneNames->getDisplayName(UnicodeString(TRUE, canonicalID, -1), stdType, date, name);
1372     }
1373 
1374     if (timeType && !name.isEmpty()) {
1375         *timeType = isDaylight ? UTZFMT_TIME_TYPE_DAYLIGHT : UTZFMT_TIME_TYPE_STANDARD;
1376     }
1377     return name;
1378 }
1379 
1380 const TimeZoneGenericNames*
getTimeZoneGenericNames(UErrorCode & status) const1381 TimeZoneFormat::getTimeZoneGenericNames(UErrorCode& status) const {
1382     if (U_FAILURE(status)) {
1383         return NULL;
1384     }
1385 
1386     umtx_lock(&gLock);
1387     if (fTimeZoneGenericNames == NULL) {
1388         TimeZoneFormat *nonConstThis = const_cast<TimeZoneFormat *>(this);
1389         nonConstThis->fTimeZoneGenericNames = TimeZoneGenericNames::createInstance(fLocale, status);
1390     }
1391     umtx_unlock(&gLock);
1392 
1393     return fTimeZoneGenericNames;
1394 }
1395 
1396 const TZDBTimeZoneNames*
getTZDBTimeZoneNames(UErrorCode & status) const1397 TimeZoneFormat::getTZDBTimeZoneNames(UErrorCode& status) const {
1398     if (U_FAILURE(status)) {
1399         return NULL;
1400     }
1401 
1402     umtx_lock(&gLock);
1403     if (fTZDBTimeZoneNames == NULL) {
1404         TZDBTimeZoneNames *tzdbNames = new TZDBTimeZoneNames(fLocale);
1405         if (tzdbNames == NULL) {
1406             status = U_MEMORY_ALLOCATION_ERROR;
1407         } else {
1408             TimeZoneFormat *nonConstThis = const_cast<TimeZoneFormat *>(this);
1409             nonConstThis->fTZDBTimeZoneNames = tzdbNames;
1410         }
1411     }
1412     umtx_unlock(&gLock);
1413 
1414     return fTZDBTimeZoneNames;
1415 }
1416 
1417 UnicodeString&
formatExemplarLocation(const TimeZone & tz,UnicodeString & name) const1418 TimeZoneFormat::formatExemplarLocation(const TimeZone& tz, UnicodeString& name) const {
1419     UChar locationBuf[ZONE_NAME_U16_MAX];
1420     UnicodeString location(locationBuf, 0, UPRV_LENGTHOF(locationBuf));
1421     const UChar* canonicalID = ZoneMeta::getCanonicalCLDRID(tz);
1422 
1423     if (canonicalID) {
1424         fTimeZoneNames->getExemplarLocationName(UnicodeString(TRUE, canonicalID, -1), location);
1425     }
1426     if (location.length() > 0) {
1427         name.setTo(location);
1428     } else {
1429         // Use "unknown" location
1430         fTimeZoneNames->getExemplarLocationName(UnicodeString(TRUE, UNKNOWN_ZONE_ID, -1), location);
1431         if (location.length() > 0) {
1432             name.setTo(location);
1433         } else {
1434             // last resort
1435             name.setTo(UNKNOWN_LOCATION, -1);
1436         }
1437     }
1438     return name;
1439 }
1440 
1441 
1442 // ------------------------------------------------------------------
1443 // Zone offset format and parse
1444 
1445 UnicodeString&
formatOffsetISO8601Basic(int32_t offset,UBool useUtcIndicator,UBool isShort,UBool ignoreSeconds,UnicodeString & result,UErrorCode & status) const1446 TimeZoneFormat::formatOffsetISO8601Basic(int32_t offset, UBool useUtcIndicator, UBool isShort, UBool ignoreSeconds,
1447         UnicodeString& result, UErrorCode& status) const {
1448     return formatOffsetISO8601(offset, TRUE, useUtcIndicator, isShort, ignoreSeconds, result, status);
1449 }
1450 
1451 UnicodeString&
formatOffsetISO8601Extended(int32_t offset,UBool useUtcIndicator,UBool isShort,UBool ignoreSeconds,UnicodeString & result,UErrorCode & status) const1452 TimeZoneFormat::formatOffsetISO8601Extended(int32_t offset, UBool useUtcIndicator, UBool isShort, UBool ignoreSeconds,
1453         UnicodeString& result, UErrorCode& status) const {
1454     return formatOffsetISO8601(offset, FALSE, useUtcIndicator, isShort, ignoreSeconds, result, status);
1455 }
1456 
1457 UnicodeString&
formatOffsetLocalizedGMT(int32_t offset,UnicodeString & result,UErrorCode & status) const1458 TimeZoneFormat::formatOffsetLocalizedGMT(int32_t offset, UnicodeString& result, UErrorCode& status) const {
1459     return formatOffsetLocalizedGMT(offset, FALSE, result, status);
1460 }
1461 
1462 UnicodeString&
formatOffsetShortLocalizedGMT(int32_t offset,UnicodeString & result,UErrorCode & status) const1463 TimeZoneFormat::formatOffsetShortLocalizedGMT(int32_t offset, UnicodeString& result, UErrorCode& status) const {
1464     return formatOffsetLocalizedGMT(offset, TRUE, result, status);
1465 }
1466 
1467 int32_t
parseOffsetISO8601(const UnicodeString & text,ParsePosition & pos) const1468 TimeZoneFormat::parseOffsetISO8601(const UnicodeString& text, ParsePosition& pos) const {
1469     return parseOffsetISO8601(text, pos, FALSE);
1470 }
1471 
1472 int32_t
parseOffsetLocalizedGMT(const UnicodeString & text,ParsePosition & pos) const1473 TimeZoneFormat::parseOffsetLocalizedGMT(const UnicodeString& text, ParsePosition& pos) const {
1474     return parseOffsetLocalizedGMT(text, pos, FALSE, NULL);
1475 }
1476 
1477 int32_t
parseOffsetShortLocalizedGMT(const UnicodeString & text,ParsePosition & pos) const1478 TimeZoneFormat::parseOffsetShortLocalizedGMT(const UnicodeString& text, ParsePosition& pos) const {
1479     return parseOffsetLocalizedGMT(text, pos, TRUE, NULL);
1480 }
1481 
1482 // ------------------------------------------------------------------
1483 // Private zone offset format/parse implementation
1484 
1485 UnicodeString&
formatOffsetISO8601(int32_t offset,UBool isBasic,UBool useUtcIndicator,UBool isShort,UBool ignoreSeconds,UnicodeString & result,UErrorCode & status) const1486 TimeZoneFormat::formatOffsetISO8601(int32_t offset, UBool isBasic, UBool useUtcIndicator,
1487         UBool isShort, UBool ignoreSeconds, UnicodeString& result, UErrorCode& status) const {
1488     if (U_FAILURE(status)) {
1489         result.setToBogus();
1490         return result;
1491     }
1492     int32_t absOffset = offset < 0 ? -offset : offset;
1493     if (useUtcIndicator && (absOffset < MILLIS_PER_SECOND || (ignoreSeconds && absOffset < MILLIS_PER_MINUTE))) {
1494         result.setTo(ISO8601_UTC);
1495         return result;
1496     }
1497 
1498     OffsetFields minFields = isShort ? FIELDS_H : FIELDS_HM;
1499     OffsetFields maxFields = ignoreSeconds ? FIELDS_HM : FIELDS_HMS;
1500     UChar sep = isBasic ? 0 : ISO8601_SEP;
1501 
1502     // Note: FIELDS_HMS as maxFields is a CLDR/ICU extension. ISO 8601 specification does
1503     // not support seconds field.
1504 
1505     if (absOffset >= MAX_OFFSET) {
1506         result.setToBogus();
1507         status = U_ILLEGAL_ARGUMENT_ERROR;
1508         return result;
1509     }
1510 
1511     int fields[3];
1512     fields[0] = absOffset / MILLIS_PER_HOUR;
1513     absOffset = absOffset % MILLIS_PER_HOUR;
1514     fields[1] = absOffset / MILLIS_PER_MINUTE;
1515     absOffset = absOffset % MILLIS_PER_MINUTE;
1516     fields[2] = absOffset / MILLIS_PER_SECOND;
1517 
1518     U_ASSERT(fields[0] >= 0 && fields[0] <= MAX_OFFSET_HOUR);
1519     U_ASSERT(fields[1] >= 0 && fields[1] <= MAX_OFFSET_MINUTE);
1520     U_ASSERT(fields[2] >= 0 && fields[2] <= MAX_OFFSET_SECOND);
1521 
1522     int32_t lastIdx = maxFields;
1523     while (lastIdx > minFields) {
1524         if (fields[lastIdx] != 0) {
1525             break;
1526         }
1527         lastIdx--;
1528     }
1529 
1530     UChar sign = PLUS;
1531     if (offset < 0) {
1532         // if all output fields are 0s, do not use negative sign
1533         for (int32_t idx = 0; idx <= lastIdx; idx++) {
1534             if (fields[idx] != 0) {
1535                 sign = MINUS;
1536                 break;
1537             }
1538         }
1539     }
1540     result.setTo(sign);
1541 
1542     for (int32_t idx = 0; idx <= lastIdx; idx++) {
1543         if (sep && idx != 0) {
1544             result.append(sep);
1545         }
1546         result.append((UChar)(0x0030 + fields[idx]/10));
1547         result.append((UChar)(0x0030 + fields[idx]%10));
1548     }
1549 
1550     return result;
1551 }
1552 
1553 UnicodeString&
formatOffsetLocalizedGMT(int32_t offset,UBool isShort,UnicodeString & result,UErrorCode & status) const1554 TimeZoneFormat::formatOffsetLocalizedGMT(int32_t offset, UBool isShort, UnicodeString& result, UErrorCode& status) const {
1555     if (U_FAILURE(status)) {
1556         result.setToBogus();
1557         return result;
1558     }
1559     if (offset <= -MAX_OFFSET || offset >= MAX_OFFSET) {
1560         result.setToBogus();
1561         status = U_ILLEGAL_ARGUMENT_ERROR;
1562         return result;
1563     }
1564 
1565     if (offset == 0) {
1566         result.setTo(fGMTZeroFormat);
1567         return result;
1568     }
1569 
1570     UBool positive = TRUE;
1571     if (offset < 0) {
1572         offset = -offset;
1573         positive = FALSE;
1574     }
1575 
1576     int32_t offsetH = offset / MILLIS_PER_HOUR;
1577     offset = offset % MILLIS_PER_HOUR;
1578     int32_t offsetM = offset / MILLIS_PER_MINUTE;
1579     offset = offset % MILLIS_PER_MINUTE;
1580     int32_t offsetS = offset / MILLIS_PER_SECOND;
1581 
1582     U_ASSERT(offsetH <= MAX_OFFSET_HOUR && offsetM <= MAX_OFFSET_MINUTE && offsetS <= MAX_OFFSET_SECOND);
1583 
1584     const UVector* offsetPatternItems = NULL;
1585     if (positive) {
1586         if (offsetS != 0) {
1587             offsetPatternItems = fGMTOffsetPatternItems[UTZFMT_PAT_POSITIVE_HMS];
1588         } else if (offsetM != 0 || !isShort) {
1589             offsetPatternItems = fGMTOffsetPatternItems[UTZFMT_PAT_POSITIVE_HM];
1590         } else {
1591             offsetPatternItems = fGMTOffsetPatternItems[UTZFMT_PAT_POSITIVE_H];
1592         }
1593     } else {
1594         if (offsetS != 0) {
1595             offsetPatternItems = fGMTOffsetPatternItems[UTZFMT_PAT_NEGATIVE_HMS];
1596         } else if (offsetM != 0 || !isShort) {
1597             offsetPatternItems = fGMTOffsetPatternItems[UTZFMT_PAT_NEGATIVE_HM];
1598         } else {
1599             offsetPatternItems = fGMTOffsetPatternItems[UTZFMT_PAT_NEGATIVE_H];
1600         }
1601     }
1602 
1603     U_ASSERT(offsetPatternItems != NULL);
1604 
1605     // Building the GMT format string
1606     result.setTo(fGMTPatternPrefix);
1607 
1608     for (int32_t i = 0; i < offsetPatternItems->size(); i++) {
1609         const GMTOffsetField* item = (GMTOffsetField*)offsetPatternItems->elementAt(i);
1610         GMTOffsetField::FieldType type = item->getType();
1611 
1612         switch (type) {
1613         case GMTOffsetField::TEXT:
1614             result.append(item->getPatternText(), -1);
1615             break;
1616 
1617         case GMTOffsetField::HOUR:
1618             appendOffsetDigits(result, offsetH, (isShort ? 1 : 2));
1619             break;
1620 
1621         case GMTOffsetField::MINUTE:
1622             appendOffsetDigits(result, offsetM, 2);
1623             break;
1624 
1625         case GMTOffsetField::SECOND:
1626             appendOffsetDigits(result, offsetS, 2);
1627             break;
1628         }
1629     }
1630 
1631     result.append(fGMTPatternSuffix);
1632     return result;
1633 }
1634 
1635 int32_t
parseOffsetISO8601(const UnicodeString & text,ParsePosition & pos,UBool extendedOnly,UBool * hasDigitOffset) const1636 TimeZoneFormat::parseOffsetISO8601(const UnicodeString& text, ParsePosition& pos, UBool extendedOnly, UBool* hasDigitOffset /* = NULL */) const {
1637     if (hasDigitOffset) {
1638         *hasDigitOffset = FALSE;
1639     }
1640     int32_t start = pos.getIndex();
1641     if (start >= text.length()) {
1642         pos.setErrorIndex(start);
1643         return 0;
1644     }
1645 
1646     UChar firstChar = text.charAt(start);
1647     if (firstChar == ISO8601_UTC || firstChar == (UChar)(ISO8601_UTC + 0x20)) {
1648         // "Z" (or "z") - indicates UTC
1649         pos.setIndex(start + 1);
1650         return 0;
1651     }
1652 
1653     int32_t sign = 1;
1654     if (firstChar == PLUS) {
1655         sign = 1;
1656     } else if (firstChar == MINUS) {
1657         sign = -1;
1658     } else {
1659         // Not an ISO 8601 offset string
1660         pos.setErrorIndex(start);
1661         return 0;
1662     }
1663     ParsePosition posOffset(start + 1);
1664     int32_t offset = parseAsciiOffsetFields(text, posOffset, ISO8601_SEP, FIELDS_H, FIELDS_HMS);
1665     if (posOffset.getErrorIndex() == -1 && !extendedOnly && (posOffset.getIndex() - start <= 3)) {
1666         // If the text is successfully parsed as extended format with the options above, it can be also parsed
1667         // as basic format. For example, "0230" can be parsed as offset 2:00 (only first digits are valid for
1668         // extended format), but it can be parsed as offset 2:30 with basic format. We use longer result.
1669         ParsePosition posBasic(start + 1);
1670         int32_t tmpOffset = parseAbuttingAsciiOffsetFields(text, posBasic, FIELDS_H, FIELDS_HMS, FALSE);
1671         if (posBasic.getErrorIndex() == -1 && posBasic.getIndex() > posOffset.getIndex()) {
1672             offset = tmpOffset;
1673             posOffset.setIndex(posBasic.getIndex());
1674         }
1675     }
1676 
1677     if (posOffset.getErrorIndex() != -1) {
1678         pos.setErrorIndex(start);
1679         return 0;
1680     }
1681 
1682     pos.setIndex(posOffset.getIndex());
1683     if (hasDigitOffset) {
1684         *hasDigitOffset = TRUE;
1685     }
1686     return sign * offset;
1687 }
1688 
1689 int32_t
parseOffsetLocalizedGMT(const UnicodeString & text,ParsePosition & pos,UBool isShort,UBool * hasDigitOffset) const1690 TimeZoneFormat::parseOffsetLocalizedGMT(const UnicodeString& text, ParsePosition& pos, UBool isShort, UBool* hasDigitOffset) const {
1691     int32_t start = pos.getIndex();
1692     int32_t offset = 0;
1693     int32_t parsedLength = 0;
1694 
1695     if (hasDigitOffset) {
1696         *hasDigitOffset = FALSE;
1697     }
1698 
1699     offset = parseOffsetLocalizedGMTPattern(text, start, isShort, parsedLength);
1700 
1701     // For now, parseOffsetLocalizedGMTPattern handles both long and short
1702     // formats, no matter isShort is true or false. This might be changed in future
1703     // when strict parsing is necessary, or different set of patterns are used for
1704     // short/long formats.
1705 #if 0
1706     if (parsedLength == 0) {
1707         offset = parseOffsetLocalizedGMTPattern(text, start, !isShort, parsedLength);
1708     }
1709 #endif
1710 
1711     if (parsedLength > 0) {
1712         if (hasDigitOffset) {
1713             *hasDigitOffset = TRUE;
1714         }
1715         pos.setIndex(start + parsedLength);
1716         return offset;
1717     }
1718 
1719     // Try the default patterns
1720     offset = parseOffsetDefaultLocalizedGMT(text, start, parsedLength);
1721     if (parsedLength > 0) {
1722         if (hasDigitOffset) {
1723             *hasDigitOffset = TRUE;
1724         }
1725         pos.setIndex(start + parsedLength);
1726         return offset;
1727     }
1728 
1729     // Check if this is a GMT zero format
1730     if (text.caseCompare(start, fGMTZeroFormat.length(), fGMTZeroFormat, 0) == 0) {
1731         pos.setIndex(start + fGMTZeroFormat.length());
1732         return 0;
1733     }
1734 
1735     // Check if this is a default GMT zero format
1736     for (int32_t i = 0; ALT_GMT_STRINGS[i][0] != 0; i++) {
1737         const UChar* defGMTZero = ALT_GMT_STRINGS[i];
1738         int32_t defGMTZeroLen = u_strlen(defGMTZero);
1739         if (text.caseCompare(start, defGMTZeroLen, defGMTZero, 0) == 0) {
1740             pos.setIndex(start + defGMTZeroLen);
1741             return 0;
1742         }
1743     }
1744 
1745     // Nothing matched
1746     pos.setErrorIndex(start);
1747     return 0;
1748 }
1749 
1750 int32_t
parseOffsetLocalizedGMTPattern(const UnicodeString & text,int32_t start,UBool,int32_t & parsedLen) const1751 TimeZoneFormat::parseOffsetLocalizedGMTPattern(const UnicodeString& text, int32_t start, UBool /*isShort*/, int32_t& parsedLen) const {
1752     int32_t idx = start;
1753     int32_t offset = 0;
1754     UBool parsed = FALSE;
1755 
1756     do {
1757         // Prefix part
1758         int32_t len = fGMTPatternPrefix.length();
1759         if (len > 0 && text.caseCompare(idx, len, fGMTPatternPrefix, 0) != 0) {
1760             // prefix match failed
1761             break;
1762         }
1763         idx += len;
1764 
1765         // Offset part
1766         offset = parseOffsetFields(text, idx, FALSE, len);
1767         if (len == 0) {
1768             // offset field match failed
1769             break;
1770         }
1771         idx += len;
1772 
1773         len = fGMTPatternSuffix.length();
1774         if (len > 0 && text.caseCompare(idx, len, fGMTPatternSuffix, 0) != 0) {
1775             // no suffix match
1776             break;
1777         }
1778         idx += len;
1779         parsed = TRUE;
1780     } while (FALSE);
1781 
1782     parsedLen = parsed ? idx - start : 0;
1783     return offset;
1784 }
1785 
1786 int32_t
parseOffsetFields(const UnicodeString & text,int32_t start,UBool,int32_t & parsedLen) const1787 TimeZoneFormat::parseOffsetFields(const UnicodeString& text, int32_t start, UBool /*isShort*/, int32_t& parsedLen) const {
1788     int32_t outLen = 0;
1789     int32_t offset = 0;
1790     int32_t sign = 1;
1791 
1792     parsedLen = 0;
1793 
1794     int32_t offsetH, offsetM, offsetS;
1795     offsetH = offsetM = offsetS = 0;
1796 
1797     for (int32_t patidx = 0; PARSE_GMT_OFFSET_TYPES[patidx] >= 0; patidx++) {
1798         int32_t gmtPatType = PARSE_GMT_OFFSET_TYPES[patidx];
1799         UVector* items = fGMTOffsetPatternItems[gmtPatType];
1800         U_ASSERT(items != NULL);
1801 
1802         outLen = parseOffsetFieldsWithPattern(text, start, items, FALSE, offsetH, offsetM, offsetS);
1803         if (outLen > 0) {
1804             sign = (gmtPatType == UTZFMT_PAT_POSITIVE_H || gmtPatType == UTZFMT_PAT_POSITIVE_HM || gmtPatType == UTZFMT_PAT_POSITIVE_HMS) ?
1805                 1 : -1;
1806             break;
1807         }
1808     }
1809 
1810     if (outLen > 0 && fAbuttingOffsetHoursAndMinutes) {
1811         // When hours field is sabutting minutes field,
1812         // the parse result above may not be appropriate.
1813         // For example, "01020" is parsed as 01:02: above,
1814         // but it should be parsed as 00:10:20.
1815         int32_t tmpLen = 0;
1816         int32_t tmpSign = 1;
1817         int32_t tmpH = 0;
1818         int32_t tmpM = 0;
1819         int32_t tmpS = 0;
1820 
1821         for (int32_t patidx = 0; PARSE_GMT_OFFSET_TYPES[patidx] >= 0; patidx++) {
1822             int32_t gmtPatType = PARSE_GMT_OFFSET_TYPES[patidx];
1823             UVector* items = fGMTOffsetPatternItems[gmtPatType];
1824             U_ASSERT(items != NULL);
1825 
1826             // forcing parse to use single hour digit
1827             tmpLen = parseOffsetFieldsWithPattern(text, start, items, TRUE, tmpH, tmpM, tmpS);
1828             if (tmpLen > 0) {
1829                 tmpSign = (gmtPatType == UTZFMT_PAT_POSITIVE_H || gmtPatType == UTZFMT_PAT_POSITIVE_HM || gmtPatType == UTZFMT_PAT_POSITIVE_HMS) ?
1830                     1 : -1;
1831                 break;
1832             }
1833         }
1834         if (tmpLen > outLen) {
1835             // Better parse result with single hour digit
1836             outLen = tmpLen;
1837             sign = tmpSign;
1838             offsetH = tmpH;
1839             offsetM = tmpM;
1840             offsetS = tmpS;
1841         }
1842     }
1843 
1844     if (outLen > 0) {
1845         offset = ((((offsetH * 60) + offsetM) * 60) + offsetS) * 1000 * sign;
1846         parsedLen = outLen;
1847     }
1848 
1849     return offset;
1850 }
1851 
1852 int32_t
parseOffsetFieldsWithPattern(const UnicodeString & text,int32_t start,UVector * patternItems,UBool forceSingleHourDigit,int32_t & hour,int32_t & min,int32_t & sec) const1853 TimeZoneFormat::parseOffsetFieldsWithPattern(const UnicodeString& text, int32_t start,
1854         UVector* patternItems, UBool forceSingleHourDigit, int32_t& hour, int32_t& min, int32_t& sec) const {
1855     UBool failed = FALSE;
1856     int32_t offsetH, offsetM, offsetS;
1857     offsetH = offsetM = offsetS = 0;
1858     int32_t idx = start;
1859 
1860     for (int32_t i = 0; i < patternItems->size(); i++) {
1861         int32_t len = 0;
1862         const GMTOffsetField* field = (const GMTOffsetField*)patternItems->elementAt(i);
1863         GMTOffsetField::FieldType fieldType = field->getType();
1864         if (fieldType == GMTOffsetField::TEXT) {
1865             const UChar* patStr = field->getPatternText();
1866             len = u_strlen(patStr);
1867             if (i == 0) {
1868                 // When TimeZoneFormat parse() is called from SimpleDateFormat,
1869                 // leading space characters might be truncated. If the first pattern text
1870                 // starts with such character (e.g. Bidi control), then we need to
1871                 // skip the leading space charcters.
1872                 if (idx < text.length() && !PatternProps::isWhiteSpace(text.char32At(idx))) {
1873                     while (len > 0) {
1874                         UChar32 ch;
1875                         int32_t chLen;
1876                         U16_GET(patStr, 0, 0, len, ch)
1877                         if (PatternProps::isWhiteSpace(ch)) {
1878                             chLen = U16_LENGTH(ch);
1879                             len -= chLen;
1880                             patStr += chLen;
1881                         }
1882                         else {
1883                             break;
1884                         }
1885                     }
1886                 }
1887             }
1888             if (text.caseCompare(idx, len, patStr, 0) != 0) {
1889                 failed = TRUE;
1890                 break;
1891             }
1892             idx += len;
1893         } else {
1894             if (fieldType == GMTOffsetField::HOUR) {
1895                 uint8_t maxDigits = forceSingleHourDigit ? 1 : 2;
1896                 offsetH = parseOffsetFieldWithLocalizedDigits(text, idx, 1, maxDigits, 0, MAX_OFFSET_HOUR, len);
1897             } else if (fieldType == GMTOffsetField::MINUTE) {
1898                 offsetM = parseOffsetFieldWithLocalizedDigits(text, idx, 2, 2, 0, MAX_OFFSET_MINUTE, len);
1899             } else if (fieldType == GMTOffsetField::SECOND) {
1900                 offsetS = parseOffsetFieldWithLocalizedDigits(text, idx, 2, 2, 0, MAX_OFFSET_SECOND, len);
1901             }
1902 
1903             if (len == 0) {
1904                 failed = TRUE;
1905                 break;
1906             }
1907             idx += len;
1908         }
1909     }
1910 
1911     if (failed) {
1912         hour = min = sec = 0;
1913         return 0;
1914     }
1915 
1916     hour = offsetH;
1917     min = offsetM;
1918     sec = offsetS;
1919 
1920     return idx - start;
1921 }
1922 
1923 int32_t
parseAbuttingOffsetFields(const UnicodeString & text,int32_t start,int32_t & parsedLen) const1924 TimeZoneFormat::parseAbuttingOffsetFields(const UnicodeString& text, int32_t start, int32_t& parsedLen) const {
1925     int32_t digits[MAX_OFFSET_DIGITS];
1926     int32_t parsed[MAX_OFFSET_DIGITS];  // accumulative offsets
1927 
1928     // Parse digits into int[]
1929     int32_t idx = start;
1930     int32_t len = 0;
1931     int32_t numDigits = 0;
1932     for (int32_t i = 0; i < MAX_OFFSET_DIGITS; i++) {
1933         digits[i] = parseSingleLocalizedDigit(text, idx, len);
1934         if (digits[i] < 0) {
1935             break;
1936         }
1937         idx += len;
1938         parsed[i] = idx - start;
1939         numDigits++;
1940     }
1941 
1942     if (numDigits == 0) {
1943         parsedLen = 0;
1944         return 0;
1945     }
1946 
1947     int32_t offset = 0;
1948     while (numDigits > 0) {
1949         int32_t hour = 0;
1950         int32_t min = 0;
1951         int32_t sec = 0;
1952 
1953         U_ASSERT(numDigits > 0 && numDigits <= MAX_OFFSET_DIGITS);
1954         switch (numDigits) {
1955         case 1: // H
1956             hour = digits[0];
1957             break;
1958         case 2: // HH
1959             hour = digits[0] * 10 + digits[1];
1960             break;
1961         case 3: // Hmm
1962             hour = digits[0];
1963             min = digits[1] * 10 + digits[2];
1964             break;
1965         case 4: // HHmm
1966             hour = digits[0] * 10 + digits[1];
1967             min = digits[2] * 10 + digits[3];
1968             break;
1969         case 5: // Hmmss
1970             hour = digits[0];
1971             min = digits[1] * 10 + digits[2];
1972             sec = digits[3] * 10 + digits[4];
1973             break;
1974         case 6: // HHmmss
1975             hour = digits[0] * 10 + digits[1];
1976             min = digits[2] * 10 + digits[3];
1977             sec = digits[4] * 10 + digits[5];
1978             break;
1979         }
1980         if (hour <= MAX_OFFSET_HOUR && min <= MAX_OFFSET_MINUTE && sec <= MAX_OFFSET_SECOND) {
1981             // found a valid combination
1982             offset = hour * MILLIS_PER_HOUR + min * MILLIS_PER_MINUTE + sec * MILLIS_PER_SECOND;
1983             parsedLen = parsed[numDigits - 1];
1984             break;
1985         }
1986         numDigits--;
1987     }
1988     return offset;
1989 }
1990 
1991 int32_t
parseOffsetDefaultLocalizedGMT(const UnicodeString & text,int start,int32_t & parsedLen) const1992 TimeZoneFormat::parseOffsetDefaultLocalizedGMT(const UnicodeString& text, int start, int32_t& parsedLen) const {
1993     int32_t idx = start;
1994     int32_t offset = 0;
1995     int32_t parsed = 0;
1996 
1997     do {
1998         // check global default GMT alternatives
1999         int32_t gmtLen = 0;
2000 
2001         for (int32_t i = 0; ALT_GMT_STRINGS[i][0] != 0; i++) {
2002             const UChar* gmt = ALT_GMT_STRINGS[i];
2003             int32_t len = u_strlen(gmt);
2004             if (text.caseCompare(start, len, gmt, 0) == 0) {
2005                 gmtLen = len;
2006                 break;
2007             }
2008         }
2009         if (gmtLen == 0) {
2010             break;
2011         }
2012         idx += gmtLen;
2013 
2014         // offset needs a sign char and a digit at minimum
2015         if (idx + 1 >= text.length()) {
2016             break;
2017         }
2018 
2019         // parse sign
2020         int32_t sign = 1;
2021         UChar c = text.charAt(idx);
2022         if (c == PLUS) {
2023             sign = 1;
2024         } else if (c == MINUS) {
2025             sign = -1;
2026         } else {
2027             break;
2028         }
2029         idx++;
2030 
2031         // offset part
2032         // try the default pattern with the separator first
2033         int32_t lenWithSep = 0;
2034         int32_t offsetWithSep = parseDefaultOffsetFields(text, idx, DEFAULT_GMT_OFFSET_SEP, lenWithSep);
2035         if (lenWithSep == text.length() - idx) {
2036             // maximum match
2037             offset = offsetWithSep * sign;
2038             idx += lenWithSep;
2039         } else {
2040             // try abutting field pattern
2041             int32_t lenAbut = 0;
2042             int32_t offsetAbut = parseAbuttingOffsetFields(text, idx, lenAbut);
2043 
2044             if (lenWithSep > lenAbut) {
2045                 offset = offsetWithSep * sign;
2046                 idx += lenWithSep;
2047             } else {
2048                 offset = offsetAbut * sign;
2049                 idx += lenAbut;
2050             }
2051         }
2052         parsed = idx - start;
2053     } while (false);
2054 
2055     parsedLen = parsed;
2056     return offset;
2057 }
2058 
2059 int32_t
parseDefaultOffsetFields(const UnicodeString & text,int32_t start,UChar separator,int32_t & parsedLen) const2060 TimeZoneFormat::parseDefaultOffsetFields(const UnicodeString& text, int32_t start, UChar separator, int32_t& parsedLen) const {
2061     int32_t max = text.length();
2062     int32_t idx = start;
2063     int32_t len = 0;
2064     int32_t hour = 0, min = 0, sec = 0;
2065 
2066     parsedLen = 0;
2067 
2068     do {
2069         hour = parseOffsetFieldWithLocalizedDigits(text, idx, 1, 2, 0, MAX_OFFSET_HOUR, len);
2070         if (len == 0) {
2071             break;
2072         }
2073         idx += len;
2074 
2075         if (idx + 1 < max && text.charAt(idx) == separator) {
2076             min = parseOffsetFieldWithLocalizedDigits(text, idx + 1, 2, 2, 0, MAX_OFFSET_MINUTE, len);
2077             if (len == 0) {
2078                 break;
2079             }
2080             idx += (1 + len);
2081 
2082             if (idx + 1 < max && text.charAt(idx) == separator) {
2083                 sec = parseOffsetFieldWithLocalizedDigits(text, idx + 1, 2, 2, 0, MAX_OFFSET_SECOND, len);
2084                 if (len == 0) {
2085                     break;
2086                 }
2087                 idx += (1 + len);
2088             }
2089         }
2090     } while (FALSE);
2091 
2092     if (idx == start) {
2093         return 0;
2094     }
2095 
2096     parsedLen = idx - start;
2097     return hour * MILLIS_PER_HOUR + min * MILLIS_PER_MINUTE + sec * MILLIS_PER_SECOND;
2098 }
2099 
2100 int32_t
parseOffsetFieldWithLocalizedDigits(const UnicodeString & text,int32_t start,uint8_t minDigits,uint8_t maxDigits,uint16_t minVal,uint16_t maxVal,int32_t & parsedLen) const2101 TimeZoneFormat::parseOffsetFieldWithLocalizedDigits(const UnicodeString& text, int32_t start, uint8_t minDigits, uint8_t maxDigits, uint16_t minVal, uint16_t maxVal, int32_t& parsedLen) const {
2102     parsedLen = 0;
2103 
2104     int32_t decVal = 0;
2105     int32_t numDigits = 0;
2106     int32_t idx = start;
2107     int32_t digitLen = 0;
2108 
2109     while (idx < text.length() && numDigits < maxDigits) {
2110         int32_t digit = parseSingleLocalizedDigit(text, idx, digitLen);
2111         if (digit < 0) {
2112             break;
2113         }
2114         int32_t tmpVal = decVal * 10 + digit;
2115         if (tmpVal > maxVal) {
2116             break;
2117         }
2118         decVal = tmpVal;
2119         numDigits++;
2120         idx += digitLen;
2121     }
2122 
2123     // Note: maxVal is checked in the while loop
2124     if (numDigits < minDigits || decVal < minVal) {
2125         decVal = -1;
2126         numDigits = 0;
2127     } else {
2128         parsedLen = idx - start;
2129     }
2130 
2131     return decVal;
2132 }
2133 
2134 int32_t
parseSingleLocalizedDigit(const UnicodeString & text,int32_t start,int32_t & len) const2135 TimeZoneFormat::parseSingleLocalizedDigit(const UnicodeString& text, int32_t start, int32_t& len) const {
2136     int32_t digit = -1;
2137     len = 0;
2138     if (start < text.length()) {
2139         UChar32 cp = text.char32At(start);
2140 
2141         // First, try digits configured for this instance
2142         for (int32_t i = 0; i < 10; i++) {
2143             if (cp == fGMTOffsetDigits[i]) {
2144                 digit = i;
2145                 break;
2146             }
2147         }
2148         // If failed, check if this is a Unicode digit
2149         if (digit < 0) {
2150             int32_t tmp = u_charDigitValue(cp);
2151             digit = (tmp >= 0 && tmp <= 9) ? tmp : -1;
2152         }
2153 
2154         if (digit >= 0) {
2155             int32_t next = text.moveIndex32(start, 1);
2156             len = next - start;
2157         }
2158     }
2159     return digit;
2160 }
2161 
2162 UnicodeString&
formatOffsetWithAsciiDigits(int32_t offset,UChar sep,OffsetFields minFields,OffsetFields maxFields,UnicodeString & result)2163 TimeZoneFormat::formatOffsetWithAsciiDigits(int32_t offset, UChar sep, OffsetFields minFields, OffsetFields maxFields, UnicodeString& result) {
2164     U_ASSERT(maxFields >= minFields);
2165     U_ASSERT(offset > -MAX_OFFSET && offset < MAX_OFFSET);
2166 
2167     UChar sign = PLUS;
2168     if (offset < 0) {
2169         sign = MINUS;
2170         offset = -offset;
2171     }
2172     result.setTo(sign);
2173 
2174     int fields[3];
2175     fields[0] = offset / MILLIS_PER_HOUR;
2176     offset = offset % MILLIS_PER_HOUR;
2177     fields[1] = offset / MILLIS_PER_MINUTE;
2178     offset = offset % MILLIS_PER_MINUTE;
2179     fields[2] = offset / MILLIS_PER_SECOND;
2180 
2181     U_ASSERT(fields[0] >= 0 && fields[0] <= MAX_OFFSET_HOUR);
2182     U_ASSERT(fields[1] >= 0 && fields[1] <= MAX_OFFSET_MINUTE);
2183     U_ASSERT(fields[2] >= 0 && fields[2] <= MAX_OFFSET_SECOND);
2184 
2185     int32_t lastIdx = maxFields;
2186     while (lastIdx > minFields) {
2187         if (fields[lastIdx] != 0) {
2188             break;
2189         }
2190         lastIdx--;
2191     }
2192 
2193     for (int32_t idx = 0; idx <= lastIdx; idx++) {
2194         if (sep && idx != 0) {
2195             result.append(sep);
2196         }
2197         result.append((UChar)(0x0030 + fields[idx]/10));
2198         result.append((UChar)(0x0030 + fields[idx]%10));
2199     }
2200 
2201     return result;
2202 }
2203 
2204 int32_t
parseAbuttingAsciiOffsetFields(const UnicodeString & text,ParsePosition & pos,OffsetFields minFields,OffsetFields maxFields,UBool fixedHourWidth)2205 TimeZoneFormat::parseAbuttingAsciiOffsetFields(const UnicodeString& text, ParsePosition& pos, OffsetFields minFields, OffsetFields maxFields, UBool fixedHourWidth) {
2206     int32_t start = pos.getIndex();
2207 
2208     int32_t minDigits = 2 * (minFields + 1) - (fixedHourWidth ? 0 : 1);
2209     int32_t maxDigits = 2 * (maxFields + 1);
2210 
2211     U_ASSERT(maxDigits <= MAX_OFFSET_DIGITS);
2212 
2213     int32_t digits[MAX_OFFSET_DIGITS] = {};
2214     int32_t numDigits = 0;
2215     int32_t idx = start;
2216     while (numDigits < maxDigits && idx < text.length()) {
2217         UChar uch = text.charAt(idx);
2218         int32_t digit = DIGIT_VAL(uch);
2219         if (digit < 0) {
2220             break;
2221         }
2222         digits[numDigits] = digit;
2223         numDigits++;
2224         idx++;
2225     }
2226 
2227     if (fixedHourWidth && (numDigits & 1)) {
2228         // Fixed digits, so the number of digits must be even number. Truncating.
2229         numDigits--;
2230     }
2231 
2232     if (numDigits < minDigits) {
2233         pos.setErrorIndex(start);
2234         return 0;
2235     }
2236 
2237     int32_t hour = 0, min = 0, sec = 0;
2238     UBool bParsed = FALSE;
2239     while (numDigits >= minDigits) {
2240         switch (numDigits) {
2241         case 1: //H
2242             hour = digits[0];
2243             break;
2244         case 2: //HH
2245             hour = digits[0] * 10 + digits[1];
2246             break;
2247         case 3: //Hmm
2248             hour = digits[0];
2249             min = digits[1] * 10 + digits[2];
2250             break;
2251         case 4: //HHmm
2252             hour = digits[0] * 10 + digits[1];
2253             min = digits[2] * 10 + digits[3];
2254             break;
2255         case 5: //Hmmss
2256             hour = digits[0];
2257             min = digits[1] * 10 + digits[2];
2258             sec = digits[3] * 10 + digits[4];
2259             break;
2260         case 6: //HHmmss
2261             hour = digits[0] * 10 + digits[1];
2262             min = digits[2] * 10 + digits[3];
2263             sec = digits[4] * 10 + digits[5];
2264             break;
2265         }
2266 
2267         if (hour <= MAX_OFFSET_HOUR && min <= MAX_OFFSET_MINUTE && sec <= MAX_OFFSET_SECOND) {
2268             // Successfully parsed
2269             bParsed = true;
2270             break;
2271         }
2272 
2273         // Truncating
2274         numDigits -= (fixedHourWidth ? 2 : 1);
2275         hour = min = sec = 0;
2276     }
2277 
2278     if (!bParsed) {
2279         pos.setErrorIndex(start);
2280         return 0;
2281     }
2282     pos.setIndex(start + numDigits);
2283     return ((((hour * 60) + min) * 60) + sec) * 1000;
2284 }
2285 
2286 int32_t
parseAsciiOffsetFields(const UnicodeString & text,ParsePosition & pos,UChar sep,OffsetFields minFields,OffsetFields maxFields)2287 TimeZoneFormat::parseAsciiOffsetFields(const UnicodeString& text, ParsePosition& pos, UChar sep, OffsetFields minFields, OffsetFields maxFields) {
2288     int32_t start = pos.getIndex();
2289     int32_t fieldVal[] = {0, 0, 0};
2290     int32_t fieldLen[] = {0, -1, -1};
2291     for (int32_t idx = start, fieldIdx = 0; idx < text.length() && fieldIdx <= maxFields; idx++) {
2292         UChar c = text.charAt(idx);
2293         if (c == sep) {
2294             if (fieldIdx == 0) {
2295                 if (fieldLen[0] == 0) {
2296                     // no hours field
2297                     break;
2298                 }
2299                 // 1 digit hour, move to next field
2300             } else {
2301                 if (fieldLen[fieldIdx] != -1) {
2302                     // premature minute or seconds field
2303                     break;
2304                 }
2305                 fieldLen[fieldIdx] = 0;
2306             }
2307             continue;
2308         } else if (fieldLen[fieldIdx] == -1) {
2309             // no separator after 2 digit field
2310             break;
2311         }
2312         int32_t digit = DIGIT_VAL(c);
2313         if (digit < 0) {
2314             // not a digit
2315             break;
2316         }
2317         fieldVal[fieldIdx] = fieldVal[fieldIdx] * 10 + digit;
2318         fieldLen[fieldIdx]++;
2319         if (fieldLen[fieldIdx] >= 2) {
2320             // parsed 2 digits, move to next field
2321             fieldIdx++;
2322         }
2323     }
2324 
2325     int32_t offset = 0;
2326     int32_t parsedLen = 0;
2327     int32_t parsedFields = -1;
2328     do {
2329         // hour
2330         if (fieldLen[0] == 0) {
2331             break;
2332         }
2333         if (fieldVal[0] > MAX_OFFSET_HOUR) {
2334             offset = (fieldVal[0] / 10) * MILLIS_PER_HOUR;
2335             parsedFields = FIELDS_H;
2336             parsedLen = 1;
2337             break;
2338         }
2339         offset = fieldVal[0] * MILLIS_PER_HOUR;
2340         parsedLen = fieldLen[0];
2341         parsedFields = FIELDS_H;
2342 
2343         // minute
2344         if (fieldLen[1] != 2 || fieldVal[1] > MAX_OFFSET_MINUTE) {
2345             break;
2346         }
2347         offset += fieldVal[1] * MILLIS_PER_MINUTE;
2348         parsedLen += (1 + fieldLen[1]);
2349         parsedFields = FIELDS_HM;
2350 
2351         // second
2352         if (fieldLen[2] != 2 || fieldVal[2] > MAX_OFFSET_SECOND) {
2353             break;
2354         }
2355         offset += fieldVal[2] * MILLIS_PER_SECOND;
2356         parsedLen += (1 + fieldLen[2]);
2357         parsedFields = FIELDS_HMS;
2358     } while (false);
2359 
2360     if (parsedFields < minFields) {
2361         pos.setErrorIndex(start);
2362         return 0;
2363     }
2364 
2365     pos.setIndex(start + parsedLen);
2366     return offset;
2367 }
2368 
2369 void
appendOffsetDigits(UnicodeString & buf,int32_t n,uint8_t minDigits) const2370 TimeZoneFormat::appendOffsetDigits(UnicodeString& buf, int32_t n, uint8_t minDigits) const {
2371     U_ASSERT(n >= 0 && n < 60);
2372     int32_t numDigits = n >= 10 ? 2 : 1;
2373     for (int32_t i = 0; i < minDigits - numDigits; i++) {
2374         buf.append(fGMTOffsetDigits[0]);
2375     }
2376     if (numDigits == 2) {
2377         buf.append(fGMTOffsetDigits[n / 10]);
2378     }
2379     buf.append(fGMTOffsetDigits[n % 10]);
2380 }
2381 
2382 // ------------------------------------------------------------------
2383 // Private misc
2384 void
initGMTPattern(const UnicodeString & gmtPattern,UErrorCode & status)2385 TimeZoneFormat::initGMTPattern(const UnicodeString& gmtPattern, UErrorCode& status) {
2386     if (U_FAILURE(status)) {
2387         return;
2388     }
2389     // This implementation not perfect, but sufficient practically.
2390     int32_t idx = gmtPattern.indexOf(ARG0, ARG0_LEN, 0);
2391     if (idx < 0) {
2392         status = U_ILLEGAL_ARGUMENT_ERROR;
2393         return;
2394     }
2395     fGMTPattern.setTo(gmtPattern);
2396     unquote(gmtPattern.tempSubString(0, idx), fGMTPatternPrefix);
2397     unquote(gmtPattern.tempSubString(idx + ARG0_LEN), fGMTPatternSuffix);
2398 }
2399 
2400 UnicodeString&
unquote(const UnicodeString & pattern,UnicodeString & result)2401 TimeZoneFormat::unquote(const UnicodeString& pattern, UnicodeString& result) {
2402     if (pattern.indexOf(SINGLEQUOTE) < 0) {
2403         result.setTo(pattern);
2404         return result;
2405     }
2406     result.remove();
2407     UBool isPrevQuote = FALSE;
2408     UBool inQuote = FALSE;
2409     for (int32_t i = 0; i < pattern.length(); i++) {
2410         UChar c = pattern.charAt(i);
2411         if (c == SINGLEQUOTE) {
2412             if (isPrevQuote) {
2413                 result.append(c);
2414                 isPrevQuote = FALSE;
2415             } else {
2416                 isPrevQuote = TRUE;
2417             }
2418             inQuote = !inQuote;
2419         } else {
2420             isPrevQuote = FALSE;
2421             result.append(c);
2422         }
2423     }
2424     return result;
2425 }
2426 
2427 UVector*
parseOffsetPattern(const UnicodeString & pattern,OffsetFields required,UErrorCode & status)2428 TimeZoneFormat::parseOffsetPattern(const UnicodeString& pattern, OffsetFields required, UErrorCode& status) {
2429     if (U_FAILURE(status)) {
2430         return NULL;
2431     }
2432     UVector* result = new UVector(deleteGMTOffsetField, NULL, status);
2433     if (result == NULL) {
2434         status = U_MEMORY_ALLOCATION_ERROR;
2435         return NULL;
2436     }
2437 
2438     int32_t checkBits = 0;
2439     UBool isPrevQuote = FALSE;
2440     UBool inQuote = FALSE;
2441     UChar textBuf[32];
2442     UnicodeString text(textBuf, 0, UPRV_LENGTHOF(textBuf));
2443     GMTOffsetField::FieldType itemType = GMTOffsetField::TEXT;
2444     int32_t itemLength = 1;
2445 
2446     for (int32_t i = 0; i < pattern.length(); i++) {
2447         UChar ch = pattern.charAt(i);
2448         if (ch == SINGLEQUOTE) {
2449             if (isPrevQuote) {
2450                 text.append(SINGLEQUOTE);
2451                 isPrevQuote = FALSE;
2452             } else {
2453                 isPrevQuote = TRUE;
2454                 if (itemType != GMTOffsetField::TEXT) {
2455                     if (GMTOffsetField::isValid(itemType, itemLength)) {
2456                         GMTOffsetField* fld = GMTOffsetField::createTimeField(itemType, static_cast<uint8_t>(itemLength), status);
2457                         result->addElement(fld, status);
2458                         if (U_FAILURE(status)) {
2459                             break;
2460                         }
2461                     } else {
2462                         status = U_ILLEGAL_ARGUMENT_ERROR;
2463                         break;
2464                     }
2465                     itemType = GMTOffsetField::TEXT;
2466                 }
2467             }
2468             inQuote = !inQuote;
2469         } else {
2470             isPrevQuote = FALSE;
2471             if (inQuote) {
2472                 text.append(ch);
2473             } else {
2474                 GMTOffsetField::FieldType tmpType = GMTOffsetField::getTypeByLetter(ch);
2475                 if (tmpType != GMTOffsetField::TEXT) {
2476                     // an offset time pattern character
2477                     if (tmpType == itemType) {
2478                         itemLength++;
2479                     } else {
2480                         if (itemType == GMTOffsetField::TEXT) {
2481                             if (text.length() > 0) {
2482                                 GMTOffsetField* textfld = GMTOffsetField::createText(text, status);
2483                                 result->addElement(textfld, status);
2484                                 if (U_FAILURE(status)) {
2485                                     break;
2486                                 }
2487                                 text.remove();
2488                             }
2489                         } else {
2490                             if (GMTOffsetField::isValid(itemType, itemLength)) {
2491                                 GMTOffsetField* fld = GMTOffsetField::createTimeField(itemType, static_cast<uint8_t>(itemLength), status);
2492                                 result->addElement(fld, status);
2493                                 if (U_FAILURE(status)) {
2494                                     break;
2495                                 }
2496                             } else {
2497                                 status = U_ILLEGAL_ARGUMENT_ERROR;
2498                                 break;
2499                             }
2500                         }
2501                         itemType = tmpType;
2502                         itemLength = 1;
2503                         checkBits |= tmpType;
2504                     }
2505                 } else {
2506                     // a string literal
2507                     if (itemType != GMTOffsetField::TEXT) {
2508                         if (GMTOffsetField::isValid(itemType, itemLength)) {
2509                             GMTOffsetField* fld = GMTOffsetField::createTimeField(itemType, static_cast<uint8_t>(itemLength), status);
2510                             result->addElement(fld, status);
2511                             if (U_FAILURE(status)) {
2512                                 break;
2513                             }
2514                         } else {
2515                             status = U_ILLEGAL_ARGUMENT_ERROR;
2516                             break;
2517                         }
2518                         itemType = GMTOffsetField::TEXT;
2519                     }
2520                     text.append(ch);
2521                 }
2522             }
2523         }
2524     }
2525     // handle last item
2526     if (U_SUCCESS(status)) {
2527         if (itemType == GMTOffsetField::TEXT) {
2528             if (text.length() > 0) {
2529                 GMTOffsetField* tfld = GMTOffsetField::createText(text, status);
2530                 result->addElement(tfld, status);
2531             }
2532         } else {
2533             if (GMTOffsetField::isValid(itemType, itemLength)) {
2534                 GMTOffsetField* fld = GMTOffsetField::createTimeField(itemType, static_cast<uint8_t>(itemLength), status);
2535                 result->addElement(fld, status);
2536             } else {
2537                 status = U_ILLEGAL_ARGUMENT_ERROR;
2538             }
2539         }
2540 
2541         // Check all required fields are set
2542         if (U_SUCCESS(status)) {
2543             int32_t reqBits = 0;
2544             switch (required) {
2545             case FIELDS_H:
2546                 reqBits = GMTOffsetField::HOUR;
2547                 break;
2548             case FIELDS_HM:
2549                 reqBits = GMTOffsetField::HOUR | GMTOffsetField::MINUTE;
2550                 break;
2551             case FIELDS_HMS:
2552                 reqBits = GMTOffsetField::HOUR | GMTOffsetField::MINUTE | GMTOffsetField::SECOND;
2553                 break;
2554             }
2555             if (checkBits == reqBits) {
2556                 // all required fields are set, no extra fields
2557                 return result;
2558             }
2559         }
2560     }
2561 
2562     // error
2563     delete result;
2564     return NULL;
2565 }
2566 
2567 UnicodeString&
expandOffsetPattern(const UnicodeString & offsetHM,UnicodeString & result,UErrorCode & status)2568 TimeZoneFormat::expandOffsetPattern(const UnicodeString& offsetHM, UnicodeString& result, UErrorCode& status) {
2569     result.setToBogus();
2570     if (U_FAILURE(status)) {
2571         return result;
2572     }
2573     U_ASSERT(u_strlen(DEFAULT_GMT_OFFSET_MINUTE_PATTERN) == 2);
2574 
2575     int32_t idx_mm = offsetHM.indexOf(DEFAULT_GMT_OFFSET_MINUTE_PATTERN, 2, 0);
2576     if (idx_mm < 0) {
2577         // Bad time zone hour pattern data
2578         status = U_ILLEGAL_ARGUMENT_ERROR;
2579         return result;
2580     }
2581 
2582     UnicodeString sep;
2583     int32_t idx_H = offsetHM.tempSubString(0, idx_mm).lastIndexOf((UChar)0x0048 /* H */);
2584     if (idx_H >= 0) {
2585         sep = offsetHM.tempSubString(idx_H + 1, idx_mm - (idx_H + 1));
2586     }
2587     result.setTo(offsetHM.tempSubString(0, idx_mm + 2));
2588     result.append(sep);
2589     result.append(DEFAULT_GMT_OFFSET_SECOND_PATTERN, -1);
2590     result.append(offsetHM.tempSubString(idx_mm + 2));
2591     return result;
2592 }
2593 
2594 UnicodeString&
truncateOffsetPattern(const UnicodeString & offsetHM,UnicodeString & result,UErrorCode & status)2595 TimeZoneFormat::truncateOffsetPattern(const UnicodeString& offsetHM, UnicodeString& result, UErrorCode& status) {
2596     result.setToBogus();
2597     if (U_FAILURE(status)) {
2598         return result;
2599     }
2600     U_ASSERT(u_strlen(DEFAULT_GMT_OFFSET_MINUTE_PATTERN) == 2);
2601 
2602     int32_t idx_mm = offsetHM.indexOf(DEFAULT_GMT_OFFSET_MINUTE_PATTERN, 2, 0);
2603     if (idx_mm < 0) {
2604         // Bad time zone hour pattern data
2605         status = U_ILLEGAL_ARGUMENT_ERROR;
2606         return result;
2607     }
2608     UChar HH[] = {0x0048, 0x0048};
2609     int32_t idx_HH = offsetHM.tempSubString(0, idx_mm).lastIndexOf(HH, 2, 0);
2610     if (idx_HH >= 0) {
2611         return result.setTo(offsetHM.tempSubString(0, idx_HH + 2));
2612     }
2613     int32_t idx_H = offsetHM.tempSubString(0, idx_mm).lastIndexOf((UChar)0x0048, 0);
2614     if (idx_H >= 0) {
2615         return result.setTo(offsetHM.tempSubString(0, idx_H + 1));
2616     }
2617     // Bad time zone hour pattern data
2618     status = U_ILLEGAL_ARGUMENT_ERROR;
2619     return result;
2620 }
2621 
2622 void
initGMTOffsetPatterns(UErrorCode & status)2623 TimeZoneFormat::initGMTOffsetPatterns(UErrorCode& status) {
2624     for (int32_t type = 0; type < UTZFMT_PAT_COUNT; type++) {
2625         switch (type) {
2626         case UTZFMT_PAT_POSITIVE_H:
2627         case UTZFMT_PAT_NEGATIVE_H:
2628             fGMTOffsetPatternItems[type] = parseOffsetPattern(fGMTOffsetPatterns[type], FIELDS_H, status);
2629             break;
2630         case UTZFMT_PAT_POSITIVE_HM:
2631         case UTZFMT_PAT_NEGATIVE_HM:
2632             fGMTOffsetPatternItems[type] = parseOffsetPattern(fGMTOffsetPatterns[type], FIELDS_HM, status);
2633             break;
2634         case UTZFMT_PAT_POSITIVE_HMS:
2635         case UTZFMT_PAT_NEGATIVE_HMS:
2636             fGMTOffsetPatternItems[type] = parseOffsetPattern(fGMTOffsetPatterns[type], FIELDS_HMS, status);
2637             break;
2638         }
2639     }
2640     checkAbuttingHoursAndMinutes();
2641 }
2642 
2643 void
checkAbuttingHoursAndMinutes()2644 TimeZoneFormat::checkAbuttingHoursAndMinutes() {
2645     fAbuttingOffsetHoursAndMinutes= FALSE;
2646     for (int32_t type = 0; type < UTZFMT_PAT_COUNT; type++) {
2647         UBool afterH = FALSE;
2648         UVector *items = fGMTOffsetPatternItems[type];
2649         for (int32_t i = 0; i < items->size(); i++) {
2650             const GMTOffsetField* item = (GMTOffsetField*)items->elementAt(i);
2651             GMTOffsetField::FieldType fieldType = item->getType();
2652             if (fieldType != GMTOffsetField::TEXT) {
2653                 if (afterH) {
2654                     fAbuttingOffsetHoursAndMinutes = TRUE;
2655                     break;
2656                 } else if (fieldType == GMTOffsetField::HOUR) {
2657                     afterH = TRUE;
2658                 }
2659             } else if (afterH) {
2660                 break;
2661             }
2662         }
2663         if (fAbuttingOffsetHoursAndMinutes) {
2664             break;
2665         }
2666     }
2667 }
2668 
2669 UBool
toCodePoints(const UnicodeString & str,UChar32 * codeArray,int32_t size)2670 TimeZoneFormat::toCodePoints(const UnicodeString& str, UChar32* codeArray, int32_t size) {
2671     int32_t count = str.countChar32();
2672     if (count != size) {
2673         return FALSE;
2674     }
2675 
2676     for (int32_t idx = 0, start = 0; idx < size; idx++) {
2677         codeArray[idx] = str.char32At(start);
2678         start = str.moveIndex32(start, 1);
2679     }
2680 
2681     return TRUE;
2682 }
2683 
2684 TimeZone*
createTimeZoneForOffset(int32_t offset) const2685 TimeZoneFormat::createTimeZoneForOffset(int32_t offset) const {
2686     if (offset == 0) {
2687         // when offset is 0, we should use "Etc/GMT"
2688         return TimeZone::createTimeZone(UnicodeString(TRUE, TZID_GMT, -1));
2689     }
2690     return ZoneMeta::createCustomTimeZone(offset);
2691 }
2692 
2693 UTimeZoneFormatTimeType
getTimeType(UTimeZoneNameType nameType)2694 TimeZoneFormat::getTimeType(UTimeZoneNameType nameType) {
2695     switch (nameType) {
2696     case UTZNM_LONG_STANDARD:
2697     case UTZNM_SHORT_STANDARD:
2698         return UTZFMT_TIME_TYPE_STANDARD;
2699 
2700     case UTZNM_LONG_DAYLIGHT:
2701     case UTZNM_SHORT_DAYLIGHT:
2702         return UTZFMT_TIME_TYPE_DAYLIGHT;
2703 
2704     default:
2705         return UTZFMT_TIME_TYPE_UNKNOWN;
2706     }
2707 }
2708 
2709 UnicodeString&
getTimeZoneID(const TimeZoneNames::MatchInfoCollection * matches,int32_t idx,UnicodeString & tzID) const2710 TimeZoneFormat::getTimeZoneID(const TimeZoneNames::MatchInfoCollection* matches, int32_t idx, UnicodeString& tzID) const {
2711     if (!matches->getTimeZoneIDAt(idx, tzID)) {
2712         UChar mzIDBuf[32];
2713         UnicodeString mzID(mzIDBuf, 0, UPRV_LENGTHOF(mzIDBuf));
2714         if (matches->getMetaZoneIDAt(idx, mzID)) {
2715             fTimeZoneNames->getReferenceZoneID(mzID, fTargetRegion, tzID);
2716         }
2717     }
2718     return tzID;
2719 }
2720 
2721 
2722 class ZoneIdMatchHandler : public TextTrieMapSearchResultHandler {
2723 public:
2724     ZoneIdMatchHandler();
2725     virtual ~ZoneIdMatchHandler();
2726 
2727     UBool handleMatch(int32_t matchLength, const CharacterNode *node, UErrorCode &status);
2728     const UChar* getID();
2729     int32_t getMatchLen();
2730 private:
2731     int32_t fLen;
2732     const UChar* fID;
2733 };
2734 
ZoneIdMatchHandler()2735 ZoneIdMatchHandler::ZoneIdMatchHandler()
2736 : fLen(0), fID(NULL) {
2737 }
2738 
~ZoneIdMatchHandler()2739 ZoneIdMatchHandler::~ZoneIdMatchHandler() {
2740 }
2741 
2742 UBool
handleMatch(int32_t matchLength,const CharacterNode * node,UErrorCode & status)2743 ZoneIdMatchHandler::handleMatch(int32_t matchLength, const CharacterNode *node, UErrorCode &status) {
2744     if (U_FAILURE(status)) {
2745         return FALSE;
2746     }
2747     if (node->hasValues()) {
2748         const UChar* id = (const UChar*)node->getValue(0);
2749         if (id != NULL) {
2750             if (fLen < matchLength) {
2751                 fID = id;
2752                 fLen = matchLength;
2753             }
2754         }
2755     }
2756     return TRUE;
2757 }
2758 
2759 const UChar*
getID()2760 ZoneIdMatchHandler::getID() {
2761     return fID;
2762 }
2763 
2764 int32_t
getMatchLen()2765 ZoneIdMatchHandler::getMatchLen() {
2766     return fLen;
2767 }
2768 
2769 
initZoneIdTrie(UErrorCode & status)2770 static void U_CALLCONV initZoneIdTrie(UErrorCode &status) {
2771     U_ASSERT(gZoneIdTrie == NULL);
2772     ucln_i18n_registerCleanup(UCLN_I18N_TIMEZONEFORMAT, tzfmt_cleanup);
2773     gZoneIdTrie = new TextTrieMap(TRUE, NULL);    // No deleter, because values are pooled by ZoneMeta
2774     if (gZoneIdTrie == NULL) {
2775         status = U_MEMORY_ALLOCATION_ERROR;
2776         return;
2777     }
2778     StringEnumeration *tzenum = TimeZone::createEnumeration();
2779     const UnicodeString *id;
2780     while ((id = tzenum->snext(status)) != NULL) {
2781         const UChar* uid = ZoneMeta::findTimeZoneID(*id);
2782         if (uid) {
2783             gZoneIdTrie->put(uid, const_cast<UChar *>(uid), status);
2784         }
2785     }
2786     delete tzenum;
2787 }
2788 
2789 
2790 UnicodeString&
parseZoneID(const UnicodeString & text,ParsePosition & pos,UnicodeString & tzID) const2791 TimeZoneFormat::parseZoneID(const UnicodeString& text, ParsePosition& pos, UnicodeString& tzID) const {
2792     UErrorCode status = U_ZERO_ERROR;
2793     umtx_initOnce(gZoneIdTrieInitOnce, &initZoneIdTrie, status);
2794 
2795     int32_t start = pos.getIndex();
2796     int32_t len = 0;
2797     tzID.setToBogus();
2798 
2799     if (U_SUCCESS(status)) {
2800         LocalPointer<ZoneIdMatchHandler> handler(new ZoneIdMatchHandler());
2801         gZoneIdTrie->search(text, start, handler.getAlias(), status);
2802         len = handler->getMatchLen();
2803         if (len > 0) {
2804             tzID.setTo(handler->getID(), -1);
2805         }
2806     }
2807 
2808     if (len > 0) {
2809         pos.setIndex(start + len);
2810     } else {
2811         pos.setErrorIndex(start);
2812     }
2813 
2814     return tzID;
2815 }
2816 
initShortZoneIdTrie(UErrorCode & status)2817 static void U_CALLCONV initShortZoneIdTrie(UErrorCode &status) {
2818     U_ASSERT(gShortZoneIdTrie == NULL);
2819     ucln_i18n_registerCleanup(UCLN_I18N_TIMEZONEFORMAT, tzfmt_cleanup);
2820     StringEnumeration *tzenum = TimeZone::createTimeZoneIDEnumeration(UCAL_ZONE_TYPE_CANONICAL, NULL, NULL, status);
2821     if (U_SUCCESS(status)) {
2822         gShortZoneIdTrie = new TextTrieMap(TRUE, NULL);    // No deleter, because values are pooled by ZoneMeta
2823         if (gShortZoneIdTrie == NULL) {
2824             status = U_MEMORY_ALLOCATION_ERROR;
2825         } else {
2826             const UnicodeString *id;
2827             while ((id = tzenum->snext(status)) != NULL) {
2828                 const UChar* uID = ZoneMeta::findTimeZoneID(*id);
2829                 const UChar* shortID = ZoneMeta::getShortID(*id);
2830                 if (shortID && uID) {
2831                     gShortZoneIdTrie->put(shortID, const_cast<UChar *>(uID), status);
2832                 }
2833             }
2834         }
2835     }
2836     delete tzenum;
2837 }
2838 
2839 
2840 UnicodeString&
parseShortZoneID(const UnicodeString & text,ParsePosition & pos,UnicodeString & tzID) const2841 TimeZoneFormat::parseShortZoneID(const UnicodeString& text, ParsePosition& pos, UnicodeString& tzID) const {
2842     UErrorCode status = U_ZERO_ERROR;
2843     umtx_initOnce(gShortZoneIdTrieInitOnce, &initShortZoneIdTrie, status);
2844 
2845     int32_t start = pos.getIndex();
2846     int32_t len = 0;
2847     tzID.setToBogus();
2848 
2849     if (U_SUCCESS(status)) {
2850         LocalPointer<ZoneIdMatchHandler> handler(new ZoneIdMatchHandler());
2851         gShortZoneIdTrie->search(text, start, handler.getAlias(), status);
2852         len = handler->getMatchLen();
2853         if (len > 0) {
2854             tzID.setTo(handler->getID(), -1);
2855         }
2856     }
2857 
2858     if (len > 0) {
2859         pos.setIndex(start + len);
2860     } else {
2861         pos.setErrorIndex(start);
2862     }
2863 
2864     return tzID;
2865 }
2866 
2867 
2868 UnicodeString&
parseExemplarLocation(const UnicodeString & text,ParsePosition & pos,UnicodeString & tzID) const2869 TimeZoneFormat::parseExemplarLocation(const UnicodeString& text, ParsePosition& pos, UnicodeString& tzID) const {
2870     int32_t startIdx = pos.getIndex();
2871     int32_t parsedPos = -1;
2872     tzID.setToBogus();
2873 
2874     UErrorCode status = U_ZERO_ERROR;
2875     LocalPointer<TimeZoneNames::MatchInfoCollection> exemplarMatches(fTimeZoneNames->find(text, startIdx, UTZNM_EXEMPLAR_LOCATION, status));
2876     if (U_FAILURE(status)) {
2877         pos.setErrorIndex(startIdx);
2878         return tzID;
2879     }
2880     int32_t matchIdx = -1;
2881     if (!exemplarMatches.isNull()) {
2882         for (int32_t i = 0; i < exemplarMatches->size(); i++) {
2883             if (startIdx + exemplarMatches->getMatchLengthAt(i) > parsedPos) {
2884                 matchIdx = i;
2885                 parsedPos = startIdx + exemplarMatches->getMatchLengthAt(i);
2886             }
2887         }
2888         if (parsedPos > 0) {
2889             pos.setIndex(parsedPos);
2890             getTimeZoneID(exemplarMatches.getAlias(), matchIdx, tzID);
2891         }
2892     }
2893 
2894     if (tzID.length() == 0) {
2895         pos.setErrorIndex(startIdx);
2896     }
2897 
2898     return tzID;
2899 }
2900 
2901 U_NAMESPACE_END
2902 
2903 #endif
2904