1 package org.unicode.cldr.tool;
2 
3 import java.util.Arrays;
4 import java.util.Collections;
5 import java.util.HashMap;
6 import java.util.LinkedHashSet;
7 import java.util.Map;
8 import java.util.Map.Entry;
9 import java.util.Set;
10 import java.util.TreeMap;
11 import java.util.TreeSet;
12 
13 import org.unicode.cldr.util.Builder;
14 import org.unicode.cldr.util.CLDRConfig;
15 import org.unicode.cldr.util.CLDRFile;
16 import org.unicode.cldr.util.Containment;
17 import org.unicode.cldr.util.DateTimeCanonicalizer.DateTimePatternType;
18 import org.unicode.cldr.util.Factory;
19 import org.unicode.cldr.util.LanguageTagParser;
20 import org.unicode.cldr.util.PreferredAndAllowedHour;
21 import org.unicode.cldr.util.SupplementalDataInfo.OfficialStatus;
22 import org.unicode.cldr.util.SupplementalDataInfo.PopulationData;
23 import org.unicode.cldr.util.With;
24 
25 import com.ibm.icu.dev.util.CollectionUtilities;
26 import com.ibm.icu.impl.Relation;
27 import com.ibm.icu.text.DateTimePatternGenerator.FormatParser;
28 import com.ibm.icu.text.DateTimePatternGenerator.VariableField;
29 import com.ibm.icu.text.UnicodeSet;
30 
31 public class FindPreferredHours {
32     private static CLDRConfig INFO = ToolConfig.getToolInstance();
33     private static final CLDRFile ENGLISH = INFO.getEnglish();
34     private static final UnicodeSet DIGITS = new UnicodeSet("[0-9]").freeze();
35 
36     private static final Set<Character> ONLY24 = Collections.unmodifiableSet(new LinkedHashSet<Character>(Arrays
37         .asList('H')));
38 
39     private final static Map<String, Set<Character>> OVERRIDE_ALLOWED = Builder
40         .with(new HashMap<String, Set<Character>>())
41         .put("RU", ONLY24)
42         .put("IL", ONLY24)
43         .freeze();
44 
45     private final static Map<String, Character> CONFLICT_RESOLUTION = Builder.with(new HashMap<String, Character>())
46         .put("DJ", 'h')
47         .put("KM", 'H')
48         .put("MG", 'H')
49         .put("MU", 'H')
50         .put("MZ", 'H')
51         .put("SC", 'H')
52         .put("CM", 'H')
53         .put("TD", 'h')
54         .put("DZ", 'h')
55         .put("MA", 'h')
56         .put("TN", 'h')
57         .put("BW", 'h')
58         .put("LS", 'h')
59         .put("NA", 'h')
60         .put("SZ", 'h')
61         .put("ZA", 'h')
62         .put("GH", 'h')
63         .put("MR", 'h')
64         .put("NG", 'h')
65         .put("TG", 'H')
66         .put("CA", 'h')
67         .put("US", 'h')
68         .put("CN", 'h')
69         .put("MO", 'h')
70         .put("PH", 'H')
71         .put("IN", 'h')
72         .put("LK", 'H')
73         .put("CY", 'h')
74         .put("IL", 'H')
75         .put("SY", 'h')
76         .put("MK", 'H')
77         .put("VU", 'h')
78         .put("TO", 'H')
79         .put("001", 'H')
80         .freeze();
81 
82     static final class Hours implements Comparable<Hours> {
83         final DateTimePatternType type;
84         final char variable;
85 
Hours(DateTimePatternType type, String variable)86         public Hours(DateTimePatternType type, String variable) {
87             this.type = type;
88             this.variable = variable.charAt(0);
89         }
90 
91         @Override
compareTo(Hours arg0)92         public int compareTo(Hours arg0) {
93             // TODO Auto-generated method stub
94             int result = type.compareTo(arg0.type);
95             if (result != 0) return result;
96             return variable < arg0.variable ? -1 : variable > arg0.variable ? 1 : 0;
97         }
98 
99         @Override
toString()100         public String toString() {
101             // TODO Auto-generated method stub
102             return type + ":" + variable;
103         }
104 
105         @Override
equals(Object obj)106         public boolean equals(Object obj) {
107             return obj instanceof Hours && compareTo((Hours) obj) == 0;
108         }
109     }
110 
main(String[] args)111     public static void main(String[] args) {
112         final Relation<String, Hours> lang2Hours = Relation.of(new TreeMap<String, Set<Hours>>(), TreeSet.class);
113         final Factory factory = INFO.getCldrFactory();
114         final FormatParser formatDateParser = new FormatParser();
115         final LikelySubtags likely2Max = new LikelySubtags(INFO.getSupplementalDataInfo());
116 
117         for (final String locale : factory.getAvailable()) {
118             if (locale.equals("root")) {
119                 continue;
120             }
121             // if (locale.charAt(0) > 'b') {
122             // continue;
123             // }
124             final CLDRFile cldrFile = factory.make(locale, true);
125             for (String path : With.in(cldrFile)) {
126                 // if (path.contains("/timeFormats")) {
127                 // System.out.println(path);
128                 // }
129                 DateTimePatternType type = DateTimePatternType.fromPath(path);
130                 if (type == DateTimePatternType.NA || type == DateTimePatternType.GMT) {
131                     continue;
132                 }
133                 String value = cldrFile.getStringValue(path);
134                 formatDateParser.set(value);
135                 for (Object item : formatDateParser.getItems()) {
136                     if (item instanceof VariableField) {
137                         String itemString = item.toString();
138                         if (PreferredAndAllowedHour.HourStyle.isHourCharacter(itemString)) {
139                             lang2Hours.put(locale, new Hours(type, itemString));
140                         }
141                     }
142                 }
143             }
144             System.out.println(locale + "\t" + lang2Hours.get(locale));
145             // for (Entry<String, Set<String>> e : lang2Hours.keyValuesSet()) {
146             // System.out.println(e);
147             // }
148         }
149 
150         // gather data per region
151 
152         Map<String, Relation<Character, String>> region2Preferred2locales = new TreeMap<String, Relation<Character, String>>();
153         Relation<String, Character> region2Allowed = Relation.of(new TreeMap<String, Set<Character>>(), TreeSet.class);
154         final LanguageTagParser ltp = new LanguageTagParser();
155 
156         for (Entry<String, Set<Hours>> localeAndHours : lang2Hours.keyValuesSet()) {
157             String locale = localeAndHours.getKey();
158             String maxLocale = likely2Max.maximize(locale);
159             if (maxLocale == null) {
160                 System.out.println("*** Missing likely for " + locale);
161                 continue;
162             }
163             String region = ltp.set(maxLocale).getRegion();
164             if (region.isEmpty()) {
165                 System.out.println("*** Missing region for " + locale + ", " + maxLocale);
166                 continue;
167             }
168             if (DIGITS.containsSome(region) && !region.equals("001")) {
169                 System.out.println("*** Skipping multicountry region for " + locale + ", " + maxLocale);
170                 continue;
171             }
172             for (Hours hours : localeAndHours.getValue()) {
173                 region2Allowed.put(region, hours.variable);
174                 if (hours.type == DateTimePatternType.STOCK) {
175                     Relation<Character, String> items = region2Preferred2locales.get(region);
176                     if (items == null) {
177                         region2Preferred2locales.put(region,
178                             items = Relation.of(new TreeMap<Character, Set<String>>(), TreeSet.class));
179                     }
180                     items.put(hours.variable, locale);
181                 }
182             }
183         }
184 
185         // now invert
186         Relation<PreferredAndAllowedHour, String> preferred2Region = Relation.of(
187             new TreeMap<PreferredAndAllowedHour, Set<String>>(), TreeSet.class);
188         StringBuilder overrides = new StringBuilder("\n");
189 
190         for (Entry<String, Relation<Character, String>> e : region2Preferred2locales.entrySet()) {
191             String region = e.getKey();
192             Set<Character> allowed = region2Allowed.get(region);
193             Relation<Character, String> preferredSet = e.getValue();
194             Character resolvedValue = CONFLICT_RESOLUTION.get(region);
195             if (resolvedValue != null) {
196                 if (preferredSet.size() == 1) {
197                     overrides.append(region + " didn't need override!!\n");
198                 } else {
199                     LinkedHashSet<Entry<Character, String>> oldValues = new LinkedHashSet<Entry<Character, String>>();
200                     StringBuilder oldValuesString = new StringBuilder();
201                     for (Entry<Character, String> x : preferredSet.keyValueSet()) {
202                         if (!x.getKey().equals(resolvedValue)) {
203                             oldValues.add(x);
204                             oldValuesString.append(x.getKey() + "=" + x.getValue() + "; ");
205                         }
206                     }
207                     for (Entry<Character, String> x : oldValues) {
208                         preferredSet.remove(x.getKey(), x.getValue());
209                     }
210                     overrides.append(region + " has multiple values. Overriding with CONFLICT_RESOLUTION to "
211                         + resolvedValue + " and discarded values " + oldValuesString + "\n");
212                 }
213             }
214 
215             Set<Character> allAllowed = new TreeSet<Character>();
216             Character preferred = null;
217 
218             for (Entry<Character, Set<String>> pref : preferredSet.keyValuesSet()) {
219                 allAllowed.addAll(allowed);
220                 if (preferred == null) {
221                     preferred = pref.getKey();
222                 } else {
223                     overrides.append(region + " has multiple preferred values! " + preferredSet + "\n");
224                 }
225                 // else {
226                 // if (!haveFirst) {
227                 // System.out.print("*** Conflict in\t" + region + "\t" + ENGLISH.getName("territory", region) +
228                 // "\twith\t");
229                 // System.out.println(preferred + "\t" + locales);
230                 // haveFirst = true;
231                 // }
232                 // //System.out.println("\t" + pref.getKey() + "\t" + pref.getValue());
233                 // }
234             }
235             Set<Character> overrideAllowed = OVERRIDE_ALLOWED.get(region);
236             if (overrideAllowed != null) {
237                 allAllowed = overrideAllowed;
238                 overrides.append(region + " overriding allowed to " + overrideAllowed + "\n");
239             }
240             try {
241                 preferred2Region.put(new PreferredAndAllowedHour(preferred, allAllowed), region);
242             } catch (RuntimeException e1) {
243                 throw e1;
244             }
245             String subcontinent = Containment.getSubcontinent(region);
246             String continent = Containment.getContinent(region);
247             String tag = CollectionUtilities.join(preferredSet.keySet(), ",");
248             if (tag.equals("h")) {
249                 tag += "*";
250             }
251 
252             System.out.println(tag
253                 + "\t" + region
254                 + "\t" + ENGLISH.getName("territory", region)
255                 + "\t" + subcontinent
256                 + "\t" + ENGLISH.getName("territory", subcontinent)
257                 + "\t" + continent
258                 + "\t" + ENGLISH.getName("territory", continent)
259                 + "\t" + showInfo(preferredSet));
260         }
261 
262         // now present
263 
264         System.out.println("    <timeData>");
265         for (Entry<PreferredAndAllowedHour, Set<String>> e : preferred2Region.keyValuesSet()) {
266             PreferredAndAllowedHour preferredAndAllowedHour = e.getKey();
267             Set<String> regions = e.getValue();
268             System.out.println("        <hours "
269                 + "preferred=\""
270                 + preferredAndAllowedHour.preferred
271                 + "\""
272                 + " allowed=\""
273                 + CollectionUtilities.join(preferredAndAllowedHour.allowed, " ")
274                 + "\""
275                 + " regions=\"" + CollectionUtilities.join(regions, " ") + "\""
276                 + "/>");
277         }
278         System.out.println("    </timeData>");
279         System.out.println(overrides);
280     }
281 
showInfo(Relation<Character, String> preferredSet)282     private static String showInfo(Relation<Character, String> preferredSet) {
283         StringBuilder b = new StringBuilder();
284         for (Character key : Arrays.asList('H', 'h')) {
285             if (b.length() != 0) {
286                 b.append('\t');
287             }
288             b.append(key).append('\t');
289             Set<String> value = preferredSet.get(key);
290             if (value != null) {
291                 boolean needSpace = false;
292                 for (String locale : value) {
293                     if (needSpace) {
294                         b.append(" ");
295                     } else {
296                         needSpace = true;
297                     }
298                     b.append(locale);
299                     boolean isOfficial = false;
300                     isOfficial = isOfficial(locale, isOfficial);
301                     if (isOfficial) {
302                         b.append('°');
303                     }
304                 }
305             }
306         }
307         return b.toString();
308     }
309 
isOfficial(String locale, boolean isOfficial)310     private static boolean isOfficial(String locale, boolean isOfficial) {
311         LanguageTagParser ltp = new LanguageTagParser().set(locale);
312         PopulationData data = INFO.getSupplementalDataInfo().getLanguageAndTerritoryPopulationData(
313             ltp.getLanguageScript(), ltp.getRegion());
314         if (data == null) {
315             data = INFO.getSupplementalDataInfo().getLanguageAndTerritoryPopulationData(
316                 ltp.getLanguage(), ltp.getRegion());
317         }
318         if (data != null) {
319             OfficialStatus status = data.getOfficialStatus();
320             if (status == OfficialStatus.official || status == OfficialStatus.de_facto_official) {
321                 isOfficial = true;
322             }
323         }
324         return isOfficial;
325     }
326 }
327