1 // © 2016 and later: Unicode, Inc. and others.
2 // License & terms of use: http://www.unicode.org/copyright.html
3 /*
4 ********************************************************************************
5 *   Copyright (C) 1997-2013, International Business Machines
6 *   Corporation and others.  All Rights Reserved.
7 ********************************************************************************
8 *
9 * File CHOICFMT.H
10 *
11 * Modification History:
12 *
13 *   Date        Name        Description
14 *   02/19/97    aliu        Converted from java.
15 *   03/20/97    helena      Finished first cut of implementation and got rid
16 *                           of nextDouble/previousDouble and replaced with
17 *                           boolean array.
18 *   4/10/97     aliu        Clean up.  Modified to work on AIX.
19 *   8/6/97      nos         Removed overloaded constructor, member var 'buffer'.
20 *   07/22/98    stephen     Removed operator!= (implemented in Format)
21 ********************************************************************************
22 */
23 
24 #ifndef CHOICFMT_H
25 #define CHOICFMT_H
26 
27 #include "unicode/utypes.h"
28 
29 #if U_SHOW_CPLUSPLUS_API
30 
31 /**
32  * \file
33  * \brief C++ API: Choice Format.
34  */
35 
36 #if !UCONFIG_NO_FORMATTING
37 
38 #include "unicode/fieldpos.h"
39 #include "unicode/format.h"
40 #include "unicode/messagepattern.h"
41 #include "unicode/numfmt.h"
42 #include "unicode/unistr.h"
43 
44 #ifndef U_HIDE_DEPRECATED_API
45 
46 U_NAMESPACE_BEGIN
47 
48 class MessageFormat;
49 
50 /**
51  * ChoiceFormat converts between ranges of numeric values and strings for those ranges.
52  * The strings must conform to the MessageFormat pattern syntax.
53  *
54  * <p><em><code>ChoiceFormat</code> is probably not what you need.
55  * Please use <code>MessageFormat</code>
56  * with <code>plural</code> arguments for proper plural selection,
57  * and <code>select</code> arguments for simple selection among a fixed set of choices!</em></p>
58  *
59  * <p>A <code>ChoiceFormat</code> splits
60  * the real number line \htmlonly<code>-&#x221E;</code> to
61  * <code>+&#x221E;</code>\endhtmlonly into two
62  * or more contiguous ranges. Each range is mapped to a
63  * string.</p>
64  *
65  * <p><code>ChoiceFormat</code> was originally intended
66  * for displaying grammatically correct
67  * plurals such as &quot;There is one file.&quot; vs. &quot;There are 2 files.&quot;
68  * <em>However,</em> plural rules for many languages
69  * are too complex for the capabilities of ChoiceFormat,
70  * and its requirement of specifying the precise rules for each message
71  * is unmanageable for translators.</p>
72  *
73  * <p>There are two methods of defining a <code>ChoiceFormat</code>; both
74  * are equivalent.  The first is by using a string pattern. This is the
75  * preferred method in most cases.  The second method is through direct
76  * specification of the arrays that logically make up the
77  * <code>ChoiceFormat</code>.</p>
78  *
79  * <p>Note: Typically, choice formatting is done (if done at all) via <code>MessageFormat</code>
80  * with a <code>choice</code> argument type,
81  * rather than using a stand-alone <code>ChoiceFormat</code>.</p>
82  *
83  * <h5>Patterns and Their Interpretation</h5>
84  *
85  * <p>The pattern string defines the range boundaries and the strings for each number range.
86  * Syntax:
87  * <pre>
88  * choiceStyle = number separator message ('|' number separator message)*
89  * number = normal_number | ['-'] \htmlonly&#x221E;\endhtmlonly (U+221E, infinity)
90  * normal_number = double value (unlocalized ASCII string)
91  * separator = less_than | less_than_or_equal
92  * less_than = '<'
93  * less_than_or_equal = '#' | \htmlonly&#x2264;\endhtmlonly (U+2264)
94  * message: see {@link MessageFormat}
95  * </pre>
96  * Pattern_White_Space between syntax elements is ignored, except
97  * around each range's sub-message.</p>
98  *
99  * <p>Each numeric sub-range extends from the current range's number
100  * to the next range's number.
101  * The number itself is included in its range if a <code>less_than_or_equal</code> sign is used,
102  * and excluded from its range (and instead included in the previous range)
103  * if a <code>less_than</code> sign is used.</p>
104  *
105  * <p>When a <code>ChoiceFormat</code> is constructed from
106  * arrays of numbers, closure flags and strings,
107  * they are interpreted just like
108  * the sequence of <code>(number separator string)</code> in an equivalent pattern string.
109  * <code>closure[i]==true</code> corresponds to a <code>less_than</code> separator sign.
110  * The equivalent pattern string will be constructed automatically.</p>
111  *
112  * <p>During formatting, a number is mapped to the first range
113  * where the number is not greater than the range's upper limit.
114  * That range's message string is returned. A NaN maps to the very first range.</p>
115  *
116  * <p>During parsing, a range is selected for the longest match of
117  * any range's message. That range's number is returned, ignoring the separator/closure.
118  * Only a simple string match is performed, without parsing of arguments that
119  * might be specified in the message strings.</p>
120  *
121  * <p>Note that the first range's number is ignored in formatting
122  * but may be returned from parsing.</p>
123  *
124  * <h5>Examples</h5>
125  *
126  * <p>Here is an example of two arrays that map the number
127  * <code>1..7</code> to the English day of the week abbreviations
128  * <code>Sun..Sat</code>. No closures array is given; this is the same as
129  * specifying all closures to be <code>false</code>.</p>
130  *
131  * <pre>    {1,2,3,4,5,6,7},
132  *     {&quot;Sun&quot;,&quot;Mon&quot;,&quot;Tue&quot;,&quot;Wed&quot;,&quot;Thur&quot;,&quot;Fri&quot;,&quot;Sat&quot;}</pre>
133  *
134  * <p>Here is an example that maps the ranges [-Inf, 1), [1, 1], and (1,
135  * +Inf] to three strings. That is, the number line is split into three
136  * ranges: x &lt; 1.0, x = 1.0, and x &gt; 1.0.
137  * (The round parentheses in the notation above indicate an exclusive boundary,
138  * like the turned bracket in European notation: [-Inf, 1) == [-Inf, 1[  )</p>
139  *
140  * <pre>    {0, 1, 1},
141  *     {false, false, true},
142  *     {&quot;no files&quot;, &quot;one file&quot;, &quot;many files&quot;}</pre>
143  *
144  * <p>Here is an example that shows formatting and parsing: </p>
145  *
146  * \code
147  *   #include <unicode/choicfmt.h>
148  *   #include <unicode/unistr.h>
149  *   #include <iostream.h>
150  *
151  *   int main(int argc, char *argv[]) {
152  *       double limits[] = {1,2,3,4,5,6,7};
153  *       UnicodeString monthNames[] = {
154  *           "Sun","Mon","Tue","Wed","Thu","Fri","Sat"};
155  *       ChoiceFormat fmt(limits, monthNames, 7);
156  *       UnicodeString str;
157  *       char buf[256];
158  *       for (double x = 1.0; x <= 8.0; x += 1.0) {
159  *           fmt.format(x, str);
160  *           str.extract(0, str.length(), buf, 256, "");
161  *           str.truncate(0);
162  *           cout << x << " -> "
163  *                << buf << endl;
164  *       }
165  *       cout << endl;
166  *       return 0;
167  *   }
168  * \endcode
169  *
170  * <p><em>User subclasses are not supported.</em> While clients may write
171  * subclasses, such code will not necessarily work and will not be
172  * guaranteed to work stably from release to release.
173  *
174  * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
175  */
176 class U_I18N_API ChoiceFormat: public NumberFormat {
177 public:
178     /**
179      * Constructs a new ChoiceFormat from the pattern string.
180      *
181      * @param pattern   Pattern used to construct object.
182      * @param status    Output param to receive success code.  If the
183      *                  pattern cannot be parsed, set to failure code.
184      * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
185      */
186     ChoiceFormat(const UnicodeString& pattern,
187                  UErrorCode& status);
188 
189 
190     /**
191      * Constructs a new ChoiceFormat with the given limits and message strings.
192      * All closure flags default to <code>false</code>,
193      * equivalent to <code>less_than_or_equal</code> separators.
194      *
195      * Copies the limits and formats instead of adopting them.
196      *
197      * @param limits    Array of limit values.
198      * @param formats   Array of formats.
199      * @param count     Size of 'limits' and 'formats' arrays.
200      * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
201      */
202     ChoiceFormat(const double* limits,
203                  const UnicodeString* formats,
204                  int32_t count );
205 
206     /**
207      * Constructs a new ChoiceFormat with the given limits, closure flags and message strings.
208      *
209      * Copies the limits and formats instead of adopting them.
210      *
211      * @param limits Array of limit values
212      * @param closures Array of booleans specifying whether each
213      * element of 'limits' is open or closed.  If false, then the
214      * corresponding limit number is a member of its range.
215      * If true, then the limit number belongs to the previous range it.
216      * @param formats Array of formats
217      * @param count Size of 'limits', 'closures', and 'formats' arrays
218      * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
219      */
220     ChoiceFormat(const double* limits,
221                  const UBool* closures,
222                  const UnicodeString* formats,
223                  int32_t count);
224 
225     /**
226      * Copy constructor.
227      *
228      * @param that   ChoiceFormat object to be copied from
229      * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
230      */
231     ChoiceFormat(const ChoiceFormat& that);
232 
233     /**
234      * Assignment operator.
235      *
236      * @param that   ChoiceFormat object to be copied
237      * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
238      */
239     const ChoiceFormat& operator=(const ChoiceFormat& that);
240 
241     /**
242      * Destructor.
243      * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
244      */
245     virtual ~ChoiceFormat();
246 
247     /**
248      * Clones this Format object. The caller owns the
249      * result and must delete it when done.
250      *
251      * @return a copy of this object
252      * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
253      */
254     virtual ChoiceFormat* clone() const;
255 
256     /**
257      * Returns true if the given Format objects are semantically equal.
258      * Objects of different subclasses are considered unequal.
259      *
260      * @param other    ChoiceFormat object to be compared
261      * @return         true if other is the same as this.
262      * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
263      */
264     virtual UBool operator==(const Format& other) const;
265 
266     /**
267      * Sets the pattern.
268      * @param pattern   The pattern to be applied.
269      * @param status    Output param set to success/failure code on
270      *                  exit. If the pattern is invalid, this will be
271      *                  set to a failure result.
272      * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
273      */
274     virtual void applyPattern(const UnicodeString& pattern,
275                               UErrorCode& status);
276 
277     /**
278      * Sets the pattern.
279      * @param pattern    The pattern to be applied.
280      * @param parseError Struct to receive information on position
281      *                   of error if an error is encountered
282      * @param status     Output param set to success/failure code on
283      *                   exit. If the pattern is invalid, this will be
284      *                   set to a failure result.
285      * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
286      */
287     virtual void applyPattern(const UnicodeString& pattern,
288                              UParseError& parseError,
289                              UErrorCode& status);
290     /**
291      * Gets the pattern.
292      *
293      * @param pattern    Output param which will receive the pattern
294      *                   Previous contents are deleted.
295      * @return    A reference to 'pattern'
296      * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
297      */
298     virtual UnicodeString& toPattern(UnicodeString &pattern) const;
299 
300     /**
301      * Sets the choices to be used in formatting.
302      * For details see the constructor with the same parameter list.
303      *
304      * @param limitsToCopy      Contains the top value that you want
305      *                          parsed with that format,and should be in
306      *                          ascending sorted order. When formatting X,
307      *                          the choice will be the i, where limit[i]
308      *                          &lt;= X &lt; limit[i+1].
309      * @param formatsToCopy     The format strings you want to use for each limit.
310      * @param count             The size of the above arrays.
311      * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
312      */
313     virtual void setChoices(const double* limitsToCopy,
314                             const UnicodeString* formatsToCopy,
315                             int32_t count );
316 
317     /**
318      * Sets the choices to be used in formatting.
319      * For details see the constructor with the same parameter list.
320      *
321      * @param limits Array of limits
322      * @param closures Array of limit booleans
323      * @param formats Array of format string
324      * @param count The size of the above arrays
325      * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
326      */
327     virtual void setChoices(const double* limits,
328                             const UBool* closures,
329                             const UnicodeString* formats,
330                             int32_t count);
331 
332     /**
333      * Returns NULL and 0.
334      * Before ICU 4.8, this used to return the choice limits array.
335      *
336      * @param count Will be set to 0.
337      * @return NULL
338      * @deprecated ICU 4.8 Use the MessagePattern class to analyze a ChoiceFormat pattern.
339      */
340     virtual const double* getLimits(int32_t& count) const;
341 
342     /**
343      * Returns NULL and 0.
344      * Before ICU 4.8, this used to return the limit booleans array.
345      *
346      * @param count Will be set to 0.
347      * @return NULL
348      * @deprecated ICU 4.8 Use the MessagePattern class to analyze a ChoiceFormat pattern.
349      */
350     virtual const UBool* getClosures(int32_t& count) const;
351 
352     /**
353      * Returns NULL and 0.
354      * Before ICU 4.8, this used to return the array of choice strings.
355      *
356      * @param count Will be set to 0.
357      * @return NULL
358      * @deprecated ICU 4.8 Use the MessagePattern class to analyze a ChoiceFormat pattern.
359      */
360     virtual const UnicodeString* getFormats(int32_t& count) const;
361 
362 
363     using NumberFormat::format;
364 
365     /**
366      * Formats a double number using this object's choices.
367      *
368      * @param number    The value to be formatted.
369      * @param appendTo  Output parameter to receive result.
370      *                  Result is appended to existing contents.
371      * @param pos       On input: an alignment field, if desired.
372      *                  On output: the offsets of the alignment field.
373      * @return          Reference to 'appendTo' parameter.
374      * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
375      */
376     virtual UnicodeString& format(double number,
377                                   UnicodeString& appendTo,
378                                   FieldPosition& pos) const;
379     /**
380      * Formats an int32_t number using this object's choices.
381      *
382      * @param number    The value to be formatted.
383      * @param appendTo  Output parameter to receive result.
384      *                  Result is appended to existing contents.
385      * @param pos       On input: an alignment field, if desired.
386      *                  On output: the offsets of the alignment field.
387      * @return          Reference to 'appendTo' parameter.
388      * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
389      */
390     virtual UnicodeString& format(int32_t number,
391                                   UnicodeString& appendTo,
392                                   FieldPosition& pos) const;
393 
394     /**
395      * Formats an int64_t number using this object's choices.
396      *
397      * @param number    The value to be formatted.
398      * @param appendTo  Output parameter to receive result.
399      *                  Result is appended to existing contents.
400      * @param pos       On input: an alignment field, if desired.
401      *                  On output: the offsets of the alignment field.
402      * @return          Reference to 'appendTo' parameter.
403      * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
404      */
405     virtual UnicodeString& format(int64_t number,
406                                   UnicodeString& appendTo,
407                                   FieldPosition& pos) const;
408 
409     /**
410      * Formats an array of objects using this object's choices.
411      *
412      * @param objs      The array of objects to be formatted.
413      * @param cnt       The size of objs.
414      * @param appendTo  Output parameter to receive result.
415      *                  Result is appended to existing contents.
416      * @param pos       On input: an alignment field, if desired.
417      *                  On output: the offsets of the alignment field.
418      * @param success   Output param set to success/failure code on
419      *                  exit.
420      * @return          Reference to 'appendTo' parameter.
421      * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
422      */
423     virtual UnicodeString& format(const Formattable* objs,
424                                   int32_t cnt,
425                                   UnicodeString& appendTo,
426                                   FieldPosition& pos,
427                                   UErrorCode& success) const;
428 
429    using NumberFormat::parse;
430 
431    /**
432     * Looks for the longest match of any message string on the input text and,
433     * if there is a match, sets the result object to the corresponding range's number.
434     *
435     * If no string matches, then the parsePosition is unchanged.
436     *
437     * @param text           The text to be parsed.
438     * @param result         Formattable to be set to the parse result.
439     *                       If parse fails, return contents are undefined.
440     * @param parsePosition  The position to start parsing at on input.
441     *                       On output, moved to after the last successfully
442     *                       parse character. On parse failure, does not change.
443      * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
444     */
445     virtual void parse(const UnicodeString& text,
446                        Formattable& result,
447                        ParsePosition& parsePosition) const;
448 
449     /**
450      * Returns a unique class ID POLYMORPHICALLY. Part of ICU's "poor man's RTTI".
451      *
452      * @return          The class ID for this object. All objects of a
453      *                  given class have the same class ID.  Objects of
454      *                  other classes have different class IDs.
455      * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
456      */
457     virtual UClassID getDynamicClassID(void) const;
458 
459     /**
460      * Returns the class ID for this class.  This is useful only for
461      * comparing to a return value from getDynamicClassID().  For example:
462      * <pre>
463      * .       Base* polymorphic_pointer = createPolymorphicObject();
464      * .       if (polymorphic_pointer->getDynamicClassID() ==
465      * .           Derived::getStaticClassID()) ...
466      * </pre>
467      * @return          The class ID for all objects of this class.
468      * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
469      */
470     static UClassID U_EXPORT2 getStaticClassID(void);
471 
472 private:
473     /**
474      * Converts a double value to a string.
475      * @param value the double number to be converted.
476      * @param string the result string.
477      * @return the converted string.
478      */
479     static UnicodeString& dtos(double value, UnicodeString& string);
480 
481     ChoiceFormat(); // default constructor not implemented
482 
483     /**
484      * Construct a new ChoiceFormat with the limits and the corresponding formats
485      * based on the pattern.
486      *
487      * @param newPattern   Pattern used to construct object.
488      * @param parseError   Struct to receive information on position
489      *                     of error if an error is encountered.
490      * @param status       Output param to receive success code.  If the
491      *                     pattern cannot be parsed, set to failure code.
492      */
493     ChoiceFormat(const UnicodeString& newPattern,
494                  UParseError& parseError,
495                  UErrorCode& status);
496 
497     friend class MessageFormat;
498 
499     virtual void setChoices(const double* limits,
500                             const UBool* closures,
501                             const UnicodeString* formats,
502                             int32_t count,
503                             UErrorCode &errorCode);
504 
505     /**
506      * Finds the ChoiceFormat sub-message for the given number.
507      * @param pattern A MessagePattern.
508      * @param partIndex the index of the first ChoiceFormat argument style part.
509      * @param number a number to be mapped to one of the ChoiceFormat argument's intervals
510      * @return the sub-message start part index.
511      */
512     static int32_t findSubMessage(const MessagePattern &pattern, int32_t partIndex, double number);
513 
514     static double parseArgument(
515             const MessagePattern &pattern, int32_t partIndex,
516             const UnicodeString &source, ParsePosition &pos);
517 
518     /**
519      * Matches the pattern string from the end of the partIndex to
520      * the beginning of the limitPartIndex,
521      * including all syntax except SKIP_SYNTAX,
522      * against the source string starting at sourceOffset.
523      * If they match, returns the length of the source string match.
524      * Otherwise returns -1.
525      */
526     static int32_t matchStringUntilLimitPart(
527             const MessagePattern &pattern, int32_t partIndex, int32_t limitPartIndex,
528             const UnicodeString &source, int32_t sourceOffset);
529 
530     /**
531      * Some of the ChoiceFormat constructors do not have a UErrorCode paramater.
532      * We need _some_ way to provide one for the MessagePattern constructor.
533      * Alternatively, the MessagePattern could be a pointer field, but that is
534      * not nice either.
535      */
536     UErrorCode constructorErrorCode;
537 
538     /**
539      * The MessagePattern which contains the parsed structure of the pattern string.
540      *
541      * Starting with ICU 4.8, the MessagePattern contains a sequence of
542      * numeric/selector/message parts corresponding to the parsed pattern.
543      * For details see the MessagePattern class API docs.
544      */
545     MessagePattern msgPattern;
546 
547     /**
548      * Docs & fields from before ICU 4.8, before MessagePattern was used.
549      * Commented out, and left only for explanation of semantics.
550      * --------
551      * Each ChoiceFormat divides the range -Inf..+Inf into fCount
552      * intervals.  The intervals are:
553      *
554      *         0: fChoiceLimits[0]..fChoiceLimits[1]
555      *         1: fChoiceLimits[1]..fChoiceLimits[2]
556      *        ...
557      *  fCount-2: fChoiceLimits[fCount-2]..fChoiceLimits[fCount-1]
558      *  fCount-1: fChoiceLimits[fCount-1]..+Inf
559      *
560      * Interval 0 is special; during formatting (mapping numbers to
561      * strings), it also contains all numbers less than
562      * fChoiceLimits[0], as well as NaN values.
563      *
564      * Interval i maps to and from string fChoiceFormats[i].  When
565      * parsing (mapping strings to numbers), then intervals map to
566      * their lower limit, that is, interval i maps to fChoiceLimit[i].
567      *
568      * The intervals may be closed, half open, or open.  This affects
569      * formatting but does not affect parsing.  Interval i is affected
570      * by fClosures[i] and fClosures[i+1].  If fClosures[i]
571      * is false, then the value fChoiceLimits[i] is in interval i.
572      * That is, intervals i and i are:
573      *
574      *  i-1:                 ... x < fChoiceLimits[i]
575      *    i: fChoiceLimits[i] <= x ...
576      *
577      * If fClosures[i] is true, then the value fChoiceLimits[i] is
578      * in interval i-1.  That is, intervals i-1 and i are:
579      *
580      *  i-1:                ... x <= fChoiceLimits[i]
581      *    i: fChoiceLimits[i] < x ...
582      *
583      * Because of the nature of interval 0, fClosures[0] has no
584      * effect.
585      */
586     // double*         fChoiceLimits;
587     // UBool*          fClosures;
588     // UnicodeString*  fChoiceFormats;
589     // int32_t         fCount;
590 };
591 
592 
593 U_NAMESPACE_END
594 
595 #endif  // U_HIDE_DEPRECATED_API
596 #endif /* #if !UCONFIG_NO_FORMATTING */
597 
598 #endif /* U_SHOW_CPLUSPLUS_API */
599 
600 #endif // CHOICFMT_H
601 //eof
602