choicfmt.h revision c73f511526464f8e56c242df80552e9b0d94ae3d
1/*
2********************************************************************************
3*   Copyright (C) 1997-2013, International Business Machines
4*   Corporation and others.  All Rights Reserved.
5********************************************************************************
6*
7* File CHOICFMT.H
8*
9* Modification History:
10*
11*   Date        Name        Description
12*   02/19/97    aliu        Converted from java.
13*   03/20/97    helena      Finished first cut of implementation and got rid
14*                           of nextDouble/previousDouble and replaced with
15*                           boolean array.
16*   4/10/97     aliu        Clean up.  Modified to work on AIX.
17*   8/6/97      nos         Removed overloaded constructor, member var 'buffer'.
18*   07/22/98    stephen     Removed operator!= (implemented in Format)
19********************************************************************************
20*/
21
22#ifndef CHOICFMT_H
23#define CHOICFMT_H
24
25#include "unicode/utypes.h"
26
27/**
28 * \file
29 * \brief C++ API: Choice Format.
30 */
31
32#if !UCONFIG_NO_FORMATTING
33#ifndef U_HIDE_DEPRECATED_API
34
35#include "unicode/fieldpos.h"
36#include "unicode/format.h"
37#include "unicode/messagepattern.h"
38#include "unicode/numfmt.h"
39#include "unicode/unistr.h"
40
41U_NAMESPACE_BEGIN
42
43class MessageFormat;
44
45/**
46 * ChoiceFormat converts between ranges of numeric values and strings for those ranges.
47 * The strings must conform to the MessageFormat pattern syntax.
48 *
49 * <p><em><code>ChoiceFormat</code> is probably not what you need.
50 * Please use <code>MessageFormat</code>
51 * with <code>plural</code> arguments for proper plural selection,
52 * and <code>select</code> arguments for simple selection among a fixed set of choices!</em></p>
53 *
54 * <p>A <code>ChoiceFormat</code> splits
55 * the real number line \htmlonly<code>-&#x221E;</code> to
56 * <code>+&#x221E;</code>\endhtmlonly into two
57 * or more contiguous ranges. Each range is mapped to a
58 * string.</p>
59 *
60 * <p><code>ChoiceFormat</code> was originally intended
61 * for displaying grammatically correct
62 * plurals such as &quot;There is one file.&quot; vs. &quot;There are 2 files.&quot;
63 * <em>However,</em> plural rules for many languages
64 * are too complex for the capabilities of ChoiceFormat,
65 * and its requirement of specifying the precise rules for each message
66 * is unmanageable for translators.</p>
67 *
68 * <p>There are two methods of defining a <code>ChoiceFormat</code>; both
69 * are equivalent.  The first is by using a string pattern. This is the
70 * preferred method in most cases.  The second method is through direct
71 * specification of the arrays that logically make up the
72 * <code>ChoiceFormat</code>.</p>
73 *
74 * <p>Note: Typically, choice formatting is done (if done at all) via <code>MessageFormat</code>
75 * with a <code>choice</code> argument type,
76 * rather than using a stand-alone <code>ChoiceFormat</code>.</p>
77 *
78 * <h5>Patterns and Their Interpretation</h5>
79 *
80 * <p>The pattern string defines the range boundaries and the strings for each number range.
81 * Syntax:
82 * <pre>
83 * choiceStyle = number separator message ('|' number separator message)*
84 * number = normal_number | ['-'] \htmlonly&#x221E;\endhtmlonly (U+221E, infinity)
85 * normal_number = double value (unlocalized ASCII string)
86 * separator = less_than | less_than_or_equal
87 * less_than = '<'
88 * less_than_or_equal = '#' | \htmlonly&#x2264;\endhtmlonly (U+2264)
89 * message: see {@link MessageFormat}
90 * </pre>
91 * Pattern_White_Space between syntax elements is ignored, except
92 * around each range's sub-message.</p>
93 *
94 * <p>Each numeric sub-range extends from the current range's number
95 * to the next range's number.
96 * The number itself is included in its range if a <code>less_than_or_equal</code> sign is used,
97 * and excluded from its range (and instead included in the previous range)
98 * if a <code>less_than</code> sign is used.</p>
99 *
100 * <p>When a <code>ChoiceFormat</code> is constructed from
101 * arrays of numbers, closure flags and strings,
102 * they are interpreted just like
103 * the sequence of <code>(number separator string)</code> in an equivalent pattern string.
104 * <code>closure[i]==TRUE</code> corresponds to a <code>less_than</code> separator sign.
105 * The equivalent pattern string will be constructed automatically.</p>
106 *
107 * <p>During formatting, a number is mapped to the first range
108 * where the number is not greater than the range's upper limit.
109 * That range's message string is returned. A NaN maps to the very first range.</p>
110 *
111 * <p>During parsing, a range is selected for the longest match of
112 * any range's message. That range's number is returned, ignoring the separator/closure.
113 * Only a simple string match is performed, without parsing of arguments that
114 * might be specified in the message strings.</p>
115 *
116 * <p>Note that the first range's number is ignored in formatting
117 * but may be returned from parsing.</p>
118 *
119 * <h5>Examples</h5>
120 *
121 * <p>Here is an example of two arrays that map the number
122 * <code>1..7</code> to the English day of the week abbreviations
123 * <code>Sun..Sat</code>. No closures array is given; this is the same as
124 * specifying all closures to be <code>FALSE</code>.</p>
125 *
126 * <pre>    {1,2,3,4,5,6,7},
127 *     {&quot;Sun&quot;,&quot;Mon&quot;,&quot;Tue&quot;,&quot;Wed&quot;,&quot;Thur&quot;,&quot;Fri&quot;,&quot;Sat&quot;}</pre>
128 *
129 * <p>Here is an example that maps the ranges [-Inf, 1), [1, 1], and (1,
130 * +Inf] to three strings. That is, the number line is split into three
131 * ranges: x &lt; 1.0, x = 1.0, and x &gt; 1.0.
132 * (The round parentheses in the notation above indicate an exclusive boundary,
133 * like the turned bracket in European notation: [-Inf, 1) == [-Inf, 1[  )</p>
134 *
135 * <pre>    {0, 1, 1},
136 *     {FALSE, FALSE, TRUE},
137 *     {&quot;no files&quot;, &quot;one file&quot;, &quot;many files&quot;}</pre>
138 *
139 * <p>Here is an example that shows formatting and parsing: </p>
140 *
141 * \code
142 *   #include <unicode/choicfmt.h>
143 *   #include <unicode/unistr.h>
144 *   #include <iostream.h>
145 *
146 *   int main(int argc, char *argv[]) {
147 *       double limits[] = {1,2,3,4,5,6,7};
148 *       UnicodeString monthNames[] = {
149 *           "Sun","Mon","Tue","Wed","Thu","Fri","Sat"};
150 *       ChoiceFormat fmt(limits, monthNames, 7);
151 *       UnicodeString str;
152 *       char buf[256];
153 *       for (double x = 1.0; x <= 8.0; x += 1.0) {
154 *           fmt.format(x, str);
155 *           str.extract(0, str.length(), buf, 256, "");
156 *           str.truncate(0);
157 *           cout << x << " -> "
158 *                << buf << endl;
159 *       }
160 *       cout << endl;
161 *       return 0;
162 *   }
163 * \endcode
164 *
165 * <p><em>User subclasses are not supported.</em> While clients may write
166 * subclasses, such code will not necessarily work and will not be
167 * guaranteed to work stably from release to release.
168 *
169 * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
170 */
171class U_I18N_API ChoiceFormat: public NumberFormat {
172public:
173    /**
174     * Constructs a new ChoiceFormat from the pattern string.
175     *
176     * @param pattern   Pattern used to construct object.
177     * @param status    Output param to receive success code.  If the
178     *                  pattern cannot be parsed, set to failure code.
179     * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
180     */
181    ChoiceFormat(const UnicodeString& pattern,
182                 UErrorCode& status);
183
184
185    /**
186     * Constructs a new ChoiceFormat with the given limits and message strings.
187     * All closure flags default to <code>FALSE</code>,
188     * equivalent to <code>less_than_or_equal</code> separators.
189     *
190     * Copies the limits and formats instead of adopting them.
191     *
192     * @param limits    Array of limit values.
193     * @param formats   Array of formats.
194     * @param count     Size of 'limits' and 'formats' arrays.
195     * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
196     */
197    ChoiceFormat(const double* limits,
198                 const UnicodeString* formats,
199                 int32_t count );
200
201    /**
202     * Constructs a new ChoiceFormat with the given limits, closure flags and message strings.
203     *
204     * Copies the limits and formats instead of adopting them.
205     *
206     * @param limits Array of limit values
207     * @param closures Array of booleans specifying whether each
208     * element of 'limits' is open or closed.  If FALSE, then the
209     * corresponding limit number is a member of its range.
210     * If TRUE, then the limit number belongs to the previous range it.
211     * @param formats Array of formats
212     * @param count Size of 'limits', 'closures', and 'formats' arrays
213     * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
214     */
215    ChoiceFormat(const double* limits,
216                 const UBool* closures,
217                 const UnicodeString* formats,
218                 int32_t count);
219
220    /**
221     * Copy constructor.
222     *
223     * @param that   ChoiceFormat object to be copied from
224     * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
225     */
226    ChoiceFormat(const ChoiceFormat& that);
227
228    /**
229     * Assignment operator.
230     *
231     * @param that   ChoiceFormat object to be copied
232     * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
233     */
234    const ChoiceFormat& operator=(const ChoiceFormat& that);
235
236    /**
237     * Destructor.
238     * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
239     */
240    virtual ~ChoiceFormat();
241
242    /**
243     * Clones this Format object. The caller owns the
244     * result and must delete it when done.
245     *
246     * @return a copy of this object
247     * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
248     */
249    virtual Format* clone(void) const;
250
251    /**
252     * Returns true if the given Format objects are semantically equal.
253     * Objects of different subclasses are considered unequal.
254     *
255     * @param other    ChoiceFormat object to be compared
256     * @return         true if other is the same as this.
257     * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
258     */
259    virtual UBool operator==(const Format& other) const;
260
261    /**
262     * Sets the pattern.
263     * @param pattern   The pattern to be applied.
264     * @param status    Output param set to success/failure code on
265     *                  exit. If the pattern is invalid, this will be
266     *                  set to a failure result.
267     * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
268     */
269    virtual void applyPattern(const UnicodeString& pattern,
270                              UErrorCode& status);
271
272    /**
273     * Sets the pattern.
274     * @param pattern    The pattern to be applied.
275     * @param parseError Struct to receive information on position
276     *                   of error if an error is encountered
277     * @param status     Output param set to success/failure code on
278     *                   exit. If the pattern is invalid, this will be
279     *                   set to a failure result.
280     * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
281     */
282    virtual void applyPattern(const UnicodeString& pattern,
283                             UParseError& parseError,
284                             UErrorCode& status);
285    /**
286     * Gets the pattern.
287     *
288     * @param pattern    Output param which will receive the pattern
289     *                   Previous contents are deleted.
290     * @return    A reference to 'pattern'
291     * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
292     */
293    virtual UnicodeString& toPattern(UnicodeString &pattern) const;
294
295    /**
296     * Sets the choices to be used in formatting.
297     * For details see the constructor with the same parameter list.
298     *
299     * @param limitsToCopy      Contains the top value that you want
300     *                          parsed with that format,and should be in
301     *                          ascending sorted order. When formatting X,
302     *                          the choice will be the i, where limit[i]
303     *                          &lt;= X &lt; limit[i+1].
304     * @param formatsToCopy     The format strings you want to use for each limit.
305     * @param count             The size of the above arrays.
306     * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
307     */
308    virtual void setChoices(const double* limitsToCopy,
309                            const UnicodeString* formatsToCopy,
310                            int32_t count );
311
312    /**
313     * Sets the choices to be used in formatting.
314     * For details see the constructor with the same parameter list.
315     *
316     * @param limits Array of limits
317     * @param closures Array of limit booleans
318     * @param formats Array of format string
319     * @param count The size of the above arrays
320     * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
321     */
322    virtual void setChoices(const double* limits,
323                            const UBool* closures,
324                            const UnicodeString* formats,
325                            int32_t count);
326
327    /**
328     * Returns NULL and 0.
329     * Before ICU 4.8, this used to return the choice limits array.
330     *
331     * @param count Will be set to 0.
332     * @return NULL
333     * @deprecated ICU 4.8 Use the MessagePattern class to analyze a ChoiceFormat pattern.
334     */
335    virtual const double* getLimits(int32_t& count) const;
336
337    /**
338     * Returns NULL and 0.
339     * Before ICU 4.8, this used to return the limit booleans array.
340     *
341     * @param count Will be set to 0.
342     * @return NULL
343     * @deprecated ICU 4.8 Use the MessagePattern class to analyze a ChoiceFormat pattern.
344     */
345    virtual const UBool* getClosures(int32_t& count) const;
346
347    /**
348     * Returns NULL and 0.
349     * Before ICU 4.8, this used to return the array of choice strings.
350     *
351     * @param count Will be set to 0.
352     * @return NULL
353     * @deprecated ICU 4.8 Use the MessagePattern class to analyze a ChoiceFormat pattern.
354     */
355    virtual const UnicodeString* getFormats(int32_t& count) const;
356
357
358    using NumberFormat::format;
359
360    /**
361     * Formats a double number using this object's choices.
362     *
363     * @param number    The value to be formatted.
364     * @param appendTo  Output parameter to receive result.
365     *                  Result is appended to existing contents.
366     * @param pos       On input: an alignment field, if desired.
367     *                  On output: the offsets of the alignment field.
368     * @return          Reference to 'appendTo' parameter.
369     * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
370     */
371    virtual UnicodeString& format(double number,
372                                  UnicodeString& appendTo,
373                                  FieldPosition& pos) const;
374    /**
375     * Formats an int32_t number using this object's choices.
376     *
377     * @param number    The value to be formatted.
378     * @param appendTo  Output parameter to receive result.
379     *                  Result is appended to existing contents.
380     * @param pos       On input: an alignment field, if desired.
381     *                  On output: the offsets of the alignment field.
382     * @return          Reference to 'appendTo' parameter.
383     * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
384     */
385    virtual UnicodeString& format(int32_t number,
386                                  UnicodeString& appendTo,
387                                  FieldPosition& pos) const;
388
389    /**
390     * Formats an int64_t number using this object's choices.
391     *
392     * @param number    The value to be formatted.
393     * @param appendTo  Output parameter to receive result.
394     *                  Result is appended to existing contents.
395     * @param pos       On input: an alignment field, if desired.
396     *                  On output: the offsets of the alignment field.
397     * @return          Reference to 'appendTo' parameter.
398     * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
399     */
400    virtual UnicodeString& format(int64_t number,
401                                  UnicodeString& appendTo,
402                                  FieldPosition& pos) const;
403
404    /**
405     * Formats an array of objects using this object's choices.
406     *
407     * @param objs      The array of objects to be formatted.
408     * @param cnt       The size of objs.
409     * @param appendTo  Output parameter to receive result.
410     *                  Result is appended to existing contents.
411     * @param pos       On input: an alignment field, if desired.
412     *                  On output: the offsets of the alignment field.
413     * @param success   Output param set to success/failure code on
414     *                  exit.
415     * @return          Reference to 'appendTo' parameter.
416     * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
417     */
418    virtual UnicodeString& format(const Formattable* objs,
419                                  int32_t cnt,
420                                  UnicodeString& appendTo,
421                                  FieldPosition& pos,
422                                  UErrorCode& success) const;
423
424   using NumberFormat::parse;
425
426   /**
427    * Looks for the longest match of any message string on the input text and,
428    * if there is a match, sets the result object to the corresponding range's number.
429    *
430    * If no string matches, then the parsePosition is unchanged.
431    *
432    * @param text           The text to be parsed.
433    * @param result         Formattable to be set to the parse result.
434    *                       If parse fails, return contents are undefined.
435    * @param parsePosition  The position to start parsing at on input.
436    *                       On output, moved to after the last successfully
437    *                       parse character. On parse failure, does not change.
438     * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
439    */
440    virtual void parse(const UnicodeString& text,
441                       Formattable& result,
442                       ParsePosition& parsePosition) const;
443
444    /**
445     * Returns a unique class ID POLYMORPHICALLY. Part of ICU's "poor man's RTTI".
446     *
447     * @return          The class ID for this object. All objects of a
448     *                  given class have the same class ID.  Objects of
449     *                  other classes have different class IDs.
450     * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
451     */
452    virtual UClassID getDynamicClassID(void) const;
453
454    /**
455     * Returns the class ID for this class.  This is useful only for
456     * comparing to a return value from getDynamicClassID().  For example:
457     * <pre>
458     * .       Base* polymorphic_pointer = createPolymorphicObject();
459     * .       if (polymorphic_pointer->getDynamicClassID() ==
460     * .           Derived::getStaticClassID()) ...
461     * </pre>
462     * @return          The class ID for all objects of this class.
463     * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
464     */
465    static UClassID U_EXPORT2 getStaticClassID(void);
466
467private:
468    /**
469     * Converts a double value to a string.
470     * @param value the double number to be converted.
471     * @param string the result string.
472     * @return the converted string.
473     */
474    static UnicodeString& dtos(double value, UnicodeString& string);
475
476    ChoiceFormat(); // default constructor not implemented
477
478    /**
479     * Construct a new ChoiceFormat with the limits and the corresponding formats
480     * based on the pattern.
481     *
482     * @param newPattern   Pattern used to construct object.
483     * @param parseError   Struct to receive information on position
484     *                     of error if an error is encountered.
485     * @param status       Output param to receive success code.  If the
486     *                     pattern cannot be parsed, set to failure code.
487     */
488    ChoiceFormat(const UnicodeString& newPattern,
489                 UParseError& parseError,
490                 UErrorCode& status);
491
492    friend class MessageFormat;
493
494    virtual void setChoices(const double* limits,
495                            const UBool* closures,
496                            const UnicodeString* formats,
497                            int32_t count,
498                            UErrorCode &errorCode);
499
500    /**
501     * Finds the ChoiceFormat sub-message for the given number.
502     * @param pattern A MessagePattern.
503     * @param partIndex the index of the first ChoiceFormat argument style part.
504     * @param number a number to be mapped to one of the ChoiceFormat argument's intervals
505     * @return the sub-message start part index.
506     */
507    static int32_t findSubMessage(const MessagePattern &pattern, int32_t partIndex, double number);
508
509    static double parseArgument(
510            const MessagePattern &pattern, int32_t partIndex,
511            const UnicodeString &source, ParsePosition &pos);
512
513    /**
514     * Matches the pattern string from the end of the partIndex to
515     * the beginning of the limitPartIndex,
516     * including all syntax except SKIP_SYNTAX,
517     * against the source string starting at sourceOffset.
518     * If they match, returns the length of the source string match.
519     * Otherwise returns -1.
520     */
521    static int32_t matchStringUntilLimitPart(
522            const MessagePattern &pattern, int32_t partIndex, int32_t limitPartIndex,
523            const UnicodeString &source, int32_t sourceOffset);
524
525    /**
526     * Some of the ChoiceFormat constructors do not have a UErrorCode paramater.
527     * We need _some_ way to provide one for the MessagePattern constructor.
528     * Alternatively, the MessagePattern could be a pointer field, but that is
529     * not nice either.
530     */
531    UErrorCode constructorErrorCode;
532
533    /**
534     * The MessagePattern which contains the parsed structure of the pattern string.
535     *
536     * Starting with ICU 4.8, the MessagePattern contains a sequence of
537     * numeric/selector/message parts corresponding to the parsed pattern.
538     * For details see the MessagePattern class API docs.
539     */
540    MessagePattern msgPattern;
541
542    /**
543     * Docs & fields from before ICU 4.8, before MessagePattern was used.
544     * Commented out, and left only for explanation of semantics.
545     * --------
546     * Each ChoiceFormat divides the range -Inf..+Inf into fCount
547     * intervals.  The intervals are:
548     *
549     *         0: fChoiceLimits[0]..fChoiceLimits[1]
550     *         1: fChoiceLimits[1]..fChoiceLimits[2]
551     *        ...
552     *  fCount-2: fChoiceLimits[fCount-2]..fChoiceLimits[fCount-1]
553     *  fCount-1: fChoiceLimits[fCount-1]..+Inf
554     *
555     * Interval 0 is special; during formatting (mapping numbers to
556     * strings), it also contains all numbers less than
557     * fChoiceLimits[0], as well as NaN values.
558     *
559     * Interval i maps to and from string fChoiceFormats[i].  When
560     * parsing (mapping strings to numbers), then intervals map to
561     * their lower limit, that is, interval i maps to fChoiceLimit[i].
562     *
563     * The intervals may be closed, half open, or open.  This affects
564     * formatting but does not affect parsing.  Interval i is affected
565     * by fClosures[i] and fClosures[i+1].  If fClosures[i]
566     * is FALSE, then the value fChoiceLimits[i] is in interval i.
567     * That is, intervals i and i are:
568     *
569     *  i-1:                 ... x < fChoiceLimits[i]
570     *    i: fChoiceLimits[i] <= x ...
571     *
572     * If fClosures[i] is TRUE, then the value fChoiceLimits[i] is
573     * in interval i-1.  That is, intervals i-1 and i are:
574     *
575     *  i-1:                ... x <= fChoiceLimits[i]
576     *    i: fChoiceLimits[i] < x ...
577     *
578     * Because of the nature of interval 0, fClosures[0] has no
579     * effect.
580     */
581    // double*         fChoiceLimits;
582    // UBool*          fClosures;
583    // UnicodeString*  fChoiceFormats;
584    // int32_t         fCount;
585};
586
587
588U_NAMESPACE_END
589
590#endif  // U_HIDE_DEPRECATED_API
591#endif /* #if !UCONFIG_NO_FORMATTING */
592
593#endif // CHOICFMT_H
594//eof
595