1// Copyright (C) 2016 and later: Unicode, Inc. and others.
2// License & terms of use: http://www.unicode.org/copyright.html
3/*
4********************************************************************************
5*   Copyright (C) 1997-2013, International Business Machines
6*   Corporation and others.  All Rights Reserved.
7********************************************************************************
8*
9* File CHOICFMT.H
10*
11* Modification History:
12*
13*   Date        Name        Description
14*   02/19/97    aliu        Converted from java.
15*   03/20/97    helena      Finished first cut of implementation and got rid
16*                           of nextDouble/previousDouble and replaced with
17*                           boolean array.
18*   4/10/97     aliu        Clean up.  Modified to work on AIX.
19*   8/6/97      nos         Removed overloaded constructor, member var 'buffer'.
20*   07/22/98    stephen     Removed operator!= (implemented in Format)
21********************************************************************************
22*/
23
24#ifndef CHOICFMT_H
25#define CHOICFMT_H
26
27#include "unicode/utypes.h"
28
29/**
30 * \file
31 * \brief C++ API: Choice Format.
32 */
33
34#if !UCONFIG_NO_FORMATTING
35#ifndef U_HIDE_DEPRECATED_API
36
37#include "unicode/fieldpos.h"
38#include "unicode/format.h"
39#include "unicode/messagepattern.h"
40#include "unicode/numfmt.h"
41#include "unicode/unistr.h"
42
43U_NAMESPACE_BEGIN
44
45class MessageFormat;
46
47/**
48 * ChoiceFormat converts between ranges of numeric values and strings for those ranges.
49 * The strings must conform to the MessageFormat pattern syntax.
50 *
51 * <p><em><code>ChoiceFormat</code> is probably not what you need.
52 * Please use <code>MessageFormat</code>
53 * with <code>plural</code> arguments for proper plural selection,
54 * and <code>select</code> arguments for simple selection among a fixed set of choices!</em></p>
55 *
56 * <p>A <code>ChoiceFormat</code> splits
57 * the real number line \htmlonly<code>-&#x221E;</code> to
58 * <code>+&#x221E;</code>\endhtmlonly into two
59 * or more contiguous ranges. Each range is mapped to a
60 * string.</p>
61 *
62 * <p><code>ChoiceFormat</code> was originally intended
63 * for displaying grammatically correct
64 * plurals such as &quot;There is one file.&quot; vs. &quot;There are 2 files.&quot;
65 * <em>However,</em> plural rules for many languages
66 * are too complex for the capabilities of ChoiceFormat,
67 * and its requirement of specifying the precise rules for each message
68 * is unmanageable for translators.</p>
69 *
70 * <p>There are two methods of defining a <code>ChoiceFormat</code>; both
71 * are equivalent.  The first is by using a string pattern. This is the
72 * preferred method in most cases.  The second method is through direct
73 * specification of the arrays that logically make up the
74 * <code>ChoiceFormat</code>.</p>
75 *
76 * <p>Note: Typically, choice formatting is done (if done at all) via <code>MessageFormat</code>
77 * with a <code>choice</code> argument type,
78 * rather than using a stand-alone <code>ChoiceFormat</code>.</p>
79 *
80 * <h5>Patterns and Their Interpretation</h5>
81 *
82 * <p>The pattern string defines the range boundaries and the strings for each number range.
83 * Syntax:
84 * <pre>
85 * choiceStyle = number separator message ('|' number separator message)*
86 * number = normal_number | ['-'] \htmlonly&#x221E;\endhtmlonly (U+221E, infinity)
87 * normal_number = double value (unlocalized ASCII string)
88 * separator = less_than | less_than_or_equal
89 * less_than = '<'
90 * less_than_or_equal = '#' | \htmlonly&#x2264;\endhtmlonly (U+2264)
91 * message: see {@link MessageFormat}
92 * </pre>
93 * Pattern_White_Space between syntax elements is ignored, except
94 * around each range's sub-message.</p>
95 *
96 * <p>Each numeric sub-range extends from the current range's number
97 * to the next range's number.
98 * The number itself is included in its range if a <code>less_than_or_equal</code> sign is used,
99 * and excluded from its range (and instead included in the previous range)
100 * if a <code>less_than</code> sign is used.</p>
101 *
102 * <p>When a <code>ChoiceFormat</code> is constructed from
103 * arrays of numbers, closure flags and strings,
104 * they are interpreted just like
105 * the sequence of <code>(number separator string)</code> in an equivalent pattern string.
106 * <code>closure[i]==TRUE</code> corresponds to a <code>less_than</code> separator sign.
107 * The equivalent pattern string will be constructed automatically.</p>
108 *
109 * <p>During formatting, a number is mapped to the first range
110 * where the number is not greater than the range's upper limit.
111 * That range's message string is returned. A NaN maps to the very first range.</p>
112 *
113 * <p>During parsing, a range is selected for the longest match of
114 * any range's message. That range's number is returned, ignoring the separator/closure.
115 * Only a simple string match is performed, without parsing of arguments that
116 * might be specified in the message strings.</p>
117 *
118 * <p>Note that the first range's number is ignored in formatting
119 * but may be returned from parsing.</p>
120 *
121 * <h5>Examples</h5>
122 *
123 * <p>Here is an example of two arrays that map the number
124 * <code>1..7</code> to the English day of the week abbreviations
125 * <code>Sun..Sat</code>. No closures array is given; this is the same as
126 * specifying all closures to be <code>FALSE</code>.</p>
127 *
128 * <pre>    {1,2,3,4,5,6,7},
129 *     {&quot;Sun&quot;,&quot;Mon&quot;,&quot;Tue&quot;,&quot;Wed&quot;,&quot;Thur&quot;,&quot;Fri&quot;,&quot;Sat&quot;}</pre>
130 *
131 * <p>Here is an example that maps the ranges [-Inf, 1), [1, 1], and (1,
132 * +Inf] to three strings. That is, the number line is split into three
133 * ranges: x &lt; 1.0, x = 1.0, and x &gt; 1.0.
134 * (The round parentheses in the notation above indicate an exclusive boundary,
135 * like the turned bracket in European notation: [-Inf, 1) == [-Inf, 1[  )</p>
136 *
137 * <pre>    {0, 1, 1},
138 *     {FALSE, FALSE, TRUE},
139 *     {&quot;no files&quot;, &quot;one file&quot;, &quot;many files&quot;}</pre>
140 *
141 * <p>Here is an example that shows formatting and parsing: </p>
142 *
143 * \code
144 *   #include <unicode/choicfmt.h>
145 *   #include <unicode/unistr.h>
146 *   #include <iostream.h>
147 *
148 *   int main(int argc, char *argv[]) {
149 *       double limits[] = {1,2,3,4,5,6,7};
150 *       UnicodeString monthNames[] = {
151 *           "Sun","Mon","Tue","Wed","Thu","Fri","Sat"};
152 *       ChoiceFormat fmt(limits, monthNames, 7);
153 *       UnicodeString str;
154 *       char buf[256];
155 *       for (double x = 1.0; x <= 8.0; x += 1.0) {
156 *           fmt.format(x, str);
157 *           str.extract(0, str.length(), buf, 256, "");
158 *           str.truncate(0);
159 *           cout << x << " -> "
160 *                << buf << endl;
161 *       }
162 *       cout << endl;
163 *       return 0;
164 *   }
165 * \endcode
166 *
167 * <p><em>User subclasses are not supported.</em> While clients may write
168 * subclasses, such code will not necessarily work and will not be
169 * guaranteed to work stably from release to release.
170 *
171 * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
172 */
173class U_I18N_API ChoiceFormat: public NumberFormat {
174public:
175    /**
176     * Constructs a new ChoiceFormat from the pattern string.
177     *
178     * @param pattern   Pattern used to construct object.
179     * @param status    Output param to receive success code.  If the
180     *                  pattern cannot be parsed, set to failure code.
181     * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
182     */
183    ChoiceFormat(const UnicodeString& pattern,
184                 UErrorCode& status);
185
186
187    /**
188     * Constructs a new ChoiceFormat with the given limits and message strings.
189     * All closure flags default to <code>FALSE</code>,
190     * equivalent to <code>less_than_or_equal</code> separators.
191     *
192     * Copies the limits and formats instead of adopting them.
193     *
194     * @param limits    Array of limit values.
195     * @param formats   Array of formats.
196     * @param count     Size of 'limits' and 'formats' arrays.
197     * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
198     */
199    ChoiceFormat(const double* limits,
200                 const UnicodeString* formats,
201                 int32_t count );
202
203    /**
204     * Constructs a new ChoiceFormat with the given limits, closure flags and message strings.
205     *
206     * Copies the limits and formats instead of adopting them.
207     *
208     * @param limits Array of limit values
209     * @param closures Array of booleans specifying whether each
210     * element of 'limits' is open or closed.  If FALSE, then the
211     * corresponding limit number is a member of its range.
212     * If TRUE, then the limit number belongs to the previous range it.
213     * @param formats Array of formats
214     * @param count Size of 'limits', 'closures', and 'formats' arrays
215     * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
216     */
217    ChoiceFormat(const double* limits,
218                 const UBool* closures,
219                 const UnicodeString* formats,
220                 int32_t count);
221
222    /**
223     * Copy constructor.
224     *
225     * @param that   ChoiceFormat object to be copied from
226     * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
227     */
228    ChoiceFormat(const ChoiceFormat& that);
229
230    /**
231     * Assignment operator.
232     *
233     * @param that   ChoiceFormat object to be copied
234     * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
235     */
236    const ChoiceFormat& operator=(const ChoiceFormat& that);
237
238    /**
239     * Destructor.
240     * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
241     */
242    virtual ~ChoiceFormat();
243
244    /**
245     * Clones this Format object. The caller owns the
246     * result and must delete it when done.
247     *
248     * @return a copy of this object
249     * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
250     */
251    virtual Format* clone(void) const;
252
253    /**
254     * Returns true if the given Format objects are semantically equal.
255     * Objects of different subclasses are considered unequal.
256     *
257     * @param other    ChoiceFormat object to be compared
258     * @return         true if other is the same as this.
259     * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
260     */
261    virtual UBool operator==(const Format& other) const;
262
263    /**
264     * Sets the pattern.
265     * @param pattern   The pattern to be applied.
266     * @param status    Output param set to success/failure code on
267     *                  exit. If the pattern is invalid, this will be
268     *                  set to a failure result.
269     * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
270     */
271    virtual void applyPattern(const UnicodeString& pattern,
272                              UErrorCode& status);
273
274    /**
275     * Sets the pattern.
276     * @param pattern    The pattern to be applied.
277     * @param parseError Struct to receive information on position
278     *                   of error if an error is encountered
279     * @param status     Output param set to success/failure code on
280     *                   exit. If the pattern is invalid, this will be
281     *                   set to a failure result.
282     * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
283     */
284    virtual void applyPattern(const UnicodeString& pattern,
285                             UParseError& parseError,
286                             UErrorCode& status);
287    /**
288     * Gets the pattern.
289     *
290     * @param pattern    Output param which will receive the pattern
291     *                   Previous contents are deleted.
292     * @return    A reference to 'pattern'
293     * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
294     */
295    virtual UnicodeString& toPattern(UnicodeString &pattern) const;
296
297    /**
298     * Sets the choices to be used in formatting.
299     * For details see the constructor with the same parameter list.
300     *
301     * @param limitsToCopy      Contains the top value that you want
302     *                          parsed with that format,and should be in
303     *                          ascending sorted order. When formatting X,
304     *                          the choice will be the i, where limit[i]
305     *                          &lt;= X &lt; limit[i+1].
306     * @param formatsToCopy     The format strings you want to use for each limit.
307     * @param count             The size of the above arrays.
308     * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
309     */
310    virtual void setChoices(const double* limitsToCopy,
311                            const UnicodeString* formatsToCopy,
312                            int32_t count );
313
314    /**
315     * Sets the choices to be used in formatting.
316     * For details see the constructor with the same parameter list.
317     *
318     * @param limits Array of limits
319     * @param closures Array of limit booleans
320     * @param formats Array of format string
321     * @param count The size of the above arrays
322     * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
323     */
324    virtual void setChoices(const double* limits,
325                            const UBool* closures,
326                            const UnicodeString* formats,
327                            int32_t count);
328
329    /**
330     * Returns NULL and 0.
331     * Before ICU 4.8, this used to return the choice limits array.
332     *
333     * @param count Will be set to 0.
334     * @return NULL
335     * @deprecated ICU 4.8 Use the MessagePattern class to analyze a ChoiceFormat pattern.
336     */
337    virtual const double* getLimits(int32_t& count) const;
338
339    /**
340     * Returns NULL and 0.
341     * Before ICU 4.8, this used to return the limit booleans array.
342     *
343     * @param count Will be set to 0.
344     * @return NULL
345     * @deprecated ICU 4.8 Use the MessagePattern class to analyze a ChoiceFormat pattern.
346     */
347    virtual const UBool* getClosures(int32_t& count) const;
348
349    /**
350     * Returns NULL and 0.
351     * Before ICU 4.8, this used to return the array of choice strings.
352     *
353     * @param count Will be set to 0.
354     * @return NULL
355     * @deprecated ICU 4.8 Use the MessagePattern class to analyze a ChoiceFormat pattern.
356     */
357    virtual const UnicodeString* getFormats(int32_t& count) const;
358
359
360    using NumberFormat::format;
361
362    /**
363     * Formats a double number using this object's choices.
364     *
365     * @param number    The value to be formatted.
366     * @param appendTo  Output parameter to receive result.
367     *                  Result is appended to existing contents.
368     * @param pos       On input: an alignment field, if desired.
369     *                  On output: the offsets of the alignment field.
370     * @return          Reference to 'appendTo' parameter.
371     * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
372     */
373    virtual UnicodeString& format(double number,
374                                  UnicodeString& appendTo,
375                                  FieldPosition& pos) const;
376    /**
377     * Formats an int32_t number using this object's choices.
378     *
379     * @param number    The value to be formatted.
380     * @param appendTo  Output parameter to receive result.
381     *                  Result is appended to existing contents.
382     * @param pos       On input: an alignment field, if desired.
383     *                  On output: the offsets of the alignment field.
384     * @return          Reference to 'appendTo' parameter.
385     * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
386     */
387    virtual UnicodeString& format(int32_t number,
388                                  UnicodeString& appendTo,
389                                  FieldPosition& pos) const;
390
391    /**
392     * Formats an int64_t number using this object's choices.
393     *
394     * @param number    The value to be formatted.
395     * @param appendTo  Output parameter to receive result.
396     *                  Result is appended to existing contents.
397     * @param pos       On input: an alignment field, if desired.
398     *                  On output: the offsets of the alignment field.
399     * @return          Reference to 'appendTo' parameter.
400     * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
401     */
402    virtual UnicodeString& format(int64_t number,
403                                  UnicodeString& appendTo,
404                                  FieldPosition& pos) const;
405
406    /**
407     * Formats an array of objects using this object's choices.
408     *
409     * @param objs      The array of objects to be formatted.
410     * @param cnt       The size of objs.
411     * @param appendTo  Output parameter to receive result.
412     *                  Result is appended to existing contents.
413     * @param pos       On input: an alignment field, if desired.
414     *                  On output: the offsets of the alignment field.
415     * @param success   Output param set to success/failure code on
416     *                  exit.
417     * @return          Reference to 'appendTo' parameter.
418     * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
419     */
420    virtual UnicodeString& format(const Formattable* objs,
421                                  int32_t cnt,
422                                  UnicodeString& appendTo,
423                                  FieldPosition& pos,
424                                  UErrorCode& success) const;
425
426   using NumberFormat::parse;
427
428   /**
429    * Looks for the longest match of any message string on the input text and,
430    * if there is a match, sets the result object to the corresponding range's number.
431    *
432    * If no string matches, then the parsePosition is unchanged.
433    *
434    * @param text           The text to be parsed.
435    * @param result         Formattable to be set to the parse result.
436    *                       If parse fails, return contents are undefined.
437    * @param parsePosition  The position to start parsing at on input.
438    *                       On output, moved to after the last successfully
439    *                       parse character. On parse failure, does not change.
440     * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
441    */
442    virtual void parse(const UnicodeString& text,
443                       Formattable& result,
444                       ParsePosition& parsePosition) const;
445
446    /**
447     * Returns a unique class ID POLYMORPHICALLY. Part of ICU's "poor man's RTTI".
448     *
449     * @return          The class ID for this object. All objects of a
450     *                  given class have the same class ID.  Objects of
451     *                  other classes have different class IDs.
452     * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
453     */
454    virtual UClassID getDynamicClassID(void) const;
455
456    /**
457     * Returns the class ID for this class.  This is useful only for
458     * comparing to a return value from getDynamicClassID().  For example:
459     * <pre>
460     * .       Base* polymorphic_pointer = createPolymorphicObject();
461     * .       if (polymorphic_pointer->getDynamicClassID() ==
462     * .           Derived::getStaticClassID()) ...
463     * </pre>
464     * @return          The class ID for all objects of this class.
465     * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
466     */
467    static UClassID U_EXPORT2 getStaticClassID(void);
468
469private:
470    /**
471     * Converts a double value to a string.
472     * @param value the double number to be converted.
473     * @param string the result string.
474     * @return the converted string.
475     */
476    static UnicodeString& dtos(double value, UnicodeString& string);
477
478    ChoiceFormat(); // default constructor not implemented
479
480    /**
481     * Construct a new ChoiceFormat with the limits and the corresponding formats
482     * based on the pattern.
483     *
484     * @param newPattern   Pattern used to construct object.
485     * @param parseError   Struct to receive information on position
486     *                     of error if an error is encountered.
487     * @param status       Output param to receive success code.  If the
488     *                     pattern cannot be parsed, set to failure code.
489     */
490    ChoiceFormat(const UnicodeString& newPattern,
491                 UParseError& parseError,
492                 UErrorCode& status);
493
494    friend class MessageFormat;
495
496    virtual void setChoices(const double* limits,
497                            const UBool* closures,
498                            const UnicodeString* formats,
499                            int32_t count,
500                            UErrorCode &errorCode);
501
502    /**
503     * Finds the ChoiceFormat sub-message for the given number.
504     * @param pattern A MessagePattern.
505     * @param partIndex the index of the first ChoiceFormat argument style part.
506     * @param number a number to be mapped to one of the ChoiceFormat argument's intervals
507     * @return the sub-message start part index.
508     */
509    static int32_t findSubMessage(const MessagePattern &pattern, int32_t partIndex, double number);
510
511    static double parseArgument(
512            const MessagePattern &pattern, int32_t partIndex,
513            const UnicodeString &source, ParsePosition &pos);
514
515    /**
516     * Matches the pattern string from the end of the partIndex to
517     * the beginning of the limitPartIndex,
518     * including all syntax except SKIP_SYNTAX,
519     * against the source string starting at sourceOffset.
520     * If they match, returns the length of the source string match.
521     * Otherwise returns -1.
522     */
523    static int32_t matchStringUntilLimitPart(
524            const MessagePattern &pattern, int32_t partIndex, int32_t limitPartIndex,
525            const UnicodeString &source, int32_t sourceOffset);
526
527    /**
528     * Some of the ChoiceFormat constructors do not have a UErrorCode paramater.
529     * We need _some_ way to provide one for the MessagePattern constructor.
530     * Alternatively, the MessagePattern could be a pointer field, but that is
531     * not nice either.
532     */
533    UErrorCode constructorErrorCode;
534
535    /**
536     * The MessagePattern which contains the parsed structure of the pattern string.
537     *
538     * Starting with ICU 4.8, the MessagePattern contains a sequence of
539     * numeric/selector/message parts corresponding to the parsed pattern.
540     * For details see the MessagePattern class API docs.
541     */
542    MessagePattern msgPattern;
543
544    /**
545     * Docs & fields from before ICU 4.8, before MessagePattern was used.
546     * Commented out, and left only for explanation of semantics.
547     * --------
548     * Each ChoiceFormat divides the range -Inf..+Inf into fCount
549     * intervals.  The intervals are:
550     *
551     *         0: fChoiceLimits[0]..fChoiceLimits[1]
552     *         1: fChoiceLimits[1]..fChoiceLimits[2]
553     *        ...
554     *  fCount-2: fChoiceLimits[fCount-2]..fChoiceLimits[fCount-1]
555     *  fCount-1: fChoiceLimits[fCount-1]..+Inf
556     *
557     * Interval 0 is special; during formatting (mapping numbers to
558     * strings), it also contains all numbers less than
559     * fChoiceLimits[0], as well as NaN values.
560     *
561     * Interval i maps to and from string fChoiceFormats[i].  When
562     * parsing (mapping strings to numbers), then intervals map to
563     * their lower limit, that is, interval i maps to fChoiceLimit[i].
564     *
565     * The intervals may be closed, half open, or open.  This affects
566     * formatting but does not affect parsing.  Interval i is affected
567     * by fClosures[i] and fClosures[i+1].  If fClosures[i]
568     * is FALSE, then the value fChoiceLimits[i] is in interval i.
569     * That is, intervals i and i are:
570     *
571     *  i-1:                 ... x < fChoiceLimits[i]
572     *    i: fChoiceLimits[i] <= x ...
573     *
574     * If fClosures[i] is TRUE, then the value fChoiceLimits[i] is
575     * in interval i-1.  That is, intervals i-1 and i are:
576     *
577     *  i-1:                ... x <= fChoiceLimits[i]
578     *    i: fChoiceLimits[i] < x ...
579     *
580     * Because of the nature of interval 0, fClosures[0] has no
581     * effect.
582     */
583    // double*         fChoiceLimits;
584    // UBool*          fClosures;
585    // UnicodeString*  fChoiceFormats;
586    // int32_t         fCount;
587};
588
589
590U_NAMESPACE_END
591
592#endif  // U_HIDE_DEPRECATED_API
593#endif /* #if !UCONFIG_NO_FORMATTING */
594
595#endif // CHOICFMT_H
596//eof
597