lib/shared/include/unicode/choicfmt.h

   1 /*
   2 ********************************************************************************
   3 *   Copyright (C) 1997-2013, International Business Machines
   4 *   Corporation and others.  All Rights Reserved.
   5 ********************************************************************************
   6 *
   7 * File CHOICFMT.H
   8 *
   9 * Modification History:
  10 *
  11 *   Date        Name        Description
  12 *   02/19/97    aliu        Converted from java.
  13 *   03/20/97    helena      Finished first cut of implementation and got rid
  14 *                           of nextDouble/previousDouble and replaced with
  15 *                           boolean array.
  16 *   4/10/97     aliu        Clean up.  Modified to work on AIX.
  17 *   8/6/97      nos         Removed overloaded constructor, member var 'buffer'.
  18 *   07/22/98    stephen     Removed operator!= (implemented in Format)
  19 ********************************************************************************
  20 */
  21
  22 #ifndef CHOICFMT_H
  23 #define CHOICFMT_H
  24
  25 #include "unicode/utypes.h"
  26
  27 /**
  28  * \file
  29  * \brief C++ API: Choice Format.
  30  */
  31
  32 #if !UCONFIG_NO_FORMATTING
  33 #ifndef U_HIDE_DEPRECATED_API
  34
  35 #include "unicode/fieldpos.h"
  36 #include "unicode/format.h"
  37 #include "unicode/messagepattern.h"
  38 #include "unicode/numfmt.h"
  39 #include "unicode/unistr.h"
  40
  41 U_NAMESPACE_BEGIN
  42
  43 class MessageFormat;
  44
  45 /**
  46  * ChoiceFormat converts between ranges of numeric values and strings for those ranges.
  47  * The strings must conform to the MessageFormat pattern syntax.
  48  *
  49  * <p><em><code>ChoiceFormat</code> is probably not what you need.
  50  * Please use <code>MessageFormat</code>
  51  * with <code>plural</code> arguments for proper plural selection,
  52  * and <code>select</code> arguments for simple selection among a fixed set of choices!</em></p>
  53  *
  54  * <p>A <code>ChoiceFormat</code> splits
  55  * the real number line \htmlonly<code>-&#x221E;</code> to
  56  * <code>+&#x221E;</code>\endhtmlonly into two
  57  * or more contiguous ranges. Each range is mapped to a
  58  * string.</p>
  59  *
  60  * <p><code>ChoiceFormat</code> was originally intended
  61  * for displaying grammatically correct
  62  * plurals such as &quot;There is one file.&quot; vs. &quot;There are 2 files.&quot;
  63  * <em>However,</em> plural rules for many languages
  64  * are too complex for the capabilities of ChoiceFormat,
  65  * and its requirement of specifying the precise rules for each message
  66  * is unmanageable for translators.</p>
  67  *
  68  * <p>There are two methods of defining a <code>ChoiceFormat</code>; both
  69  * are equivalent.  The first is by using a string pattern. This is the
  70  * preferred method in most cases.  The second method is through direct
  71  * specification of the arrays that logically make up the
  72  * <code>ChoiceFormat</code>.</p>
  73  *
  74  * <p>Note: Typically, choice formatting is done (if done at all) via <code>MessageFormat</code>
  75  * with a <code>choice</code> argument type,
  76  * rather than using a stand-alone <code>ChoiceFormat</code>.</p>
  77  *
  78  * <h5>Patterns and Their Interpretation</h5>
  79  *
  80  * <p>The pattern string defines the range boundaries and the strings for each number range.
  81  * Syntax:
  82  * <pre>
  83  * choiceStyle = number separator message ('|' number separator message)*
  84  * number = normal_number | ['-'] \htmlonly&#x221E;\endhtmlonly (U+221E, infinity)
  85  * normal_number = double value (unlocalized ASCII string)
  86  * separator = less_than | less_than_or_equal
  87  * less_than = '<'
  88  * less_than_or_equal = '#' | \htmlonly&#x2264;\endhtmlonly (U+2264)
  89  * message: see {@link MessageFormat}
  90  * </pre>
  91  * Pattern_White_Space between syntax elements is ignored, except
  92  * around each range's sub-message.</p>
  93  *
  94  * <p>Each numeric sub-range extends from the current range's number
  95  * to the next range's number.
  96  * The number itself is included in its range if a <code>less_than_or_equal</code> sign is used,
  97  * and excluded from its range (and instead included in the previous range)
  98  * if a <code>less_than</code> sign is used.</p>
  99  *
 100  * <p>When a <code>ChoiceFormat</code> is constructed from
 101  * arrays of numbers, closure flags and strings,
 102  * they are interpreted just like
 103  * the sequence of <code>(number separator string)</code> in an equivalent pattern string.
 104  * <code>closure[i]==TRUE</code> corresponds to a <code>less_than</code> separator sign.
 105  * The equivalent pattern string will be constructed automatically.</p>
 106  *
 107  * <p>During formatting, a number is mapped to the first range
 108  * where the number is not greater than the range's upper limit.
 109  * That range's message string is returned. A NaN maps to the very first range.</p>
 110  *
 111  * <p>During parsing, a range is selected for the longest match of
 112  * any range's message. That range's number is returned, ignoring the separator/closure.
 113  * Only a simple string match is performed, without parsing of arguments that
 114  * might be specified in the message strings.</p>
 115  *
 116  * <p>Note that the first range's number is ignored in formatting
 117  * but may be returned from parsing.</p>
 118  *
 119  * <h5>Examples</h5>
 120  *
 121  * <p>Here is an example of two arrays that map the number
 122  * <code>1..7</code> to the English day of the week abbreviations
 123  * <code>Sun..Sat</code>. No closures array is given; this is the same as
 124  * specifying all closures to be <code>FALSE</code>.</p>
 125  *
 126  * <pre>    {1,2,3,4,5,6,7},
 127  *     {&quot;Sun&quot;,&quot;Mon&quot;,&quot;Tue&quot;,&quot;Wed&quot;,&quot;Thur&quot;,&quot;Fri&quot;,&quot;Sat&quot;}</pre>
 128  *
 129  * <p>Here is an example that maps the ranges [-Inf, 1), [1, 1], and (1,
 130  * +Inf] to three strings. That is, the number line is split into three
 131  * ranges: x &lt; 1.0, x = 1.0, and x &gt; 1.0.
 132  * (The round parentheses in the notation above indicate an exclusive boundary,
 133  * like the turned bracket in European notation: [-Inf, 1) == [-Inf, 1[  )</p>
 134  *
 135  * <pre>    {0, 1, 1},
 136  *     {FALSE, FALSE, TRUE},
 137  *     {&quot;no files&quot;, &quot;one file&quot;, &quot;many files&quot;}</pre>
 138  *
 139  * <p>Here is an example that shows formatting and parsing: </p>
 140  *
 141  * \code
 142  *   #include <unicode/choicfmt.h>
 143  *   #include <unicode/unistr.h>
 144  *   #include <iostream.h>
 145  *
 146  *   int main(int argc, char *argv[]) {
 147  *       double limits[] = {1,2,3,4,5,6,7};
 148  *       UnicodeString monthNames[] = {
 149  *           "Sun","Mon","Tue","Wed","Thu","Fri","Sat"};
 150  *       ChoiceFormat fmt(limits, monthNames, 7);
 151  *       UnicodeString str;
 152  *       char buf[256];
 153  *       for (double x = 1.0; x <= 8.0; x += 1.0) {
 154  *           fmt.format(x, str);
 155  *           str.extract(0, str.length(), buf, 256, "");
 156  *           str.truncate(0);
 157  *           cout << x << " -> "
 158  *                << buf << endl;
 159  *       }
 160  *       cout << endl;
 161  *       return 0;
 162  *   }
 163  * \endcode
 164  *
 165  * <p><em>User subclasses are not supported.</em> While clients may write
 166  * subclasses, such code will not necessarily work and will not be
 167  * guaranteed to work stably from release to release.
 168  *
 169  * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
 170  */
 171 class U_I18N_API ChoiceFormat: public NumberFormat {
 172 public:
 173     /**
 174      * Constructs a new ChoiceFormat from the pattern string.
 175      *
 176      * @param pattern   Pattern used to construct object.
 177      * @param status    Output param to receive success code.  If the
 178      *                  pattern cannot be parsed, set to failure code.
 179      * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
 180      */
 181     ChoiceFormat(const UnicodeString& pattern,
 182                  UErrorCode& status);
 183
 184
 185     /**
 186      * Constructs a new ChoiceFormat with the given limits and message strings.
 187      * All closure flags default to <code>FALSE</code>,
 188      * equivalent to <code>less_than_or_equal</code> separators.
 189      *
 190      * Copies the limits and formats instead of adopting them.
 191      *
 192      * @param limits    Array of limit values.
 193      * @param formats   Array of formats.
 194      * @param count     Size of 'limits' and 'formats' arrays.
 195      * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
 196      */
 197     ChoiceFormat(const double* limits,
 198                  const UnicodeString* formats,
 199                  int32_t count );
 200
 201     /**
 202      * Constructs a new ChoiceFormat with the given limits, closure flags and message strings.
 203      *
 204      * Copies the limits and formats instead of adopting them.
 205      *
 206      * @param limits Array of limit values
 207      * @param closures Array of booleans specifying whether each
 208      * element of 'limits' is open or closed.  If FALSE, then the
 209      * corresponding limit number is a member of its range.
 210      * If TRUE, then the limit number belongs to the previous range it.
 211      * @param formats Array of formats
 212      * @param count Size of 'limits', 'closures', and 'formats' arrays
 213      * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
 214      */
 215     ChoiceFormat(const double* limits,
 216                  const UBool* closures,
 217                  const UnicodeString* formats,
 218                  int32_t count);
 219
 220     /**
 221      * Copy constructor.
 222      *
 223      * @param that   ChoiceFormat object to be copied from
 224      * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
 225      */
 226     ChoiceFormat(const ChoiceFormat& that);
 227
 228     /**
 229      * Assignment operator.
 230      *
 231      * @param that   ChoiceFormat object to be copied
 232      * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
 233      */
 234     const ChoiceFormat& operator=(const ChoiceFormat& that);
 235
 236     /**
 237      * Destructor.
 238      * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
 239      */
 240     virtual ~ChoiceFormat();
 241
 242     /**
 243      * Clones this Format object. The caller owns the
 244      * result and must delete it when done.
 245      *
 246      * @return a copy of this object
 247      * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
 248      */
 249     virtual Format* clone(void) const;
 250
 251     /**
 252      * Returns true if the given Format objects are semantically equal.
 253      * Objects of different subclasses are considered unequal.
 254      *
 255      * @param other    ChoiceFormat object to be compared
 256      * @return         true if other is the same as this.
 257      * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
 258      */
 259     virtual UBool operator==(const Format& other) const;
 260
 261     /**
 262      * Sets the pattern.
 263      * @param pattern   The pattern to be applied.
 264      * @param status    Output param set to success/failure code on
 265      *                  exit. If the pattern is invalid, this will be
 266      *                  set to a failure result.
 267      * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
 268      */
 269     virtual void applyPattern(const UnicodeString& pattern,
 270                               UErrorCode& status);
 271
 272     /**
 273      * Sets the pattern.
 274      * @param pattern    The pattern to be applied.
 275      * @param parseError Struct to receive information on position
 276      *                   of error if an error is encountered
 277      * @param status     Output param set to success/failure code on
 278      *                   exit. If the pattern is invalid, this will be
 279      *                   set to a failure result.
 280      * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
 281      */
 282     virtual void applyPattern(const UnicodeString& pattern,
 283                              UParseError& parseError,
 284                              UErrorCode& status);
 285     /**
 286      * Gets the pattern.
 287      *
 288      * @param pattern    Output param which will receive the pattern
 289      *                   Previous contents are deleted.
 290      * @return    A reference to 'pattern'
 291      * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
 292      */
 293     virtual UnicodeString& toPattern(UnicodeString &pattern) const;
 294
 295     /**
 296      * Sets the choices to be used in formatting.
 297      * For details see the constructor with the same parameter list.
 298      *
 299      * @param limitsToCopy      Contains the top value that you want
 300      *                          parsed with that format,and should be in
 301      *                          ascending sorted order. When formatting X,
 302      *                          the choice will be the i, where limit[i]
 303      *                          &lt;= X &lt; limit[i+1].
 304      * @param formatsToCopy     The format strings you want to use for each limit.
 305      * @param count             The size of the above arrays.
 306      * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
 307      */
 308     virtual void setChoices(const double* limitsToCopy,
 309                             const UnicodeString* formatsToCopy,
 310                             int32_t count );
 311
 312     /**
 313      * Sets the choices to be used in formatting.
 314      * For details see the constructor with the same parameter list.
 315      *
 316      * @param limits Array of limits
 317      * @param closures Array of limit booleans
 318      * @param formats Array of format string
 319      * @param count The size of the above arrays
 320      * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
 321      */
 322     virtual void setChoices(const double* limits,
 323                             const UBool* closures,
 324                             const UnicodeString* formats,
 325                             int32_t count);
 326
 327     /**
 328      * Returns NULL and 0.
 329      * Before ICU 4.8, this used to return the choice limits array.
 330      *
 331      * @param count Will be set to 0.
 332      * @return NULL
 333      * @deprecated ICU 4.8 Use the MessagePattern class to analyze a ChoiceFormat pattern.
 334      */
 335     virtual const double* getLimits(int32_t& count) const;
 336
 337     /**
 338      * Returns NULL and 0.
 339      * Before ICU 4.8, this used to return the limit booleans array.
 340      *
 341      * @param count Will be set to 0.
 342      * @return NULL
 343      * @deprecated ICU 4.8 Use the MessagePattern class to analyze a ChoiceFormat pattern.
 344      */
 345     virtual const UBool* getClosures(int32_t& count) const;
 346
 347     /**
 348      * Returns NULL and 0.
 349      * Before ICU 4.8, this used to return the array of choice strings.
 350      *
 351      * @param count Will be set to 0.
 352      * @return NULL
 353      * @deprecated ICU 4.8 Use the MessagePattern class to analyze a ChoiceFormat pattern.
 354      */
 355     virtual const UnicodeString* getFormats(int32_t& count) const;
 356
 357
 358     using NumberFormat::format;
 359
 360     /**
 361      * Formats a double number using this object's choices.
 362      *
 363      * @param number    The value to be formatted.
 364      * @param appendTo  Output parameter to receive result.
 365      *                  Result is appended to existing contents.
 366      * @param pos       On input: an alignment field, if desired.
 367      *                  On output: the offsets of the alignment field.
 368      * @return          Reference to 'appendTo' parameter.
 369      * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
 370      */
 371     virtual UnicodeString& format(double number,
 372                                   UnicodeString& appendTo,
 373                                   FieldPosition& pos) const;
 374     /**
 375      * Formats an int32_t number using this object's choices.
 376      *
 377      * @param number    The value to be formatted.
 378      * @param appendTo  Output parameter to receive result.
 379      *                  Result is appended to existing contents.
 380      * @param pos       On input: an alignment field, if desired.
 381      *                  On output: the offsets of the alignment field.
 382      * @return          Reference to 'appendTo' parameter.
 383      * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
 384      */
 385     virtual UnicodeString& format(int32_t number,
 386                                   UnicodeString& appendTo,
 387                                   FieldPosition& pos) const;
 388
 389     /**
 390      * Formats an int64_t number using this object's choices.
 391      *
 392      * @param number    The value to be formatted.
 393      * @param appendTo  Output parameter to receive result.
 394      *                  Result is appended to existing contents.
 395      * @param pos       On input: an alignment field, if desired.
 396      *                  On output: the offsets of the alignment field.
 397      * @return          Reference to 'appendTo' parameter.
 398      * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
 399      */
 400     virtual UnicodeString& format(int64_t number,
 401                                   UnicodeString& appendTo,
 402                                   FieldPosition& pos) const;
 403
 404     /**
 405      * Formats an array of objects using this object's choices.
 406      *
 407      * @param objs      The array of objects to be formatted.
 408      * @param cnt       The size of objs.
 409      * @param appendTo  Output parameter to receive result.
 410      *                  Result is appended to existing contents.
 411      * @param pos       On input: an alignment field, if desired.
 412      *                  On output: the offsets of the alignment field.
 413      * @param success   Output param set to success/failure code on
 414      *                  exit.
 415      * @return          Reference to 'appendTo' parameter.
 416      * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
 417      */
 418     virtual UnicodeString& format(const Formattable* objs,
 419                                   int32_t cnt,
 420                                   UnicodeString& appendTo,
 421                                   FieldPosition& pos,
 422                                   UErrorCode& success) const;
 423
 424    using NumberFormat::parse;
 425
 426    /**
 427     * Looks for the longest match of any message string on the input text and,
 428     * if there is a match, sets the result object to the corresponding range's number.
 429     *
 430     * If no string matches, then the parsePosition is unchanged.
 431     *
 432     * @param text           The text to be parsed.
 433     * @param result         Formattable to be set to the parse result.
 434     *                       If parse fails, return contents are undefined.
 435     * @param parsePosition  The position to start parsing at on input.
 436     *                       On output, moved to after the last successfully
 437     *                       parse character. On parse failure, does not change.
 438      * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
 439     */
 440     virtual void parse(const UnicodeString& text,
 441                        Formattable& result,
 442                        ParsePosition& parsePosition) const;
 443
 444     /**
 445      * Returns a unique class ID POLYMORPHICALLY. Part of ICU's "poor man's RTTI".
 446      *
 447      * @return          The class ID for this object. All objects of a
 448      *                  given class have the same class ID.  Objects of
 449      *                  other classes have different class IDs.
 450      * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
 451      */
 452     virtual UClassID getDynamicClassID(void) const;
 453
 454     /**
 455      * Returns the class ID for this class.  This is useful only for
 456      * comparing to a return value from getDynamicClassID().  For example:
 457      * <pre>
 458      * .       Base* polymorphic_pointer = createPolymorphicObject();
 459      * .       if (polymorphic_pointer->getDynamicClassID() ==
 460      * .           Derived::getStaticClassID()) ...
 461      * </pre>
 462      * @return          The class ID for all objects of this class.
 463      * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments.
 464      */
 465     static UClassID U_EXPORT2 getStaticClassID(void);
 466
 467 private:
 468     /**
 469      * Converts a double value to a string.
 470      * @param value the double number to be converted.
 471      * @param string the result string.
 472      * @return the converted string.
 473      */
 474     static UnicodeString& dtos(double value, UnicodeString& string);
 475
 476     ChoiceFormat(); // default constructor not implemented
 477
 478     /**
 479      * Construct a new ChoiceFormat with the limits and the corresponding formats
 480      * based on the pattern.
 481      *
 482      * @param newPattern   Pattern used to construct object.
 483      * @param parseError   Struct to receive information on position
 484      *                     of error if an error is encountered.
 485      * @param status       Output param to receive success code.  If the
 486      *                     pattern cannot be parsed, set to failure code.
 487      */
 488     ChoiceFormat(const UnicodeString& newPattern,
 489                  UParseError& parseError,
 490                  UErrorCode& status);
 491
 492     friend class MessageFormat;
 493
 494     virtual void setChoices(const double* limits,
 495                             const UBool* closures,
 496                             const UnicodeString* formats,
 497                             int32_t count,
 498                             UErrorCode &errorCode);
 499
 500     /**
 501      * Finds the ChoiceFormat sub-message for the given number.
 502      * @param pattern A MessagePattern.
 503      * @param partIndex the index of the first ChoiceFormat argument style part.
 504      * @param number a number to be mapped to one of the ChoiceFormat argument's intervals
 505      * @return the sub-message start part index.
 506      */
 507     static int32_t findSubMessage(const MessagePattern &pattern, int32_t partIndex, double number);
 508
 509     static double parseArgument(
 510             const MessagePattern &pattern, int32_t partIndex,
 511             const UnicodeString &source, ParsePosition &pos);
 512
 513     /**
 514      * Matches the pattern string from the end of the partIndex to
 515      * the beginning of the limitPartIndex,
 516      * including all syntax except SKIP_SYNTAX,
 517      * against the source string starting at sourceOffset.
 518      * If they match, returns the length of the source string match.
 519      * Otherwise returns -1.
 520      */
 521     static int32_t matchStringUntilLimitPart(
 522             const MessagePattern &pattern, int32_t partIndex, int32_t limitPartIndex,
 523             const UnicodeString &source, int32_t sourceOffset);
 524
 525     /**
 526      * Some of the ChoiceFormat constructors do not have a UErrorCode paramater.
 527      * We need _some_ way to provide one for the MessagePattern constructor.
 528      * Alternatively, the MessagePattern could be a pointer field, but that is
 529      * not nice either.
 530      */
 531     UErrorCode constructorErrorCode;
 532
 533     /**
 534      * The MessagePattern which contains the parsed structure of the pattern string.
 535      *
 536      * Starting with ICU 4.8, the MessagePattern contains a sequence of
 537      * numeric/selector/message parts corresponding to the parsed pattern.
 538      * For details see the MessagePattern class API docs.
 539      */
 540     MessagePattern msgPattern;
 541
 542     /**
 543      * Docs & fields from before ICU 4.8, before MessagePattern was used.
 544      * Commented out, and left only for explanation of semantics.
 545      * --------
 546      * Each ChoiceFormat divides the range -Inf..+Inf into fCount
 547      * intervals.  The intervals are:
 548      *
 549      *         0: fChoiceLimits[0]..fChoiceLimits[1]
 550      *         1: fChoiceLimits[1]..fChoiceLimits[2]
 551      *        ...
 552      *  fCount-2: fChoiceLimits[fCount-2]..fChoiceLimits[fCount-1]
 553      *  fCount-1: fChoiceLimits[fCount-1]..+Inf
 554      *
 555      * Interval 0 is special; during formatting (mapping numbers to
 556      * strings), it also contains all numbers less than
 557      * fChoiceLimits[0], as well as NaN values.
 558      *
 559      * Interval i maps to and from string fChoiceFormats[i].  When
 560      * parsing (mapping strings to numbers), then intervals map to
 561      * their lower limit, that is, interval i maps to fChoiceLimit[i].
 562      *
 563      * The intervals may be closed, half open, or open.  This affects
 564      * formatting but does not affect parsing.  Interval i is affected
 565      * by fClosures[i] and fClosures[i+1].  If fClosures[i]
 566      * is FALSE, then the value fChoiceLimits[i] is in interval i.
 567      * That is, intervals i and i are:
 568      *
 569      *  i-1:                 ... x < fChoiceLimits[i]
 570      *    i: fChoiceLimits[i] <= x ...
 571      *
 572      * If fClosures[i] is TRUE, then the value fChoiceLimits[i] is
 573      * in interval i-1.  That is, intervals i-1 and i are:
 574      *
 575      *  i-1:                ... x <= fChoiceLimits[i]
 576      *    i: fChoiceLimits[i] < x ...
 577      *
 578      * Because of the nature of interval 0, fClosures[0] has no
 579      * effect.
 580      */
 581     // double*         fChoiceLimits;
 582     // UBool*          fClosures;
 583     // UnicodeString*  fChoiceFormats;
 584     // int32_t         fCount;
 585 };
 586
 587
 588 U_NAMESPACE_END
 589
 590 #endif  // U_HIDE_DEPRECATED_API
 591 #endif /* #if !UCONFIG_NO_FORMATTING */
 592
 593 #endif // CHOICFMT_H
 594 //eof