1 // Copyright (C) 2016 and later: Unicode, Inc. and others. 2 // License & terms of use: http://www.unicode.org/copyright.html 3 /* 4 ******************************************************************************** 5 * Copyright (C) 1997-2013, International Business Machines 6 * Corporation and others. All Rights Reserved. 7 ******************************************************************************** 8 * 9 * File CHOICFMT.H 10 * 11 * Modification History: 12 * 13 * Date Name Description 14 * 02/19/97 aliu Converted from java. 15 * 03/20/97 helena Finished first cut of implementation and got rid 16 * of nextDouble/previousDouble and replaced with 17 * boolean array. 18 * 4/10/97 aliu Clean up. Modified to work on AIX. 19 * 8/6/97 nos Removed overloaded constructor, member var 'buffer'. 20 * 07/22/98 stephen Removed operator!= (implemented in Format) 21 ******************************************************************************** 22 */ 23 24 #ifndef CHOICFMT_H 25 #define CHOICFMT_H 26 27 #include "unicode/utypes.h" 28 29 /** 30 * \file 31 * \brief C++ API: Choice Format. 32 */ 33 34 #if !UCONFIG_NO_FORMATTING 35 #ifndef U_HIDE_DEPRECATED_API 36 37 #include "unicode/fieldpos.h" 38 #include "unicode/format.h" 39 #include "unicode/messagepattern.h" 40 #include "unicode/numfmt.h" 41 #include "unicode/unistr.h" 42 43 U_NAMESPACE_BEGIN 44 45 class MessageFormat; 46 47 /** 48 * ChoiceFormat converts between ranges of numeric values and strings for those ranges. 49 * The strings must conform to the MessageFormat pattern syntax. 50 * 51 * <p><em><code>ChoiceFormat</code> is probably not what you need. 52 * Please use <code>MessageFormat</code> 53 * with <code>plural</code> arguments for proper plural selection, 54 * and <code>select</code> arguments for simple selection among a fixed set of choices!</em></p> 55 * 56 * <p>A <code>ChoiceFormat</code> splits 57 * the real number line \htmlonly<code>-∞</code> to 58 * <code>+∞</code>\endhtmlonly into two 59 * or more contiguous ranges. Each range is mapped to a 60 * string.</p> 61 * 62 * <p><code>ChoiceFormat</code> was originally intended 63 * for displaying grammatically correct 64 * plurals such as "There is one file." vs. "There are 2 files." 65 * <em>However,</em> plural rules for many languages 66 * are too complex for the capabilities of ChoiceFormat, 67 * and its requirement of specifying the precise rules for each message 68 * is unmanageable for translators.</p> 69 * 70 * <p>There are two methods of defining a <code>ChoiceFormat</code>; both 71 * are equivalent. The first is by using a string pattern. This is the 72 * preferred method in most cases. The second method is through direct 73 * specification of the arrays that logically make up the 74 * <code>ChoiceFormat</code>.</p> 75 * 76 * <p>Note: Typically, choice formatting is done (if done at all) via <code>MessageFormat</code> 77 * with a <code>choice</code> argument type, 78 * rather than using a stand-alone <code>ChoiceFormat</code>.</p> 79 * 80 * <h5>Patterns and Their Interpretation</h5> 81 * 82 * <p>The pattern string defines the range boundaries and the strings for each number range. 83 * Syntax: 84 * <pre> 85 * choiceStyle = number separator message ('|' number separator message)* 86 * number = normal_number | ['-'] \htmlonly∞\endhtmlonly (U+221E, infinity) 87 * normal_number = double value (unlocalized ASCII string) 88 * separator = less_than | less_than_or_equal 89 * less_than = '<' 90 * less_than_or_equal = '#' | \htmlonly≤\endhtmlonly (U+2264) 91 * message: see {@link MessageFormat} 92 * </pre> 93 * Pattern_White_Space between syntax elements is ignored, except 94 * around each range's sub-message.</p> 95 * 96 * <p>Each numeric sub-range extends from the current range's number 97 * to the next range's number. 98 * The number itself is included in its range if a <code>less_than_or_equal</code> sign is used, 99 * and excluded from its range (and instead included in the previous range) 100 * if a <code>less_than</code> sign is used.</p> 101 * 102 * <p>When a <code>ChoiceFormat</code> is constructed from 103 * arrays of numbers, closure flags and strings, 104 * they are interpreted just like 105 * the sequence of <code>(number separator string)</code> in an equivalent pattern string. 106 * <code>closure[i]==TRUE</code> corresponds to a <code>less_than</code> separator sign. 107 * The equivalent pattern string will be constructed automatically.</p> 108 * 109 * <p>During formatting, a number is mapped to the first range 110 * where the number is not greater than the range's upper limit. 111 * That range's message string is returned. A NaN maps to the very first range.</p> 112 * 113 * <p>During parsing, a range is selected for the longest match of 114 * any range's message. That range's number is returned, ignoring the separator/closure. 115 * Only a simple string match is performed, without parsing of arguments that 116 * might be specified in the message strings.</p> 117 * 118 * <p>Note that the first range's number is ignored in formatting 119 * but may be returned from parsing.</p> 120 * 121 * <h5>Examples</h5> 122 * 123 * <p>Here is an example of two arrays that map the number 124 * <code>1..7</code> to the English day of the week abbreviations 125 * <code>Sun..Sat</code>. No closures array is given; this is the same as 126 * specifying all closures to be <code>FALSE</code>.</p> 127 * 128 * <pre> {1,2,3,4,5,6,7}, 129 * {"Sun","Mon","Tue","Wed","Thur","Fri","Sat"}</pre> 130 * 131 * <p>Here is an example that maps the ranges [-Inf, 1), [1, 1], and (1, 132 * +Inf] to three strings. That is, the number line is split into three 133 * ranges: x < 1.0, x = 1.0, and x > 1.0. 134 * (The round parentheses in the notation above indicate an exclusive boundary, 135 * like the turned bracket in European notation: [-Inf, 1) == [-Inf, 1[ )</p> 136 * 137 * <pre> {0, 1, 1}, 138 * {FALSE, FALSE, TRUE}, 139 * {"no files", "one file", "many files"}</pre> 140 * 141 * <p>Here is an example that shows formatting and parsing: </p> 142 * 143 * \code 144 * #include <unicode/choicfmt.h> 145 * #include <unicode/unistr.h> 146 * #include <iostream.h> 147 * 148 * int main(int argc, char *argv[]) { 149 * double limits[] = {1,2,3,4,5,6,7}; 150 * UnicodeString monthNames[] = { 151 * "Sun","Mon","Tue","Wed","Thu","Fri","Sat"}; 152 * ChoiceFormat fmt(limits, monthNames, 7); 153 * UnicodeString str; 154 * char buf[256]; 155 * for (double x = 1.0; x <= 8.0; x += 1.0) { 156 * fmt.format(x, str); 157 * str.extract(0, str.length(), buf, 256, ""); 158 * str.truncate(0); 159 * cout << x << " -> " 160 * << buf << endl; 161 * } 162 * cout << endl; 163 * return 0; 164 * } 165 * \endcode 166 * 167 * <p><em>User subclasses are not supported.</em> While clients may write 168 * subclasses, such code will not necessarily work and will not be 169 * guaranteed to work stably from release to release. 170 * 171 * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments. 172 */ 173 class U_I18N_API ChoiceFormat: public NumberFormat { 174 public: 175 /** 176 * Constructs a new ChoiceFormat from the pattern string. 177 * 178 * @param pattern Pattern used to construct object. 179 * @param status Output param to receive success code. If the 180 * pattern cannot be parsed, set to failure code. 181 * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments. 182 */ 183 ChoiceFormat(const UnicodeString& pattern, 184 UErrorCode& status); 185 186 187 /** 188 * Constructs a new ChoiceFormat with the given limits and message strings. 189 * All closure flags default to <code>FALSE</code>, 190 * equivalent to <code>less_than_or_equal</code> separators. 191 * 192 * Copies the limits and formats instead of adopting them. 193 * 194 * @param limits Array of limit values. 195 * @param formats Array of formats. 196 * @param count Size of 'limits' and 'formats' arrays. 197 * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments. 198 */ 199 ChoiceFormat(const double* limits, 200 const UnicodeString* formats, 201 int32_t count ); 202 203 /** 204 * Constructs a new ChoiceFormat with the given limits, closure flags and message strings. 205 * 206 * Copies the limits and formats instead of adopting them. 207 * 208 * @param limits Array of limit values 209 * @param closures Array of booleans specifying whether each 210 * element of 'limits' is open or closed. If FALSE, then the 211 * corresponding limit number is a member of its range. 212 * If TRUE, then the limit number belongs to the previous range it. 213 * @param formats Array of formats 214 * @param count Size of 'limits', 'closures', and 'formats' arrays 215 * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments. 216 */ 217 ChoiceFormat(const double* limits, 218 const UBool* closures, 219 const UnicodeString* formats, 220 int32_t count); 221 222 /** 223 * Copy constructor. 224 * 225 * @param that ChoiceFormat object to be copied from 226 * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments. 227 */ 228 ChoiceFormat(const ChoiceFormat& that); 229 230 /** 231 * Assignment operator. 232 * 233 * @param that ChoiceFormat object to be copied 234 * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments. 235 */ 236 const ChoiceFormat& operator=(const ChoiceFormat& that); 237 238 /** 239 * Destructor. 240 * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments. 241 */ 242 virtual ~ChoiceFormat(); 243 244 /** 245 * Clones this Format object. The caller owns the 246 * result and must delete it when done. 247 * 248 * @return a copy of this object 249 * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments. 250 */ 251 virtual Format* clone(void) const; 252 253 /** 254 * Returns true if the given Format objects are semantically equal. 255 * Objects of different subclasses are considered unequal. 256 * 257 * @param other ChoiceFormat object to be compared 258 * @return true if other is the same as this. 259 * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments. 260 */ 261 virtual UBool operator==(const Format& other) const; 262 263 /** 264 * Sets the pattern. 265 * @param pattern The pattern to be applied. 266 * @param status Output param set to success/failure code on 267 * exit. If the pattern is invalid, this will be 268 * set to a failure result. 269 * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments. 270 */ 271 virtual void applyPattern(const UnicodeString& pattern, 272 UErrorCode& status); 273 274 /** 275 * Sets the pattern. 276 * @param pattern The pattern to be applied. 277 * @param parseError Struct to receive information on position 278 * of error if an error is encountered 279 * @param status Output param set to success/failure code on 280 * exit. If the pattern is invalid, this will be 281 * set to a failure result. 282 * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments. 283 */ 284 virtual void applyPattern(const UnicodeString& pattern, 285 UParseError& parseError, 286 UErrorCode& status); 287 /** 288 * Gets the pattern. 289 * 290 * @param pattern Output param which will receive the pattern 291 * Previous contents are deleted. 292 * @return A reference to 'pattern' 293 * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments. 294 */ 295 virtual UnicodeString& toPattern(UnicodeString &pattern) const; 296 297 /** 298 * Sets the choices to be used in formatting. 299 * For details see the constructor with the same parameter list. 300 * 301 * @param limitsToCopy Contains the top value that you want 302 * parsed with that format,and should be in 303 * ascending sorted order. When formatting X, 304 * the choice will be the i, where limit[i] 305 * <= X < limit[i+1]. 306 * @param formatsToCopy The format strings you want to use for each limit. 307 * @param count The size of the above arrays. 308 * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments. 309 */ 310 virtual void setChoices(const double* limitsToCopy, 311 const UnicodeString* formatsToCopy, 312 int32_t count ); 313 314 /** 315 * Sets the choices to be used in formatting. 316 * For details see the constructor with the same parameter list. 317 * 318 * @param limits Array of limits 319 * @param closures Array of limit booleans 320 * @param formats Array of format string 321 * @param count The size of the above arrays 322 * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments. 323 */ 324 virtual void setChoices(const double* limits, 325 const UBool* closures, 326 const UnicodeString* formats, 327 int32_t count); 328 329 /** 330 * Returns NULL and 0. 331 * Before ICU 4.8, this used to return the choice limits array. 332 * 333 * @param count Will be set to 0. 334 * @return NULL 335 * @deprecated ICU 4.8 Use the MessagePattern class to analyze a ChoiceFormat pattern. 336 */ 337 virtual const double* getLimits(int32_t& count) const; 338 339 /** 340 * Returns NULL and 0. 341 * Before ICU 4.8, this used to return the limit booleans array. 342 * 343 * @param count Will be set to 0. 344 * @return NULL 345 * @deprecated ICU 4.8 Use the MessagePattern class to analyze a ChoiceFormat pattern. 346 */ 347 virtual const UBool* getClosures(int32_t& count) const; 348 349 /** 350 * Returns NULL and 0. 351 * Before ICU 4.8, this used to return the array of choice strings. 352 * 353 * @param count Will be set to 0. 354 * @return NULL 355 * @deprecated ICU 4.8 Use the MessagePattern class to analyze a ChoiceFormat pattern. 356 */ 357 virtual const UnicodeString* getFormats(int32_t& count) const; 358 359 360 using NumberFormat::format; 361 362 /** 363 * Formats a double number using this object's choices. 364 * 365 * @param number The value to be formatted. 366 * @param appendTo Output parameter to receive result. 367 * Result is appended to existing contents. 368 * @param pos On input: an alignment field, if desired. 369 * On output: the offsets of the alignment field. 370 * @return Reference to 'appendTo' parameter. 371 * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments. 372 */ 373 virtual UnicodeString& format(double number, 374 UnicodeString& appendTo, 375 FieldPosition& pos) const; 376 /** 377 * Formats an int32_t number using this object's choices. 378 * 379 * @param number The value to be formatted. 380 * @param appendTo Output parameter to receive result. 381 * Result is appended to existing contents. 382 * @param pos On input: an alignment field, if desired. 383 * On output: the offsets of the alignment field. 384 * @return Reference to 'appendTo' parameter. 385 * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments. 386 */ 387 virtual UnicodeString& format(int32_t number, 388 UnicodeString& appendTo, 389 FieldPosition& pos) const; 390 391 /** 392 * Formats an int64_t number using this object's choices. 393 * 394 * @param number The value to be formatted. 395 * @param appendTo Output parameter to receive result. 396 * Result is appended to existing contents. 397 * @param pos On input: an alignment field, if desired. 398 * On output: the offsets of the alignment field. 399 * @return Reference to 'appendTo' parameter. 400 * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments. 401 */ 402 virtual UnicodeString& format(int64_t number, 403 UnicodeString& appendTo, 404 FieldPosition& pos) const; 405 406 /** 407 * Formats an array of objects using this object's choices. 408 * 409 * @param objs The array of objects to be formatted. 410 * @param cnt The size of objs. 411 * @param appendTo Output parameter to receive result. 412 * Result is appended to existing contents. 413 * @param pos On input: an alignment field, if desired. 414 * On output: the offsets of the alignment field. 415 * @param success Output param set to success/failure code on 416 * exit. 417 * @return Reference to 'appendTo' parameter. 418 * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments. 419 */ 420 virtual UnicodeString& format(const Formattable* objs, 421 int32_t cnt, 422 UnicodeString& appendTo, 423 FieldPosition& pos, 424 UErrorCode& success) const; 425 426 using NumberFormat::parse; 427 428 /** 429 * Looks for the longest match of any message string on the input text and, 430 * if there is a match, sets the result object to the corresponding range's number. 431 * 432 * If no string matches, then the parsePosition is unchanged. 433 * 434 * @param text The text to be parsed. 435 * @param result Formattable to be set to the parse result. 436 * If parse fails, return contents are undefined. 437 * @param parsePosition The position to start parsing at on input. 438 * On output, moved to after the last successfully 439 * parse character. On parse failure, does not change. 440 * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments. 441 */ 442 virtual void parse(const UnicodeString& text, 443 Formattable& result, 444 ParsePosition& parsePosition) const; 445 446 /** 447 * Returns a unique class ID POLYMORPHICALLY. Part of ICU's "poor man's RTTI". 448 * 449 * @return The class ID for this object. All objects of a 450 * given class have the same class ID. Objects of 451 * other classes have different class IDs. 452 * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments. 453 */ 454 virtual UClassID getDynamicClassID(void) const; 455 456 /** 457 * Returns the class ID for this class. This is useful only for 458 * comparing to a return value from getDynamicClassID(). For example: 459 * <pre> 460 * . Base* polymorphic_pointer = createPolymorphicObject(); 461 * . if (polymorphic_pointer->getDynamicClassID() == 462 * . Derived::getStaticClassID()) ... 463 * </pre> 464 * @return The class ID for all objects of this class. 465 * @deprecated ICU 49 Use MessageFormat instead, with plural and select arguments. 466 */ 467 static UClassID U_EXPORT2 getStaticClassID(void); 468 469 private: 470 /** 471 * Converts a double value to a string. 472 * @param value the double number to be converted. 473 * @param string the result string. 474 * @return the converted string. 475 */ 476 static UnicodeString& dtos(double value, UnicodeString& string); 477 478 ChoiceFormat(); // default constructor not implemented 479 480 /** 481 * Construct a new ChoiceFormat with the limits and the corresponding formats 482 * based on the pattern. 483 * 484 * @param newPattern Pattern used to construct object. 485 * @param parseError Struct to receive information on position 486 * of error if an error is encountered. 487 * @param status Output param to receive success code. If the 488 * pattern cannot be parsed, set to failure code. 489 */ 490 ChoiceFormat(const UnicodeString& newPattern, 491 UParseError& parseError, 492 UErrorCode& status); 493 494 friend class MessageFormat; 495 496 virtual void setChoices(const double* limits, 497 const UBool* closures, 498 const UnicodeString* formats, 499 int32_t count, 500 UErrorCode &errorCode); 501 502 /** 503 * Finds the ChoiceFormat sub-message for the given number. 504 * @param pattern A MessagePattern. 505 * @param partIndex the index of the first ChoiceFormat argument style part. 506 * @param number a number to be mapped to one of the ChoiceFormat argument's intervals 507 * @return the sub-message start part index. 508 */ 509 static int32_t findSubMessage(const MessagePattern &pattern, int32_t partIndex, double number); 510 511 static double parseArgument( 512 const MessagePattern &pattern, int32_t partIndex, 513 const UnicodeString &source, ParsePosition &pos); 514 515 /** 516 * Matches the pattern string from the end of the partIndex to 517 * the beginning of the limitPartIndex, 518 * including all syntax except SKIP_SYNTAX, 519 * against the source string starting at sourceOffset. 520 * If they match, returns the length of the source string match. 521 * Otherwise returns -1. 522 */ 523 static int32_t matchStringUntilLimitPart( 524 const MessagePattern &pattern, int32_t partIndex, int32_t limitPartIndex, 525 const UnicodeString &source, int32_t sourceOffset); 526 527 /** 528 * Some of the ChoiceFormat constructors do not have a UErrorCode paramater. 529 * We need _some_ way to provide one for the MessagePattern constructor. 530 * Alternatively, the MessagePattern could be a pointer field, but that is 531 * not nice either. 532 */ 533 UErrorCode constructorErrorCode; 534 535 /** 536 * The MessagePattern which contains the parsed structure of the pattern string. 537 * 538 * Starting with ICU 4.8, the MessagePattern contains a sequence of 539 * numeric/selector/message parts corresponding to the parsed pattern. 540 * For details see the MessagePattern class API docs. 541 */ 542 MessagePattern msgPattern; 543 544 /** 545 * Docs & fields from before ICU 4.8, before MessagePattern was used. 546 * Commented out, and left only for explanation of semantics. 547 * -------- 548 * Each ChoiceFormat divides the range -Inf..+Inf into fCount 549 * intervals. The intervals are: 550 * 551 * 0: fChoiceLimits[0]..fChoiceLimits[1] 552 * 1: fChoiceLimits[1]..fChoiceLimits[2] 553 * ... 554 * fCount-2: fChoiceLimits[fCount-2]..fChoiceLimits[fCount-1] 555 * fCount-1: fChoiceLimits[fCount-1]..+Inf 556 * 557 * Interval 0 is special; during formatting (mapping numbers to 558 * strings), it also contains all numbers less than 559 * fChoiceLimits[0], as well as NaN values. 560 * 561 * Interval i maps to and from string fChoiceFormats[i]. When 562 * parsing (mapping strings to numbers), then intervals map to 563 * their lower limit, that is, interval i maps to fChoiceLimit[i]. 564 * 565 * The intervals may be closed, half open, or open. This affects 566 * formatting but does not affect parsing. Interval i is affected 567 * by fClosures[i] and fClosures[i+1]. If fClosures[i] 568 * is FALSE, then the value fChoiceLimits[i] is in interval i. 569 * That is, intervals i and i are: 570 * 571 * i-1: ... x < fChoiceLimits[i] 572 * i: fChoiceLimits[i] <= x ... 573 * 574 * If fClosures[i] is TRUE, then the value fChoiceLimits[i] is 575 * in interval i-1. That is, intervals i-1 and i are: 576 * 577 * i-1: ... x <= fChoiceLimits[i] 578 * i: fChoiceLimits[i] < x ... 579 * 580 * Because of the nature of interval 0, fClosures[0] has no 581 * effect. 582 */ 583 // double* fChoiceLimits; 584 // UBool* fClosures; 585 // UnicodeString* fChoiceFormats; 586 // int32_t fCount; 587 }; 588 589 590 U_NAMESPACE_END 591 592 #endif // U_HIDE_DEPRECATED_API 593 #endif /* #if !UCONFIG_NO_FORMATTING */ 594 595 #endif // CHOICFMT_H 596 //eof 597