1 /* 2 * Copyright (C) 2007-2010, International Business Machines Corporation and 3 * others. All Rights Reserved. 4 ******************************************************************************** 5 * 6 * File MSGFMT.H 7 * 8 * Modification History: 9 * 10 * Date Name Description 11 * 02/19/97 aliu Converted from java. 12 * 03/20/97 helena Finished first cut of implementation. 13 * 07/22/98 stephen Removed operator!= (defined in Format) 14 * 08/19/2002 srl Removing Javaisms 15 *******************************************************************************/ 16 17 #ifndef MSGFMT_H 18 #define MSGFMT_H 19 20 #include "unicode/utypes.h" 21 22 /** 23 * \file 24 * \brief C++ API: Formats messages in a language-neutral way. 25 */ 26 27 #if !UCONFIG_NO_FORMATTING 28 29 #include "unicode/format.h" 30 #include "unicode/locid.h" 31 #include "unicode/parseerr.h" 32 #include "unicode/uchar.h" 33 34 U_NAMESPACE_BEGIN 35 36 class NumberFormat; 37 class DateFormat; 38 39 /** 40 * 41 * MessageFormat produces concatenated messages in a language-neutral 42 * way. Use this whenever concatenating strings that are displayed to 43 * end users. 44 * 45 * <P>A MessageFormat contains an array of <EM>subformats</EM> arranged 46 * within a <EM>template string</EM>. Together, the subformats and 47 * template string determine how the MessageFormat will operate during 48 * formatting and parsing. 49 * 50 * <P>Typically, both the subformats and the template string are 51 * specified at once in a <EM>pattern</EM>. By using different 52 * patterns for different locales, messages may be localized. 53 * 54 * <P>When formatting, MessageFormat takes an array of arguments 55 * and produces a user-readable string. Each argument is a 56 * Formattable object; they may be passed in in an array, or as a 57 * single Formattable object which itself contains an array. Each 58 * argument is matched up with its corresponding subformat, which then 59 * formats it into a string. The resulting strings are then assembled 60 * within the string template of the MessageFormat to produce the 61 * final output string. 62 * 63 * <p><strong>Note:</strong> 64 * In ICU 4.0 MessageFormat supports named arguments. If a named argument 65 * is used, all arguments must be named. Names start with a character in 66 * <code>UCHAR_ID_START</code> and continue with characters in 67 * <code>UCHARID_CONTINUE</code>, in particular they do not start with a digit. 68 * If named arguments are used, {@link #usesNamedArguments()} will return true. 69 * 70 * <p>The other new methods supporting named arguments are 71 * {@link #getFormatNames(UErrorCode& status)}, 72 * {@link #getFormat(const UnicodeString& formatName, UErrorCode& status)} 73 * {@link #setFormat(const UnicodeString& formatName, const Format& format, UErrorCode& status)}, 74 * {@link #adoptFormat(const UnicodeString& formatName, Format* formatToAdopt, UErrorCode& status)}, 75 * {@link #format(const UnicodeString* argumentNames, const Formattable* arguments, 76 * int32_t count, UnicodeString& appendTo,UErrorCode& status)}. 77 * These methods are all compatible with patterns that do not used named arguments-- 78 * in these cases the keys in the input or output use <code>UnicodeString</code>s 79 * that name the argument indices, e.g. "0", "1", "2"... etc. 80 * 81 * <p>If this format uses named arguments, certain methods that take or 82 * return arrays do not perform any action, since it is not possible to 83 * identify positions in an array using a name. Of these methods, 84 * UErrorCode is set to U_ILLEGAL_ARGUMENT_ERROR by format, and to 85 * U_ARGUMENT_TYPE_MISMATCH by parse. 86 * These methods are 87 * {@link #adoptFormats(Format** formatsToAdopt, int32_t count)}, 88 * {@link #setFormats(const Format** newFormats,int32_t count)}, 89 * {@link #adoptFormat(int32_t n, Format *newFormat)}, 90 * {@link #setFormat(int32_t n, Format& newFormat)}, 91 * {@link #format(const Formattable* source, int32_t count, UnicodeString& appendTo, FieldPosition& ignore, UErrorCode& success)}, 92 * {@link #format(const UnicodeString& pattern,const Formattable* arguments,int32_t cnt,UnicodeString& appendTo,UErrorCode& success)}, 93 * {@link #format(const Formattable& source, UnicodeString& appendTo, FieldPosition& ignore, UErrorCode& success)}, 94 * {@link #format(const Formattable* arguments, int32_t cnt, UnicodeString& appendTo, FieldPosition& status, int32_t recursionProtection,UErrorCode& success)}, 95 * {@link #parse(const UnicodeString& source, ParsePosition& pos, int32_t& count)}, 96 * {@link #parse(const UnicodeString& source, int32_t& cnt, UErrorCode& status)} 97 * 98 * <P> 99 * During parsing, an input string is matched against the string 100 * template of the MessageFormat to produce an array of Formattable 101 * objects. Plain text of the template string is matched directly 102 * against input text. At each position in the template string where 103 * a subformat is located, the subformat is called to parse the 104 * corresponding segment of input text to produce an output argument. 105 * In this way, an array of arguments is created which together 106 * constitute the parse result. 107 * <P> 108 * Parsing may fail or produce unexpected results in a number of 109 * circumstances. 110 * <UL> 111 * <LI>If one of the arguments does not occur in the pattern, it 112 * will be returned as a default Formattable. 113 * <LI>If the format of an argument loses information, such as with 114 * a choice format where a large number formats to "many", then the 115 * parse may not correspond to the originally formatted argument. 116 * <LI>MessageFormat does not handle ChoiceFormat recursion during 117 * parsing; such parses will fail. 118 * <LI>Parsing will not always find a match (or the correct match) if 119 * some part of the parse is ambiguous. For example, if the pattern 120 * "{1},{2}" is used with the string arguments {"a,b", "c"}, it will 121 * format as "a,b,c". When the result is parsed, it will return {"a", 122 * "b,c"}. 123 * <LI>If a single argument is formatted more than once in the string, 124 * then the rightmost subformat in the pattern string will produce the 125 * parse result; prior subformats with the same argument index will 126 * have no effect. 127 * </UL> 128 * Here are some examples of usage: 129 * <P> 130 * Example 1: 131 * <pre> 132 * \code 133 * UErrorCode success = U_ZERO_ERROR; 134 * GregorianCalendar cal(success); 135 * Formattable arguments[] = { 136 * 7L, 137 * Formattable( (Date) cal.getTime(success), Formattable::kIsDate), 138 * "a disturbance in the Force" 139 * }; 140 * 141 * UnicodeString result; 142 * MessageFormat::format( 143 * "At {1,time} on {1,date}, there was {2} on planet {0,number}.", 144 * arguments, 3, result, success ); 145 * 146 * cout << "result: " << result << endl; 147 * //<output>: At 4:34:20 PM on 23-Mar-98, there was a disturbance 148 * // in the Force on planet 7. 149 * \endcode 150 * </pre> 151 * Typically, the message format will come from resources, and the 152 * arguments will be dynamically set at runtime. 153 * <P> 154 * Example 2: 155 * <pre> 156 * \code 157 * success = U_ZERO_ERROR; 158 * Formattable testArgs[] = {3L, "MyDisk"}; 159 * 160 * MessageFormat form( 161 * "The disk \"{1}\" contains {0} file(s).", success ); 162 * 163 * UnicodeString string; 164 * FieldPosition fpos = 0; 165 * cout << "format: " << form.format(testArgs, 2, string, fpos, success ) << endl; 166 * 167 * // output, with different testArgs: 168 * // output: The disk "MyDisk" contains 0 file(s). 169 * // output: The disk "MyDisk" contains 1 file(s). 170 * // output: The disk "MyDisk" contains 1,273 file(s). 171 * \endcode 172 * </pre> 173 * 174 * The pattern is of the following form. Legend: 175 * <pre> 176 * \code 177 * {optional item} 178 * (group that may be repeated)* 179 * \endcode 180 * </pre> 181 * Do not confuse optional items with items inside quoted braces, such 182 * as this: "{". Quoted braces are literals. 183 * <pre> 184 * \code 185 * messageFormatPattern := string ( "{" messageFormatElement "}" string )* 186 * 187 * messageFormatElement := argumentIndex | argumentName { "," elementFormat } 188 * 189 * elementFormat := "time" { "," datetimeStyle } 190 * | "date" { "," datetimeStyle } 191 * | "number" { "," numberStyle } 192 * | "choice" "," choiceStyle 193 * | "spellout" { "," spelloutStyle } 194 * | "ordinal" { "," spelloutStyle } 195 * | "duration" { "," spelloutStyle } 196 * | "plural" "," pluralStyle 197 * | "select" "," selectStyle 198 * 199 * datetimeStyle := "short" 200 * | "medium" 201 * | "long" 202 * | "full" 203 * | dateFormatPattern 204 * 205 * numberStyle := "currency" 206 * | "percent" 207 * | "integer" 208 * | numberFormatPattern 209 * 210 * choiceStyle := choiceFormatPattern 211 * 212 * pluralStyle := pluralFormatPattern 213 * 214 * selectStyle := selectFormatPattern 215 * 216 * spelloutStyle := ruleSetName 217 * \endcode 218 * </pre> 219 * If there is no elementFormat, then the argument must be a string, 220 * which is substituted. If there is no dateTimeStyle or numberStyle, 221 * then the default format is used (e.g. NumberFormat::createInstance(), 222 * DateFormat::createTimeInstance(DateFormat::kDefault, ...) or 223 * DateFormat::createDateInstance(DateFormat::kDefault, ...). For 224 * a RuleBasedNumberFormat, if there is no ruleSetName, the default 225 * rule set is used. For a ChoiceFormat or PluralFormat or SelectFormat, the pattern 226 * must always be specified, since there is no default. 227 * <P> 228 * In strings, single quotes can be used to quote syntax characters. 229 * A literal single quote is represented by '', both within and outside 230 * of single-quoted segments. Inside a 231 * messageFormatElement, quotes are <EM>not</EM> removed. For example, 232 * {1,number,$'#',##} will produce a number format with the pound-sign 233 * quoted, with a result such as: "$#31,45". 234 * <P> 235 * If a pattern is used, then unquoted braces in the pattern, if any, 236 * must match: that is, "ab {0} de" and "ab '}' de" are ok, but "ab 237 * {0'}' de" and "ab } de" are not. 238 * <p> 239 * <dl><dt><b>Warning:</b><dd>The rules for using quotes within message 240 * format patterns unfortunately have shown to be somewhat confusing. 241 * In particular, it isn't always obvious to localizers whether single 242 * quotes need to be doubled or not. Make sure to inform localizers about 243 * the rules, and tell them (for example, by using comments in resource 244 * bundle source files) which strings will be processed by MessageFormat. 245 * Note that localizers may need to use single quotes in translated 246 * strings where the original version doesn't have them. 247 * <br>Note also that the simplest way to avoid the problem is to 248 * use the real apostrophe (single quote) character U+2019 (') for 249 * human-readable text, and to use the ASCII apostrophe (U+0027 ' ) 250 * only in program syntax, like quoting in MessageFormat. 251 * See the annotations for U+0027 Apostrophe in The Unicode Standard.</p> 252 * </dl> 253 * <P> 254 * The argumentIndex is a non-negative integer, which corresponds to the 255 * index of the arguments presented in an array to be formatted. The 256 * first argument has argumentIndex 0. 257 * <P> 258 * It is acceptable to have unused arguments in the array. With missing 259 * arguments, or arguments that are not of the right class for the 260 * specified format, a failing UErrorCode result is set. 261 * <P> 262 * <strong>Creating internationalized messages that include plural forms, you 263 * can use a PluralFormat:</strong> 264 * <pre> 265 * \code 266 * UErrorCode err = U_ZERO_ERROR; 267 * UnicodeString t1("{0, plural, one{C''est # fichier} other{Ce sont # fichiers}} dans la liste."); 268 * MessageFormat* msgFmt = new MessageFormat(t1, Locale("fr"), err); 269 * if (U_FAILURE(err)) { 270 * return err; 271 * } 272 * 273 * Formattable args1[] = {(int32_t)0}; 274 * Formattable args2[] = {(int32_t)3}; 275 * FieldPosition ignore(FieldPosition::DONT_CARE); 276 * UnicodeString result; 277 * msgFmt->format(args1, 1, result, ignore, status); 278 * cout << result << endl; 279 * result.remove(); 280 * msgFmt->format(args2, 1, result, ignore, status); 281 * cout << result << endl; 282 * 283 * // output, with different args 284 * // output: C'est 0,0 fichier dans la liste. 285 * // output: Ce sont 3 fichiers dans la liste." 286 * \endcode 287 * </pre> 288 * Please check PluralFormat and PluralRules for details. 289 * </P> 290 */ 291 class U_I18N_API MessageFormat : public Format { 292 public: 293 /** 294 * Enum type for kMaxFormat. 295 * @obsolete ICU 3.0. The 10-argument limit was removed as of ICU 2.6, 296 * rendering this enum type obsolete. 297 */ 298 enum EFormatNumber { 299 /** 300 * The maximum number of arguments. 301 * @obsolete ICU 3.0. The 10-argument limit was removed as of ICU 2.6, 302 * rendering this constant obsolete. 303 */ 304 kMaxFormat = 10 305 }; 306 307 /** 308 * Constructs a new MessageFormat using the given pattern and the 309 * default locale. 310 * 311 * @param pattern Pattern used to construct object. 312 * @param status Input/output error code. If the 313 * pattern cannot be parsed, set to failure code. 314 * @stable ICU 2.0 315 */ 316 MessageFormat(const UnicodeString& pattern, 317 UErrorCode &status); 318 319 /** 320 * Constructs a new MessageFormat using the given pattern and locale. 321 * @param pattern Pattern used to construct object. 322 * @param newLocale The locale to use for formatting dates and numbers. 323 * @param status Input/output error code. If the 324 * pattern cannot be parsed, set to failure code. 325 * @stable ICU 2.0 326 */ 327 MessageFormat(const UnicodeString& pattern, 328 const Locale& newLocale, 329 UErrorCode& status); 330 /** 331 * Constructs a new MessageFormat using the given pattern and locale. 332 * @param pattern Pattern used to construct object. 333 * @param newLocale The locale to use for formatting dates and numbers. 334 * @param parseError Struct to recieve information on position 335 * of error within the pattern. 336 * @param status Input/output error code. If the 337 * pattern cannot be parsed, set to failure code. 338 * @stable ICU 2.0 339 */ 340 MessageFormat(const UnicodeString& pattern, 341 const Locale& newLocale, 342 UParseError& parseError, 343 UErrorCode& status); 344 /** 345 * Constructs a new MessageFormat from an existing one. 346 * @stable ICU 2.0 347 */ 348 MessageFormat(const MessageFormat&); 349 350 /** 351 * Assignment operator. 352 * @stable ICU 2.0 353 */ 354 const MessageFormat& operator=(const MessageFormat&); 355 356 /** 357 * Destructor. 358 * @stable ICU 2.0 359 */ 360 virtual ~MessageFormat(); 361 362 /** 363 * Clones this Format object polymorphically. The caller owns the 364 * result and should delete it when done. 365 * @stable ICU 2.0 366 */ 367 virtual Format* clone(void) const; 368 369 /** 370 * Returns true if the given Format objects are semantically equal. 371 * Objects of different subclasses are considered unequal. 372 * @param other the object to be compared with. 373 * @return true if the given Format objects are semantically equal. 374 * @stable ICU 2.0 375 */ 376 virtual UBool operator==(const Format& other) const; 377 378 /** 379 * Sets the locale. This locale is used for fetching default number or date 380 * format information. 381 * @param theLocale the new locale value to be set. 382 * @stable ICU 2.0 383 */ 384 virtual void setLocale(const Locale& theLocale); 385 386 /** 387 * Gets the locale. This locale is used for fetching default number or date 388 * format information. 389 * @return the locale of the object. 390 * @stable ICU 2.0 391 */ 392 virtual const Locale& getLocale(void) const; 393 394 /** 395 * Applies the given pattern string to this message format. 396 * 397 * @param pattern The pattern to be applied. 398 * @param status Input/output error code. If the 399 * pattern cannot be parsed, set to failure code. 400 * @stable ICU 2.0 401 */ 402 virtual void applyPattern(const UnicodeString& pattern, 403 UErrorCode& status); 404 /** 405 * Applies the given pattern string to this message format. 406 * 407 * @param pattern The pattern to be applied. 408 * @param parseError Struct to recieve information on position 409 * of error within pattern. 410 * @param status Input/output error code. If the 411 * pattern cannot be parsed, set to failure code. 412 * @stable ICU 2.0 413 */ 414 virtual void applyPattern(const UnicodeString& pattern, 415 UParseError& parseError, 416 UErrorCode& status); 417 418 /** 419 * Returns a pattern that can be used to recreate this object. 420 * 421 * @param appendTo Output parameter to receive the pattern. 422 * Result is appended to existing contents. 423 * @return Reference to 'appendTo' parameter. 424 * @stable ICU 2.0 425 */ 426 virtual UnicodeString& toPattern(UnicodeString& appendTo) const; 427 428 /** 429 * Sets subformats. 430 * See the class description about format numbering. 431 * The caller should not delete the Format objects after this call. 432 * <EM>The array formatsToAdopt is not itself adopted.</EM> Its 433 * ownership is retained by the caller. If the call fails because 434 * memory cannot be allocated, then the formats will be deleted 435 * by this method, and this object will remain unchanged. 436 * 437 * <p>If this format uses named arguments, the new formats are discarded 438 * and this format remains unchanged. 439 * 440 * @stable ICU 2.0 441 * @param formatsToAdopt the format to be adopted. 442 * @param count the size of the array. 443 */ 444 virtual void adoptFormats(Format** formatsToAdopt, int32_t count); 445 446 /** 447 * Sets subformats. 448 * See the class description about format numbering. 449 * Each item in the array is cloned into the internal array. 450 * If the call fails because memory cannot be allocated, then this 451 * object will remain unchanged. 452 * 453 * <p>If this format uses named arguments, the new formats are discarded 454 * and this format remains unchanged. 455 * 456 * @stable ICU 2.0 457 * @param newFormats the new format to be set. 458 * @param cnt the size of the array. 459 */ 460 virtual void setFormats(const Format** newFormats, int32_t cnt); 461 462 463 /** 464 * Sets one subformat. 465 * See the class description about format numbering. 466 * The caller should not delete the Format object after this call. 467 * If the number is over the number of formats already set, 468 * the item will be deleted and ignored. 469 * 470 * <p>If this format uses named arguments, the new format is discarded 471 * and this format remains unchanged. 472 * 473 * @stable ICU 2.0 474 * @param formatNumber index of the subformat. 475 * @param formatToAdopt the format to be adopted. 476 */ 477 virtual void adoptFormat(int32_t formatNumber, Format* formatToAdopt); 478 479 /** 480 * Sets one subformat. 481 * See the class description about format numbering. 482 * If the number is over the number of formats already set, 483 * the item will be ignored. 484 * @param formatNumber index of the subformat. 485 * @param format the format to be set. 486 * @stable ICU 2.0 487 */ 488 virtual void setFormat(int32_t formatNumber, const Format& format); 489 490 /** 491 * Gets format names. This function returns formatNames in StringEnumerations 492 * which can be used with getFormat() and setFormat() to export formattable 493 * array from current MessageFormat to another. It is caller's resposibility 494 * to delete the returned formatNames. 495 * @param status output param set to success/failure code. 496 * @stable ICU 4.0 497 */ 498 virtual StringEnumeration* getFormatNames(UErrorCode& status); 499 500 /** 501 * Gets subformat pointer for given format name. 502 * This function supports both named and numbered 503 * arguments-- if numbered, the formatName is the 504 * corresponding UnicodeStrings (e.g. "0", "1", "2"...). 505 * The returned Format object should not be deleted by the caller, 506 * nor should the ponter of other object . The pointer and its 507 * contents remain valid only until the next call to any method 508 * of this class is made with this object. 509 * @param formatName the name or number specifying a format 510 * @param status output param set to success/failure code. 511 * @stable ICU 4.0 512 */ 513 virtual Format* getFormat(const UnicodeString& formatName, UErrorCode& status); 514 515 /** 516 * Sets one subformat for given format name. 517 * See the class description about format name. 518 * This function supports both named and numbered 519 * arguments-- if numbered, the formatName is the 520 * corresponding UnicodeStrings (e.g. "0", "1", "2"...). 521 * If there is no matched formatName or wrong type, 522 * the item will be ignored. 523 * @param formatName Name of the subformat. 524 * @param format the format to be set. 525 * @param status output param set to success/failure code. 526 * @stable ICU 4.0 527 */ 528 virtual void setFormat(const UnicodeString& formatName, const Format& format, UErrorCode& status); 529 530 /** 531 * Sets one subformat for given format name. 532 * See the class description about format name. 533 * This function supports both named and numbered 534 * arguments-- if numbered, the formatName is the 535 * corresponding UnicodeStrings (e.g. "0", "1", "2"...). 536 * If there is no matched formatName or wrong type, 537 * the item will be ignored. 538 * The caller should not delete the Format object after this call. 539 * @param formatName Name of the subformat. 540 * @param formatToAdopt Format to be adopted. 541 * @param status output param set to success/failure code. 542 * @stable ICU 4.0 543 */ 544 virtual void adoptFormat(const UnicodeString& formatName, Format* formatToAdopt, UErrorCode& status); 545 546 /** 547 * Gets an array of subformats of this object. The returned array 548 * should not be deleted by the caller, nor should the pointers 549 * within the array. The array and its contents remain valid only 550 * until the next call to this format. See the class description 551 * about format numbering. 552 * 553 * @param count output parameter to receive the size of the array 554 * @return an array of count Format* objects, or NULL if out of 555 * memory. Any or all of the array elements may be NULL. 556 * @stable ICU 2.0 557 */ 558 virtual const Format** getFormats(int32_t& count) const; 559 560 561 using Format::format; 562 563 /** 564 * Formats the given array of arguments into a user-readable string. 565 * Does not take ownership of the Formattable* array or its contents. 566 * 567 * <p>If this format uses named arguments, appendTo is unchanged and 568 * status is set to U_ILLEGAL_ARGUMENT_ERROR. 569 * 570 * @param source An array of objects to be formatted. 571 * @param count The number of elements of 'source'. 572 * @param appendTo Output parameter to receive result. 573 * Result is appended to existing contents. 574 * @param ignore Not used; inherited from base class API. 575 * @param status Input/output error code. If the 576 * pattern cannot be parsed, set to failure code. 577 * @return Reference to 'appendTo' parameter. 578 * @stable ICU 2.0 579 */ 580 UnicodeString& format(const Formattable* source, 581 int32_t count, 582 UnicodeString& appendTo, 583 FieldPosition& ignore, 584 UErrorCode& status) const; 585 586 /** 587 * Formats the given array of arguments into a user-readable string 588 * using the given pattern. 589 * 590 * <p>If this format uses named arguments, appendTo is unchanged and 591 * status is set to U_ILLEGAL_ARGUMENT_ERROR. 592 * 593 * @param pattern The pattern. 594 * @param arguments An array of objects to be formatted. 595 * @param count The number of elements of 'source'. 596 * @param appendTo Output parameter to receive result. 597 * Result is appended to existing contents. 598 * @param status Input/output error code. If the 599 * pattern cannot be parsed, set to failure code. 600 * @return Reference to 'appendTo' parameter. 601 * @stable ICU 2.0 602 */ 603 static UnicodeString& format(const UnicodeString& pattern, 604 const Formattable* arguments, 605 int32_t count, 606 UnicodeString& appendTo, 607 UErrorCode& status); 608 609 /** 610 * Formats the given array of arguments into a user-readable 611 * string. The array must be stored within a single Formattable 612 * object of type kArray. If the Formattable object type is not of 613 * type kArray, then returns a failing UErrorCode. 614 * 615 * <p>If this format uses named arguments, appendTo is unchanged and 616 * status is set to U_ILLEGAL_ARGUMENT_ERROR. 617 * 618 * @param obj A Formattable of type kArray containing 619 * arguments to be formatted. 620 * @param appendTo Output parameter to receive result. 621 * Result is appended to existing contents. 622 * @param pos On input: an alignment field, if desired. 623 * On output: the offsets of the alignment field. 624 * @param status Input/output error code. If the 625 * pattern cannot be parsed, set to failure code. 626 * @return Reference to 'appendTo' parameter. 627 * @stable ICU 2.0 628 */ 629 virtual UnicodeString& format(const Formattable& obj, 630 UnicodeString& appendTo, 631 FieldPosition& pos, 632 UErrorCode& status) const; 633 634 /** 635 * Formats the given array of arguments into a user-readable 636 * string. The array must be stored within a single Formattable 637 * object of type kArray. If the Formattable object type is not of 638 * type kArray, then returns a failing UErrorCode. 639 * 640 * @param obj The object to format 641 * @param appendTo Output parameter to receive result. 642 * Result is appended to existing contents. 643 * @param status Input/output error code. If the 644 * pattern cannot be parsed, set to failure code. 645 * @return Reference to 'appendTo' parameter. 646 * @stable ICU 2.0 647 */ 648 UnicodeString& format(const Formattable& obj, 649 UnicodeString& appendTo, 650 UErrorCode& status) const; 651 652 653 /** 654 * Formats the given array of arguments into a user-defined argument name 655 * array. This function supports both named and numbered 656 * arguments-- if numbered, the formatName is the 657 * corresponding UnicodeStrings (e.g. "0", "1", "2"...). 658 * 659 * @param argumentNames argument name array 660 * @param arguments An array of objects to be formatted. 661 * @param count The number of elements of 'argumentNames' and 662 * arguments. The number of argumentNames and arguments 663 * must be the same. 664 * @param appendTo Output parameter to receive result. 665 * Result is appended to existing contents. 666 * @param status Input/output error code. If the 667 * pattern cannot be parsed, set to failure code. 668 * @return Reference to 'appendTo' parameter. 669 * @stable ICU 4.0 670 */ 671 UnicodeString& format(const UnicodeString* argumentNames, 672 const Formattable* arguments, 673 int32_t count, 674 UnicodeString& appendTo, 675 UErrorCode& status) const; 676 /** 677 * Parses the given string into an array of output arguments. 678 * 679 * @param source String to be parsed. 680 * @param pos On input, starting position for parse. On output, 681 * final position after parse. Unchanged if parse 682 * fails. 683 * @param count Output parameter to receive the number of arguments 684 * parsed. 685 * @return an array of parsed arguments. The caller owns both 686 * the array and its contents. 687 * @stable ICU 2.0 688 */ 689 virtual Formattable* parse(const UnicodeString& source, 690 ParsePosition& pos, 691 int32_t& count) const; 692 693 /** 694 * Parses the given string into an array of output arguments. 695 * 696 * <p>If this format uses named arguments, status is set to 697 * U_ARGUMENT_TYPE_MISMATCH. 698 * 699 * @param source String to be parsed. 700 * @param count Output param to receive size of returned array. 701 * @param status Input/output error code. If the 702 * pattern cannot be parsed, set to failure code. 703 * @return an array of parsed arguments. The caller owns both 704 * the array and its contents. Returns NULL if status is not U_ZERO_ERROR. 705 * 706 * @stable ICU 2.0 707 */ 708 virtual Formattable* parse(const UnicodeString& source, 709 int32_t& count, 710 UErrorCode& status) const; 711 712 /** 713 * Parses the given string into an array of output arguments 714 * stored within a single Formattable of type kArray. 715 * 716 * @param source The string to be parsed into an object. 717 * @param result Formattable to be set to the parse result. 718 * If parse fails, return contents are undefined. 719 * @param pos On input, starting position for parse. On output, 720 * final position after parse. Unchanged if parse 721 * fails. 722 * @stable ICU 2.0 723 */ 724 virtual void parseObject(const UnicodeString& source, 725 Formattable& result, 726 ParsePosition& pos) const; 727 728 /** 729 * Convert an 'apostrophe-friendly' pattern into a standard 730 * pattern. Standard patterns treat all apostrophes as 731 * quotes, which is problematic in some languages, e.g. 732 * French, where apostrophe is commonly used. This utility 733 * assumes that only an unpaired apostrophe immediately before 734 * a brace is a true quote. Other unpaired apostrophes are paired, 735 * and the resulting standard pattern string is returned. 736 * 737 * <p><b>Note</b> it is not guaranteed that the returned pattern 738 * is indeed a valid pattern. The only effect is to convert 739 * between patterns having different quoting semantics. 740 * 741 * @param pattern the 'apostrophe-friendly' patttern to convert 742 * @param status Input/output error code. If the pattern 743 * cannot be parsed, the failure code is set. 744 * @return the standard equivalent of the original pattern 745 * @stable ICU 3.4 746 */ 747 static UnicodeString autoQuoteApostrophe(const UnicodeString& pattern, 748 UErrorCode& status); 749 750 /** 751 * Returns true if this MessageFormat uses named arguments, 752 * and false otherwise. See class description. 753 * 754 * @return true if named arguments are used. 755 * @stable ICU 4.0 756 */ 757 UBool usesNamedArguments() const; 758 759 760 /** 761 * This API is for ICU internal use only. 762 * Please do not use it. 763 * 764 * Returns argument types count in the parsed pattern. 765 * Used to distinguish pattern "{0} d" and "d". 766 * 767 * @return The number of formattable types in the pattern 768 * @internal 769 */ 770 int32_t getArgTypeCount() const; 771 772 /** 773 * Returns a unique class ID POLYMORPHICALLY. Pure virtual override. 774 * This method is to implement a simple version of RTTI, since not all 775 * C++ compilers support genuine RTTI. Polymorphic operator==() and 776 * clone() methods call this method. 777 * 778 * @return The class ID for this object. All objects of a 779 * given class have the same class ID. Objects of 780 * other classes have different class IDs. 781 * @stable ICU 2.0 782 */ 783 virtual UClassID getDynamicClassID(void) const; 784 785 /** 786 * Return the class ID for this class. This is useful only for 787 * comparing to a return value from getDynamicClassID(). For example: 788 * <pre> 789 * . Base* polymorphic_pointer = createPolymorphicObject(); 790 * . if (polymorphic_pointer->getDynamicClassID() == 791 * . Derived::getStaticClassID()) ... 792 * </pre> 793 * @return The class ID for all objects of this class. 794 * @stable ICU 2.0 795 */ 796 static UClassID U_EXPORT2 getStaticClassID(void); 797 798 private: 799 800 Locale fLocale; 801 UnicodeString fPattern; 802 Format** formatAliases; // see getFormats 803 int32_t formatAliasesCapacity; 804 UProperty idStart; 805 UProperty idContinue; 806 807 MessageFormat(); // default constructor not implemented 808 809 /* 810 * A structure representing one subformat of this MessageFormat. 811 * Each subformat has a Format object, an offset into the plain 812 * pattern text fPattern, and an argument number. The argument 813 * number corresponds to the array of arguments to be formatted. 814 * @internal 815 */ 816 class Subformat; 817 818 /** 819 * A MessageFormat contains an array of subformats. This array 820 * needs to grow dynamically if the MessageFormat is modified. 821 */ 822 Subformat* subformats; 823 int32_t subformatCount; 824 int32_t subformatCapacity; 825 826 /** 827 * A MessageFormat formats an array of arguments. Each argument 828 * has an expected type, based on the pattern. For example, if 829 * the pattern contains the subformat "{3,number,integer}", then 830 * we expect argument 3 to have type Formattable::kLong. This 831 * array needs to grow dynamically if the MessageFormat is 832 * modified. 833 */ 834 Formattable::Type* argTypes; 835 int32_t argTypeCount; 836 int32_t argTypeCapacity; 837 838 /** 839 * Is true iff all argument names are non-negative numbers. 840 * 841 */ 842 UBool isArgNumeric; 843 844 // Variable-size array management 845 UBool allocateSubformats(int32_t capacity); 846 UBool allocateArgTypes(int32_t capacity); 847 848 /** 849 * Default Format objects used when no format is specified and a 850 * numeric or date argument is formatted. These are volatile 851 * cache objects maintained only for performance. They do not 852 * participate in operator=(), copy constructor(), nor 853 * operator==(). 854 */ 855 NumberFormat* defaultNumberFormat; 856 DateFormat* defaultDateFormat; 857 858 /** 859 * Method to retrieve default formats (or NULL on failure). 860 * These are semantically const, but may modify *this. 861 */ 862 const NumberFormat* getDefaultNumberFormat(UErrorCode&) const; 863 const DateFormat* getDefaultDateFormat(UErrorCode&) const; 864 865 /** 866 * Finds the word s, in the keyword list and returns the located index. 867 * @param s the keyword to be searched for. 868 * @param list the list of keywords to be searched with. 869 * @return the index of the list which matches the keyword s. 870 */ 871 static int32_t findKeyword( const UnicodeString& s, 872 const UChar * const *list); 873 874 /** 875 * Formats the array of arguments and copies the result into the 876 * result buffer, updates the field position. 877 * 878 * @param arguments The formattable objects array. 879 * @param cnt The array count. 880 * @param appendTo Output parameter to receive result. 881 * Result is appended to existing contents. 882 * @param status Field position status. 883 * @param recursionProtection 884 * Initially zero. Bits 0..9 are used to indicate 885 * that a parameter has already been seen, to 886 * avoid recursion. Currently unused. 887 * @param success The error code status. 888 * @return Reference to 'appendTo' parameter. 889 */ 890 UnicodeString& format( const Formattable* arguments, 891 int32_t cnt, 892 UnicodeString& appendTo, 893 FieldPosition& status, 894 int32_t recursionProtection, 895 UErrorCode& success) const; 896 897 UnicodeString& format( const Formattable* arguments, 898 const UnicodeString *argumentNames, 899 int32_t cnt, 900 UnicodeString& appendTo, 901 FieldPosition& status, 902 int32_t recursionProtection, 903 UErrorCode& success) const; 904 905 void makeFormat(int32_t offsetNumber, 906 UnicodeString* segments, 907 UParseError& parseError, 908 UErrorCode& success); 909 910 /** 911 * Convenience method that ought to be in NumberFormat 912 */ 913 NumberFormat* createIntegerFormat(const Locale& locale, UErrorCode& status) const; 914 915 /** 916 * Checks the range of the source text to quote the special 917 * characters, { and ' and copy to target buffer. 918 * @param source 919 * @param start the text offset to start the process of in the source string 920 * @param end the text offset to end the process of in the source string 921 * @param appendTo Output parameter to receive result. 922 * Result is appended to existing contents. 923 */ 924 static void copyAndFixQuotes(const UnicodeString& appendTo, int32_t start, int32_t end, UnicodeString& target); 925 926 /** 927 * Returns array of argument types in the parsed pattern 928 * for use in C API. Only for the use of umsg_vformat(). Not 929 * for public consumption. 930 * @param listCount Output parameter to receive the size of array 931 * @return The array of formattable types in the pattern 932 * @internal 933 */ 934 const Formattable::Type* getArgTypeList(int32_t& listCount) const { 935 listCount = argTypeCount; 936 return argTypes; 937 } 938 939 /** 940 * Returns FALSE if the argument name is not legal. 941 * @param argName argument name. 942 * @return TRUE if the argument name is legal, otherwise return FALSE. 943 */ 944 UBool isLegalArgName(const UnicodeString& argName) const; 945 946 friend class MessageFormatAdapter; // getFormatTypeList() access 947 }; 948 949 inline UnicodeString& 950 MessageFormat::format(const Formattable& obj, 951 UnicodeString& appendTo, 952 UErrorCode& status) const { 953 return Format::format(obj, appendTo, status); 954 } 955 956 U_NAMESPACE_END 957 958 #endif /* #if !UCONFIG_NO_FORMATTING */ 959 960 #endif // _MSGFMT 961 //eof 962