Home | History | Annotate | Download | only in unicode
      1 //  2016 and later: Unicode, Inc. and others.
      2 // License & terms of use: http://www.unicode.org/copyright.html
      3 /*
      4 ********************************************************************************
      5 *   Copyright (C) 1997-2016, International Business Machines
      6 *   Corporation and others.  All Rights Reserved.
      7 ********************************************************************************
      8 *
      9 * File DCFMTSYM.H
     10 *
     11 * Modification History:
     12 *
     13 *   Date        Name        Description
     14 *   02/19/97    aliu        Converted from java.
     15 *   03/18/97    clhuang     Updated per C++ implementation.
     16 *   03/27/97    helena      Updated to pass the simple test after code review.
     17 *   08/26/97    aliu        Added currency/intl currency symbol support.
     18 *   07/22/98    stephen     Changed to match C++ style
     19 *                            currencySymbol -> fCurrencySymbol
     20 *                            Constants changed from CAPS to kCaps
     21 *   06/24/99    helena      Integrated Alan's NF enhancements and Java2 bug fixes
     22 *   09/22/00    grhoten     Marked deprecation tags with a pointer to replacement
     23 *                            functions.
     24 ********************************************************************************
     25 */
     26 
     27 #ifndef DCFMTSYM_H
     28 #define DCFMTSYM_H
     29 
     30 #include "unicode/utypes.h"
     31 #include "unicode/uchar.h"
     32 
     33 #if !UCONFIG_NO_FORMATTING
     34 
     35 #include "unicode/uobject.h"
     36 #include "unicode/locid.h"
     37 #include "unicode/numsys.h"
     38 #include "unicode/unum.h"
     39 #include "unicode/unistr.h"
     40 
     41 /**
     42  * \file
     43  * \brief C++ API: Symbols for formatting numbers.
     44  */
     45 
     46 
     47 U_NAMESPACE_BEGIN
     48 
     49 /**
     50  * This class represents the set of symbols needed by DecimalFormat
     51  * to format numbers. DecimalFormat creates for itself an instance of
     52  * DecimalFormatSymbols from its locale data.  If you need to change any
     53  * of these symbols, you can get the DecimalFormatSymbols object from
     54  * your DecimalFormat and modify it.
     55  * <P>
     56  * Here are the special characters used in the parts of the
     57  * subpattern, with notes on their usage.
     58  * <pre>
     59  * \code
     60  *        Symbol   Meaning
     61  *          0      a digit
     62  *          #      a digit, zero shows as absent
     63  *          .      placeholder for decimal separator
     64  *          ,      placeholder for grouping separator.
     65  *          ;      separates formats.
     66  *          -      default negative prefix.
     67  *          %      divide by 100 and show as percentage
     68  *          X      any other characters can be used in the prefix or suffix
     69  *          '      used to quote special characters in a prefix or suffix.
     70  * \endcode
     71  *  </pre>
     72  * [Notes]
     73  * <P>
     74  * If there is no explicit negative subpattern, - is prefixed to the
     75  * positive form. That is, "0.00" alone is equivalent to "0.00;-0.00".
     76  * <P>
     77  * The grouping separator is commonly used for thousands, but in some
     78  * countries for ten-thousands. The interval is a constant number of
     79  * digits between the grouping characters, such as 100,000,000 or 1,0000,0000.
     80  * If you supply a pattern with multiple grouping characters, the interval
     81  * between the last one and the end of the integer is the one that is
     82  * used. So "#,##,###,####" == "######,####" == "##,####,####".
     83  */
     84 class U_I18N_API DecimalFormatSymbols : public UObject {
     85 public:
     86     /**
     87      * Constants for specifying a number format symbol.
     88      * @stable ICU 2.0
     89      */
     90     enum ENumberFormatSymbol {
     91         /** The decimal separator */
     92         kDecimalSeparatorSymbol,
     93         /** The grouping separator */
     94         kGroupingSeparatorSymbol,
     95         /** The pattern separator */
     96         kPatternSeparatorSymbol,
     97         /** The percent sign */
     98         kPercentSymbol,
     99         /** Zero*/
    100         kZeroDigitSymbol,
    101         /** Character representing a digit in the pattern */
    102         kDigitSymbol,
    103         /** The minus sign */
    104         kMinusSignSymbol,
    105         /** The plus sign */
    106         kPlusSignSymbol,
    107         /** The currency symbol */
    108         kCurrencySymbol,
    109         /** The international currency symbol */
    110         kIntlCurrencySymbol,
    111         /** The monetary separator */
    112         kMonetarySeparatorSymbol,
    113         /** The exponential symbol */
    114         kExponentialSymbol,
    115         /** Per mill symbol - replaces kPermillSymbol */
    116         kPerMillSymbol,
    117         /** Escape padding character */
    118         kPadEscapeSymbol,
    119         /** Infinity symbol */
    120         kInfinitySymbol,
    121         /** Nan symbol */
    122         kNaNSymbol,
    123         /** Significant digit symbol
    124          * @stable ICU 3.0 */
    125         kSignificantDigitSymbol,
    126         /** The monetary grouping separator
    127          * @stable ICU 3.6
    128          */
    129         kMonetaryGroupingSeparatorSymbol,
    130         /** One
    131          * @stable ICU 4.6
    132          */
    133         kOneDigitSymbol,
    134         /** Two
    135          * @stable ICU 4.6
    136          */
    137         kTwoDigitSymbol,
    138         /** Three
    139          * @stable ICU 4.6
    140          */
    141         kThreeDigitSymbol,
    142         /** Four
    143          * @stable ICU 4.6
    144          */
    145         kFourDigitSymbol,
    146         /** Five
    147          * @stable ICU 4.6
    148          */
    149         kFiveDigitSymbol,
    150         /** Six
    151          * @stable ICU 4.6
    152          */
    153         kSixDigitSymbol,
    154         /** Seven
    155          * @stable ICU 4.6
    156          */
    157         kSevenDigitSymbol,
    158         /** Eight
    159          * @stable ICU 4.6
    160          */
    161         kEightDigitSymbol,
    162         /** Nine
    163          * @stable ICU 4.6
    164          */
    165         kNineDigitSymbol,
    166         /** Multiplication sign.
    167          * @stable ICU 54
    168          */
    169         kExponentMultiplicationSymbol,
    170         /** count symbol constants */
    171         kFormatSymbolCount = kNineDigitSymbol + 2
    172     };
    173 
    174     /**
    175      * Create a DecimalFormatSymbols object for the given locale.
    176      *
    177      * @param locale    The locale to get symbols for.
    178      * @param status    Input/output parameter, set to success or
    179      *                  failure code upon return.
    180      * @stable ICU 2.0
    181      */
    182     DecimalFormatSymbols(const Locale& locale, UErrorCode& status);
    183 
    184     /**
    185      * Creates a DecimalFormatSymbols instance for the given locale with digits and symbols
    186      * corresponding to the given NumberingSystem.
    187      *
    188      * This constructor behaves equivalently to the normal constructor called with a locale having a
    189      * "numbers=xxxx" keyword specifying the numbering system by name.
    190      *
    191      * In this constructor, the NumberingSystem argument will be used even if the locale has its own
    192      * "numbers=xxxx" keyword.
    193      *
    194      * @param locale    The locale to get symbols for.
    195      * @param ns        The numbering system.
    196      * @param status    Input/output parameter, set to success or
    197      *                  failure code upon return.
    198      * @stable ICU 60
    199      */
    200     DecimalFormatSymbols(const Locale& locale, const NumberingSystem& ns, UErrorCode& status);
    201 
    202     /**
    203      * Create a DecimalFormatSymbols object for the default locale.
    204      * This constructor will not fail.  If the resource file data is
    205      * not available, it will use hard-coded last-resort data and
    206      * set status to U_USING_FALLBACK_ERROR.
    207      *
    208      * @param status    Input/output parameter, set to success or
    209      *                  failure code upon return.
    210      * @stable ICU 2.0
    211      */
    212     DecimalFormatSymbols(UErrorCode& status);
    213 
    214     /**
    215      * Creates a DecimalFormatSymbols object with last-resort data.
    216      * Intended for callers who cache the symbols data and
    217      * set all symbols on the resulting object.
    218      *
    219      * The last-resort symbols are similar to those for the root data,
    220      * except that the grouping separators are empty,
    221      * the NaN symbol is U+FFFD rather than "NaN",
    222      * and the CurrencySpacing patterns are empty.
    223      *
    224      * @param status    Input/output parameter, set to success or
    225      *                  failure code upon return.
    226      * @return last-resort symbols
    227      * @stable ICU 52
    228      */
    229     static DecimalFormatSymbols* createWithLastResortData(UErrorCode& status);
    230 
    231     /**
    232      * Copy constructor.
    233      * @stable ICU 2.0
    234      */
    235     DecimalFormatSymbols(const DecimalFormatSymbols&);
    236 
    237     /**
    238      * Assignment operator.
    239      * @stable ICU 2.0
    240      */
    241     DecimalFormatSymbols& operator=(const DecimalFormatSymbols&);
    242 
    243     /**
    244      * Destructor.
    245      * @stable ICU 2.0
    246      */
    247     virtual ~DecimalFormatSymbols();
    248 
    249     /**
    250      * Return true if another object is semantically equal to this one.
    251      *
    252      * @param other    the object to be compared with.
    253      * @return         true if another object is semantically equal to this one.
    254      * @stable ICU 2.0
    255      */
    256     UBool operator==(const DecimalFormatSymbols& other) const;
    257 
    258     /**
    259      * Return true if another object is semantically unequal to this one.
    260      *
    261      * @param other    the object to be compared with.
    262      * @return         true if another object is semantically unequal to this one.
    263      * @stable ICU 2.0
    264      */
    265     UBool operator!=(const DecimalFormatSymbols& other) const { return !operator==(other); }
    266 
    267     /**
    268      * Get one of the format symbols by its enum constant.
    269      * Each symbol is stored as a string so that graphemes
    270      * (characters with modifier letters) can be used.
    271      *
    272      * @param symbol    Constant to indicate a number format symbol.
    273      * @return    the format symbols by the param 'symbol'
    274      * @stable ICU 2.0
    275      */
    276     inline UnicodeString getSymbol(ENumberFormatSymbol symbol) const;
    277 
    278     /**
    279      * Set one of the format symbols by its enum constant.
    280      * Each symbol is stored as a string so that graphemes
    281      * (characters with modifier letters) can be used.
    282      *
    283      * @param symbol    Constant to indicate a number format symbol.
    284      * @param value     value of the format symbol
    285      * @param propogateDigits If false, setting the zero digit will not automatically set 1-9.
    286      *     The default behavior is to automatically set 1-9 if zero is being set and the value
    287      *     it is being set to corresponds to a known Unicode zero digit.
    288      * @stable ICU 2.0
    289      */
    290     void setSymbol(ENumberFormatSymbol symbol, const UnicodeString &value, const UBool propogateDigits);
    291 
    292     /**
    293      * Returns the locale for which this object was constructed.
    294      * @stable ICU 2.6
    295      */
    296     inline Locale getLocale() const;
    297 
    298     /**
    299      * Returns the locale for this object. Two flavors are available:
    300      * valid and actual locale.
    301      * @stable ICU 2.8
    302      */
    303     Locale getLocale(ULocDataLocaleType type, UErrorCode& status) const;
    304 
    305     /**
    306       * Get pattern string for 'CurrencySpacing' that can be applied to
    307       * currency format.
    308       * This API gets the CurrencySpacing data from ResourceBundle. The pattern can
    309       * be empty if there is no data from current locale and its parent locales.
    310       *
    311       * @param type :  UNUM_CURRENCY_MATCH, UNUM_CURRENCY_SURROUNDING_MATCH or UNUM_CURRENCY_INSERT.
    312       * @param beforeCurrency : true if the pattern is for before currency symbol.
    313       *                         false if the pattern is for after currency symbol.
    314       * @param status: Input/output parameter, set to success or
    315       *                  failure code upon return.
    316       * @return pattern string for currencyMatch, surroundingMatch or spaceInsert.
    317       *     Return empty string if there is no data for this locale and its parent
    318       *     locales.
    319       * @stable ICU 4.8
    320       */
    321      const UnicodeString& getPatternForCurrencySpacing(UCurrencySpacing type,
    322                                                  UBool beforeCurrency,
    323                                                  UErrorCode& status) const;
    324      /**
    325        * Set pattern string for 'CurrencySpacing' that can be applied to
    326        * currency format.
    327        *
    328        * @param type : UNUM_CURRENCY_MATCH, UNUM_CURRENCY_SURROUNDING_MATCH or UNUM_CURRENCY_INSERT.
    329        * @param beforeCurrency : true if the pattern is for before currency symbol.
    330        *                         false if the pattern is for after currency symbol.
    331        * @param pattern : pattern string to override current setting.
    332        * @stable ICU 4.8
    333        */
    334      void setPatternForCurrencySpacing(UCurrencySpacing type,
    335                                        UBool beforeCurrency,
    336                                        const UnicodeString& pattern);
    337 
    338     /**
    339      * ICU "poor man's RTTI", returns a UClassID for the actual class.
    340      *
    341      * @stable ICU 2.2
    342      */
    343     virtual UClassID getDynamicClassID() const;
    344 
    345     /**
    346      * ICU "poor man's RTTI", returns a UClassID for this class.
    347      *
    348      * @stable ICU 2.2
    349      */
    350     static UClassID U_EXPORT2 getStaticClassID();
    351 
    352 private:
    353     DecimalFormatSymbols();
    354 
    355     /**
    356      * Initializes the symbols from the LocaleElements resource bundle.
    357      * Note: The organization of LocaleElements badly needs to be
    358      * cleaned up.
    359      *
    360      * @param locale               The locale to get symbols for.
    361      * @param success              Input/output parameter, set to success or
    362      *                             failure code upon return.
    363      * @param useLastResortData    determine if use last resort data
    364      * @param ns                   The NumberingSystem to use; otherwise, fall
    365      *                             back to the locale.
    366      */
    367     void initialize(const Locale& locale, UErrorCode& success,
    368         UBool useLastResortData = FALSE, const NumberingSystem* ns = nullptr);
    369 
    370     /**
    371      * Initialize the symbols with default values.
    372      */
    373     void initialize();
    374 
    375     void setCurrencyForSymbols();
    376 
    377 public:
    378 
    379 #ifndef U_HIDE_INTERNAL_API
    380     /**
    381      * @internal For ICU use only
    382      */
    383     inline UBool isCustomCurrencySymbol() const {
    384         return fIsCustomCurrencySymbol;
    385     }
    386 
    387     /**
    388      * @internal For ICU use only
    389      */
    390     inline UBool isCustomIntlCurrencySymbol() const {
    391         return fIsCustomIntlCurrencySymbol;
    392     }
    393 
    394     /**
    395      * @internal For ICU use only
    396      */
    397     inline UChar32 getCodePointZero() const {
    398         return fCodePointZero;
    399     }
    400 #endif  /* U_HIDE_INTERNAL_API */
    401 
    402     /**
    403      * _Internal_ function - more efficient version of getSymbol,
    404      * returning a const reference to one of the symbol strings.
    405      * The returned reference becomes invalid when the symbol is changed
    406      * or when the DecimalFormatSymbols are destroyed.
    407      * Note: moved \#ifndef U_HIDE_INTERNAL_API after this, since this is needed for inline in DecimalFormat
    408      *
    409      * This is not currently stable API, but if you think it should be stable,
    410      * post a comment on the following ticket and the ICU team will take a look:
    411      * http://bugs.icu-project.org/trac/ticket/13580
    412      *
    413      * @param symbol Constant to indicate a number format symbol.
    414      * @return the format symbol by the param 'symbol'
    415      * @internal
    416      */
    417     inline const UnicodeString& getConstSymbol(ENumberFormatSymbol symbol) const;
    418 
    419 #ifndef U_HIDE_INTERNAL_API
    420     /**
    421      * Returns the const UnicodeString reference, like getConstSymbol,
    422      * corresponding to the digit with the given value.  This is equivalent
    423      * to accessing the symbol from getConstSymbol with the corresponding
    424      * key, such as kZeroDigitSymbol or kOneDigitSymbol.
    425      *
    426      * This is not currently stable API, but if you think it should be stable,
    427      * post a comment on the following ticket and the ICU team will take a look:
    428      * http://bugs.icu-project.org/trac/ticket/13580
    429      *
    430      * @param digit The digit, an integer between 0 and 9 inclusive.
    431      *              If outside the range 0 to 9, the zero digit is returned.
    432      * @return the format symbol for the given digit.
    433      * @internal This API is currently for ICU use only.
    434      */
    435     inline const UnicodeString& getConstDigitSymbol(int32_t digit) const;
    436 
    437     /**
    438      * Returns that pattern stored in currecy info. Internal API for use by NumberFormat API.
    439      * @internal
    440      */
    441     inline const char16_t* getCurrencyPattern(void) const;
    442 #endif  /* U_HIDE_INTERNAL_API */
    443 
    444 private:
    445     /**
    446      * Private symbol strings.
    447      * They are either loaded from a resource bundle or otherwise owned.
    448      * setSymbol() clones the symbol string.
    449      * Readonly aliases can only come from a resource bundle, so that we can always
    450      * use fastCopyFrom() with them.
    451      *
    452      * If DecimalFormatSymbols becomes subclassable and the status of fSymbols changes
    453      * from private to protected,
    454      * or when fSymbols can be set any other way that allows them to be readonly aliases
    455      * to non-resource bundle strings,
    456      * then regular UnicodeString copies must be used instead of fastCopyFrom().
    457      *
    458      * @internal
    459      */
    460     UnicodeString fSymbols[kFormatSymbolCount];
    461 
    462     /**
    463      * Non-symbol variable for getConstSymbol(). Always empty.
    464      * @internal
    465      */
    466     UnicodeString fNoSymbol;
    467 
    468     /**
    469      * Dealing with code points is faster than dealing with strings when formatting. Because of
    470      * this, we maintain a value containing the zero code point that is used whenever digitStrings
    471      * represents a sequence of ten code points in order.
    472      *
    473      * <p>If the value stored here is positive, it means that the code point stored in this value
    474      * corresponds to the digitStrings array, and codePointZero can be used instead of the
    475      * digitStrings array for the purposes of efficient formatting; if -1, then digitStrings does
    476      * *not* contain a sequence of code points, and it must be used directly.
    477      *
    478      * <p>It is assumed that codePointZero always shadows the value in digitStrings. codePointZero
    479      * should never be set directly; rather, it should be updated only when digitStrings mutates.
    480      * That is, the flow of information is digitStrings -> codePointZero, not the other way.
    481      */
    482     UChar32 fCodePointZero;
    483 
    484     Locale locale;
    485 
    486     char actualLocale[ULOC_FULLNAME_CAPACITY];
    487     char validLocale[ULOC_FULLNAME_CAPACITY];
    488     const char16_t* currPattern;
    489 
    490     UnicodeString currencySpcBeforeSym[UNUM_CURRENCY_SPACING_COUNT];
    491     UnicodeString currencySpcAfterSym[UNUM_CURRENCY_SPACING_COUNT];
    492     UBool fIsCustomCurrencySymbol;
    493     UBool fIsCustomIntlCurrencySymbol;
    494 };
    495 
    496 // -------------------------------------
    497 
    498 inline UnicodeString
    499 DecimalFormatSymbols::getSymbol(ENumberFormatSymbol symbol) const {
    500     const UnicodeString *strPtr;
    501     if(symbol < kFormatSymbolCount) {
    502         strPtr = &fSymbols[symbol];
    503     } else {
    504         strPtr = &fNoSymbol;
    505     }
    506     return *strPtr;
    507 }
    508 
    509 // See comments above for this function. Not hidden with #ifdef U_HIDE_INTERNAL_API
    510 inline const UnicodeString &
    511 DecimalFormatSymbols::getConstSymbol(ENumberFormatSymbol symbol) const {
    512     const UnicodeString *strPtr;
    513     if(symbol < kFormatSymbolCount) {
    514         strPtr = &fSymbols[symbol];
    515     } else {
    516         strPtr = &fNoSymbol;
    517     }
    518     return *strPtr;
    519 }
    520 
    521 #ifndef U_HIDE_INTERNAL_API
    522 inline const UnicodeString& DecimalFormatSymbols::getConstDigitSymbol(int32_t digit) const {
    523     if (digit < 0 || digit > 9) {
    524         digit = 0;
    525     }
    526     if (digit == 0) {
    527         return fSymbols[kZeroDigitSymbol];
    528     }
    529     ENumberFormatSymbol key = static_cast<ENumberFormatSymbol>(kOneDigitSymbol + digit - 1);
    530     return fSymbols[key];
    531 }
    532 #endif /* U_HIDE_INTERNAL_API */
    533 
    534 // -------------------------------------
    535 
    536 inline void
    537 DecimalFormatSymbols::setSymbol(ENumberFormatSymbol symbol, const UnicodeString &value, const UBool propogateDigits = TRUE) {
    538     if (symbol == kCurrencySymbol) {
    539         fIsCustomCurrencySymbol = TRUE;
    540     }
    541     else if (symbol == kIntlCurrencySymbol) {
    542         fIsCustomIntlCurrencySymbol = TRUE;
    543     }
    544     if(symbol<kFormatSymbolCount) {
    545         fSymbols[symbol]=value;
    546     }
    547 
    548     // If the zero digit is being set to a known zero digit according to Unicode,
    549     // then we automatically set the corresponding 1-9 digits
    550     // Also record updates to fCodePointZero. Be conservative if in doubt.
    551     if (symbol == kZeroDigitSymbol) {
    552         UChar32 sym = value.char32At(0);
    553         if ( propogateDigits && u_charDigitValue(sym) == 0 && value.countChar32() == 1 ) {
    554             fCodePointZero = sym;
    555             for ( int8_t i = 1 ; i<= 9 ; i++ ) {
    556                 sym++;
    557                 fSymbols[(int)kOneDigitSymbol+i-1] = UnicodeString(sym);
    558             }
    559         } else {
    560             fCodePointZero = -1;
    561         }
    562     } else if (symbol >= kOneDigitSymbol && symbol <= kNineDigitSymbol) {
    563         fCodePointZero = -1;
    564     }
    565 }
    566 
    567 // -------------------------------------
    568 
    569 inline Locale
    570 DecimalFormatSymbols::getLocale() const {
    571     return locale;
    572 }
    573 
    574 #ifndef U_HIDE_INTERNAL_API
    575 inline const char16_t*
    576 DecimalFormatSymbols::getCurrencyPattern() const {
    577     return currPattern;
    578 }
    579 #endif /* U_HIDE_INTERNAL_API */
    580 
    581 U_NAMESPACE_END
    582 
    583 #endif /* #if !UCONFIG_NO_FORMATTING */
    584 
    585 #endif // _DCFMTSYM
    586 //eof
    587