• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1 // © 2016 and later: Unicode, Inc. and others.
2 // License & terms of use: http://www.unicode.org/copyright.html
3 /*
4 ********************************************************************************
5 *   Copyright (C) 1997-2016, International Business Machines
6 *   Corporation and others.  All Rights Reserved.
7 ********************************************************************************
8 *
9 * File DCFMTSYM.H
10 *
11 * Modification History:
12 *
13 *   Date        Name        Description
14 *   02/19/97    aliu        Converted from java.
15 *   03/18/97    clhuang     Updated per C++ implementation.
16 *   03/27/97    helena      Updated to pass the simple test after code review.
17 *   08/26/97    aliu        Added currency/intl currency symbol support.
18 *   07/22/98    stephen     Changed to match C++ style
19 *                            currencySymbol -> fCurrencySymbol
20 *                            Constants changed from CAPS to kCaps
21 *   06/24/99    helena      Integrated Alan's NF enhancements and Java2 bug fixes
22 *   09/22/00    grhoten     Marked deprecation tags with a pointer to replacement
23 *                            functions.
24 ********************************************************************************
25 */
26 
27 #ifndef DCFMTSYM_H
28 #define DCFMTSYM_H
29 
30 #include "unicode/utypes.h"
31 
32 #if U_SHOW_CPLUSPLUS_API
33 
34 #if !UCONFIG_NO_FORMATTING
35 
36 #include "unicode/uchar.h"
37 #include "unicode/uobject.h"
38 #include "unicode/locid.h"
39 #include "unicode/numsys.h"
40 #include "unicode/unum.h"
41 #include "unicode/unistr.h"
42 
43 /**
44  * \file
45  * \brief C++ API: Symbols for formatting numbers.
46  */
47 
48 
49 U_NAMESPACE_BEGIN
50 
51 /**
52  * This class represents the set of symbols needed by DecimalFormat
53  * to format numbers. DecimalFormat creates for itself an instance of
54  * DecimalFormatSymbols from its locale data.  If you need to change any
55  * of these symbols, you can get the DecimalFormatSymbols object from
56  * your DecimalFormat and modify it.
57  * <P>
58  * Here are the special characters used in the parts of the
59  * subpattern, with notes on their usage.
60  * <pre>
61  * \code
62  *        Symbol   Meaning
63  *          0      a digit
64  *          #      a digit, zero shows as absent
65  *          .      placeholder for decimal separator
66  *          ,      placeholder for grouping separator.
67  *          ;      separates formats.
68  *          -      default negative prefix.
69  *          %      divide by 100 and show as percentage
70  *          X      any other characters can be used in the prefix or suffix
71  *          '      used to quote special characters in a prefix or suffix.
72  * \endcode
73  *  </pre>
74  * [Notes]
75  * <P>
76  * If there is no explicit negative subpattern, - is prefixed to the
77  * positive form. That is, "0.00" alone is equivalent to "0.00;-0.00".
78  * <P>
79  * The grouping separator is commonly used for thousands, but in some
80  * countries for ten-thousands. The interval is a constant number of
81  * digits between the grouping characters, such as 100,000,000 or 1,0000,0000.
82  * If you supply a pattern with multiple grouping characters, the interval
83  * between the last one and the end of the integer is the one that is
84  * used. So "#,##,###,####" == "######,####" == "##,####,####".
85  */
86 class U_I18N_API DecimalFormatSymbols : public UObject {
87 public:
88     /**
89      * Constants for specifying a number format symbol.
90      * @stable ICU 2.0
91      */
92     enum ENumberFormatSymbol {
93         /** The decimal separator */
94         kDecimalSeparatorSymbol,
95         /** The grouping separator */
96         kGroupingSeparatorSymbol,
97         /** The pattern separator */
98         kPatternSeparatorSymbol,
99         /** The percent sign */
100         kPercentSymbol,
101         /** Zero*/
102         kZeroDigitSymbol,
103         /** Character representing a digit in the pattern */
104         kDigitSymbol,
105         /** The minus sign */
106         kMinusSignSymbol,
107         /** The plus sign */
108         kPlusSignSymbol,
109         /** The currency symbol */
110         kCurrencySymbol,
111         /** The international currency symbol */
112         kIntlCurrencySymbol,
113         /** The monetary separator */
114         kMonetarySeparatorSymbol,
115         /** The exponential symbol */
116         kExponentialSymbol,
117         /** Per mill symbol - replaces kPermillSymbol */
118         kPerMillSymbol,
119         /** Escape padding character */
120         kPadEscapeSymbol,
121         /** Infinity symbol */
122         kInfinitySymbol,
123         /** Nan symbol */
124         kNaNSymbol,
125         /** Significant digit symbol
126          * @stable ICU 3.0 */
127         kSignificantDigitSymbol,
128         /** The monetary grouping separator
129          * @stable ICU 3.6
130          */
131         kMonetaryGroupingSeparatorSymbol,
132         /** One
133          * @stable ICU 4.6
134          */
135         kOneDigitSymbol,
136         /** Two
137          * @stable ICU 4.6
138          */
139         kTwoDigitSymbol,
140         /** Three
141          * @stable ICU 4.6
142          */
143         kThreeDigitSymbol,
144         /** Four
145          * @stable ICU 4.6
146          */
147         kFourDigitSymbol,
148         /** Five
149          * @stable ICU 4.6
150          */
151         kFiveDigitSymbol,
152         /** Six
153          * @stable ICU 4.6
154          */
155         kSixDigitSymbol,
156         /** Seven
157          * @stable ICU 4.6
158          */
159         kSevenDigitSymbol,
160         /** Eight
161          * @stable ICU 4.6
162          */
163         kEightDigitSymbol,
164         /** Nine
165          * @stable ICU 4.6
166          */
167         kNineDigitSymbol,
168         /** Multiplication sign.
169          * @stable ICU 54
170          */
171         kExponentMultiplicationSymbol,
172         /** count symbol constants */
173         kFormatSymbolCount = kNineDigitSymbol + 2
174     };
175 
176     /**
177      * Create a DecimalFormatSymbols object for the given locale.
178      *
179      * @param locale    The locale to get symbols for.
180      * @param status    Input/output parameter, set to success or
181      *                  failure code upon return.
182      * @stable ICU 2.0
183      */
184     DecimalFormatSymbols(const Locale& locale, UErrorCode& status);
185 
186     /**
187      * Creates a DecimalFormatSymbols instance for the given locale with digits and symbols
188      * corresponding to the given NumberingSystem.
189      *
190      * This constructor behaves equivalently to the normal constructor called with a locale having a
191      * "numbers=xxxx" keyword specifying the numbering system by name.
192      *
193      * In this constructor, the NumberingSystem argument will be used even if the locale has its own
194      * "numbers=xxxx" keyword.
195      *
196      * @param locale    The locale to get symbols for.
197      * @param ns        The numbering system.
198      * @param status    Input/output parameter, set to success or
199      *                  failure code upon return.
200      * @stable ICU 60
201      */
202     DecimalFormatSymbols(const Locale& locale, const NumberingSystem& ns, UErrorCode& status);
203 
204     /**
205      * Create a DecimalFormatSymbols object for the default locale.
206      * This constructor will not fail.  If the resource file data is
207      * not available, it will use hard-coded last-resort data and
208      * set status to U_USING_FALLBACK_ERROR.
209      *
210      * @param status    Input/output parameter, set to success or
211      *                  failure code upon return.
212      * @stable ICU 2.0
213      */
214     DecimalFormatSymbols(UErrorCode& status);
215 
216     /**
217      * Creates a DecimalFormatSymbols object with last-resort data.
218      * Intended for callers who cache the symbols data and
219      * set all symbols on the resulting object.
220      *
221      * The last-resort symbols are similar to those for the root data,
222      * except that the grouping separators are empty,
223      * the NaN symbol is U+FFFD rather than "NaN",
224      * and the CurrencySpacing patterns are empty.
225      *
226      * @param status    Input/output parameter, set to success or
227      *                  failure code upon return.
228      * @return last-resort symbols
229      * @stable ICU 52
230      */
231     static DecimalFormatSymbols* createWithLastResortData(UErrorCode& status);
232 
233     /**
234      * Copy constructor.
235      * @stable ICU 2.0
236      */
237     DecimalFormatSymbols(const DecimalFormatSymbols&);
238 
239     /**
240      * Assignment operator.
241      * @stable ICU 2.0
242      */
243     DecimalFormatSymbols& operator=(const DecimalFormatSymbols&);
244 
245     /**
246      * Destructor.
247      * @stable ICU 2.0
248      */
249     virtual ~DecimalFormatSymbols();
250 
251     /**
252      * Return true if another object is semantically equal to this one.
253      *
254      * @param other    the object to be compared with.
255      * @return         true if another object is semantically equal to this one.
256      * @stable ICU 2.0
257      */
258     UBool operator==(const DecimalFormatSymbols& other) const;
259 
260     /**
261      * Return true if another object is semantically unequal to this one.
262      *
263      * @param other    the object to be compared with.
264      * @return         true if another object is semantically unequal to this one.
265      * @stable ICU 2.0
266      */
267     UBool operator!=(const DecimalFormatSymbols& other) const { return !operator==(other); }
268 
269     /**
270      * Get one of the format symbols by its enum constant.
271      * Each symbol is stored as a string so that graphemes
272      * (characters with modifier letters) can be used.
273      *
274      * @param symbol    Constant to indicate a number format symbol.
275      * @return    the format symbols by the param 'symbol'
276      * @stable ICU 2.0
277      */
278     inline UnicodeString getSymbol(ENumberFormatSymbol symbol) const;
279 
280     /**
281      * Set one of the format symbols by its enum constant.
282      * Each symbol is stored as a string so that graphemes
283      * (characters with modifier letters) can be used.
284      *
285      * @param symbol    Constant to indicate a number format symbol.
286      * @param value     value of the format symbol
287      * @param propogateDigits If false, setting the zero digit will not automatically set 1-9.
288      *     The default behavior is to automatically set 1-9 if zero is being set and the value
289      *     it is being set to corresponds to a known Unicode zero digit.
290      * @stable ICU 2.0
291      */
292     void setSymbol(ENumberFormatSymbol symbol, const UnicodeString &value, const UBool propogateDigits);
293 
294     /**
295      * Returns the locale for which this object was constructed.
296      * @stable ICU 2.6
297      */
298     inline Locale getLocale() const;
299 
300     /**
301      * Returns the locale for this object. Two flavors are available:
302      * valid and actual locale.
303      * @stable ICU 2.8
304      */
305     Locale getLocale(ULocDataLocaleType type, UErrorCode& status) const;
306 
307     /**
308       * Get pattern string for 'CurrencySpacing' that can be applied to
309       * currency format.
310       * This API gets the CurrencySpacing data from ResourceBundle. The pattern can
311       * be empty if there is no data from current locale and its parent locales.
312       *
313       * @param type :  UNUM_CURRENCY_MATCH, UNUM_CURRENCY_SURROUNDING_MATCH or UNUM_CURRENCY_INSERT.
314       * @param beforeCurrency : true if the pattern is for before currency symbol.
315       *                         false if the pattern is for after currency symbol.
316       * @param status: Input/output parameter, set to success or
317       *                  failure code upon return.
318       * @return pattern string for currencyMatch, surroundingMatch or spaceInsert.
319       *     Return empty string if there is no data for this locale and its parent
320       *     locales.
321       * @stable ICU 4.8
322       */
323      const UnicodeString& getPatternForCurrencySpacing(UCurrencySpacing type,
324                                                  UBool beforeCurrency,
325                                                  UErrorCode& status) const;
326      /**
327        * Set pattern string for 'CurrencySpacing' that can be applied to
328        * currency format.
329        *
330        * @param type : UNUM_CURRENCY_MATCH, UNUM_CURRENCY_SURROUNDING_MATCH or UNUM_CURRENCY_INSERT.
331        * @param beforeCurrency : true if the pattern is for before currency symbol.
332        *                         false if the pattern is for after currency symbol.
333        * @param pattern : pattern string to override current setting.
334        * @stable ICU 4.8
335        */
336      void setPatternForCurrencySpacing(UCurrencySpacing type,
337                                        UBool beforeCurrency,
338                                        const UnicodeString& pattern);
339 
340     /**
341      * ICU "poor man's RTTI", returns a UClassID for the actual class.
342      *
343      * @stable ICU 2.2
344      */
345     virtual UClassID getDynamicClassID() const;
346 
347     /**
348      * ICU "poor man's RTTI", returns a UClassID for this class.
349      *
350      * @stable ICU 2.2
351      */
352     static UClassID U_EXPORT2 getStaticClassID();
353 
354 private:
355     DecimalFormatSymbols();
356 
357     /**
358      * Initializes the symbols from the LocaleElements resource bundle.
359      * Note: The organization of LocaleElements badly needs to be
360      * cleaned up.
361      *
362      * @param locale               The locale to get symbols for.
363      * @param success              Input/output parameter, set to success or
364      *                             failure code upon return.
365      * @param useLastResortData    determine if use last resort data
366      * @param ns                   The NumberingSystem to use; otherwise, fall
367      *                             back to the locale.
368      */
369     void initialize(const Locale& locale, UErrorCode& success,
370         UBool useLastResortData = FALSE, const NumberingSystem* ns = nullptr);
371 
372     /**
373      * Initialize the symbols with default values.
374      */
375     void initialize();
376 
377     void setCurrencyForSymbols();
378 
379 public:
380 
381 #ifndef U_HIDE_INTERNAL_API
382     /**
383      * @internal For ICU use only
384      */
isCustomCurrencySymbol()385     inline UBool isCustomCurrencySymbol() const {
386         return fIsCustomCurrencySymbol;
387     }
388 
389     /**
390      * @internal For ICU use only
391      */
isCustomIntlCurrencySymbol()392     inline UBool isCustomIntlCurrencySymbol() const {
393         return fIsCustomIntlCurrencySymbol;
394     }
395 
396     /**
397      * @internal For ICU use only
398      */
getCodePointZero()399     inline UChar32 getCodePointZero() const {
400         return fCodePointZero;
401     }
402 #endif  /* U_HIDE_INTERNAL_API */
403 
404     /**
405      * _Internal_ function - more efficient version of getSymbol,
406      * returning a const reference to one of the symbol strings.
407      * The returned reference becomes invalid when the symbol is changed
408      * or when the DecimalFormatSymbols are destroyed.
409      * Note: moved \#ifndef U_HIDE_INTERNAL_API after this, since this is needed for inline in DecimalFormat
410      *
411      * This is not currently stable API, but if you think it should be stable,
412      * post a comment on the following ticket and the ICU team will take a look:
413      * http://bugs.icu-project.org/trac/ticket/13580
414      *
415      * @param symbol Constant to indicate a number format symbol.
416      * @return the format symbol by the param 'symbol'
417      * @internal
418      */
419     inline const UnicodeString& getConstSymbol(ENumberFormatSymbol symbol) const;
420 
421 #ifndef U_HIDE_INTERNAL_API
422     /**
423      * Returns the const UnicodeString reference, like getConstSymbol,
424      * corresponding to the digit with the given value.  This is equivalent
425      * to accessing the symbol from getConstSymbol with the corresponding
426      * key, such as kZeroDigitSymbol or kOneDigitSymbol.
427      *
428      * This is not currently stable API, but if you think it should be stable,
429      * post a comment on the following ticket and the ICU team will take a look:
430      * http://bugs.icu-project.org/trac/ticket/13580
431      *
432      * @param digit The digit, an integer between 0 and 9 inclusive.
433      *              If outside the range 0 to 9, the zero digit is returned.
434      * @return the format symbol for the given digit.
435      * @internal This API is currently for ICU use only.
436      */
437     inline const UnicodeString& getConstDigitSymbol(int32_t digit) const;
438 
439     /**
440      * Returns that pattern stored in currecy info. Internal API for use by NumberFormat API.
441      * @internal
442      */
443     inline const char16_t* getCurrencyPattern(void) const;
444 #endif  /* U_HIDE_INTERNAL_API */
445 
446 private:
447     /**
448      * Private symbol strings.
449      * They are either loaded from a resource bundle or otherwise owned.
450      * setSymbol() clones the symbol string.
451      * Readonly aliases can only come from a resource bundle, so that we can always
452      * use fastCopyFrom() with them.
453      *
454      * If DecimalFormatSymbols becomes subclassable and the status of fSymbols changes
455      * from private to protected,
456      * or when fSymbols can be set any other way that allows them to be readonly aliases
457      * to non-resource bundle strings,
458      * then regular UnicodeString copies must be used instead of fastCopyFrom().
459      *
460      */
461     UnicodeString fSymbols[kFormatSymbolCount];
462 
463     /**
464      * Non-symbol variable for getConstSymbol(). Always empty.
465      */
466     UnicodeString fNoSymbol;
467 
468     /**
469      * Dealing with code points is faster than dealing with strings when formatting. Because of
470      * this, we maintain a value containing the zero code point that is used whenever digitStrings
471      * represents a sequence of ten code points in order.
472      *
473      * <p>If the value stored here is positive, it means that the code point stored in this value
474      * corresponds to the digitStrings array, and codePointZero can be used instead of the
475      * digitStrings array for the purposes of efficient formatting; if -1, then digitStrings does
476      * *not* contain a sequence of code points, and it must be used directly.
477      *
478      * <p>It is assumed that codePointZero always shadows the value in digitStrings. codePointZero
479      * should never be set directly; rather, it should be updated only when digitStrings mutates.
480      * That is, the flow of information is digitStrings -> codePointZero, not the other way.
481      */
482     UChar32 fCodePointZero;
483 
484     Locale locale;
485 
486     char actualLocale[ULOC_FULLNAME_CAPACITY];
487     char validLocale[ULOC_FULLNAME_CAPACITY];
488     const char16_t* currPattern;
489 
490     UnicodeString currencySpcBeforeSym[UNUM_CURRENCY_SPACING_COUNT];
491     UnicodeString currencySpcAfterSym[UNUM_CURRENCY_SPACING_COUNT];
492     UBool fIsCustomCurrencySymbol;
493     UBool fIsCustomIntlCurrencySymbol;
494 };
495 
496 // -------------------------------------
497 
498 inline UnicodeString
getSymbol(ENumberFormatSymbol symbol)499 DecimalFormatSymbols::getSymbol(ENumberFormatSymbol symbol) const {
500     const UnicodeString *strPtr;
501     if(symbol < kFormatSymbolCount) {
502         strPtr = &fSymbols[symbol];
503     } else {
504         strPtr = &fNoSymbol;
505     }
506     return *strPtr;
507 }
508 
509 // See comments above for this function. Not hidden with #ifdef U_HIDE_INTERNAL_API
510 inline const UnicodeString &
getConstSymbol(ENumberFormatSymbol symbol)511 DecimalFormatSymbols::getConstSymbol(ENumberFormatSymbol symbol) const {
512     const UnicodeString *strPtr;
513     if(symbol < kFormatSymbolCount) {
514         strPtr = &fSymbols[symbol];
515     } else {
516         strPtr = &fNoSymbol;
517     }
518     return *strPtr;
519 }
520 
521 #ifndef U_HIDE_INTERNAL_API
getConstDigitSymbol(int32_t digit)522 inline const UnicodeString& DecimalFormatSymbols::getConstDigitSymbol(int32_t digit) const {
523     if (digit < 0 || digit > 9) {
524         digit = 0;
525     }
526     if (digit == 0) {
527         return fSymbols[kZeroDigitSymbol];
528     }
529     ENumberFormatSymbol key = static_cast<ENumberFormatSymbol>(kOneDigitSymbol + digit - 1);
530     return fSymbols[key];
531 }
532 #endif /* U_HIDE_INTERNAL_API */
533 
534 // -------------------------------------
535 
536 inline void
537 DecimalFormatSymbols::setSymbol(ENumberFormatSymbol symbol, const UnicodeString &value, const UBool propogateDigits = TRUE) {
538     if (symbol == kCurrencySymbol) {
539         fIsCustomCurrencySymbol = TRUE;
540     }
541     else if (symbol == kIntlCurrencySymbol) {
542         fIsCustomIntlCurrencySymbol = TRUE;
543     }
544     if(symbol<kFormatSymbolCount) {
545         fSymbols[symbol]=value;
546     }
547 
548     // If the zero digit is being set to a known zero digit according to Unicode,
549     // then we automatically set the corresponding 1-9 digits
550     // Also record updates to fCodePointZero. Be conservative if in doubt.
551     if (symbol == kZeroDigitSymbol) {
552         UChar32 sym = value.char32At(0);
553         if ( propogateDigits && u_charDigitValue(sym) == 0 && value.countChar32() == 1 ) {
554             fCodePointZero = sym;
555             for ( int8_t i = 1 ; i<= 9 ; i++ ) {
556                 sym++;
557                 fSymbols[(int)kOneDigitSymbol+i-1] = UnicodeString(sym);
558             }
559         } else {
560             fCodePointZero = -1;
561         }
562     } else if (symbol >= kOneDigitSymbol && symbol <= kNineDigitSymbol) {
563         fCodePointZero = -1;
564     }
565 }
566 
567 // -------------------------------------
568 
569 inline Locale
getLocale()570 DecimalFormatSymbols::getLocale() const {
571     return locale;
572 }
573 
574 #ifndef U_HIDE_INTERNAL_API
575 inline const char16_t*
getCurrencyPattern()576 DecimalFormatSymbols::getCurrencyPattern() const {
577     return currPattern;
578 }
579 #endif /* U_HIDE_INTERNAL_API */
580 
581 U_NAMESPACE_END
582 
583 #endif /* #if !UCONFIG_NO_FORMATTING */
584 
585 #endif /* U_SHOW_CPLUSPLUS_API */
586 
587 #endif // _DCFMTSYM
588 //eof
589