1 | // © 2016 and later: Unicode, Inc. and others. |
2 | // License & terms of use: http://www.unicode.org/copyright.html |
3 | /* |
4 | ******************************************************************************** |
5 | * Copyright (C) 1997-2016, International Business Machines |
6 | * Corporation and others. All Rights Reserved. |
7 | ******************************************************************************** |
8 | * |
9 | * File DCFMTSYM.H |
10 | * |
11 | * Modification History: |
12 | * |
13 | * Date Name Description |
14 | * 02/19/97 aliu Converted from java. |
15 | * 03/18/97 clhuang Updated per C++ implementation. |
16 | * 03/27/97 helena Updated to pass the simple test after code review. |
17 | * 08/26/97 aliu Added currency/intl currency symbol support. |
18 | * 07/22/98 stephen Changed to match C++ style |
19 | * currencySymbol -> fCurrencySymbol |
20 | * Constants changed from CAPS to kCaps |
21 | * 06/24/99 helena Integrated Alan's NF enhancements and Java2 bug fixes |
22 | * 09/22/00 grhoten Marked deprecation tags with a pointer to replacement |
23 | * functions. |
24 | ******************************************************************************** |
25 | */ |
26 | |
27 | #ifndef DCFMTSYM_H |
28 | #define DCFMTSYM_H |
29 | |
30 | #include "unicode/utypes.h" |
31 | |
32 | #if U_SHOW_CPLUSPLUS_API |
33 | |
34 | #if !UCONFIG_NO_FORMATTING |
35 | |
36 | #include "unicode/uchar.h" |
37 | #include "unicode/uobject.h" |
38 | #include "unicode/locid.h" |
39 | #include "unicode/numsys.h" |
40 | #include "unicode/unum.h" |
41 | #include "unicode/unistr.h" |
42 | |
43 | /** |
44 | * \file |
45 | * \brief C++ API: Symbols for formatting numbers. |
46 | */ |
47 | |
48 | |
49 | U_NAMESPACE_BEGIN |
50 | |
51 | /** |
52 | * This class represents the set of symbols needed by DecimalFormat |
53 | * to format numbers. DecimalFormat creates for itself an instance of |
54 | * DecimalFormatSymbols from its locale data. If you need to change any |
55 | * of these symbols, you can get the DecimalFormatSymbols object from |
56 | * your DecimalFormat and modify it. |
57 | * <P> |
58 | * Here are the special characters used in the parts of the |
59 | * subpattern, with notes on their usage. |
60 | * <pre> |
61 | * \code |
62 | * Symbol Meaning |
63 | * 0 a digit |
64 | * # a digit, zero shows as absent |
65 | * . placeholder for decimal separator |
66 | * , placeholder for grouping separator. |
67 | * ; separates formats. |
68 | * - default negative prefix. |
69 | * % divide by 100 and show as percentage |
70 | * X any other characters can be used in the prefix or suffix |
71 | * ' used to quote special characters in a prefix or suffix. |
72 | * \endcode |
73 | * </pre> |
74 | * [Notes] |
75 | * <P> |
76 | * If there is no explicit negative subpattern, - is prefixed to the |
77 | * positive form. That is, "0.00" alone is equivalent to "0.00;-0.00". |
78 | * <P> |
79 | * The grouping separator is commonly used for thousands, but in some |
80 | * countries for ten-thousands. The interval is a constant number of |
81 | * digits between the grouping characters, such as 100,000,000 or 1,0000,0000. |
82 | * If you supply a pattern with multiple grouping characters, the interval |
83 | * between the last one and the end of the integer is the one that is |
84 | * used. So "#,##,###,####" == "######,####" == "##,####,####". |
85 | */ |
86 | class U_I18N_API DecimalFormatSymbols : public UObject { |
87 | public: |
88 | /** |
89 | * Constants for specifying a number format symbol. |
90 | * @stable ICU 2.0 |
91 | */ |
92 | enum ENumberFormatSymbol { |
93 | /** The decimal separator */ |
94 | kDecimalSeparatorSymbol, |
95 | /** The grouping separator */ |
96 | kGroupingSeparatorSymbol, |
97 | /** The pattern separator */ |
98 | kPatternSeparatorSymbol, |
99 | /** The percent sign */ |
100 | kPercentSymbol, |
101 | /** Zero*/ |
102 | kZeroDigitSymbol, |
103 | /** Character representing a digit in the pattern */ |
104 | kDigitSymbol, |
105 | /** The minus sign */ |
106 | kMinusSignSymbol, |
107 | /** The plus sign */ |
108 | kPlusSignSymbol, |
109 | /** The currency symbol */ |
110 | kCurrencySymbol, |
111 | /** The international currency symbol */ |
112 | kIntlCurrencySymbol, |
113 | /** The monetary separator */ |
114 | kMonetarySeparatorSymbol, |
115 | /** The exponential symbol */ |
116 | kExponentialSymbol, |
117 | /** Per mill symbol - replaces kPermillSymbol */ |
118 | kPerMillSymbol, |
119 | /** Escape padding character */ |
120 | kPadEscapeSymbol, |
121 | /** Infinity symbol */ |
122 | kInfinitySymbol, |
123 | /** Nan symbol */ |
124 | kNaNSymbol, |
125 | /** Significant digit symbol |
126 | * @stable ICU 3.0 */ |
127 | kSignificantDigitSymbol, |
128 | /** The monetary grouping separator |
129 | * @stable ICU 3.6 |
130 | */ |
131 | kMonetaryGroupingSeparatorSymbol, |
132 | /** One |
133 | * @stable ICU 4.6 |
134 | */ |
135 | kOneDigitSymbol, |
136 | /** Two |
137 | * @stable ICU 4.6 |
138 | */ |
139 | kTwoDigitSymbol, |
140 | /** Three |
141 | * @stable ICU 4.6 |
142 | */ |
143 | kThreeDigitSymbol, |
144 | /** Four |
145 | * @stable ICU 4.6 |
146 | */ |
147 | kFourDigitSymbol, |
148 | /** Five |
149 | * @stable ICU 4.6 |
150 | */ |
151 | kFiveDigitSymbol, |
152 | /** Six |
153 | * @stable ICU 4.6 |
154 | */ |
155 | kSixDigitSymbol, |
156 | /** Seven |
157 | * @stable ICU 4.6 |
158 | */ |
159 | kSevenDigitSymbol, |
160 | /** Eight |
161 | * @stable ICU 4.6 |
162 | */ |
163 | kEightDigitSymbol, |
164 | /** Nine |
165 | * @stable ICU 4.6 |
166 | */ |
167 | kNineDigitSymbol, |
168 | /** Multiplication sign. |
169 | * @stable ICU 54 |
170 | */ |
171 | kExponentMultiplicationSymbol, |
172 | /** count symbol constants */ |
173 | kFormatSymbolCount = kNineDigitSymbol + 2 |
174 | }; |
175 | |
176 | /** |
177 | * Create a DecimalFormatSymbols object for the given locale. |
178 | * |
179 | * @param locale The locale to get symbols for. |
180 | * @param status Input/output parameter, set to success or |
181 | * failure code upon return. |
182 | * @stable ICU 2.0 |
183 | */ |
184 | DecimalFormatSymbols(const Locale& locale, UErrorCode& status); |
185 | |
186 | /** |
187 | * Creates a DecimalFormatSymbols instance for the given locale with digits and symbols |
188 | * corresponding to the given NumberingSystem. |
189 | * |
190 | * This constructor behaves equivalently to the normal constructor called with a locale having a |
191 | * "numbers=xxxx" keyword specifying the numbering system by name. |
192 | * |
193 | * In this constructor, the NumberingSystem argument will be used even if the locale has its own |
194 | * "numbers=xxxx" keyword. |
195 | * |
196 | * @param locale The locale to get symbols for. |
197 | * @param ns The numbering system. |
198 | * @param status Input/output parameter, set to success or |
199 | * failure code upon return. |
200 | * @stable ICU 60 |
201 | */ |
202 | DecimalFormatSymbols(const Locale& locale, const NumberingSystem& ns, UErrorCode& status); |
203 | |
204 | /** |
205 | * Create a DecimalFormatSymbols object for the default locale. |
206 | * This constructor will not fail. If the resource file data is |
207 | * not available, it will use hard-coded last-resort data and |
208 | * set status to U_USING_FALLBACK_ERROR. |
209 | * |
210 | * @param status Input/output parameter, set to success or |
211 | * failure code upon return. |
212 | * @stable ICU 2.0 |
213 | */ |
214 | DecimalFormatSymbols(UErrorCode& status); |
215 | |
216 | /** |
217 | * Creates a DecimalFormatSymbols object with last-resort data. |
218 | * Intended for callers who cache the symbols data and |
219 | * set all symbols on the resulting object. |
220 | * |
221 | * The last-resort symbols are similar to those for the root data, |
222 | * except that the grouping separators are empty, |
223 | * the NaN symbol is U+FFFD rather than "NaN", |
224 | * and the CurrencySpacing patterns are empty. |
225 | * |
226 | * @param status Input/output parameter, set to success or |
227 | * failure code upon return. |
228 | * @return last-resort symbols |
229 | * @stable ICU 52 |
230 | */ |
231 | static DecimalFormatSymbols* createWithLastResortData(UErrorCode& status); |
232 | |
233 | /** |
234 | * Copy constructor. |
235 | * @stable ICU 2.0 |
236 | */ |
237 | DecimalFormatSymbols(const DecimalFormatSymbols&); |
238 | |
239 | /** |
240 | * Assignment operator. |
241 | * @stable ICU 2.0 |
242 | */ |
243 | DecimalFormatSymbols& operator=(const DecimalFormatSymbols&); |
244 | |
245 | /** |
246 | * Destructor. |
247 | * @stable ICU 2.0 |
248 | */ |
249 | virtual ~DecimalFormatSymbols(); |
250 | |
251 | /** |
252 | * Return true if another object is semantically equal to this one. |
253 | * |
254 | * @param other the object to be compared with. |
255 | * @return true if another object is semantically equal to this one. |
256 | * @stable ICU 2.0 |
257 | */ |
258 | UBool operator==(const DecimalFormatSymbols& other) const; |
259 | |
260 | /** |
261 | * Return true if another object is semantically unequal to this one. |
262 | * |
263 | * @param other the object to be compared with. |
264 | * @return true if another object is semantically unequal to this one. |
265 | * @stable ICU 2.0 |
266 | */ |
267 | UBool operator!=(const DecimalFormatSymbols& other) const { return !operator==(other); } |
268 | |
269 | /** |
270 | * Get one of the format symbols by its enum constant. |
271 | * Each symbol is stored as a string so that graphemes |
272 | * (characters with modifier letters) can be used. |
273 | * |
274 | * @param symbol Constant to indicate a number format symbol. |
275 | * @return the format symbols by the param 'symbol' |
276 | * @stable ICU 2.0 |
277 | */ |
278 | inline UnicodeString getSymbol(ENumberFormatSymbol symbol) const; |
279 | |
280 | /** |
281 | * Set one of the format symbols by its enum constant. |
282 | * Each symbol is stored as a string so that graphemes |
283 | * (characters with modifier letters) can be used. |
284 | * |
285 | * @param symbol Constant to indicate a number format symbol. |
286 | * @param value value of the format symbol |
287 | * @param propogateDigits If false, setting the zero digit will not automatically set 1-9. |
288 | * The default behavior is to automatically set 1-9 if zero is being set and the value |
289 | * it is being set to corresponds to a known Unicode zero digit. |
290 | * @stable ICU 2.0 |
291 | */ |
292 | void setSymbol(ENumberFormatSymbol symbol, const UnicodeString &value, const UBool propogateDigits); |
293 | |
294 | /** |
295 | * Returns the locale for which this object was constructed. |
296 | * @stable ICU 2.6 |
297 | */ |
298 | inline Locale getLocale() const; |
299 | |
300 | /** |
301 | * Returns the locale for this object. Two flavors are available: |
302 | * valid and actual locale. |
303 | * @stable ICU 2.8 |
304 | */ |
305 | Locale getLocale(ULocDataLocaleType type, UErrorCode& status) const; |
306 | |
307 | /** |
308 | * Get pattern string for 'CurrencySpacing' that can be applied to |
309 | * currency format. |
310 | * This API gets the CurrencySpacing data from ResourceBundle. The pattern can |
311 | * be empty if there is no data from current locale and its parent locales. |
312 | * |
313 | * @param type : UNUM_CURRENCY_MATCH, UNUM_CURRENCY_SURROUNDING_MATCH or UNUM_CURRENCY_INSERT. |
314 | * @param beforeCurrency : true if the pattern is for before currency symbol. |
315 | * false if the pattern is for after currency symbol. |
316 | * @param status: Input/output parameter, set to success or |
317 | * failure code upon return. |
318 | * @return pattern string for currencyMatch, surroundingMatch or spaceInsert. |
319 | * Return empty string if there is no data for this locale and its parent |
320 | * locales. |
321 | * @stable ICU 4.8 |
322 | */ |
323 | const UnicodeString& getPatternForCurrencySpacing(UCurrencySpacing type, |
324 | UBool beforeCurrency, |
325 | UErrorCode& status) const; |
326 | /** |
327 | * Set pattern string for 'CurrencySpacing' that can be applied to |
328 | * currency format. |
329 | * |
330 | * @param type : UNUM_CURRENCY_MATCH, UNUM_CURRENCY_SURROUNDING_MATCH or UNUM_CURRENCY_INSERT. |
331 | * @param beforeCurrency : true if the pattern is for before currency symbol. |
332 | * false if the pattern is for after currency symbol. |
333 | * @param pattern : pattern string to override current setting. |
334 | * @stable ICU 4.8 |
335 | */ |
336 | void setPatternForCurrencySpacing(UCurrencySpacing type, |
337 | UBool beforeCurrency, |
338 | const UnicodeString& pattern); |
339 | |
340 | /** |
341 | * ICU "poor man's RTTI", returns a UClassID for the actual class. |
342 | * |
343 | * @stable ICU 2.2 |
344 | */ |
345 | virtual UClassID getDynamicClassID() const; |
346 | |
347 | /** |
348 | * ICU "poor man's RTTI", returns a UClassID for this class. |
349 | * |
350 | * @stable ICU 2.2 |
351 | */ |
352 | static UClassID U_EXPORT2 getStaticClassID(); |
353 | |
354 | private: |
355 | DecimalFormatSymbols(); |
356 | |
357 | /** |
358 | * Initializes the symbols from the LocaleElements resource bundle. |
359 | * Note: The organization of LocaleElements badly needs to be |
360 | * cleaned up. |
361 | * |
362 | * @param locale The locale to get symbols for. |
363 | * @param success Input/output parameter, set to success or |
364 | * failure code upon return. |
365 | * @param useLastResortData determine if use last resort data |
366 | * @param ns The NumberingSystem to use; otherwise, fall |
367 | * back to the locale. |
368 | */ |
369 | void initialize(const Locale& locale, UErrorCode& success, |
370 | UBool useLastResortData = FALSE, const NumberingSystem* ns = nullptr); |
371 | |
372 | /** |
373 | * Initialize the symbols with default values. |
374 | */ |
375 | void initialize(); |
376 | |
377 | void setCurrencyForSymbols(); |
378 | |
379 | public: |
380 | |
381 | #ifndef U_HIDE_INTERNAL_API |
382 | /** |
383 | * @internal For ICU use only |
384 | */ |
385 | inline UBool isCustomCurrencySymbol() const { |
386 | return fIsCustomCurrencySymbol; |
387 | } |
388 | |
389 | /** |
390 | * @internal For ICU use only |
391 | */ |
392 | inline UBool isCustomIntlCurrencySymbol() const { |
393 | return fIsCustomIntlCurrencySymbol; |
394 | } |
395 | |
396 | /** |
397 | * @internal For ICU use only |
398 | */ |
399 | inline UChar32 getCodePointZero() const { |
400 | return fCodePointZero; |
401 | } |
402 | #endif /* U_HIDE_INTERNAL_API */ |
403 | |
404 | /** |
405 | * _Internal_ function - more efficient version of getSymbol, |
406 | * returning a const reference to one of the symbol strings. |
407 | * The returned reference becomes invalid when the symbol is changed |
408 | * or when the DecimalFormatSymbols are destroyed. |
409 | * Note: moved \#ifndef U_HIDE_INTERNAL_API after this, since this is needed for inline in DecimalFormat |
410 | * |
411 | * This is not currently stable API, but if you think it should be stable, |
412 | * post a comment on the following ticket and the ICU team will take a look: |
413 | * http://bugs.icu-project.org/trac/ticket/13580 |
414 | * |
415 | * @param symbol Constant to indicate a number format symbol. |
416 | * @return the format symbol by the param 'symbol' |
417 | * @internal |
418 | */ |
419 | inline const UnicodeString& getConstSymbol(ENumberFormatSymbol symbol) const; |
420 | |
421 | #ifndef U_HIDE_INTERNAL_API |
422 | /** |
423 | * Returns the const UnicodeString reference, like getConstSymbol, |
424 | * corresponding to the digit with the given value. This is equivalent |
425 | * to accessing the symbol from getConstSymbol with the corresponding |
426 | * key, such as kZeroDigitSymbol or kOneDigitSymbol. |
427 | * |
428 | * This is not currently stable API, but if you think it should be stable, |
429 | * post a comment on the following ticket and the ICU team will take a look: |
430 | * http://bugs.icu-project.org/trac/ticket/13580 |
431 | * |
432 | * @param digit The digit, an integer between 0 and 9 inclusive. |
433 | * If outside the range 0 to 9, the zero digit is returned. |
434 | * @return the format symbol for the given digit. |
435 | * @internal This API is currently for ICU use only. |
436 | */ |
437 | inline const UnicodeString& getConstDigitSymbol(int32_t digit) const; |
438 | |
439 | /** |
440 | * Returns that pattern stored in currecy info. Internal API for use by NumberFormat API. |
441 | * @internal |
442 | */ |
443 | inline const char16_t* getCurrencyPattern(void) const; |
444 | #endif /* U_HIDE_INTERNAL_API */ |
445 | |
446 | private: |
447 | /** |
448 | * Private symbol strings. |
449 | * They are either loaded from a resource bundle or otherwise owned. |
450 | * setSymbol() clones the symbol string. |
451 | * Readonly aliases can only come from a resource bundle, so that we can always |
452 | * use fastCopyFrom() with them. |
453 | * |
454 | * If DecimalFormatSymbols becomes subclassable and the status of fSymbols changes |
455 | * from private to protected, |
456 | * or when fSymbols can be set any other way that allows them to be readonly aliases |
457 | * to non-resource bundle strings, |
458 | * then regular UnicodeString copies must be used instead of fastCopyFrom(). |
459 | * |
460 | */ |
461 | UnicodeString fSymbols[kFormatSymbolCount]; |
462 | |
463 | /** |
464 | * Non-symbol variable for getConstSymbol(). Always empty. |
465 | */ |
466 | UnicodeString fNoSymbol; |
467 | |
468 | /** |
469 | * Dealing with code points is faster than dealing with strings when formatting. Because of |
470 | * this, we maintain a value containing the zero code point that is used whenever digitStrings |
471 | * represents a sequence of ten code points in order. |
472 | * |
473 | * <p>If the value stored here is positive, it means that the code point stored in this value |
474 | * corresponds to the digitStrings array, and codePointZero can be used instead of the |
475 | * digitStrings array for the purposes of efficient formatting; if -1, then digitStrings does |
476 | * *not* contain a sequence of code points, and it must be used directly. |
477 | * |
478 | * <p>It is assumed that codePointZero always shadows the value in digitStrings. codePointZero |
479 | * should never be set directly; rather, it should be updated only when digitStrings mutates. |
480 | * That is, the flow of information is digitStrings -> codePointZero, not the other way. |
481 | */ |
482 | UChar32 fCodePointZero; |
483 | |
484 | Locale locale; |
485 | |
486 | char actualLocale[ULOC_FULLNAME_CAPACITY]; |
487 | char validLocale[ULOC_FULLNAME_CAPACITY]; |
488 | const char16_t* currPattern; |
489 | |
490 | UnicodeString currencySpcBeforeSym[UNUM_CURRENCY_SPACING_COUNT]; |
491 | UnicodeString currencySpcAfterSym[UNUM_CURRENCY_SPACING_COUNT]; |
492 | UBool fIsCustomCurrencySymbol; |
493 | UBool fIsCustomIntlCurrencySymbol; |
494 | }; |
495 | |
496 | // ------------------------------------- |
497 | |
498 | inline UnicodeString |
499 | DecimalFormatSymbols::getSymbol(ENumberFormatSymbol symbol) const { |
500 | const UnicodeString *strPtr; |
501 | if(symbol < kFormatSymbolCount) { |
502 | strPtr = &fSymbols[symbol]; |
503 | } else { |
504 | strPtr = &fNoSymbol; |
505 | } |
506 | return *strPtr; |
507 | } |
508 | |
509 | // See comments above for this function. Not hidden with #ifdef U_HIDE_INTERNAL_API |
510 | inline const UnicodeString & |
511 | DecimalFormatSymbols::getConstSymbol(ENumberFormatSymbol symbol) const { |
512 | const UnicodeString *strPtr; |
513 | if(symbol < kFormatSymbolCount) { |
514 | strPtr = &fSymbols[symbol]; |
515 | } else { |
516 | strPtr = &fNoSymbol; |
517 | } |
518 | return *strPtr; |
519 | } |
520 | |
521 | #ifndef U_HIDE_INTERNAL_API |
522 | inline const UnicodeString& DecimalFormatSymbols::getConstDigitSymbol(int32_t digit) const { |
523 | if (digit < 0 || digit > 9) { |
524 | digit = 0; |
525 | } |
526 | if (digit == 0) { |
527 | return fSymbols[kZeroDigitSymbol]; |
528 | } |
529 | ENumberFormatSymbol key = static_cast<ENumberFormatSymbol>(kOneDigitSymbol + digit - 1); |
530 | return fSymbols[key]; |
531 | } |
532 | #endif /* U_HIDE_INTERNAL_API */ |
533 | |
534 | // ------------------------------------- |
535 | |
536 | inline void |
537 | DecimalFormatSymbols::setSymbol(ENumberFormatSymbol symbol, const UnicodeString &value, const UBool propogateDigits = TRUE) { |
538 | if (symbol == kCurrencySymbol) { |
539 | fIsCustomCurrencySymbol = TRUE; |
540 | } |
541 | else if (symbol == kIntlCurrencySymbol) { |
542 | fIsCustomIntlCurrencySymbol = TRUE; |
543 | } |
544 | if(symbol<kFormatSymbolCount) { |
545 | fSymbols[symbol]=value; |
546 | } |
547 | |
548 | // If the zero digit is being set to a known zero digit according to Unicode, |
549 | // then we automatically set the corresponding 1-9 digits |
550 | // Also record updates to fCodePointZero. Be conservative if in doubt. |
551 | if (symbol == kZeroDigitSymbol) { |
552 | UChar32 sym = value.char32At(0); |
553 | if ( propogateDigits && u_charDigitValue(sym) == 0 && value.countChar32() == 1 ) { |
554 | fCodePointZero = sym; |
555 | for ( int8_t i = 1 ; i<= 9 ; i++ ) { |
556 | sym++; |
557 | fSymbols[(int)kOneDigitSymbol+i-1] = UnicodeString(sym); |
558 | } |
559 | } else { |
560 | fCodePointZero = -1; |
561 | } |
562 | } else if (symbol >= kOneDigitSymbol && symbol <= kNineDigitSymbol) { |
563 | fCodePointZero = -1; |
564 | } |
565 | } |
566 | |
567 | // ------------------------------------- |
568 | |
569 | inline Locale |
570 | DecimalFormatSymbols::getLocale() const { |
571 | return locale; |
572 | } |
573 | |
574 | #ifndef U_HIDE_INTERNAL_API |
575 | inline const char16_t* |
576 | DecimalFormatSymbols::getCurrencyPattern() const { |
577 | return currPattern; |
578 | } |
579 | #endif /* U_HIDE_INTERNAL_API */ |
580 | |
581 | U_NAMESPACE_END |
582 | |
583 | #endif /* #if !UCONFIG_NO_FORMATTING */ |
584 | |
585 | #endif /* U_SHOW_CPLUSPLUS_API */ |
586 | |
587 | #endif // _DCFMTSYM |
588 | //eof |
589 | |