1 | // © 2016 and later: Unicode, Inc. and others. |
2 | // License & terms of use: http://www.unicode.org/copyright.html |
3 | /* |
4 | ******************************************************************************* |
5 | * Copyright (C) 2008-2015, International Business Machines Corporation and |
6 | * others. All Rights Reserved. |
7 | ******************************************************************************* |
8 | * |
9 | * |
10 | * File PLURRULE.H |
11 | * |
12 | * Modification History:* |
13 | * Date Name Description |
14 | * |
15 | ******************************************************************************** |
16 | */ |
17 | |
18 | #ifndef PLURRULE |
19 | #define PLURRULE |
20 | |
21 | #include "unicode/utypes.h" |
22 | |
23 | #if U_SHOW_CPLUSPLUS_API |
24 | |
25 | /** |
26 | * \file |
27 | * \brief C++ API: PluralRules object |
28 | */ |
29 | |
30 | #if !UCONFIG_NO_FORMATTING |
31 | |
32 | #include "unicode/format.h" |
33 | #include "unicode/upluralrules.h" |
34 | #ifndef U_HIDE_INTERNAL_API |
35 | #include "unicode/numfmt.h" |
36 | #endif /* U_HIDE_INTERNAL_API */ |
37 | |
38 | /** |
39 | * Value returned by PluralRules::getUniqueKeywordValue() when there is no |
40 | * unique value to return. |
41 | * @stable ICU 4.8 |
42 | */ |
43 | #define UPLRULES_NO_UNIQUE_VALUE ((double)-0.00123456777) |
44 | |
45 | U_NAMESPACE_BEGIN |
46 | |
47 | class Hashtable; |
48 | class IFixedDecimal; |
49 | class RuleChain; |
50 | class PluralRuleParser; |
51 | class PluralKeywordEnumeration; |
52 | class AndConstraint; |
53 | class SharedPluralRules; |
54 | |
55 | namespace number { |
56 | class FormattedNumber; |
57 | } |
58 | |
59 | /** |
60 | * Defines rules for mapping non-negative numeric values onto a small set of |
61 | * keywords. Rules are constructed from a text description, consisting |
62 | * of a series of keywords and conditions. The {@link #select} method |
63 | * examines each condition in order and returns the keyword for the |
64 | * first condition that matches the number. If none match, |
65 | * default rule(other) is returned. |
66 | * |
67 | * For more information, details, and tips for writing rules, see the |
68 | * LDML spec, C.11 Language Plural Rules: |
69 | * http://www.unicode.org/draft/reports/tr35/tr35.html#Language_Plural_Rules |
70 | * |
71 | * Examples:<pre> |
72 | * "one: n is 1; few: n in 2..4"</pre> |
73 | * This defines two rules, for 'one' and 'few'. The condition for |
74 | * 'one' is "n is 1" which means that the number must be equal to |
75 | * 1 for this condition to pass. The condition for 'few' is |
76 | * "n in 2..4" which means that the number must be between 2 and |
77 | * 4 inclusive for this condition to pass. All other numbers |
78 | * are assigned the keyword "other" by the default rule. |
79 | * </p><pre> |
80 | * "zero: n is 0; one: n is 1; zero: n mod 100 in 1..19"</pre> |
81 | * This illustrates that the same keyword can be defined multiple times. |
82 | * Each rule is examined in order, and the first keyword whose condition |
83 | * passes is the one returned. Also notes that a modulus is applied |
84 | * to n in the last rule. Thus its condition holds for 119, 219, 319... |
85 | * </p><pre> |
86 | * "one: n is 1; few: n mod 10 in 2..4 and n mod 100 not in 12..14"</pre> |
87 | * This illustrates conjunction and negation. The condition for 'few' |
88 | * has two parts, both of which must be met: "n mod 10 in 2..4" and |
89 | * "n mod 100 not in 12..14". The first part applies a modulus to n |
90 | * before the test as in the previous example. The second part applies |
91 | * a different modulus and also uses negation, thus it matches all |
92 | * numbers _not_ in 12, 13, 14, 112, 113, 114, 212, 213, 214... |
93 | * </p> |
94 | * <p> |
95 | * Syntax:<pre> |
96 | * \code |
97 | * rules = rule (';' rule)* |
98 | * rule = keyword ':' condition |
99 | * keyword = <identifier> |
100 | * condition = and_condition ('or' and_condition)* |
101 | * and_condition = relation ('and' relation)* |
102 | * relation = is_relation | in_relation | within_relation | 'n' <EOL> |
103 | * is_relation = expr 'is' ('not')? value |
104 | * in_relation = expr ('not')? 'in' range_list |
105 | * within_relation = expr ('not')? 'within' range |
106 | * expr = ('n' | 'i' | 'f' | 'v' | 'j') ('mod' value)? |
107 | * range_list = (range | value) (',' range_list)* |
108 | * value = digit+ ('.' digit+)? |
109 | * digit = 0|1|2|3|4|5|6|7|8|9 |
110 | * range = value'..'value |
111 | * \endcode |
112 | * </pre></p> |
113 | * <p> |
114 | * <p> |
115 | * The i, f, and v values are defined as follows: |
116 | * </p> |
117 | * <ul> |
118 | * <li>i to be the integer digits.</li> |
119 | * <li>f to be the visible fractional digits, as an integer.</li> |
120 | * <li>v to be the number of visible fraction digits.</li> |
121 | * <li>j is defined to only match integers. That is j is 3 fails if v != 0 (eg for 3.1 or 3.0).</li> |
122 | * </ul> |
123 | * <p> |
124 | * Examples are in the following table: |
125 | * </p> |
126 | * <table border='1' style="border-collapse:collapse"> |
127 | * <tr> |
128 | * <th>n</th> |
129 | * <th>i</th> |
130 | * <th>f</th> |
131 | * <th>v</th> |
132 | * </tr> |
133 | * <tr> |
134 | * <td>1.0</td> |
135 | * <td>1</td> |
136 | * <td align="right">0</td> |
137 | * <td>1</td> |
138 | * </tr> |
139 | * <tr> |
140 | * <td>1.00</td> |
141 | * <td>1</td> |
142 | * <td align="right">0</td> |
143 | * <td>2</td> |
144 | * </tr> |
145 | * <tr> |
146 | * <td>1.3</td> |
147 | * <td>1</td> |
148 | * <td align="right">3</td> |
149 | * <td>1</td> |
150 | * </tr> |
151 | * <tr> |
152 | * <td>1.03</td> |
153 | * <td>1</td> |
154 | * <td align="right">3</td> |
155 | * <td>2</td> |
156 | * </tr> |
157 | * <tr> |
158 | * <td>1.23</td> |
159 | * <td>1</td> |
160 | * <td align="right">23</td> |
161 | * <td>2</td> |
162 | * </tr> |
163 | * </table> |
164 | * <p> |
165 | * The difference between 'in' and 'within' is that 'in' only includes integers in the specified range, while 'within' |
166 | * includes all values. Using 'within' with a range_list consisting entirely of values is the same as using 'in' (it's |
167 | * not an error). |
168 | * </p> |
169 | |
170 | * An "identifier" is a sequence of characters that do not have the |
171 | * Unicode Pattern_Syntax or Pattern_White_Space properties. |
172 | * <p> |
173 | * The difference between 'in' and 'within' is that 'in' only includes |
174 | * integers in the specified range, while 'within' includes all values. |
175 | * Using 'within' with a range_list consisting entirely of values is the |
176 | * same as using 'in' (it's not an error). |
177 | *</p> |
178 | * <p> |
179 | * Keywords |
180 | * could be defined by users or from ICU locale data. There are 6 |
181 | * predefined values in ICU - 'zero', 'one', 'two', 'few', 'many' and |
182 | * 'other'. Callers need to check the value of keyword returned by |
183 | * {@link #select} method. |
184 | * </p> |
185 | * |
186 | * Examples:<pre> |
187 | * UnicodeString keyword = pl->select(number); |
188 | * if (keyword== UnicodeString("one") { |
189 | * ... |
190 | * } |
191 | * else if ( ... ) |
192 | * </pre> |
193 | * <strong>Note:</strong><br> |
194 | * <p> |
195 | * ICU defines plural rules for many locales based on CLDR <i>Language Plural Rules</i>. |
196 | * For these predefined rules, see CLDR page at |
197 | * http://unicode.org/repos/cldr-tmp/trunk/diff/supplemental/language_plural_rules.html |
198 | * </p> |
199 | */ |
200 | class U_I18N_API PluralRules : public UObject { |
201 | public: |
202 | |
203 | /** |
204 | * Constructor. |
205 | * @param status Output param set to success/failure code on exit, which |
206 | * must not indicate a failure before the function call. |
207 | * |
208 | * @stable ICU 4.0 |
209 | */ |
210 | PluralRules(UErrorCode& status); |
211 | |
212 | /** |
213 | * Copy constructor. |
214 | * @stable ICU 4.0 |
215 | */ |
216 | PluralRules(const PluralRules& other); |
217 | |
218 | /** |
219 | * Destructor. |
220 | * @stable ICU 4.0 |
221 | */ |
222 | virtual ~PluralRules(); |
223 | |
224 | /** |
225 | * Clone |
226 | * @stable ICU 4.0 |
227 | */ |
228 | PluralRules* clone() const; |
229 | |
230 | /** |
231 | * Assignment operator. |
232 | * @stable ICU 4.0 |
233 | */ |
234 | PluralRules& operator=(const PluralRules&); |
235 | |
236 | /** |
237 | * Creates a PluralRules from a description if it is parsable, otherwise |
238 | * returns NULL. |
239 | * |
240 | * @param description rule description |
241 | * @param status Output param set to success/failure code on exit, which |
242 | * must not indicate a failure before the function call. |
243 | * @return new PluralRules pointer. NULL if there is an error. |
244 | * @stable ICU 4.0 |
245 | */ |
246 | static PluralRules* U_EXPORT2 createRules(const UnicodeString& description, |
247 | UErrorCode& status); |
248 | |
249 | /** |
250 | * The default rules that accept any number. |
251 | * |
252 | * @param status Output param set to success/failure code on exit, which |
253 | * must not indicate a failure before the function call. |
254 | * @return new PluralRules pointer. NULL if there is an error. |
255 | * @stable ICU 4.0 |
256 | */ |
257 | static PluralRules* U_EXPORT2 createDefaultRules(UErrorCode& status); |
258 | |
259 | /** |
260 | * Provides access to the predefined cardinal-number <code>PluralRules</code> for a given |
261 | * locale. |
262 | * Same as forLocale(locale, UPLURAL_TYPE_CARDINAL, status). |
263 | * |
264 | * @param locale The locale for which a <code>PluralRules</code> object is |
265 | * returned. |
266 | * @param status Output param set to success/failure code on exit, which |
267 | * must not indicate a failure before the function call. |
268 | * @return The predefined <code>PluralRules</code> object pointer for |
269 | * this locale. If there's no predefined rules for this locale, |
270 | * the rules for the closest parent in the locale hierarchy |
271 | * that has one will be returned. The final fallback always |
272 | * returns the default 'other' rules. |
273 | * @stable ICU 4.0 |
274 | */ |
275 | static PluralRules* U_EXPORT2 forLocale(const Locale& locale, UErrorCode& status); |
276 | |
277 | /** |
278 | * Provides access to the predefined <code>PluralRules</code> for a given |
279 | * locale and the plural type. |
280 | * |
281 | * @param locale The locale for which a <code>PluralRules</code> object is |
282 | * returned. |
283 | * @param type The plural type (e.g., cardinal or ordinal). |
284 | * @param status Output param set to success/failure code on exit, which |
285 | * must not indicate a failure before the function call. |
286 | * @return The predefined <code>PluralRules</code> object pointer for |
287 | * this locale. If there's no predefined rules for this locale, |
288 | * the rules for the closest parent in the locale hierarchy |
289 | * that has one will be returned. The final fallback always |
290 | * returns the default 'other' rules. |
291 | * @stable ICU 50 |
292 | */ |
293 | static PluralRules* U_EXPORT2 forLocale(const Locale& locale, UPluralType type, UErrorCode& status); |
294 | |
295 | #ifndef U_HIDE_INTERNAL_API |
296 | /** |
297 | * Return a StringEnumeration over the locales for which there is plurals data. |
298 | * @return a StringEnumeration over the locales available. |
299 | * @internal |
300 | */ |
301 | static StringEnumeration* U_EXPORT2 getAvailableLocales(UErrorCode &status); |
302 | |
303 | /** |
304 | * Returns whether or not there are overrides. |
305 | * @param locale the locale to check. |
306 | * @return |
307 | * @internal |
308 | */ |
309 | static UBool hasOverride(const Locale &locale); |
310 | |
311 | /** |
312 | * For ICU use only. |
313 | * creates a SharedPluralRules object |
314 | * @internal |
315 | */ |
316 | static PluralRules* U_EXPORT2 internalForLocale(const Locale& locale, UPluralType type, UErrorCode& status); |
317 | |
318 | /** |
319 | * For ICU use only. |
320 | * Returns handle to the shared, cached PluralRules instance. |
321 | * Caller must call removeRef() on returned value once it is done with |
322 | * the shared instance. |
323 | * @internal |
324 | */ |
325 | static const SharedPluralRules* U_EXPORT2 createSharedInstance( |
326 | const Locale& locale, UPluralType type, UErrorCode& status); |
327 | |
328 | |
329 | #endif /* U_HIDE_INTERNAL_API */ |
330 | |
331 | /** |
332 | * Given an integer, returns the keyword of the first rule |
333 | * that applies to the number. This function can be used with |
334 | * isKeyword* functions to determine the keyword for default plural rules. |
335 | * |
336 | * @param number The number for which the rule has to be determined. |
337 | * @return The keyword of the selected rule. |
338 | * @stable ICU 4.0 |
339 | */ |
340 | UnicodeString select(int32_t number) const; |
341 | |
342 | /** |
343 | * Given a floating-point number, returns the keyword of the first rule |
344 | * that applies to the number. This function can be used with |
345 | * isKeyword* functions to determine the keyword for default plural rules. |
346 | * |
347 | * @param number The number for which the rule has to be determined. |
348 | * @return The keyword of the selected rule. |
349 | * @stable ICU 4.0 |
350 | */ |
351 | UnicodeString select(double number) const; |
352 | |
353 | #ifndef U_HIDE_DRAFT_API |
354 | /** |
355 | * Given a formatted number, returns the keyword of the first rule |
356 | * that applies to the number. This function can be used with |
357 | * isKeyword* functions to determine the keyword for default plural rules. |
358 | * |
359 | * A FormattedNumber allows you to specify an exponent or trailing zeros, |
360 | * which can affect the plural category. To get a FormattedNumber, see |
361 | * NumberFormatter. |
362 | * |
363 | * @param number The number for which the rule has to be determined. |
364 | * @param status Set if an error occurs while selecting plural keyword. |
365 | * This could happen if the FormattedNumber is invalid. |
366 | * @return The keyword of the selected rule. |
367 | * @draft ICU 64 |
368 | */ |
369 | UnicodeString select(const number::FormattedNumber& number, UErrorCode& status) const; |
370 | #endif /* U_HIDE_DRAFT_API */ |
371 | |
372 | #ifndef U_HIDE_INTERNAL_API |
373 | /** |
374 | * @internal |
375 | */ |
376 | UnicodeString select(const IFixedDecimal &number) const; |
377 | #endif /* U_HIDE_INTERNAL_API */ |
378 | |
379 | /** |
380 | * Returns a list of all rule keywords used in this <code>PluralRules</code> |
381 | * object. The rule 'other' is always present by default. |
382 | * |
383 | * @param status Output param set to success/failure code on exit, which |
384 | * must not indicate a failure before the function call. |
385 | * @return StringEnumeration with the keywords. |
386 | * The caller must delete the object. |
387 | * @stable ICU 4.0 |
388 | */ |
389 | StringEnumeration* getKeywords(UErrorCode& status) const; |
390 | |
391 | #ifndef U_HIDE_DEPRECATED_API |
392 | /** |
393 | * Deprecated Function, does not return useful results. |
394 | * |
395 | * Originally intended to return a unique value for this keyword if it exists, |
396 | * else the constant UPLRULES_NO_UNIQUE_VALUE. |
397 | * |
398 | * @param keyword The keyword. |
399 | * @return Stub deprecated function returns UPLRULES_NO_UNIQUE_VALUE always. |
400 | * @deprecated ICU 55 |
401 | */ |
402 | double getUniqueKeywordValue(const UnicodeString& keyword); |
403 | |
404 | /** |
405 | * Deprecated Function, does not produce useful results. |
406 | * |
407 | * Originally intended to return all the values for which select() would return the keyword. |
408 | * If the keyword is unknown, returns no values, but this is not an error. If |
409 | * the number of values is unlimited, returns no values and -1 as the |
410 | * count. |
411 | * |
412 | * The number of returned values is typically small. |
413 | * |
414 | * @param keyword The keyword. |
415 | * @param dest Array into which to put the returned values. May |
416 | * be NULL if destCapacity is 0. |
417 | * @param destCapacity The capacity of the array, must be at least 0. |
418 | * @param status The error code. Deprecated function, always sets U_UNSUPPORTED_ERROR. |
419 | * @return The count of values available, or -1. This count |
420 | * can be larger than destCapacity, but no more than |
421 | * destCapacity values will be written. |
422 | * @deprecated ICU 55 |
423 | */ |
424 | int32_t getAllKeywordValues(const UnicodeString &keyword, |
425 | double *dest, int32_t destCapacity, |
426 | UErrorCode& status); |
427 | #endif /* U_HIDE_DEPRECATED_API */ |
428 | |
429 | /** |
430 | * Returns sample values for which select() would return the keyword. If |
431 | * the keyword is unknown, returns no values, but this is not an error. |
432 | * |
433 | * The number of returned values is typically small. |
434 | * |
435 | * @param keyword The keyword. |
436 | * @param dest Array into which to put the returned values. May |
437 | * be NULL if destCapacity is 0. |
438 | * @param destCapacity The capacity of the array, must be at least 0. |
439 | * @param status The error code. |
440 | * @return The count of values written. |
441 | * If more than destCapacity samples are available, then |
442 | * only destCapacity are written, and destCapacity is returned as the count, |
443 | * rather than setting a U_BUFFER_OVERFLOW_ERROR. |
444 | * (The actual number of keyword values could be unlimited.) |
445 | * @stable ICU 4.8 |
446 | */ |
447 | int32_t getSamples(const UnicodeString &keyword, |
448 | double *dest, int32_t destCapacity, |
449 | UErrorCode& status); |
450 | |
451 | /** |
452 | * Returns TRUE if the given keyword is defined in this |
453 | * <code>PluralRules</code> object. |
454 | * |
455 | * @param keyword the input keyword. |
456 | * @return TRUE if the input keyword is defined. |
457 | * Otherwise, return FALSE. |
458 | * @stable ICU 4.0 |
459 | */ |
460 | UBool isKeyword(const UnicodeString& keyword) const; |
461 | |
462 | |
463 | /** |
464 | * Returns keyword for default plural form. |
465 | * |
466 | * @return keyword for default plural form. |
467 | * @stable ICU 4.0 |
468 | */ |
469 | UnicodeString getKeywordOther() const; |
470 | |
471 | #ifndef U_HIDE_INTERNAL_API |
472 | /** |
473 | * |
474 | * @internal |
475 | */ |
476 | UnicodeString getRules() const; |
477 | #endif /* U_HIDE_INTERNAL_API */ |
478 | |
479 | /** |
480 | * Compares the equality of two PluralRules objects. |
481 | * |
482 | * @param other The other PluralRules object to be compared with. |
483 | * @return True if the given PluralRules is the same as this |
484 | * PluralRules; false otherwise. |
485 | * @stable ICU 4.0 |
486 | */ |
487 | virtual UBool operator==(const PluralRules& other) const; |
488 | |
489 | /** |
490 | * Compares the inequality of two PluralRules objects. |
491 | * |
492 | * @param other The PluralRules object to be compared with. |
493 | * @return True if the given PluralRules is not the same as this |
494 | * PluralRules; false otherwise. |
495 | * @stable ICU 4.0 |
496 | */ |
497 | UBool operator!=(const PluralRules& other) const {return !operator==(other);} |
498 | |
499 | |
500 | /** |
501 | * ICU "poor man's RTTI", returns a UClassID for this class. |
502 | * |
503 | * @stable ICU 4.0 |
504 | * |
505 | */ |
506 | static UClassID U_EXPORT2 getStaticClassID(void); |
507 | |
508 | /** |
509 | * ICU "poor man's RTTI", returns a UClassID for the actual class. |
510 | * |
511 | * @stable ICU 4.0 |
512 | */ |
513 | virtual UClassID getDynamicClassID() const; |
514 | |
515 | |
516 | private: |
517 | RuleChain *mRules; |
518 | |
519 | PluralRules(); // default constructor not implemented |
520 | void parseDescription(const UnicodeString& ruleData, UErrorCode &status); |
521 | int32_t getNumberValue(const UnicodeString& token) const; |
522 | UnicodeString getRuleFromResource(const Locale& locale, UPluralType type, UErrorCode& status); |
523 | RuleChain *rulesForKeyword(const UnicodeString &keyword) const; |
524 | |
525 | /** |
526 | * An internal status variable used to indicate that the object is in an 'invalid' state. |
527 | * Used by copy constructor, the assignment operator and the clone method. |
528 | */ |
529 | UErrorCode mInternalStatus; |
530 | |
531 | friend class PluralRuleParser; |
532 | }; |
533 | |
534 | U_NAMESPACE_END |
535 | |
536 | #endif /* #if !UCONFIG_NO_FORMATTING */ |
537 | |
538 | #endif /* U_SHOW_CPLUSPLUS_API */ |
539 | |
540 | #endif // _PLURRULE |
541 | //eof |
542 | |