1 // © 2016 and later: Unicode, Inc. and others. 2 // License & terms of use: http://www.unicode.org/copyright.html 3 /* 4 ******************************************************************************* 5 * Copyright (C) 2008-2015, International Business Machines Corporation and 6 * others. All Rights Reserved. 7 ******************************************************************************* 8 * 9 * 10 * File PLURRULE.H 11 * 12 * Modification History:* 13 * Date Name Description 14 * 15 ******************************************************************************** 16 */ 17 18 #ifndef PLURRULE 19 #define PLURRULE 20 21 #include "unicode/utypes.h" 22 23 #if U_SHOW_CPLUSPLUS_API 24 25 /** 26 * \file 27 * \brief C++ API: PluralRules object 28 */ 29 30 #if !UCONFIG_NO_FORMATTING 31 32 #include "unicode/format.h" 33 #include "unicode/upluralrules.h" 34 #ifndef U_HIDE_INTERNAL_API 35 #include "unicode/numfmt.h" 36 #endif /* U_HIDE_INTERNAL_API */ 37 38 /** 39 * Value returned by PluralRules::getUniqueKeywordValue() when there is no 40 * unique value to return. 41 * @stable ICU 4.8 42 */ 43 #define UPLRULES_NO_UNIQUE_VALUE ((double)-0.00123456777) 44 45 U_NAMESPACE_BEGIN 46 47 class Hashtable; 48 class IFixedDecimal; 49 class RuleChain; 50 class PluralRuleParser; 51 class PluralKeywordEnumeration; 52 class AndConstraint; 53 class SharedPluralRules; 54 55 namespace number { 56 class FormattedNumber; 57 } 58 59 /** 60 * Defines rules for mapping non-negative numeric values onto a small set of 61 * keywords. Rules are constructed from a text description, consisting 62 * of a series of keywords and conditions. The {@link #select} method 63 * examines each condition in order and returns the keyword for the 64 * first condition that matches the number. If none match, 65 * default rule(other) is returned. 66 * 67 * For more information, details, and tips for writing rules, see the 68 * LDML spec, C.11 Language Plural Rules: 69 * http://www.unicode.org/draft/reports/tr35/tr35.html#Language_Plural_Rules 70 * 71 * Examples:<pre> 72 * "one: n is 1; few: n in 2..4"</pre> 73 * This defines two rules, for 'one' and 'few'. The condition for 74 * 'one' is "n is 1" which means that the number must be equal to 75 * 1 for this condition to pass. The condition for 'few' is 76 * "n in 2..4" which means that the number must be between 2 and 77 * 4 inclusive for this condition to pass. All other numbers 78 * are assigned the keyword "other" by the default rule. 79 * </p><pre> 80 * "zero: n is 0; one: n is 1; zero: n mod 100 in 1..19"</pre> 81 * This illustrates that the same keyword can be defined multiple times. 82 * Each rule is examined in order, and the first keyword whose condition 83 * passes is the one returned. Also notes that a modulus is applied 84 * to n in the last rule. Thus its condition holds for 119, 219, 319... 85 * </p><pre> 86 * "one: n is 1; few: n mod 10 in 2..4 and n mod 100 not in 12..14"</pre> 87 * This illustrates conjunction and negation. The condition for 'few' 88 * has two parts, both of which must be met: "n mod 10 in 2..4" and 89 * "n mod 100 not in 12..14". The first part applies a modulus to n 90 * before the test as in the previous example. The second part applies 91 * a different modulus and also uses negation, thus it matches all 92 * numbers _not_ in 12, 13, 14, 112, 113, 114, 212, 213, 214... 93 * </p> 94 * <p> 95 * Syntax:<pre> 96 * \code 97 * rules = rule (';' rule)* 98 * rule = keyword ':' condition 99 * keyword = <identifier> 100 * condition = and_condition ('or' and_condition)* 101 * and_condition = relation ('and' relation)* 102 * relation = is_relation | in_relation | within_relation | 'n' <EOL> 103 * is_relation = expr 'is' ('not')? value 104 * in_relation = expr ('not')? 'in' range_list 105 * within_relation = expr ('not')? 'within' range 106 * expr = ('n' | 'i' | 'f' | 'v' | 'j') ('mod' value)? 107 * range_list = (range | value) (',' range_list)* 108 * value = digit+ ('.' digit+)? 109 * digit = 0|1|2|3|4|5|6|7|8|9 110 * range = value'..'value 111 * \endcode 112 * </pre></p> 113 * <p> 114 * <p> 115 * The i, f, and v values are defined as follows: 116 * </p> 117 * <ul> 118 * <li>i to be the integer digits.</li> 119 * <li>f to be the visible fractional digits, as an integer.</li> 120 * <li>v to be the number of visible fraction digits.</li> 121 * <li>j is defined to only match integers. That is j is 3 fails if v != 0 (eg for 3.1 or 3.0).</li> 122 * </ul> 123 * <p> 124 * Examples are in the following table: 125 * </p> 126 * <table border='1' style="border-collapse:collapse"> 127 * <tr> 128 * <th>n</th> 129 * <th>i</th> 130 * <th>f</th> 131 * <th>v</th> 132 * </tr> 133 * <tr> 134 * <td>1.0</td> 135 * <td>1</td> 136 * <td align="right">0</td> 137 * <td>1</td> 138 * </tr> 139 * <tr> 140 * <td>1.00</td> 141 * <td>1</td> 142 * <td align="right">0</td> 143 * <td>2</td> 144 * </tr> 145 * <tr> 146 * <td>1.3</td> 147 * <td>1</td> 148 * <td align="right">3</td> 149 * <td>1</td> 150 * </tr> 151 * <tr> 152 * <td>1.03</td> 153 * <td>1</td> 154 * <td align="right">3</td> 155 * <td>2</td> 156 * </tr> 157 * <tr> 158 * <td>1.23</td> 159 * <td>1</td> 160 * <td align="right">23</td> 161 * <td>2</td> 162 * </tr> 163 * </table> 164 * <p> 165 * The difference between 'in' and 'within' is that 'in' only includes integers in the specified range, while 'within' 166 * includes all values. Using 'within' with a range_list consisting entirely of values is the same as using 'in' (it's 167 * not an error). 168 * </p> 169 170 * An "identifier" is a sequence of characters that do not have the 171 * Unicode Pattern_Syntax or Pattern_White_Space properties. 172 * <p> 173 * The difference between 'in' and 'within' is that 'in' only includes 174 * integers in the specified range, while 'within' includes all values. 175 * Using 'within' with a range_list consisting entirely of values is the 176 * same as using 'in' (it's not an error). 177 *</p> 178 * <p> 179 * Keywords 180 * could be defined by users or from ICU locale data. There are 6 181 * predefined values in ICU - 'zero', 'one', 'two', 'few', 'many' and 182 * 'other'. Callers need to check the value of keyword returned by 183 * {@link #select} method. 184 * </p> 185 * 186 * Examples:<pre> 187 * UnicodeString keyword = pl->select(number); 188 * if (keyword== UnicodeString("one") { 189 * ... 190 * } 191 * else if ( ... ) 192 * </pre> 193 * <strong>Note:</strong><br> 194 * <p> 195 * ICU defines plural rules for many locales based on CLDR <i>Language Plural Rules</i>. 196 * For these predefined rules, see CLDR page at 197 * http://unicode.org/repos/cldr-tmp/trunk/diff/supplemental/language_plural_rules.html 198 * </p> 199 */ 200 class U_I18N_API PluralRules : public UObject { 201 public: 202 203 /** 204 * Constructor. 205 * @param status Output param set to success/failure code on exit, which 206 * must not indicate a failure before the function call. 207 * 208 * @stable ICU 4.0 209 */ 210 PluralRules(UErrorCode& status); 211 212 /** 213 * Copy constructor. 214 * @stable ICU 4.0 215 */ 216 PluralRules(const PluralRules& other); 217 218 /** 219 * Destructor. 220 * @stable ICU 4.0 221 */ 222 virtual ~PluralRules(); 223 224 /** 225 * Clone 226 * @stable ICU 4.0 227 */ 228 PluralRules* clone() const; 229 230 /** 231 * Assignment operator. 232 * @stable ICU 4.0 233 */ 234 PluralRules& operator=(const PluralRules&); 235 236 /** 237 * Creates a PluralRules from a description if it is parsable, otherwise 238 * returns NULL. 239 * 240 * @param description rule description 241 * @param status Output param set to success/failure code on exit, which 242 * must not indicate a failure before the function call. 243 * @return new PluralRules pointer. NULL if there is an error. 244 * @stable ICU 4.0 245 */ 246 static PluralRules* U_EXPORT2 createRules(const UnicodeString& description, 247 UErrorCode& status); 248 249 /** 250 * The default rules that accept any number. 251 * 252 * @param status Output param set to success/failure code on exit, which 253 * must not indicate a failure before the function call. 254 * @return new PluralRules pointer. NULL if there is an error. 255 * @stable ICU 4.0 256 */ 257 static PluralRules* U_EXPORT2 createDefaultRules(UErrorCode& status); 258 259 /** 260 * Provides access to the predefined cardinal-number <code>PluralRules</code> for a given 261 * locale. 262 * Same as forLocale(locale, UPLURAL_TYPE_CARDINAL, status). 263 * 264 * @param locale The locale for which a <code>PluralRules</code> object is 265 * returned. 266 * @param status Output param set to success/failure code on exit, which 267 * must not indicate a failure before the function call. 268 * @return The predefined <code>PluralRules</code> object pointer for 269 * this locale. If there's no predefined rules for this locale, 270 * the rules for the closest parent in the locale hierarchy 271 * that has one will be returned. The final fallback always 272 * returns the default 'other' rules. 273 * @stable ICU 4.0 274 */ 275 static PluralRules* U_EXPORT2 forLocale(const Locale& locale, UErrorCode& status); 276 277 /** 278 * Provides access to the predefined <code>PluralRules</code> for a given 279 * locale and the plural type. 280 * 281 * @param locale The locale for which a <code>PluralRules</code> object is 282 * returned. 283 * @param type The plural type (e.g., cardinal or ordinal). 284 * @param status Output param set to success/failure code on exit, which 285 * must not indicate a failure before the function call. 286 * @return The predefined <code>PluralRules</code> object pointer for 287 * this locale. If there's no predefined rules for this locale, 288 * the rules for the closest parent in the locale hierarchy 289 * that has one will be returned. The final fallback always 290 * returns the default 'other' rules. 291 * @stable ICU 50 292 */ 293 static PluralRules* U_EXPORT2 forLocale(const Locale& locale, UPluralType type, UErrorCode& status); 294 295 #ifndef U_HIDE_INTERNAL_API 296 /** 297 * Return a StringEnumeration over the locales for which there is plurals data. 298 * @return a StringEnumeration over the locales available. 299 * @internal 300 */ 301 static StringEnumeration* U_EXPORT2 getAvailableLocales(UErrorCode &status); 302 303 /** 304 * Returns whether or not there are overrides. 305 * @param locale the locale to check. 306 * @return 307 * @internal 308 */ 309 static UBool hasOverride(const Locale &locale); 310 311 /** 312 * For ICU use only. 313 * creates a SharedPluralRules object 314 * @internal 315 */ 316 static PluralRules* U_EXPORT2 internalForLocale(const Locale& locale, UPluralType type, UErrorCode& status); 317 318 /** 319 * For ICU use only. 320 * Returns handle to the shared, cached PluralRules instance. 321 * Caller must call removeRef() on returned value once it is done with 322 * the shared instance. 323 * @internal 324 */ 325 static const SharedPluralRules* U_EXPORT2 createSharedInstance( 326 const Locale& locale, UPluralType type, UErrorCode& status); 327 328 329 #endif /* U_HIDE_INTERNAL_API */ 330 331 /** 332 * Given an integer, returns the keyword of the first rule 333 * that applies to the number. This function can be used with 334 * isKeyword* functions to determine the keyword for default plural rules. 335 * 336 * @param number The number for which the rule has to be determined. 337 * @return The keyword of the selected rule. 338 * @stable ICU 4.0 339 */ 340 UnicodeString select(int32_t number) const; 341 342 /** 343 * Given a floating-point number, returns the keyword of the first rule 344 * that applies to the number. This function can be used with 345 * isKeyword* functions to determine the keyword for default plural rules. 346 * 347 * @param number The number for which the rule has to be determined. 348 * @return The keyword of the selected rule. 349 * @stable ICU 4.0 350 */ 351 UnicodeString select(double number) const; 352 353 #ifndef U_HIDE_DRAFT_API 354 /** 355 * Given a formatted number, returns the keyword of the first rule 356 * that applies to the number. This function can be used with 357 * isKeyword* functions to determine the keyword for default plural rules. 358 * 359 * A FormattedNumber allows you to specify an exponent or trailing zeros, 360 * which can affect the plural category. To get a FormattedNumber, see 361 * NumberFormatter. 362 * 363 * @param number The number for which the rule has to be determined. 364 * @param status Set if an error occurs while selecting plural keyword. 365 * This could happen if the FormattedNumber is invalid. 366 * @return The keyword of the selected rule. 367 * @draft ICU 64 368 */ 369 UnicodeString select(const number::FormattedNumber& number, UErrorCode& status) const; 370 #endif /* U_HIDE_DRAFT_API */ 371 372 #ifndef U_HIDE_INTERNAL_API 373 /** 374 * @internal 375 */ 376 UnicodeString select(const IFixedDecimal &number) const; 377 #endif /* U_HIDE_INTERNAL_API */ 378 379 /** 380 * Returns a list of all rule keywords used in this <code>PluralRules</code> 381 * object. The rule 'other' is always present by default. 382 * 383 * @param status Output param set to success/failure code on exit, which 384 * must not indicate a failure before the function call. 385 * @return StringEnumeration with the keywords. 386 * The caller must delete the object. 387 * @stable ICU 4.0 388 */ 389 StringEnumeration* getKeywords(UErrorCode& status) const; 390 391 #ifndef U_HIDE_DEPRECATED_API 392 /** 393 * Deprecated Function, does not return useful results. 394 * 395 * Originally intended to return a unique value for this keyword if it exists, 396 * else the constant UPLRULES_NO_UNIQUE_VALUE. 397 * 398 * @param keyword The keyword. 399 * @return Stub deprecated function returns UPLRULES_NO_UNIQUE_VALUE always. 400 * @deprecated ICU 55 401 */ 402 double getUniqueKeywordValue(const UnicodeString& keyword); 403 404 /** 405 * Deprecated Function, does not produce useful results. 406 * 407 * Originally intended to return all the values for which select() would return the keyword. 408 * If the keyword is unknown, returns no values, but this is not an error. If 409 * the number of values is unlimited, returns no values and -1 as the 410 * count. 411 * 412 * The number of returned values is typically small. 413 * 414 * @param keyword The keyword. 415 * @param dest Array into which to put the returned values. May 416 * be NULL if destCapacity is 0. 417 * @param destCapacity The capacity of the array, must be at least 0. 418 * @param status The error code. Deprecated function, always sets U_UNSUPPORTED_ERROR. 419 * @return The count of values available, or -1. This count 420 * can be larger than destCapacity, but no more than 421 * destCapacity values will be written. 422 * @deprecated ICU 55 423 */ 424 int32_t getAllKeywordValues(const UnicodeString &keyword, 425 double *dest, int32_t destCapacity, 426 UErrorCode& status); 427 #endif /* U_HIDE_DEPRECATED_API */ 428 429 /** 430 * Returns sample values for which select() would return the keyword. If 431 * the keyword is unknown, returns no values, but this is not an error. 432 * 433 * The number of returned values is typically small. 434 * 435 * @param keyword The keyword. 436 * @param dest Array into which to put the returned values. May 437 * be NULL if destCapacity is 0. 438 * @param destCapacity The capacity of the array, must be at least 0. 439 * @param status The error code. 440 * @return The count of values written. 441 * If more than destCapacity samples are available, then 442 * only destCapacity are written, and destCapacity is returned as the count, 443 * rather than setting a U_BUFFER_OVERFLOW_ERROR. 444 * (The actual number of keyword values could be unlimited.) 445 * @stable ICU 4.8 446 */ 447 int32_t getSamples(const UnicodeString &keyword, 448 double *dest, int32_t destCapacity, 449 UErrorCode& status); 450 451 /** 452 * Returns TRUE if the given keyword is defined in this 453 * <code>PluralRules</code> object. 454 * 455 * @param keyword the input keyword. 456 * @return TRUE if the input keyword is defined. 457 * Otherwise, return FALSE. 458 * @stable ICU 4.0 459 */ 460 UBool isKeyword(const UnicodeString& keyword) const; 461 462 463 /** 464 * Returns keyword for default plural form. 465 * 466 * @return keyword for default plural form. 467 * @stable ICU 4.0 468 */ 469 UnicodeString getKeywordOther() const; 470 471 #ifndef U_HIDE_INTERNAL_API 472 /** 473 * 474 * @internal 475 */ 476 UnicodeString getRules() const; 477 #endif /* U_HIDE_INTERNAL_API */ 478 479 /** 480 * Compares the equality of two PluralRules objects. 481 * 482 * @param other The other PluralRules object to be compared with. 483 * @return True if the given PluralRules is the same as this 484 * PluralRules; false otherwise. 485 * @stable ICU 4.0 486 */ 487 virtual UBool operator==(const PluralRules& other) const; 488 489 /** 490 * Compares the inequality of two PluralRules objects. 491 * 492 * @param other The PluralRules object to be compared with. 493 * @return True if the given PluralRules is not the same as this 494 * PluralRules; false otherwise. 495 * @stable ICU 4.0 496 */ 497 UBool operator!=(const PluralRules& other) const {return !operator==(other);} 498 499 500 /** 501 * ICU "poor man's RTTI", returns a UClassID for this class. 502 * 503 * @stable ICU 4.0 504 * 505 */ 506 static UClassID U_EXPORT2 getStaticClassID(void); 507 508 /** 509 * ICU "poor man's RTTI", returns a UClassID for the actual class. 510 * 511 * @stable ICU 4.0 512 */ 513 virtual UClassID getDynamicClassID() const; 514 515 516 private: 517 RuleChain *mRules; 518 519 PluralRules(); // default constructor not implemented 520 void parseDescription(const UnicodeString& ruleData, UErrorCode &status); 521 int32_t getNumberValue(const UnicodeString& token) const; 522 UnicodeString getRuleFromResource(const Locale& locale, UPluralType type, UErrorCode& status); 523 RuleChain *rulesForKeyword(const UnicodeString &keyword) const; 524 525 /** 526 * An internal status variable used to indicate that the object is in an 'invalid' state. 527 * Used by copy constructor, the assignment operator and the clone method. 528 */ 529 UErrorCode mInternalStatus; 530 531 friend class PluralRuleParser; 532 }; 533 534 U_NAMESPACE_END 535 536 #endif /* #if !UCONFIG_NO_FORMATTING */ 537 538 #endif /* U_SHOW_CPLUSPLUS_API */ 539 540 #endif // _PLURRULE 541 //eof 542