blob: 04bf3970ba08257d4ac4dfca0c1c5d258c46f904 [file] [log] [blame]
ross.kirsling@sony.com35a79bf2020-04-06 23:15:45 +00001// © 2016 and later: Unicode, Inc. and others.
2// License & terms of use: http://www.unicode.org/copyright.html
mmaxfield@apple.comfa99daa2017-07-05 21:13:19 +00003/*
4*******************************************************************************
5* Copyright (C) 2008-2015, International Business Machines Corporation and
6* others. All Rights Reserved.
7*******************************************************************************
8*
9*
10* File PLURRULE.H
11*
12* Modification History:*
13* Date Name Description
14*
15********************************************************************************
16*/
17
18#ifndef PLURRULE
19#define PLURRULE
20
21#include "unicode/utypes.h"
22
23/**
24 * \file
25 * \brief C++ API: PluralRules object
26 */
27
28#if !UCONFIG_NO_FORMATTING
29
30#include "unicode/format.h"
31#include "unicode/upluralrules.h"
ross.kirsling@sony.com35a79bf2020-04-06 23:15:45 +000032#ifndef U_HIDE_INTERNAL_API
33#include "unicode/numfmt.h"
34#endif /* U_HIDE_INTERNAL_API */
mmaxfield@apple.comfa99daa2017-07-05 21:13:19 +000035
36/**
37 * Value returned by PluralRules::getUniqueKeywordValue() when there is no
38 * unique value to return.
39 * @stable ICU 4.8
40 */
41#define UPLRULES_NO_UNIQUE_VALUE ((double)-0.00123456777)
42
43U_NAMESPACE_BEGIN
44
45class Hashtable;
ross.kirsling@sony.com35a79bf2020-04-06 23:15:45 +000046class IFixedDecimal;
mmaxfield@apple.comfa99daa2017-07-05 21:13:19 +000047class RuleChain;
48class PluralRuleParser;
49class PluralKeywordEnumeration;
50class AndConstraint;
51class SharedPluralRules;
52
ysuzuki@apple.com900fa162021-10-02 04:38:45 +000053namespace number {
54class FormattedNumber;
55}
56
mmaxfield@apple.comfa99daa2017-07-05 21:13:19 +000057/**
58 * Defines rules for mapping non-negative numeric values onto a small set of
59 * keywords. Rules are constructed from a text description, consisting
60 * of a series of keywords and conditions. The {@link #select} method
61 * examines each condition in order and returns the keyword for the
62 * first condition that matches the number. If none match,
63 * default rule(other) is returned.
64 *
65 * For more information, details, and tips for writing rules, see the
66 * LDML spec, C.11 Language Plural Rules:
67 * http://www.unicode.org/draft/reports/tr35/tr35.html#Language_Plural_Rules
68 *
69 * Examples:<pre>
70 * "one: n is 1; few: n in 2..4"</pre>
71 * This defines two rules, for 'one' and 'few'. The condition for
72 * 'one' is "n is 1" which means that the number must be equal to
73 * 1 for this condition to pass. The condition for 'few' is
74 * "n in 2..4" which means that the number must be between 2 and
75 * 4 inclusive for this condition to pass. All other numbers
76 * are assigned the keyword "other" by the default rule.
77 * </p><pre>
78 * "zero: n is 0; one: n is 1; zero: n mod 100 in 1..19"</pre>
79 * This illustrates that the same keyword can be defined multiple times.
80 * Each rule is examined in order, and the first keyword whose condition
81 * passes is the one returned. Also notes that a modulus is applied
82 * to n in the last rule. Thus its condition holds for 119, 219, 319...
83 * </p><pre>
84 * "one: n is 1; few: n mod 10 in 2..4 and n mod 100 not in 12..14"</pre>
85 * This illustrates conjunction and negation. The condition for 'few'
86 * has two parts, both of which must be met: "n mod 10 in 2..4" and
87 * "n mod 100 not in 12..14". The first part applies a modulus to n
88 * before the test as in the previous example. The second part applies
89 * a different modulus and also uses negation, thus it matches all
90 * numbers _not_ in 12, 13, 14, 112, 113, 114, 212, 213, 214...
91 * </p>
92 * <p>
93 * Syntax:<pre>
94 * \code
95 * rules = rule (';' rule)*
96 * rule = keyword ':' condition
97 * keyword = <identifier>
98 * condition = and_condition ('or' and_condition)*
99 * and_condition = relation ('and' relation)*
100 * relation = is_relation | in_relation | within_relation | 'n' <EOL>
101 * is_relation = expr 'is' ('not')? value
102 * in_relation = expr ('not')? 'in' range_list
103 * within_relation = expr ('not')? 'within' range
104 * expr = ('n' | 'i' | 'f' | 'v' | 'j') ('mod' value)?
105 * range_list = (range | value) (',' range_list)*
106 * value = digit+ ('.' digit+)?
107 * digit = 0|1|2|3|4|5|6|7|8|9
108 * range = value'..'value
109 * \endcode
110 * </pre></p>
111 * <p>
112 * <p>
113 * The i, f, and v values are defined as follows:
114 * </p>
115 * <ul>
116 * <li>i to be the integer digits.</li>
117 * <li>f to be the visible fractional digits, as an integer.</li>
118 * <li>v to be the number of visible fraction digits.</li>
119 * <li>j is defined to only match integers. That is j is 3 fails if v != 0 (eg for 3.1 or 3.0).</li>
120 * </ul>
121 * <p>
122 * Examples are in the following table:
123 * </p>
124 * <table border='1' style="border-collapse:collapse">
mmaxfield@apple.comfa99daa2017-07-05 21:13:19 +0000125 * <tr>
126 * <th>n</th>
127 * <th>i</th>
128 * <th>f</th>
129 * <th>v</th>
130 * </tr>
131 * <tr>
132 * <td>1.0</td>
133 * <td>1</td>
134 * <td align="right">0</td>
135 * <td>1</td>
136 * </tr>
137 * <tr>
138 * <td>1.00</td>
139 * <td>1</td>
140 * <td align="right">0</td>
141 * <td>2</td>
142 * </tr>
143 * <tr>
144 * <td>1.3</td>
145 * <td>1</td>
146 * <td align="right">3</td>
147 * <td>1</td>
148 * </tr>
149 * <tr>
150 * <td>1.03</td>
151 * <td>1</td>
152 * <td align="right">3</td>
153 * <td>2</td>
154 * </tr>
155 * <tr>
156 * <td>1.23</td>
157 * <td>1</td>
158 * <td align="right">23</td>
159 * <td>2</td>
160 * </tr>
mmaxfield@apple.comfa99daa2017-07-05 21:13:19 +0000161 * </table>
162 * <p>
163 * The difference between 'in' and 'within' is that 'in' only includes integers in the specified range, while 'within'
164 * includes all values. Using 'within' with a range_list consisting entirely of values is the same as using 'in' (it's
165 * not an error).
166 * </p>
167
168 * An "identifier" is a sequence of characters that do not have the
169 * Unicode Pattern_Syntax or Pattern_White_Space properties.
170 * <p>
171 * The difference between 'in' and 'within' is that 'in' only includes
172 * integers in the specified range, while 'within' includes all values.
173 * Using 'within' with a range_list consisting entirely of values is the
174 * same as using 'in' (it's not an error).
175 *</p>
176 * <p>
177 * Keywords
178 * could be defined by users or from ICU locale data. There are 6
179 * predefined values in ICU - 'zero', 'one', 'two', 'few', 'many' and
180 * 'other'. Callers need to check the value of keyword returned by
181 * {@link #select} method.
182 * </p>
183 *
184 * Examples:<pre>
185 * UnicodeString keyword = pl->select(number);
186 * if (keyword== UnicodeString("one") {
187 * ...
188 * }
189 * else if ( ... )
190 * </pre>
191 * <strong>Note:</strong><br>
192 * <p>
193 * ICU defines plural rules for many locales based on CLDR <i>Language Plural Rules</i>.
194 * For these predefined rules, see CLDR page at
195 * http://unicode.org/repos/cldr-tmp/trunk/diff/supplemental/language_plural_rules.html
196 * </p>
197 */
198class U_I18N_API PluralRules : public UObject {
199public:
200
201 /**
202 * Constructor.
203 * @param status Output param set to success/failure code on exit, which
204 * must not indicate a failure before the function call.
205 *
206 * @stable ICU 4.0
207 */
208 PluralRules(UErrorCode& status);
209
210 /**
211 * Copy constructor.
212 * @stable ICU 4.0
213 */
214 PluralRules(const PluralRules& other);
215
216 /**
217 * Destructor.
218 * @stable ICU 4.0
219 */
220 virtual ~PluralRules();
221
222 /**
223 * Clone
224 * @stable ICU 4.0
225 */
226 PluralRules* clone() const;
227
228 /**
229 * Assignment operator.
230 * @stable ICU 4.0
231 */
232 PluralRules& operator=(const PluralRules&);
233
234 /**
235 * Creates a PluralRules from a description if it is parsable, otherwise
236 * returns NULL.
237 *
238 * @param description rule description
239 * @param status Output param set to success/failure code on exit, which
240 * must not indicate a failure before the function call.
241 * @return new PluralRules pointer. NULL if there is an error.
242 * @stable ICU 4.0
243 */
244 static PluralRules* U_EXPORT2 createRules(const UnicodeString& description,
245 UErrorCode& status);
246
247 /**
248 * The default rules that accept any number.
249 *
250 * @param status Output param set to success/failure code on exit, which
251 * must not indicate a failure before the function call.
252 * @return new PluralRules pointer. NULL if there is an error.
253 * @stable ICU 4.0
254 */
255 static PluralRules* U_EXPORT2 createDefaultRules(UErrorCode& status);
256
257 /**
258 * Provides access to the predefined cardinal-number <code>PluralRules</code> for a given
259 * locale.
260 * Same as forLocale(locale, UPLURAL_TYPE_CARDINAL, status).
261 *
262 * @param locale The locale for which a <code>PluralRules</code> object is
263 * returned.
264 * @param status Output param set to success/failure code on exit, which
265 * must not indicate a failure before the function call.
266 * @return The predefined <code>PluralRules</code> object pointer for
267 * this locale. If there's no predefined rules for this locale,
268 * the rules for the closest parent in the locale hierarchy
269 * that has one will be returned. The final fallback always
270 * returns the default 'other' rules.
271 * @stable ICU 4.0
272 */
273 static PluralRules* U_EXPORT2 forLocale(const Locale& locale, UErrorCode& status);
274
275 /**
276 * Provides access to the predefined <code>PluralRules</code> for a given
277 * locale and the plural type.
278 *
279 * @param locale The locale for which a <code>PluralRules</code> object is
280 * returned.
281 * @param type The plural type (e.g., cardinal or ordinal).
282 * @param status Output param set to success/failure code on exit, which
283 * must not indicate a failure before the function call.
284 * @return The predefined <code>PluralRules</code> object pointer for
285 * this locale. If there's no predefined rules for this locale,
286 * the rules for the closest parent in the locale hierarchy
287 * that has one will be returned. The final fallback always
288 * returns the default 'other' rules.
289 * @stable ICU 50
290 */
291 static PluralRules* U_EXPORT2 forLocale(const Locale& locale, UPluralType type, UErrorCode& status);
292
293#ifndef U_HIDE_INTERNAL_API
294 /**
295 * Return a StringEnumeration over the locales for which there is plurals data.
296 * @return a StringEnumeration over the locales available.
297 * @internal
298 */
299 static StringEnumeration* U_EXPORT2 getAvailableLocales(UErrorCode &status);
300
301 /**
302 * Returns whether or not there are overrides.
303 * @param locale the locale to check.
304 * @return
305 * @internal
306 */
307 static UBool hasOverride(const Locale &locale);
308
309 /**
310 * For ICU use only.
311 * creates a SharedPluralRules object
312 * @internal
313 */
314 static PluralRules* U_EXPORT2 internalForLocale(const Locale& locale, UPluralType type, UErrorCode& status);
315
316 /**
317 * For ICU use only.
318 * Returns handle to the shared, cached PluralRules instance.
319 * Caller must call removeRef() on returned value once it is done with
320 * the shared instance.
321 * @internal
322 */
323 static const SharedPluralRules* U_EXPORT2 createSharedInstance(
324 const Locale& locale, UPluralType type, UErrorCode& status);
325
326
327#endif /* U_HIDE_INTERNAL_API */
328
329 /**
ysuzuki@apple.com900fa162021-10-02 04:38:45 +0000330 * Given an integer, returns the keyword of the first rule
331 * that applies to the number. This function can be used with
332 * isKeyword* functions to determine the keyword for default plural rules.
mmaxfield@apple.comfa99daa2017-07-05 21:13:19 +0000333 *
334 * @param number The number for which the rule has to be determined.
335 * @return The keyword of the selected rule.
336 * @stable ICU 4.0
337 */
338 UnicodeString select(int32_t number) const;
339
340 /**
ysuzuki@apple.com900fa162021-10-02 04:38:45 +0000341 * Given a floating-point number, returns the keyword of the first rule
342 * that applies to the number. This function can be used with
343 * isKeyword* functions to determine the keyword for default plural rules.
mmaxfield@apple.comfa99daa2017-07-05 21:13:19 +0000344 *
345 * @param number The number for which the rule has to be determined.
346 * @return The keyword of the selected rule.
347 * @stable ICU 4.0
348 */
349 UnicodeString select(double number) const;
350
ysuzuki@apple.com900fa162021-10-02 04:38:45 +0000351#ifndef U_HIDE_DRAFT_API
352 /**
353 * Given a formatted number, returns the keyword of the first rule
354 * that applies to the number. This function can be used with
355 * isKeyword* functions to determine the keyword for default plural rules.
356 *
357 * A FormattedNumber allows you to specify an exponent or trailing zeros,
358 * which can affect the plural category. To get a FormattedNumber, see
359 * NumberFormatter.
360 *
361 * @param number The number for which the rule has to be determined.
362 * @param status Set if an error occurs while selecting plural keyword.
363 * This could happen if the FormattedNumber is invalid.
364 * @return The keyword of the selected rule.
365 * @draft ICU 64
366 */
367 UnicodeString select(const number::FormattedNumber& number, UErrorCode& status) const;
368#endif /* U_HIDE_DRAFT_API */
369
mmaxfield@apple.comfa99daa2017-07-05 21:13:19 +0000370#ifndef U_HIDE_INTERNAL_API
371 /**
372 * @internal
373 */
ross.kirsling@sony.com35a79bf2020-04-06 23:15:45 +0000374 UnicodeString select(const IFixedDecimal &number) const;
mmaxfield@apple.comfa99daa2017-07-05 21:13:19 +0000375#endif /* U_HIDE_INTERNAL_API */
376
377 /**
378 * Returns a list of all rule keywords used in this <code>PluralRules</code>
379 * object. The rule 'other' is always present by default.
380 *
381 * @param status Output param set to success/failure code on exit, which
382 * must not indicate a failure before the function call.
383 * @return StringEnumeration with the keywords.
384 * The caller must delete the object.
385 * @stable ICU 4.0
386 */
387 StringEnumeration* getKeywords(UErrorCode& status) const;
388
389#ifndef U_HIDE_DEPRECATED_API
390 /**
391 * Deprecated Function, does not return useful results.
392 *
393 * Originally intended to return a unique value for this keyword if it exists,
394 * else the constant UPLRULES_NO_UNIQUE_VALUE.
395 *
396 * @param keyword The keyword.
397 * @return Stub deprecated function returns UPLRULES_NO_UNIQUE_VALUE always.
398 * @deprecated ICU 55
399 */
400 double getUniqueKeywordValue(const UnicodeString& keyword);
401
402 /**
403 * Deprecated Function, does not produce useful results.
404 *
ross.kirsling@sony.com35a79bf2020-04-06 23:15:45 +0000405 * Originally intended to return all the values for which select() would return the keyword.
mmaxfield@apple.comfa99daa2017-07-05 21:13:19 +0000406 * If the keyword is unknown, returns no values, but this is not an error. If
407 * the number of values is unlimited, returns no values and -1 as the
408 * count.
409 *
410 * The number of returned values is typically small.
411 *
412 * @param keyword The keyword.
413 * @param dest Array into which to put the returned values. May
414 * be NULL if destCapacity is 0.
415 * @param destCapacity The capacity of the array, must be at least 0.
416 * @param status The error code. Deprecated function, always sets U_UNSUPPORTED_ERROR.
417 * @return The count of values available, or -1. This count
418 * can be larger than destCapacity, but no more than
419 * destCapacity values will be written.
420 * @deprecated ICU 55
421 */
422 int32_t getAllKeywordValues(const UnicodeString &keyword,
423 double *dest, int32_t destCapacity,
424 UErrorCode& status);
425#endif /* U_HIDE_DEPRECATED_API */
426
427 /**
428 * Returns sample values for which select() would return the keyword. If
429 * the keyword is unknown, returns no values, but this is not an error.
430 *
431 * The number of returned values is typically small.
432 *
433 * @param keyword The keyword.
434 * @param dest Array into which to put the returned values. May
435 * be NULL if destCapacity is 0.
436 * @param destCapacity The capacity of the array, must be at least 0.
437 * @param status The error code.
438 * @return The count of values written.
439 * If more than destCapacity samples are available, then
440 * only destCapacity are written, and destCapacity is returned as the count,
441 * rather than setting a U_BUFFER_OVERFLOW_ERROR.
442 * (The actual number of keyword values could be unlimited.)
443 * @stable ICU 4.8
444 */
445 int32_t getSamples(const UnicodeString &keyword,
446 double *dest, int32_t destCapacity,
447 UErrorCode& status);
448
449 /**
450 * Returns TRUE if the given keyword is defined in this
451 * <code>PluralRules</code> object.
452 *
453 * @param keyword the input keyword.
454 * @return TRUE if the input keyword is defined.
455 * Otherwise, return FALSE.
456 * @stable ICU 4.0
457 */
458 UBool isKeyword(const UnicodeString& keyword) const;
459
460
461 /**
462 * Returns keyword for default plural form.
463 *
464 * @return keyword for default plural form.
465 * @stable ICU 4.0
466 */
467 UnicodeString getKeywordOther() const;
468
469#ifndef U_HIDE_INTERNAL_API
470 /**
471 *
472 * @internal
473 */
474 UnicodeString getRules() const;
475#endif /* U_HIDE_INTERNAL_API */
476
477 /**
478 * Compares the equality of two PluralRules objects.
479 *
480 * @param other The other PluralRules object to be compared with.
481 * @return True if the given PluralRules is the same as this
482 * PluralRules; false otherwise.
483 * @stable ICU 4.0
484 */
485 virtual UBool operator==(const PluralRules& other) const;
486
487 /**
488 * Compares the inequality of two PluralRules objects.
489 *
490 * @param other The PluralRules object to be compared with.
491 * @return True if the given PluralRules is not the same as this
492 * PluralRules; false otherwise.
493 * @stable ICU 4.0
494 */
495 UBool operator!=(const PluralRules& other) const {return !operator==(other);}
496
497
498 /**
499 * ICU "poor man's RTTI", returns a UClassID for this class.
500 *
501 * @stable ICU 4.0
502 *
503 */
504 static UClassID U_EXPORT2 getStaticClassID(void);
505
506 /**
507 * ICU "poor man's RTTI", returns a UClassID for the actual class.
508 *
509 * @stable ICU 4.0
510 */
511 virtual UClassID getDynamicClassID() const;
512
513
514private:
515 RuleChain *mRules;
516
517 PluralRules(); // default constructor not implemented
518 void parseDescription(const UnicodeString& ruleData, UErrorCode &status);
519 int32_t getNumberValue(const UnicodeString& token) const;
520 UnicodeString getRuleFromResource(const Locale& locale, UPluralType type, UErrorCode& status);
521 RuleChain *rulesForKeyword(const UnicodeString &keyword) const;
522
ysuzuki@apple.com900fa162021-10-02 04:38:45 +0000523 /**
524 * An internal status variable used to indicate that the object is in an 'invalid' state.
525 * Used by copy constructor, the assignment operator and the clone method.
526 */
527 UErrorCode mInternalStatus;
528
mmaxfield@apple.comfa99daa2017-07-05 21:13:19 +0000529 friend class PluralRuleParser;
530};
531
532U_NAMESPACE_END
533
534#endif /* #if !UCONFIG_NO_FORMATTING */
535
536#endif // _PLURRULE
537//eof