]>
Commit | Line | Data |
---|---|---|
46f4442e A |
1 | /* |
2 | ******************************************************************************* | |
51004dcb | 3 | * Copyright (C) 2008-2013, International Business Machines Corporation and |
46f4442e A |
4 | * others. All Rights Reserved. |
5 | ******************************************************************************* | |
6 | * | |
7 | * | |
8 | * File PLURRULE.H | |
9 | * | |
10 | * Modification History:* | |
11 | * Date Name Description | |
12 | * | |
13 | ******************************************************************************** | |
14 | */ | |
15 | ||
16 | #ifndef PLURRULE | |
17 | #define PLURRULE | |
18 | ||
19 | #include "unicode/utypes.h" | |
20 | ||
21 | /** | |
22 | * \file | |
23 | * \brief C++ API: PluralRules object | |
24 | */ | |
25 | ||
26 | #if !UCONFIG_NO_FORMATTING | |
27 | ||
28 | #include "unicode/format.h" | |
51004dcb | 29 | #include "unicode/upluralrules.h" |
46f4442e | 30 | |
4388f060 A |
31 | /** |
32 | * Value returned by PluralRules::getUniqueKeywordValue() when there is no | |
33 | * unique value to return. | |
34 | * @stable ICU 4.8 | |
35 | */ | |
36 | #define UPLRULES_NO_UNIQUE_VALUE ((double)-0.00123456777) | |
37 | ||
46f4442e A |
38 | U_NAMESPACE_BEGIN |
39 | ||
40 | class Hashtable; | |
41 | class RuleChain; | |
42 | class RuleParser; | |
4388f060 | 43 | class PluralKeywordEnumeration; |
46f4442e A |
44 | |
45 | /** | |
4388f060 | 46 | * Defines rules for mapping non-negative numeric values onto a small set of |
46f4442e A |
47 | * keywords. Rules are constructed from a text description, consisting |
48 | * of a series of keywords and conditions. The {@link #select} method | |
49 | * examines each condition in order and returns the keyword for the | |
50 | * first condition that matches the number. If none match, | |
51 | * default rule(other) is returned. | |
52 | * | |
4388f060 A |
53 | * For more information, details, and tips for writing rules, see the |
54 | * LDML spec, C.11 Language Plural Rules: | |
55 | * http://www.unicode.org/draft/reports/tr35/tr35.html#Language_Plural_Rules | |
56 | * | |
46f4442e A |
57 | * Examples:<pre> |
58 | * "one: n is 1; few: n in 2..4"</pre> | |
59 | * This defines two rules, for 'one' and 'few'. The condition for | |
60 | * 'one' is "n is 1" which means that the number must be equal to | |
61 | * 1 for this condition to pass. The condition for 'few' is | |
62 | * "n in 2..4" which means that the number must be between 2 and | |
63 | * 4 inclusive for this condition to pass. All other numbers | |
64 | * are assigned the keyword "other" by the default rule. | |
65 | * </p><pre> | |
66 | * "zero: n is 0; one: n is 1; zero: n mod 100 in 1..19"</pre> | |
67 | * This illustrates that the same keyword can be defined multiple times. | |
68 | * Each rule is examined in order, and the first keyword whose condition | |
69 | * passes is the one returned. Also notes that a modulus is applied | |
70 | * to n in the last rule. Thus its condition holds for 119, 219, 319... | |
71 | * </p><pre> | |
72 | * "one: n is 1; few: n mod 10 in 2..4 and n mod 100 not in 12..14"</pre> | |
73 | * This illustrates conjunction and negation. The condition for 'few' | |
74 | * has two parts, both of which must be met: "n mod 10 in 2..4" and | |
75 | * "n mod 100 not in 12..14". The first part applies a modulus to n | |
76 | * before the test as in the previous example. The second part applies | |
77 | * a different modulus and also uses negation, thus it matches all | |
78 | * numbers _not_ in 12, 13, 14, 112, 113, 114, 212, 213, 214... | |
79 | * </p> | |
80 | * <p> | |
81 | * Syntax:<pre> | |
729e4ab9 | 82 | * \code |
46f4442e A |
83 | * rules = rule (';' rule)* |
84 | * rule = keyword ':' condition | |
85 | * keyword = <identifier> | |
86 | * condition = and_condition ('or' and_condition)* | |
87 | * and_condition = relation ('and' relation)* | |
88 | * relation = is_relation | in_relation | within_relation | 'n' <EOL> | |
89 | * is_relation = expr 'is' ('not')? value | |
4388f060 | 90 | * in_relation = expr ('not')? 'in' range_list |
46f4442e A |
91 | * within_relation = expr ('not')? 'within' range |
92 | * expr = 'n' ('mod' value)? | |
4388f060 | 93 | * range_list = (range | value) (',' range_list)* |
46f4442e A |
94 | * value = digit+ |
95 | * digit = 0|1|2|3|4|5|6|7|8|9 | |
96 | * range = value'..'value | |
729e4ab9 | 97 | * \endcode |
46f4442e A |
98 | * </pre></p> |
99 | * <p> | |
4388f060 A |
100 | * An "identifier" is a sequence of characters that do not have the |
101 | * Unicode Pattern_Syntax or Pattern_White_Space properties. | |
102 | * <p> | |
103 | * The difference between 'in' and 'within' is that 'in' only includes | |
104 | * integers in the specified range, while 'within' includes all values.</p> | |
105 | * <p> | |
106 | * Keywords | |
107 | * could be defined by users or from ICU locale data. There are 6 | |
108 | * predefined values in ICU - 'zero', 'one', 'two', 'few', 'many' and | |
109 | * 'other'. Callers need to check the value of keyword returned by | |
110 | * {@link #select} method. | |
111 | * </p> | |
46f4442e A |
112 | * |
113 | * Examples:<pre> | |
114 | * UnicodeString keyword = pl->select(number); | |
115 | * if (keyword== UnicodeString("one") { | |
116 | * ... | |
117 | * } | |
118 | * else if ( ... ) | |
119 | * </pre> | |
729e4ab9 A |
120 | * <strong>Note:</strong><br> |
121 | * <p> | |
122 | * ICU defines plural rules for many locales based on CLDR <i>Language Plural Rules</i>. | |
4388f060 | 123 | * For these predefined rules, see CLDR page at |
729e4ab9 A |
124 | * http://unicode.org/repos/cldr-tmp/trunk/diff/supplemental/language_plural_rules.html |
125 | * </p> | |
46f4442e A |
126 | */ |
127 | class U_I18N_API PluralRules : public UObject { | |
128 | public: | |
129 | ||
130 | /** | |
131 | * Constructor. | |
132 | * @param status Output param set to success/failure code on exit, which | |
133 | * must not indicate a failure before the function call. | |
134 | * | |
729e4ab9 | 135 | * @stable ICU 4.0 |
46f4442e A |
136 | */ |
137 | PluralRules(UErrorCode& status); | |
138 | ||
139 | /** | |
140 | * Copy constructor. | |
729e4ab9 | 141 | * @stable ICU 4.0 |
46f4442e A |
142 | */ |
143 | PluralRules(const PluralRules& other); | |
144 | ||
145 | /** | |
146 | * Destructor. | |
729e4ab9 | 147 | * @stable ICU 4.0 |
46f4442e A |
148 | */ |
149 | virtual ~PluralRules(); | |
150 | ||
151 | /** | |
152 | * Clone | |
729e4ab9 | 153 | * @stable ICU 4.0 |
46f4442e A |
154 | */ |
155 | PluralRules* clone() const; | |
156 | ||
157 | /** | |
158 | * Assignment operator. | |
729e4ab9 | 159 | * @stable ICU 4.0 |
46f4442e A |
160 | */ |
161 | PluralRules& operator=(const PluralRules&); | |
162 | ||
163 | /** | |
164 | * Creates a PluralRules from a description if it is parsable, otherwise | |
4388f060 | 165 | * returns NULL. |
46f4442e A |
166 | * |
167 | * @param description rule description | |
168 | * @param status Output param set to success/failure code on exit, which | |
169 | * must not indicate a failure before the function call. | |
170 | * @return new PluralRules pointer. NULL if there is an error. | |
729e4ab9 | 171 | * @stable ICU 4.0 |
46f4442e A |
172 | */ |
173 | static PluralRules* U_EXPORT2 createRules(const UnicodeString& description, | |
174 | UErrorCode& status); | |
175 | ||
176 | /** | |
177 | * The default rules that accept any number. | |
178 | * | |
179 | * @param status Output param set to success/failure code on exit, which | |
180 | * must not indicate a failure before the function call. | |
181 | * @return new PluralRules pointer. NULL if there is an error. | |
729e4ab9 | 182 | * @stable ICU 4.0 |
46f4442e A |
183 | */ |
184 | static PluralRules* U_EXPORT2 createDefaultRules(UErrorCode& status); | |
185 | ||
186 | /** | |
51004dcb | 187 | * Provides access to the predefined cardinal-number <code>PluralRules</code> for a given |
46f4442e | 188 | * locale. |
51004dcb | 189 | * Same as forLocale(locale, UPLURAL_TYPE_CARDINAL, status). |
46f4442e A |
190 | * |
191 | * @param locale The locale for which a <code>PluralRules</code> object is | |
192 | * returned. | |
193 | * @param status Output param set to success/failure code on exit, which | |
194 | * must not indicate a failure before the function call. | |
195 | * @return The predefined <code>PluralRules</code> object pointer for | |
196 | * this locale. If there's no predefined rules for this locale, | |
197 | * the rules for the closest parent in the locale hierarchy | |
198 | * that has one will be returned. The final fallback always | |
199 | * returns the default 'other' rules. | |
729e4ab9 | 200 | * @stable ICU 4.0 |
46f4442e A |
201 | */ |
202 | static PluralRules* U_EXPORT2 forLocale(const Locale& locale, UErrorCode& status); | |
4388f060 | 203 | |
51004dcb A |
204 | #ifndef U_HIDE_DRAFT_API |
205 | /** | |
206 | * Provides access to the predefined <code>PluralRules</code> for a given | |
207 | * locale and the plural type. | |
208 | * | |
209 | * @param locale The locale for which a <code>PluralRules</code> object is | |
210 | * returned. | |
211 | * @param type The plural type (e.g., cardinal or ordinal). | |
212 | * @param status Output param set to success/failure code on exit, which | |
213 | * must not indicate a failure before the function call. | |
214 | * @return The predefined <code>PluralRules</code> object pointer for | |
215 | * this locale. If there's no predefined rules for this locale, | |
216 | * the rules for the closest parent in the locale hierarchy | |
217 | * that has one will be returned. The final fallback always | |
218 | * returns the default 'other' rules. | |
219 | * @draft ICU 50 | |
220 | */ | |
221 | static PluralRules* U_EXPORT2 forLocale(const Locale& locale, UPluralType type, UErrorCode& status); | |
222 | #endif /* U_HIDE_DRAFT_API */ | |
223 | ||
46f4442e A |
224 | /** |
225 | * Given a number, returns the keyword of the first rule that applies to | |
226 | * the number. This function can be used with isKeyword* functions to | |
227 | * determine the keyword for default plural rules. | |
228 | * | |
229 | * @param number The number for which the rule has to be determined. | |
230 | * @return The keyword of the selected rule. | |
729e4ab9 | 231 | * @stable ICU 4.0 |
46f4442e A |
232 | */ |
233 | UnicodeString select(int32_t number) const; | |
4388f060 | 234 | |
46f4442e A |
235 | /** |
236 | * Given a number, returns the keyword of the first rule that applies to | |
237 | * the number. This function can be used with isKeyword* functions to | |
238 | * determine the keyword for default plural rules. | |
239 | * | |
240 | * @param number The number for which the rule has to be determined. | |
241 | * @return The keyword of the selected rule. | |
729e4ab9 | 242 | * @stable ICU 4.0 |
46f4442e A |
243 | */ |
244 | UnicodeString select(double number) const; | |
245 | ||
246 | /** | |
247 | * Returns a list of all rule keywords used in this <code>PluralRules</code> | |
248 | * object. The rule 'other' is always present by default. | |
249 | * | |
250 | * @param status Output param set to success/failure code on exit, which | |
251 | * must not indicate a failure before the function call. | |
252 | * @return StringEnumeration with the keywords. | |
253 | * The caller must delete the object. | |
729e4ab9 | 254 | * @stable ICU 4.0 |
46f4442e A |
255 | */ |
256 | StringEnumeration* getKeywords(UErrorCode& status) const; | |
257 | ||
4388f060 A |
258 | /** |
259 | * Returns a unique value for this keyword if it exists, else the constant | |
260 | * UPLRULES_NO_UNIQUE_VALUE. | |
261 | * | |
262 | * @param keyword The keyword. | |
263 | * @return The unique value that generates the keyword, or | |
264 | * UPLRULES_NO_UNIQUE_VALUE if the keyword is undefined or there is no | |
265 | * unique value that generates this keyword. | |
266 | * @stable ICU 4.8 | |
267 | */ | |
268 | double getUniqueKeywordValue(const UnicodeString& keyword); | |
269 | ||
270 | /** | |
271 | * Returns all the values for which select() would return the keyword. If | |
272 | * the keyword is unknown, returns no values, but this is not an error. If | |
273 | * the number of values is unlimited, returns no values and -1 as the | |
274 | * count. | |
275 | * | |
276 | * The number of returned values is typically small. | |
277 | * | |
278 | * @param keyword The keyword. | |
279 | * @param dest Array into which to put the returned values. May | |
280 | * be NULL if destCapacity is 0. | |
281 | * @param destCapacity The capacity of the array, must be at least 0. | |
282 | * @param status The error code. | |
283 | * @return The count of values available, or -1. This count | |
284 | * can be larger than destCapacity, but no more than | |
285 | * destCapacity values will be written. | |
286 | * @stable ICU 4.8 | |
287 | */ | |
288 | int32_t getAllKeywordValues(const UnicodeString &keyword, | |
289 | double *dest, int32_t destCapacity, | |
290 | UErrorCode& status); | |
291 | ||
292 | /** | |
293 | * Returns sample values for which select() would return the keyword. If | |
294 | * the keyword is unknown, returns no values, but this is not an error. | |
295 | * | |
296 | * The number of returned values is typically small. | |
297 | * | |
298 | * @param keyword The keyword. | |
299 | * @param dest Array into which to put the returned values. May | |
300 | * be NULL if destCapacity is 0. | |
301 | * @param destCapacity The capacity of the array, must be at least 0. | |
302 | * @param status The error code. | |
303 | * @return The count of values written. | |
304 | * If more than destCapacity samples are available, then | |
305 | * only destCapacity are written, and destCapacity is returned as the count, | |
306 | * rather than setting a U_BUFFER_OVERFLOW_ERROR. | |
307 | * (The actual number of keyword values could be unlimited.) | |
308 | * @stable ICU 4.8 | |
309 | */ | |
310 | int32_t getSamples(const UnicodeString &keyword, | |
311 | double *dest, int32_t destCapacity, | |
312 | UErrorCode& status); | |
313 | ||
46f4442e A |
314 | /** |
315 | * Returns TRUE if the given keyword is defined in this | |
316 | * <code>PluralRules</code> object. | |
317 | * | |
318 | * @param keyword the input keyword. | |
319 | * @return TRUE if the input keyword is defined. | |
320 | * Otherwise, return FALSE. | |
729e4ab9 | 321 | * @stable ICU 4.0 |
46f4442e A |
322 | */ |
323 | UBool isKeyword(const UnicodeString& keyword) const; | |
324 | ||
325 | ||
326 | /** | |
327 | * Returns keyword for default plural form. | |
328 | * | |
329 | * @return keyword for default plural form. | |
729e4ab9 | 330 | * @stable ICU 4.0 |
46f4442e A |
331 | */ |
332 | UnicodeString getKeywordOther() const; | |
333 | ||
334 | /** | |
335 | * Compares the equality of two PluralRules objects. | |
336 | * | |
337 | * @param other The other PluralRules object to be compared with. | |
338 | * @return True if the given PluralRules is the same as this | |
339 | * PluralRules; false otherwise. | |
729e4ab9 | 340 | * @stable ICU 4.0 |
46f4442e A |
341 | */ |
342 | virtual UBool operator==(const PluralRules& other) const; | |
343 | ||
344 | /** | |
345 | * Compares the inequality of two PluralRules objects. | |
346 | * | |
347 | * @param other The PluralRules object to be compared with. | |
348 | * @return True if the given PluralRules is not the same as this | |
349 | * PluralRules; false otherwise. | |
729e4ab9 | 350 | * @stable ICU 4.0 |
46f4442e A |
351 | */ |
352 | UBool operator!=(const PluralRules& other) const {return !operator==(other);} | |
353 | ||
354 | ||
355 | /** | |
356 | * ICU "poor man's RTTI", returns a UClassID for this class. | |
357 | * | |
729e4ab9 | 358 | * @stable ICU 4.0 |
46f4442e A |
359 | * |
360 | */ | |
361 | static UClassID U_EXPORT2 getStaticClassID(void); | |
362 | ||
363 | /** | |
364 | * ICU "poor man's RTTI", returns a UClassID for the actual class. | |
365 | * | |
729e4ab9 | 366 | * @stable ICU 4.0 |
46f4442e A |
367 | */ |
368 | virtual UClassID getDynamicClassID() const; | |
369 | ||
370 | ||
371 | private: | |
4388f060 A |
372 | RuleChain *mRules; |
373 | RuleParser *mParser; | |
374 | double *mSamples; | |
375 | int32_t *mSampleInfo; | |
376 | int32_t mSampleInfoCount; | |
46f4442e A |
377 | |
378 | PluralRules(); // default constructor not implemented | |
379 | int32_t getRepeatLimit() const; | |
380 | void parseDescription(UnicodeString& ruleData, RuleChain& rules, UErrorCode &status); | |
381 | void getNextLocale(const UnicodeString& localeData, int32_t* curIndex, UnicodeString& localeName); | |
382 | void addRules(RuleChain& rules); | |
383 | int32_t getNumberValue(const UnicodeString& token) const; | |
51004dcb | 384 | UnicodeString getRuleFromResource(const Locale& locale, UPluralType type, UErrorCode& status); |
46f4442e | 385 | |
4388f060 A |
386 | static const int32_t MAX_SAMPLES = 3; |
387 | ||
388 | int32_t getSamplesInternal(const UnicodeString &keyword, double *dest, | |
389 | int32_t destCapacity, UBool includeUnlimited, | |
390 | UErrorCode& status); | |
391 | int32_t getKeywordIndex(const UnicodeString& keyword, | |
392 | UErrorCode& status) const; | |
393 | void initSamples(UErrorCode& status); | |
394 | ||
46f4442e A |
395 | }; |
396 | ||
397 | U_NAMESPACE_END | |
398 | ||
399 | #endif /* #if !UCONFIG_NO_FORMATTING */ | |
400 | ||
401 | #endif // _PLURRULE | |
402 | //eof |