]> git.saurik.com Git - apple/icu.git/blob - icuSources/i18n/nfsubs.cpp
ICU-8.11.4.tar.gz
[apple/icu.git] / icuSources / i18n / nfsubs.cpp
1 /*
2 ******************************************************************************
3 * Copyright (C) 1997-2005, International Business Machines
4 * Corporation and others. All Rights Reserved.
5 ******************************************************************************
6 * file name: nfsubs.cpp
7 * encoding: US-ASCII
8 * tab size: 8 (not used)
9 * indentation:4
10 *
11 * Modification history
12 * Date Name Comments
13 * 10/11/2001 Doug Ported from ICU4J
14 */
15
16 #include "nfsubs.h"
17 #include "digitlst.h"
18
19 #include <stdio.h>
20
21 #if U_HAVE_RBNF
22
23 static const UChar gLessThan = 0x003c;
24 static const UChar gEquals = 0x003d;
25 static const UChar gGreaterThan = 0x003e;
26 static const UChar gPercent = 0x0025;
27 static const UChar gPound = 0x0023;
28 static const UChar gZero = 0x0030;
29 static const UChar gSpace = 0x0020;
30
31 static const UChar gEqualsEquals[] =
32 {
33 0x3D, 0x3D, 0
34 }; /* "==" */
35 static const UChar gGreaterGreaterGreaterThan[] =
36 {
37 0x3E, 0x3E, 0x3E, 0
38 }; /* ">>>" */
39 static const UChar gGreaterGreaterThan[] =
40 {
41 0x3E, 0x3E, 0
42 }; /* ">>" */
43
44 NFSubstitution*
45 NFSubstitution::makeSubstitution(int32_t pos,
46 const NFRule* rule,
47 const NFRule* predecessor,
48 const NFRuleSet* ruleSet,
49 const RuleBasedNumberFormat* formatter,
50 const UnicodeString& description,
51 UErrorCode& status)
52 {
53 // if the description is empty, return a NullSubstitution
54 if (description.length() == 0) {
55 return new NullSubstitution(pos, ruleSet, formatter, description, status);
56 }
57
58 switch (description.charAt(0)) {
59 // if the description begins with '<'...
60 case gLessThan:
61 // throw an exception if the rule is a negative number
62 // rule
63 if (rule->getBaseValue() == NFRule::kNegativeNumberRule) {
64 // throw new IllegalArgumentException("<< not allowed in negative-number rule");
65 status = U_PARSE_ERROR;
66 return NULL;
67 }
68
69 // if the rule is a fraction rule, return an
70 // IntegralPartSubstitution
71 else if (rule->getBaseValue() == NFRule::kImproperFractionRule
72 || rule->getBaseValue() == NFRule::kProperFractionRule
73 || rule->getBaseValue() == NFRule::kMasterRule) {
74 return new IntegralPartSubstitution(pos, ruleSet, formatter, description, status);
75 }
76
77 // if the rule set containing the rule is a fraction
78 // rule set, return a NumeratorSubstitution
79 else if (ruleSet->isFractionRuleSet()) {
80 return new NumeratorSubstitution(pos, (double)rule->getBaseValue(),
81 formatter->getDefaultRuleSet(), formatter, description, status);
82 }
83
84 // otherwise, return a MultiplierSubstitution
85 else {
86 return new MultiplierSubstitution(pos, rule->getDivisor(), ruleSet,
87 formatter, description, status);
88 }
89
90 // if the description begins with '>'...
91 case gGreaterThan:
92 // if the rule is a negative-number rule, return
93 // an AbsoluteValueSubstitution
94 if (rule->getBaseValue() == NFRule::kNegativeNumberRule) {
95 return new AbsoluteValueSubstitution(pos, ruleSet, formatter, description, status);
96 }
97
98 // if the rule is a fraction rule, return a
99 // FractionalPartSubstitution
100 else if (rule->getBaseValue() == NFRule::kImproperFractionRule
101 || rule->getBaseValue() == NFRule::kProperFractionRule
102 || rule->getBaseValue() == NFRule::kMasterRule) {
103 return new FractionalPartSubstitution(pos, ruleSet, formatter, description, status);
104 }
105
106 // if the rule set owning the rule is a fraction rule set,
107 // throw an exception
108 else if (ruleSet->isFractionRuleSet()) {
109 // throw new IllegalArgumentException(">> not allowed in fraction rule set");
110 status = U_PARSE_ERROR;
111 return NULL;
112 }
113
114 // otherwise, return a ModulusSubstitution
115 else {
116 return new ModulusSubstitution(pos, rule->getDivisor(), predecessor,
117 ruleSet, formatter, description, status);
118 }
119
120 // if the description begins with '=', always return a
121 // SameValueSubstitution
122 case gEquals:
123 return new SameValueSubstitution(pos, ruleSet, formatter, description, status);
124
125 // and if it's anything else, throw an exception
126 default:
127 // throw new IllegalArgumentException("Illegal substitution character");
128 status = U_PARSE_ERROR;
129 }
130 return NULL;
131 }
132
133 NFSubstitution::NFSubstitution(int32_t _pos,
134 const NFRuleSet* _ruleSet,
135 const RuleBasedNumberFormat* formatter,
136 const UnicodeString& description,
137 UErrorCode& status)
138 : pos(_pos), ruleSet(NULL), numberFormat(NULL)
139 {
140 // the description should begin and end with the same character.
141 // If it doesn't that's a syntax error. Otherwise,
142 // makeSubstitution() was the only thing that needed to know
143 // about these characters, so strip them off
144 UnicodeString workingDescription(description);
145 if (description.length() >= 2
146 && description.charAt(0) == description.charAt(description.length() - 1))
147 {
148 workingDescription.remove(description.length() - 1, 1);
149 workingDescription.remove(0, 1);
150 }
151 else if (description.length() != 0) {
152 // throw new IllegalArgumentException("Illegal substitution syntax");
153 status = U_PARSE_ERROR;
154 return;
155 }
156
157 // if the description was just two paired token characters
158 // (i.e., "<<" or ">>"), it uses the rule set it belongs to to
159 // format its result
160 if (workingDescription.length() == 0) {
161 this->ruleSet = _ruleSet;
162 }
163 // if the description contains a rule set name, that's the rule
164 // set we use to format the result: get a reference to the
165 // names rule set
166 else if (workingDescription.charAt(0) == gPercent) {
167 this->ruleSet = formatter->findRuleSet(workingDescription, status);
168 }
169 // if the description begins with 0 or #, treat it as a
170 // DecimalFormat pattern, and initialize a DecimalFormat with
171 // that pattern (then set it to use the DecimalFormatSymbols
172 // belonging to our formatter)
173 else if (workingDescription.charAt(0) == gPound || workingDescription.charAt(0) ==gZero) {
174 DecimalFormatSymbols* sym = formatter->getDecimalFormatSymbols();
175 if (!sym) {
176 status = U_MISSING_RESOURCE_ERROR;
177 return;
178 }
179 this->numberFormat = new DecimalFormat(workingDescription, *sym, status);
180 /* test for NULL */
181 if (this->numberFormat == 0) {
182 status = U_MEMORY_ALLOCATION_ERROR;
183 return;
184 }
185 if (U_FAILURE(status)) {
186 delete (DecimalFormat*)this->numberFormat;
187 this->numberFormat = NULL;
188 return;
189 }
190 // this->numberFormat->setDecimalFormatSymbols(formatter->getDecimalFormatSymbols());
191 }
192 // if the description is ">>>", this substitution bypasses the
193 // usual rule-search process and always uses the rule that precedes
194 // it in its own rule set's rule list (this is used for place-value
195 // notations: formats where you want to see a particular part of
196 // a number even when it's 0)
197 else if (workingDescription.charAt(0) == gGreaterThan) {
198 // this causes problems when >>> is used in a frationalPartSubstitution
199 // this->ruleSet = NULL;
200 this->ruleSet = _ruleSet;
201 this->numberFormat = NULL;
202 }
203 // and of the description is none of these things, it's a syntax error
204 else {
205 // throw new IllegalArgumentException("Illegal substitution syntax");
206 status = U_PARSE_ERROR;
207 }
208 }
209
210 NFSubstitution::~NFSubstitution()
211 {
212 // cast away const
213 delete (NumberFormat*)numberFormat; numberFormat = NULL;
214 }
215
216 /**
217 * Set's the substitution's divisor. Used by NFRule.setBaseValue().
218 * A no-op for all substitutions except multiplier and modulus
219 * substitutions.
220 * @param radix The radix of the divisor
221 * @param exponent The exponent of the divisor
222 */
223 void
224 NFSubstitution::setDivisor(int32_t /*radix*/, int32_t /*exponent*/, UErrorCode& /*status*/) {
225 // a no-op for all substitutions except multiplier and modulus substitutions
226 }
227
228
229 //-----------------------------------------------------------------------
230 // boilerplate
231 //-----------------------------------------------------------------------
232
233 const char NFSubstitution::fgClassID = 0;
234
235 UClassID
236 NFSubstitution::getDynamicClassID() const {
237 return getStaticClassID();
238 }
239
240 /**
241 * Compares two substitutions for equality
242 * @param The substitution to compare this one to
243 * @return true if the two substitutions are functionally equivalent
244 */
245 UBool
246 NFSubstitution::operator==(const NFSubstitution& rhs) const
247 {
248 // compare class and all of the fields all substitutions have
249 // in common
250 // this should be called by subclasses before their own equality tests
251 return getDynamicClassID() == rhs.getDynamicClassID()
252 && pos == rhs.pos
253 && (ruleSet == NULL) == (rhs.ruleSet == NULL)
254 // && ruleSet == rhs.ruleSet causes circularity, other checks to make instead?
255 && (numberFormat == NULL
256 ? (rhs.numberFormat == NULL)
257 : (*numberFormat == *rhs.numberFormat));
258 }
259
260 /**
261 * Returns a textual description of the substitution
262 * @return A textual description of the substitution. This might
263 * not be identical to the description it was created from, but
264 * it'll produce the same result.
265 */
266 void
267 NFSubstitution::toString(UnicodeString& text) const
268 {
269 // use tokenChar() to get the character at the beginning and
270 // end of the substitutin token. In between them will go
271 // either the name of the rule set it uses, or the pattern of
272 // the DecimalFormat it uses
273 text.remove();
274 text.append(tokenChar());
275
276 UnicodeString temp;
277 if (ruleSet != NULL) {
278 ruleSet->getName(temp);
279 } else if (numberFormat != NULL) {
280 numberFormat->toPattern(temp);
281 }
282 text.append(temp);
283 text.append(tokenChar());
284 }
285
286 //-----------------------------------------------------------------------
287 // formatting
288 //-----------------------------------------------------------------------
289
290 /**
291 * Performs a mathematical operation on the number, formats it using
292 * either ruleSet or decimalFormat, and inserts the result into
293 * toInsertInto.
294 * @param number The number being formatted.
295 * @param toInsertInto The string we insert the result into
296 * @param pos The position in toInsertInto where the owning rule's
297 * rule text begins (this value is added to this substitution's
298 * position to determine exactly where to insert the new text)
299 */
300 void
301 NFSubstitution::doSubstitution(int64_t number, UnicodeString& toInsertInto, int32_t _pos) const
302 {
303 if (ruleSet != NULL) {
304 // perform a transformation on the number that is dependent
305 // on the type of substitution this is, then just call its
306 // rule set's format() method to format the result
307 ruleSet->format(transformNumber(number), toInsertInto, _pos + this->pos);
308 } else if (numberFormat != NULL) {
309 // or perform the transformation on the number (preserving
310 // the result's fractional part if the formatter it set
311 // to show it), then use that formatter's format() method
312 // to format the result
313 double numberToFormat = transformNumber((double)number);
314 if (numberFormat->getMaximumFractionDigits() == 0) {
315 numberToFormat = uprv_floor(numberToFormat);
316 }
317
318 UnicodeString temp;
319 numberFormat->format(numberToFormat, temp);
320 toInsertInto.insert(_pos + this->pos, temp);
321 }
322 }
323
324 /**
325 * Performs a mathematical operation on the number, formats it using
326 * either ruleSet or decimalFormat, and inserts the result into
327 * toInsertInto.
328 * @param number The number being formatted.
329 * @param toInsertInto The string we insert the result into
330 * @param pos The position in toInsertInto where the owning rule's
331 * rule text begins (this value is added to this substitution's
332 * position to determine exactly where to insert the new text)
333 */
334 void
335 NFSubstitution::doSubstitution(double number, UnicodeString& toInsertInto, int32_t _pos) const {
336 // perform a transformation on the number being formatted that
337 // is dependent on the type of substitution this is
338 double numberToFormat = transformNumber(number);
339
340 // if the result is an integer, from here on out we work in integer
341 // space (saving time and memory and preserving accuracy)
342 if (numberToFormat == uprv_floor(numberToFormat) && ruleSet != NULL) {
343 ruleSet->format(util64_fromDouble(numberToFormat), toInsertInto, _pos + this->pos);
344
345 // if the result isn't an integer, then call either our rule set's
346 // format() method or our DecimalFormat's format() method to
347 // format the result
348 } else {
349 if (ruleSet != NULL) {
350 ruleSet->format(numberToFormat, toInsertInto, _pos + this->pos);
351 } else if (numberFormat != NULL) {
352 UnicodeString temp;
353 numberFormat->format(numberToFormat, temp);
354 toInsertInto.insert(_pos + this->pos, temp);
355 }
356 }
357 }
358
359
360 //-----------------------------------------------------------------------
361 // parsing
362 //-----------------------------------------------------------------------
363
364 #ifdef RBNF_DEBUG
365 #include <stdio.h>
366 #endif
367
368 /**
369 * Parses a string using the rule set or DecimalFormat belonging
370 * to this substitution. If there's a match, a mathematical
371 * operation (the inverse of the one used in formatting) is
372 * performed on the result of the parse and the value passed in
373 * and returned as the result. The parse position is updated to
374 * point to the first unmatched character in the string.
375 * @param text The string to parse
376 * @param parsePosition On entry, ignored, but assumed to be 0.
377 * On exit, this is updated to point to the first unmatched
378 * character (or 0 if the substitution didn't match)
379 * @param baseValue A partial parse result that should be
380 * combined with the result of this parse
381 * @param upperBound When searching the rule set for a rule
382 * matching the string passed in, only rules with base values
383 * lower than this are considered
384 * @param lenientParse If true and matching against rules fails,
385 * the substitution will also try matching the text against
386 * numerals using a default-costructed NumberFormat. If false,
387 * no extra work is done. (This value is false whenever the
388 * formatter isn't in lenient-parse mode, but is also false
389 * under some conditions even when the formatter _is_ in
390 * lenient-parse mode.)
391 * @return If there's a match, this is the result of composing
392 * baseValue with whatever was returned from matching the
393 * characters. This will be either a Long or a Double. If there's
394 * no match this is new Long(0) (not null), and parsePosition
395 * is left unchanged.
396 */
397 UBool
398 NFSubstitution::doParse(const UnicodeString& text,
399 ParsePosition& parsePosition,
400 double baseValue,
401 double upperBound,
402 UBool lenientParse,
403 Formattable& result) const
404 {
405 #ifdef RBNF_DEBUG
406 fprintf(stderr, "<nfsubs> %x bv: %g ub: %g\n", this, baseValue, upperBound);
407 #endif
408 // figure out the highest base value a rule can have and match
409 // the text being parsed (this varies according to the type of
410 // substitutions: multiplier, modulus, and numerator substitutions
411 // restrict the search to rules with base values lower than their
412 // own; same-value substitutions leave the upper bound wherever
413 // it was, and the others allow any rule to match
414 upperBound = calcUpperBound(upperBound);
415
416 // use our rule set to parse the text. If that fails and
417 // lenient parsing is enabled (this is always false if the
418 // formatter's lenient-parsing mode is off, but it may also
419 // be false even when the formatter's lenient-parse mode is
420 // on), then also try parsing the text using a default-
421 // constructed NumberFormat
422 if (ruleSet != NULL) {
423 ruleSet->parse(text, parsePosition, upperBound, result);
424 if (lenientParse && !ruleSet->isFractionRuleSet() && parsePosition.getIndex() == 0) {
425 UErrorCode status = U_ZERO_ERROR;
426 NumberFormat* fmt = NumberFormat::createInstance(status);
427 if (U_SUCCESS(status)) {
428 fmt->parse(text, result, parsePosition);
429 }
430 delete fmt;
431 }
432
433 // ...or use our DecimalFormat to parse the text
434 } else if (numberFormat != NULL) {
435 numberFormat->parse(text, result, parsePosition);
436 }
437
438 // if the parse was successful, we've already advanced the caller's
439 // parse position (this is the one function that doesn't have one
440 // of its own). Derive a parse result and return it as a Long,
441 // if possible, or a Double
442 if (parsePosition.getIndex() != 0) {
443 UErrorCode status = U_ZERO_ERROR;
444 double tempResult = result.getDouble(status);
445
446 // composeRuleValue() produces a full parse result from
447 // the partial parse result passed to this function from
448 // the caller (this is either the owning rule's base value
449 // or the partial result obtained from composing the
450 // owning rule's base value with its other substitution's
451 // parse result) and the partial parse result obtained by
452 // matching the substitution (which will be the same value
453 // the caller would get by parsing just this part of the
454 // text with RuleBasedNumberFormat.parse() ). How the two
455 // values are used to derive the full parse result depends
456 // on the types of substitutions: For a regular rule, the
457 // ultimate result is its multiplier substitution's result
458 // times the rule's divisor (or the rule's base value) plus
459 // the modulus substitution's result (which will actually
460 // supersede part of the rule's base value). For a negative-
461 // number rule, the result is the negative of its substitution's
462 // result. For a fraction rule, it's the sum of its two
463 // substitution results. For a rule in a fraction rule set,
464 // it's the numerator substitution's result divided by
465 // the rule's base value. Results from same-value substitutions
466 // propagate back upard, and null substitutions don't affect
467 // the result.
468 tempResult = composeRuleValue(tempResult, baseValue);
469 result.setDouble(tempResult);
470 return TRUE;
471 // if the parse was UNsuccessful, return 0
472 } else {
473 result.setLong(0);
474 return FALSE;
475 }
476 }
477
478 UBool
479 NFSubstitution::isNullSubstitution() const {
480 return FALSE;
481 }
482
483 /**
484 * Returns true if this is a modulus substitution. (We didn't do this
485 * with instanceof partially because it causes source files to
486 * proliferate and partially because we have to port this to C++.)
487 * @return true if this object is an instance of ModulusSubstitution
488 */
489 UBool
490 NFSubstitution::isModulusSubstitution() const {
491 return FALSE;
492 }
493
494 //===================================================================
495 // SameValueSubstitution
496 //===================================================================
497
498 /**
499 * A substitution that passes the value passed to it through unchanged.
500 * Represented by == in rule descriptions.
501 */
502 SameValueSubstitution::SameValueSubstitution(int32_t _pos,
503 const NFRuleSet* _ruleSet,
504 const RuleBasedNumberFormat* formatter,
505 const UnicodeString& description,
506 UErrorCode& status)
507 : NFSubstitution(_pos, _ruleSet, formatter, description, status)
508 {
509 if (description == gEqualsEquals) {
510 // throw new IllegalArgumentException("== is not a legal token");
511 status = U_PARSE_ERROR;
512 }
513 }
514
515 const char SameValueSubstitution::fgClassID = 0;
516
517 UClassID
518 SameValueSubstitution::getDynamicClassID() const {
519 return getStaticClassID();
520 }
521
522
523 //===================================================================
524 // MultiplierSubstitution
525 //===================================================================
526
527 const char MultiplierSubstitution::fgClassID = 0;
528
529 UClassID
530 MultiplierSubstitution::getDynamicClassID() const {
531 return getStaticClassID();
532 }
533
534 UBool MultiplierSubstitution::operator==(const NFSubstitution& rhs) const
535 {
536 return NFSubstitution::operator==(rhs) &&
537 divisor == ((const MultiplierSubstitution*)&rhs)->divisor;
538 }
539
540
541 //===================================================================
542 // ModulusSubstitution
543 //===================================================================
544
545 /**
546 * A substitution that divides the number being formatted by the its rule's
547 * divisor and formats the remainder. Represented by "&gt;&gt;" in a
548 * regular rule.
549 */
550 ModulusSubstitution::ModulusSubstitution(int32_t _pos,
551 double _divisor,
552 const NFRule* predecessor,
553 const NFRuleSet* _ruleSet,
554 const RuleBasedNumberFormat* formatter,
555 const UnicodeString& description,
556 UErrorCode& status)
557 : NFSubstitution(_pos, _ruleSet, formatter, description, status)
558 , divisor(_divisor)
559 , ruleToUse(NULL)
560 {
561 ldivisor = util64_fromDouble(_divisor);
562
563 // the owning rule's divisor controls the behavior of this
564 // substitution: rather than keeping a backpointer to the rule,
565 // we keep a copy of the divisor
566
567 if (ldivisor == 0) {
568 status = U_PARSE_ERROR;
569 }
570
571 if (description == gGreaterGreaterGreaterThan) {
572 // the >>> token doesn't alter how this substituion calculates the
573 // values it uses for formatting and parsing, but it changes
574 // what's done with that value after it's obtained: >>> short-
575 // circuits the rule-search process and goes straight to the
576 // specified rule to format the substitution value
577 ruleToUse = predecessor;
578 }
579 }
580
581 const char ModulusSubstitution::fgClassID = 0;
582
583 UClassID
584 ModulusSubstitution::getDynamicClassID() const {
585 return getStaticClassID();
586 }
587
588 UBool ModulusSubstitution::operator==(const NFSubstitution& rhs) const
589 {
590 return NFSubstitution::operator==(rhs) &&
591 divisor == ((const ModulusSubstitution*)&rhs)->divisor &&
592 ruleToUse == ((const ModulusSubstitution*)&rhs)->ruleToUse;
593 }
594
595 //-----------------------------------------------------------------------
596 // formatting
597 //-----------------------------------------------------------------------
598
599
600 /**
601 * If this is a &gt;&gt;&gt; substitution, use ruleToUse to fill in
602 * the substitution. Otherwise, just use the superclass function.
603 * @param number The number being formatted
604 * @toInsertInto The string to insert the result of this substitution
605 * into
606 * @param pos The position of the rule text in toInsertInto
607 */
608 void
609 ModulusSubstitution::doSubstitution(int64_t number, UnicodeString& toInsertInto, int32_t _pos) const
610 {
611 // if this isn't a >>> substitution, just use the inherited version
612 // of this function (which uses either a rule set or a DecimalFormat
613 // to format its substitution value)
614 if (ruleToUse == NULL) {
615 NFSubstitution::doSubstitution(number, toInsertInto, _pos);
616
617 // a >>> substitution goes straight to a particular rule to
618 // format the substitution value
619 } else {
620 int64_t numberToFormat = transformNumber(number);
621 ruleToUse->doFormat(numberToFormat, toInsertInto, _pos + getPos());
622 }
623 }
624
625 /**
626 * If this is a &gt;&gt;&gt; substitution, use ruleToUse to fill in
627 * the substitution. Otherwise, just use the superclass function.
628 * @param number The number being formatted
629 * @toInsertInto The string to insert the result of this substitution
630 * into
631 * @param pos The position of the rule text in toInsertInto
632 */
633 void
634 ModulusSubstitution::doSubstitution(double number, UnicodeString& toInsertInto, int32_t _pos) const
635 {
636 // if this isn't a >>> substitution, just use the inherited version
637 // of this function (which uses either a rule set or a DecimalFormat
638 // to format its substitution value)
639 if (ruleToUse == NULL) {
640 NFSubstitution::doSubstitution(number, toInsertInto, _pos);
641
642 // a >>> substitution goes straight to a particular rule to
643 // format the substitution value
644 } else {
645 double numberToFormat = transformNumber(number);
646
647 ruleToUse->doFormat(numberToFormat, toInsertInto, _pos + getPos());
648 }
649 }
650
651 //-----------------------------------------------------------------------
652 // parsing
653 //-----------------------------------------------------------------------
654
655 /**
656 * If this is a &gt;&gt;&gt; substitution, match only against ruleToUse.
657 * Otherwise, use the superclass function.
658 * @param text The string to parse
659 * @param parsePosition Ignored on entry, updated on exit to point to
660 * the first unmatched character.
661 * @param baseValue The partial parse result prior to calling this
662 * routine.
663 */
664 UBool
665 ModulusSubstitution::doParse(const UnicodeString& text,
666 ParsePosition& parsePosition,
667 double baseValue,
668 double upperBound,
669 UBool lenientParse,
670 Formattable& result) const
671 {
672 // if this isn't a >>> substitution, we can just use the
673 // inherited parse() routine to do the parsing
674 if (ruleToUse == NULL) {
675 return NFSubstitution::doParse(text, parsePosition, baseValue, upperBound, lenientParse, result);
676
677 // but if it IS a >>> substitution, we have to do it here: we
678 // use the specific rule's doParse() method, and then we have to
679 // do some of the other work of NFRuleSet.parse()
680 } else {
681 ruleToUse->doParse(text, parsePosition, FALSE, upperBound, result);
682
683 if (parsePosition.getIndex() != 0) {
684 UErrorCode status = U_ZERO_ERROR;
685 double tempResult = result.getDouble(status);
686 tempResult = composeRuleValue(tempResult, baseValue);
687 result.setDouble(tempResult);
688 }
689
690 return TRUE;
691 }
692 }
693
694
695 //===================================================================
696 // IntegralPartSubstitution
697 //===================================================================
698
699 const char IntegralPartSubstitution::fgClassID = 0;
700
701 UClassID
702 IntegralPartSubstitution::getDynamicClassID() const {
703 return getStaticClassID();
704 }
705
706
707 //===================================================================
708 // FractionalPartSubstitution
709 //===================================================================
710
711
712 /**
713 * Constructs a FractionalPartSubstitution. This object keeps a flag
714 * telling whether it should format by digits or not. In addition,
715 * it marks the rule set it calls (if any) as a fraction rule set.
716 */
717 FractionalPartSubstitution::FractionalPartSubstitution(int32_t _pos,
718 const NFRuleSet* _ruleSet,
719 const RuleBasedNumberFormat* formatter,
720 const UnicodeString& description,
721 UErrorCode& status)
722 : NFSubstitution(_pos, _ruleSet, formatter, description, status)
723 , byDigits(FALSE)
724 , useSpaces(TRUE)
725
726 {
727 // akk, ruleSet can change in superclass constructor
728 if (description == gGreaterGreaterThan ||
729 description == gGreaterGreaterGreaterThan ||
730 _ruleSet == getRuleSet()) {
731 byDigits = TRUE;
732 if (description == gGreaterGreaterGreaterThan) {
733 useSpaces = FALSE;
734 }
735 } else {
736 // cast away const
737 ((NFRuleSet*)getRuleSet())->makeIntoFractionRuleSet();
738 }
739 }
740
741 //-----------------------------------------------------------------------
742 // formatting
743 //-----------------------------------------------------------------------
744
745 /**
746 * If in "by digits" mode, fills in the substitution one decimal digit
747 * at a time using the rule set containing this substitution.
748 * Otherwise, uses the superclass function.
749 * @param number The number being formatted
750 * @param toInsertInto The string to insert the result of formatting
751 * the substitution into
752 * @param pos The position of the owning rule's rule text in
753 * toInsertInto
754 */
755 void
756 FractionalPartSubstitution::doSubstitution(double number, UnicodeString& toInsertInto, int32_t _pos) const
757 {
758 // if we're not in "byDigits" mode, just use the inherited
759 // doSubstitution() routine
760 if (!byDigits) {
761 NFSubstitution::doSubstitution(number, toInsertInto, _pos);
762
763 // if we're in "byDigits" mode, transform the value into an integer
764 // by moving the decimal point eight places to the right and
765 // pulling digits off the right one at a time, formatting each digit
766 // as an integer using this substitution's owning rule set
767 // (this is slower, but more accurate, than doing it from the
768 // other end)
769 } else {
770 // int32_t numberToFormat = (int32_t)uprv_round(transformNumber(number) * uprv_pow(10, kMaxDecimalDigits));
771 // // this flag keeps us from formatting trailing zeros. It starts
772 // // out false because we're pulling from the right, and switches
773 // // to true the first time we encounter a non-zero digit
774 // UBool doZeros = FALSE;
775 // for (int32_t i = 0; i < kMaxDecimalDigits; i++) {
776 // int64_t digit = numberToFormat % 10;
777 // if (digit != 0 || doZeros) {
778 // if (doZeros && useSpaces) {
779 // toInsertInto.insert(_pos + getPos(), gSpace);
780 // }
781 // doZeros = TRUE;
782 // getRuleSet()->format(digit, toInsertInto, _pos + getPos());
783 // }
784 // numberToFormat /= 10;
785 // }
786
787 DigitList dl;
788 dl.set(number, 20, TRUE);
789
790 UBool pad = FALSE;
791 while (dl.fCount > (dl.fDecimalAt <= 0 ? 0 : dl.fDecimalAt)) {
792 if (pad && useSpaces) {
793 toInsertInto.insert(_pos + getPos(), gSpace);
794 } else {
795 pad = TRUE;
796 }
797 getRuleSet()->format((int64_t)(dl.fDigits[--dl.fCount] - '0'), toInsertInto, _pos + getPos());
798 }
799 while (dl.fDecimalAt < 0) {
800 if (pad && useSpaces) {
801 toInsertInto.insert(_pos + getPos(), gSpace);
802 } else {
803 pad = TRUE;
804 }
805 getRuleSet()->format((int64_t)0, toInsertInto, _pos + getPos());
806 ++dl.fDecimalAt;
807 }
808
809 if (!pad) {
810 // hack around lack of precision in digitlist. if we would end up with
811 // "foo point" make sure we add a " zero" to the end.
812 getRuleSet()->format((int64_t)0, toInsertInto, _pos + getPos());
813 }
814 }
815 }
816
817 //-----------------------------------------------------------------------
818 // parsing
819 //-----------------------------------------------------------------------
820
821 /**
822 * If in "by digits" mode, parses the string as if it were a string
823 * of individual digits; otherwise, uses the superclass function.
824 * @param text The string to parse
825 * @param parsePosition Ignored on entry, but updated on exit to point
826 * to the first unmatched character
827 * @param baseValue The partial parse result prior to entering this
828 * function
829 * @param upperBound Only consider rules with base values lower than
830 * this when filling in the substitution
831 * @param lenientParse If true, try matching the text as numerals if
832 * matching as words doesn't work
833 * @return If the match was successful, the current partial parse
834 * result; otherwise new Long(0). The result is either a Long or
835 * a Double.
836 */
837
838 UBool
839 FractionalPartSubstitution::doParse(const UnicodeString& text,
840 ParsePosition& parsePosition,
841 double baseValue,
842 double /*upperBound*/,
843 UBool lenientParse,
844 Formattable& resVal) const
845 {
846 // if we're not in byDigits mode, we can just use the inherited
847 // doParse()
848 if (!byDigits) {
849 return NFSubstitution::doParse(text, parsePosition, baseValue, 0, lenientParse, resVal);
850
851 // if we ARE in byDigits mode, parse the text one digit at a time
852 // using this substitution's owning rule set (we do this by setting
853 // upperBound to 10 when calling doParse() ) until we reach
854 // nonmatching text
855 } else {
856 UnicodeString workText(text);
857 ParsePosition workPos(1);
858 double result = 0;
859 int32_t digit;
860 // double p10 = 0.1;
861
862 DigitList dl;
863 NumberFormat* fmt = NULL;
864 while (workText.length() > 0 && workPos.getIndex() != 0) {
865 workPos.setIndex(0);
866 Formattable temp;
867 getRuleSet()->parse(workText, workPos, 10, temp);
868 UErrorCode status = U_ZERO_ERROR;
869 digit = temp.getLong(status);
870 // digit = temp.getType() == Formattable::kLong ?
871 // temp.getLong() :
872 // (int32_t)temp.getDouble();
873
874 if (lenientParse && workPos.getIndex() == 0) {
875 if (!fmt) {
876 status = U_ZERO_ERROR;
877 fmt = NumberFormat::createInstance(status);
878 if (U_FAILURE(status)) {
879 delete fmt;
880 fmt = NULL;
881 }
882 }
883 if (fmt) {
884 fmt->parse(workText, temp, workPos);
885 digit = temp.getLong(status);
886 }
887 }
888
889 if (workPos.getIndex() != 0) {
890 dl.append((char)('0' + digit));
891 // result += digit * p10;
892 // p10 /= 10;
893 parsePosition.setIndex(parsePosition.getIndex() + workPos.getIndex());
894 workText.removeBetween(0, workPos.getIndex());
895 while (workText.length() > 0 && workText.charAt(0) == gSpace) {
896 workText.removeBetween(0, 1);
897 parsePosition.setIndex(parsePosition.getIndex() + 1);
898 }
899 }
900 }
901 delete fmt;
902
903 result = dl.fCount == 0 ? 0 : dl.getDouble();
904 result = composeRuleValue(result, baseValue);
905 resVal.setDouble(result);
906 return TRUE;
907 }
908 }
909
910 UBool
911 FractionalPartSubstitution::operator==(const NFSubstitution& rhs) const
912 {
913 return NFSubstitution::operator==(rhs) &&
914 ((const FractionalPartSubstitution*)&rhs)->byDigits == byDigits;
915 }
916
917 const char FractionalPartSubstitution::fgClassID = 0;
918
919 UClassID
920 FractionalPartSubstitution::getDynamicClassID() const {
921 return getStaticClassID();
922 }
923
924
925 //===================================================================
926 // AbsoluteValueSubstitution
927 //===================================================================
928
929 const char AbsoluteValueSubstitution::fgClassID = 0;
930
931 UClassID
932 AbsoluteValueSubstitution::getDynamicClassID() const {
933 return getStaticClassID();
934 }
935
936 //===================================================================
937 // NumeratorSubstitution
938 //===================================================================
939
940 void
941 NumeratorSubstitution::doSubstitution(double number, UnicodeString& toInsertInto, int32_t apos) const {
942 // perform a transformation on the number being formatted that
943 // is dependent on the type of substitution this is
944
945 double numberToFormat = transformNumber(number);
946 int64_t longNF = util64_fromDouble(numberToFormat);
947
948 const NFRuleSet* aruleSet = getRuleSet();
949 if (withZeros && aruleSet != NULL) {
950 // if there are leading zeros in the decimal expansion then emit them
951 int64_t nf =longNF;
952 int32_t len = toInsertInto.length();
953 while ((nf *= 10) < denominator) {
954 toInsertInto.insert(apos + getPos(), gSpace);
955 aruleSet->format((int64_t)0, toInsertInto, apos + getPos());
956 }
957 apos += toInsertInto.length() - len;
958 }
959
960 // if the result is an integer, from here on out we work in integer
961 // space (saving time and memory and preserving accuracy)
962 if (numberToFormat == longNF && aruleSet != NULL) {
963 aruleSet->format(longNF, toInsertInto, apos + getPos());
964
965 // if the result isn't an integer, then call either our rule set's
966 // format() method or our DecimalFormat's format() method to
967 // format the result
968 } else {
969 if (aruleSet != NULL) {
970 aruleSet->format(numberToFormat, toInsertInto, apos + getPos());
971 } else {
972 UErrorCode status = U_ZERO_ERROR;
973 UnicodeString temp;
974 getNumberFormat()->format(numberToFormat, temp, status);
975 toInsertInto.insert(apos + getPos(), temp);
976 }
977 }
978 }
979
980 UBool
981 NumeratorSubstitution::doParse(const UnicodeString& text,
982 ParsePosition& parsePosition,
983 double baseValue,
984 double upperBound,
985 UBool /*lenientParse*/,
986 Formattable& result) const
987 {
988 // we don't have to do anything special to do the parsing here,
989 // but we have to turn lenient parsing off-- if we leave it on,
990 // it SERIOUSLY messes up the algorithm
991
992 // if withZeros is true, we need to count the zeros
993 // and use that to adjust the parse result
994 UErrorCode status = U_ZERO_ERROR;
995 int32_t zeroCount = 0;
996 UnicodeString workText(text);
997
998 if (withZeros) {
999 ParsePosition workPos(1);
1000 Formattable temp;
1001
1002 while (workText.length() > 0 && workPos.getIndex() != 0) {
1003 workPos.setIndex(0);
1004 getRuleSet()->parse(workText, workPos, 1, temp); // parse zero or nothing at all
1005 if (workPos.getIndex() == 0) {
1006 // we failed, either there were no more zeros, or the number was formatted with digits
1007 // either way, we're done
1008 break;
1009 }
1010
1011 ++zeroCount;
1012 parsePosition.setIndex(parsePosition.getIndex() + workPos.getIndex());
1013 workText.remove(0, workPos.getIndex());
1014 while (workText.length() > 0 && workText.charAt(0) == gSpace) {
1015 workText.remove(0, 1);
1016 parsePosition.setIndex(parsePosition.getIndex() + 1);
1017 }
1018 }
1019
1020 workText = text;
1021 workText.remove(0, (int32_t)parsePosition.getIndex());
1022 parsePosition.setIndex(0);
1023 }
1024
1025 // we've parsed off the zeros, now let's parse the rest from our current position
1026 NFSubstitution::doParse(workText, parsePosition, withZeros ? 1 : baseValue, upperBound, FALSE, result);
1027
1028 if (withZeros) {
1029 // any base value will do in this case. is there a way to
1030 // force this to not bother trying all the base values?
1031
1032 // compute the 'effective' base and prescale the value down
1033 int64_t n = result.getLong(status); // force conversion!
1034 int64_t d = 1;
1035 int32_t pow = 0;
1036 while (d <= n) {
1037 d *= 10;
1038 ++pow;
1039 }
1040 // now add the zeros
1041 while (zeroCount > 0) {
1042 d *= 10;
1043 --zeroCount;
1044 }
1045 // d is now our true denominator
1046 result.setDouble((double)n/(double)d);
1047 }
1048
1049 return TRUE;
1050 }
1051
1052 UBool
1053 NumeratorSubstitution::operator==(const NFSubstitution& rhs) const
1054 {
1055 return NFSubstitution::operator==(rhs) &&
1056 denominator == ((const NumeratorSubstitution*)&rhs)->denominator;
1057 }
1058
1059 const char NumeratorSubstitution::fgClassID = 0;
1060
1061 UClassID
1062 NumeratorSubstitution::getDynamicClassID() const {
1063 return getStaticClassID();
1064 }
1065
1066 const UChar NumeratorSubstitution::LTLT[] = { 0x003c, 0x003c };
1067
1068 //===================================================================
1069 // NullSubstitution
1070 //===================================================================
1071
1072 const char NullSubstitution::fgClassID = 0;
1073
1074 UClassID
1075 NullSubstitution::getDynamicClassID() const {
1076 return getStaticClassID();
1077 }
1078
1079 /* U_HAVE_RBNF */
1080 #endif
1081