icuSources/i18n/msgfmt.cpp

   1 // © 2016 and later: Unicode, Inc. and others.
   2 // License & terms of use: http://www.unicode.org/copyright.html
   3 /********************************************************************
   4  * COPYRIGHT:
   5  * Copyright (c) 1997-2015, International Business Machines Corporation and
   6  * others. All Rights Reserved.
   7  ********************************************************************
   8  *
   9  * File MSGFMT.CPP
  10  *
  11  * Modification History:
  12  *
  13  *   Date        Name        Description
  14  *   02/19/97    aliu        Converted from java.
  15  *   03/20/97    helena      Finished first cut of implementation.
  16  *   04/10/97    aliu        Made to work on AIX.  Added stoi to replace wtoi.
  17  *   06/11/97    helena      Fixed addPattern to take the pattern correctly.
  18  *   06/17/97    helena      Fixed the getPattern to return the correct pattern.
  19  *   07/09/97    helena      Made ParsePosition into a class.
  20  *   02/22/99    stephen     Removed character literals for EBCDIC safety
  21  *   11/01/09    kirtig      Added SelectFormat
  22  ********************************************************************/
  23
  24 #include "unicode/utypes.h"
  25
  26 #if !UCONFIG_NO_FORMATTING
  27
  28 #include "unicode/appendable.h"
  29 #include "unicode/choicfmt.h"
  30 #include "unicode/datefmt.h"
  31 #include "unicode/decimfmt.h"
  32 #include "unicode/localpointer.h"
  33 #include "unicode/msgfmt.h"
  34 #include "unicode/numberformatter.h"
  35 #include "unicode/plurfmt.h"
  36 #include "unicode/rbnf.h"
  37 #include "unicode/selfmt.h"
  38 #include "unicode/smpdtfmt.h"
  39 #include "unicode/umsg.h"
  40 #include "unicode/ustring.h"
  41 #include "cmemory.h"
  42 #include "patternprops.h"
  43 #include "messageimpl.h"
  44 #include "msgfmt_impl.h"
  45 #include "plurrule_impl.h"
  46 #include "uassert.h"
  47 #include "uelement.h"
  48 #include "uhash.h"
  49 #include "ustrfmt.h"
  50 #include "util.h"
  51 #include "uvector.h"
  52 #include "number_decimalquantity.h"
  53
  54 // *****************************************************************************
  55 // class MessageFormat
  56 // *****************************************************************************
  57
  58 #define SINGLE_QUOTE      ((UChar)0x0027)
  59 #define COMMA             ((UChar)0x002C)
  60 #define LEFT_CURLY_BRACE  ((UChar)0x007B)
  61 #define RIGHT_CURLY_BRACE ((UChar)0x007D)
  62
  63 //---------------------------------------
  64 // static data
  65
  66 static const UChar ID_NUMBER[]    = {
  67     0x6E, 0x75, 0x6D, 0x62, 0x65, 0x72, 0  /* "number" */
  68 };
  69 static const UChar ID_DATE[]      = {
  70     0x64, 0x61, 0x74, 0x65, 0              /* "date" */
  71 };
  72 static const UChar ID_TIME[]      = {
  73     0x74, 0x69, 0x6D, 0x65, 0              /* "time" */
  74 };
  75 static const UChar ID_SPELLOUT[]  = {
  76     0x73, 0x70, 0x65, 0x6c, 0x6c, 0x6f, 0x75, 0x74, 0 /* "spellout" */
  77 };
  78 static const UChar ID_ORDINAL[]   = {
  79     0x6f, 0x72, 0x64, 0x69, 0x6e, 0x61, 0x6c, 0 /* "ordinal" */
  80 };
  81 static const UChar ID_DURATION[]  = {
  82     0x64, 0x75, 0x72, 0x61, 0x74, 0x69, 0x6f, 0x6e, 0 /* "duration" */
  83 };
  84
  85 // MessageFormat Type List  Number, Date, Time or Choice
  86 static const UChar * const TYPE_IDS[] = {
  87     ID_NUMBER,
  88     ID_DATE,
  89     ID_TIME,
  90     ID_SPELLOUT,
  91     ID_ORDINAL,
  92     ID_DURATION,
  93     NULL,
  94 };
  95
  96 static const UChar ID_EMPTY[]     = {
  97     0 /* empty string, used for default so that null can mark end of list */
  98 };
  99 static const UChar ID_CURRENCY[]  = {
 100     0x63, 0x75, 0x72, 0x72, 0x65, 0x6E, 0x63, 0x79, 0  /* "currency" */
 101 };
 102 static const UChar ID_PERCENT[]   = {
 103     0x70, 0x65, 0x72, 0x63, 0x65, 0x6E, 0x74, 0        /* "percent" */
 104 };
 105 static const UChar ID_INTEGER[]   = {
 106     0x69, 0x6E, 0x74, 0x65, 0x67, 0x65, 0x72, 0        /* "integer" */
 107 };
 108
 109 // NumberFormat modifier list, default, currency, percent or integer
 110 static const UChar * const NUMBER_STYLE_IDS[] = {
 111     ID_EMPTY,
 112     ID_CURRENCY,
 113     ID_PERCENT,
 114     ID_INTEGER,
 115     NULL,
 116 };
 117
 118 static const UChar ID_SHORT[]     = {
 119     0x73, 0x68, 0x6F, 0x72, 0x74, 0        /* "short" */
 120 };
 121 static const UChar ID_MEDIUM[]    = {
 122     0x6D, 0x65, 0x64, 0x69, 0x75, 0x6D, 0  /* "medium" */
 123 };
 124 static const UChar ID_LONG[]      = {
 125     0x6C, 0x6F, 0x6E, 0x67, 0              /* "long" */
 126 };
 127 static const UChar ID_FULL[]      = {
 128     0x66, 0x75, 0x6C, 0x6C, 0              /* "full" */
 129 };
 130
 131 // DateFormat modifier list, default, short, medium, long or full
 132 static const UChar * const DATE_STYLE_IDS[] = {
 133     ID_EMPTY,
 134     ID_SHORT,
 135     ID_MEDIUM,
 136     ID_LONG,
 137     ID_FULL,
 138     NULL,
 139 };
 140
 141 static const icu::DateFormat::EStyle DATE_STYLES[] = {
 142     icu::DateFormat::kDefault,
 143     icu::DateFormat::kShort,
 144     icu::DateFormat::kMedium,
 145     icu::DateFormat::kLong,
 146     icu::DateFormat::kFull,
 147 };
 148
 149 static const int32_t DEFAULT_INITIAL_CAPACITY = 10;
 150
 151 static const UChar NULL_STRING[] = {
 152     0x6E, 0x75, 0x6C, 0x6C, 0  // "null"
 153 };
 154
 155 static const UChar OTHER_STRING[] = {
 156     0x6F, 0x74, 0x68, 0x65, 0x72, 0  // "other"
 157 };
 158
 159 U_CDECL_BEGIN
 160 static UBool U_CALLCONV equalFormatsForHash(const UHashTok key1,
 161                                             const UHashTok key2) {
 162     return icu::MessageFormat::equalFormats(key1.pointer, key2.pointer);
 163 }
 164
 165 U_CDECL_END
 166
 167 U_NAMESPACE_BEGIN
 168
 169 // -------------------------------------
 170 UOBJECT_DEFINE_RTTI_IMPLEMENTATION(MessageFormat)
 171 UOBJECT_DEFINE_RTTI_IMPLEMENTATION(FormatNameEnumeration)
 172
 173 //--------------------------------------------------------------------
 174
 175 /**
 176  * Convert an integer value to a string and append the result to
 177  * the given UnicodeString.
 178  */
 179 static UnicodeString& itos(int32_t i, UnicodeString& appendTo) {
 180     UChar temp[16];
 181     uprv_itou(temp,16,i,10,0); // 10 == radix
 182     appendTo.append(temp, -1);
 183     return appendTo;
 184 }
 185
 186
 187 // AppendableWrapper: encapsulates the result of formatting, keeping track
 188 // of the string and its length.
 189 class AppendableWrapper : public UMemory {
 190 public:
 191     AppendableWrapper(Appendable& appendable) : app(appendable), len(0) {
 192     }
 193     void append(const UnicodeString& s) {
 194         app.appendString(s.getBuffer(), s.length());
 195         len += s.length();
 196     }
 197     void append(const UChar* s, const int32_t sLength) {
 198         app.appendString(s, sLength);
 199         len += sLength;
 200     }
 201     void append(const UnicodeString& s, int32_t start, int32_t length) {
 202         append(s.tempSubString(start, length));
 203     }
 204     void formatAndAppend(const Format* formatter, const Formattable& arg, UErrorCode& ec) {
 205         UnicodeString s;
 206         formatter->format(arg, s, ec);
 207         if (U_SUCCESS(ec)) {
 208             append(s);
 209         }
 210     }
 211     void formatAndAppend(const Format* formatter, const Formattable& arg,
 212                          const UnicodeString &argString, UErrorCode& ec) {
 213         if (!argString.isEmpty()) {
 214             if (U_SUCCESS(ec)) {
 215                 append(argString);
 216             }
 217         } else {
 218             formatAndAppend(formatter, arg, ec);
 219         }
 220     }
 221     int32_t length() {
 222         return len;
 223     }
 224 private:
 225     Appendable& app;
 226     int32_t len;
 227 };
 228
 229
 230 // -------------------------------------
 231 // Creates a MessageFormat instance based on the pattern.
 232
 233 MessageFormat::MessageFormat(const UnicodeString& pattern,
 234                              UErrorCode& success)
 235 : fLocale(Locale::getDefault()),  // Uses the default locale
 236   msgPattern(success),
 237   formatAliases(NULL),
 238   formatAliasesCapacity(0),
 239   argTypes(NULL),
 240   argTypeCount(0),
 241   argTypeCapacity(0),
 242   hasArgTypeConflicts(FALSE),
 243   defaultNumberFormat(NULL),
 244   defaultDateFormat(NULL),
 245   cachedFormatters(NULL),
 246   customFormatArgStarts(NULL),
 247   pluralProvider(*this, UPLURAL_TYPE_CARDINAL),
 248   ordinalProvider(*this, UPLURAL_TYPE_ORDINAL)
 249 {
 250     setLocaleIDs(fLocale.getName(), fLocale.getName());
 251     applyPattern(pattern, success);
 252 }
 253
 254 MessageFormat::MessageFormat(const UnicodeString& pattern,
 255                              const Locale& newLocale,
 256                              UErrorCode& success)
 257 : fLocale(newLocale),
 258   msgPattern(success),
 259   formatAliases(NULL),
 260   formatAliasesCapacity(0),
 261   argTypes(NULL),
 262   argTypeCount(0),
 263   argTypeCapacity(0),
 264   hasArgTypeConflicts(FALSE),
 265   defaultNumberFormat(NULL),
 266   defaultDateFormat(NULL),
 267   cachedFormatters(NULL),
 268   customFormatArgStarts(NULL),
 269   pluralProvider(*this, UPLURAL_TYPE_CARDINAL),
 270   ordinalProvider(*this, UPLURAL_TYPE_ORDINAL)
 271 {
 272     setLocaleIDs(fLocale.getName(), fLocale.getName());
 273     applyPattern(pattern, success);
 274 }
 275
 276 MessageFormat::MessageFormat(const UnicodeString& pattern,
 277                              const Locale& newLocale,
 278                              UParseError& parseError,
 279                              UErrorCode& success)
 280 : fLocale(newLocale),
 281   msgPattern(success),
 282   formatAliases(NULL),
 283   formatAliasesCapacity(0),
 284   argTypes(NULL),
 285   argTypeCount(0),
 286   argTypeCapacity(0),
 287   hasArgTypeConflicts(FALSE),
 288   defaultNumberFormat(NULL),
 289   defaultDateFormat(NULL),
 290   cachedFormatters(NULL),
 291   customFormatArgStarts(NULL),
 292   pluralProvider(*this, UPLURAL_TYPE_CARDINAL),
 293   ordinalProvider(*this, UPLURAL_TYPE_ORDINAL)
 294 {
 295     setLocaleIDs(fLocale.getName(), fLocale.getName());
 296     applyPattern(pattern, parseError, success);
 297 }
 298
 299 MessageFormat::MessageFormat(const MessageFormat& that)
 300 :
 301   Format(that),
 302   fLocale(that.fLocale),
 303   msgPattern(that.msgPattern),
 304   formatAliases(NULL),
 305   formatAliasesCapacity(0),
 306   argTypes(NULL),
 307   argTypeCount(0),
 308   argTypeCapacity(0),
 309   hasArgTypeConflicts(that.hasArgTypeConflicts),
 310   defaultNumberFormat(NULL),
 311   defaultDateFormat(NULL),
 312   cachedFormatters(NULL),
 313   customFormatArgStarts(NULL),
 314   pluralProvider(*this, UPLURAL_TYPE_CARDINAL),
 315   ordinalProvider(*this, UPLURAL_TYPE_ORDINAL)
 316 {
 317     // This will take care of creating the hash tables (since they are NULL).
 318     UErrorCode ec = U_ZERO_ERROR;
 319     copyObjects(that, ec);
 320     if (U_FAILURE(ec)) {
 321         resetPattern();
 322     }
 323 }
 324
 325 MessageFormat::~MessageFormat()
 326 {
 327     uhash_close(cachedFormatters);
 328     uhash_close(customFormatArgStarts);
 329
 330     uprv_free(argTypes);
 331     uprv_free(formatAliases);
 332     delete defaultNumberFormat;
 333     delete defaultDateFormat;
 334 }
 335
 336 //--------------------------------------------------------------------
 337 // Variable-size array management
 338
 339 /**
 340  * Allocate argTypes[] to at least the given capacity and return
 341  * TRUE if successful.  If not, leave argTypes[] unchanged.
 342  *
 343  * If argTypes is NULL, allocate it.  If it is not NULL, enlarge it
 344  * if necessary to be at least as large as specified.
 345  */
 346 UBool MessageFormat::allocateArgTypes(int32_t capacity, UErrorCode& status) {
 347     if (U_FAILURE(status)) {
 348         return FALSE;
 349     }
 350     if (argTypeCapacity >= capacity) {
 351         return TRUE;
 352     }
 353     if (capacity < DEFAULT_INITIAL_CAPACITY) {
 354         capacity = DEFAULT_INITIAL_CAPACITY;
 355     } else if (capacity < 2*argTypeCapacity) {
 356         capacity = 2*argTypeCapacity;
 357     }
 358     Formattable::Type* a = (Formattable::Type*)
 359             uprv_realloc(argTypes, sizeof(*argTypes) * capacity);
 360     if (a == NULL) {
 361         status = U_MEMORY_ALLOCATION_ERROR;
 362         return FALSE;
 363     }
 364     argTypes = a;
 365     argTypeCapacity = capacity;
 366     return TRUE;
 367 }
 368
 369 // -------------------------------------
 370 // assignment operator
 371
 372 const MessageFormat&
 373 MessageFormat::operator=(const MessageFormat& that)
 374 {
 375     if (this != &that) {
 376         // Calls the super class for assignment first.
 377         Format::operator=(that);
 378
 379         setLocale(that.fLocale);
 380         msgPattern = that.msgPattern;
 381         hasArgTypeConflicts = that.hasArgTypeConflicts;
 382
 383         UErrorCode ec = U_ZERO_ERROR;
 384         copyObjects(that, ec);
 385         if (U_FAILURE(ec)) {
 386             resetPattern();
 387         }
 388     }
 389     return *this;
 390 }
 391
 392 UBool
 393 MessageFormat::operator==(const Format& rhs) const
 394 {
 395     if (this == &rhs) return TRUE;
 396
 397     MessageFormat& that = (MessageFormat&)rhs;
 398
 399     // Check class ID before checking MessageFormat members
 400     if (!Format::operator==(rhs) ||
 401         msgPattern != that.msgPattern ||
 402         fLocale != that.fLocale) {
 403         return FALSE;
 404     }
 405
 406     // Compare hashtables.
 407     if ((customFormatArgStarts == NULL) != (that.customFormatArgStarts == NULL)) {
 408         return FALSE;
 409     }
 410     if (customFormatArgStarts == NULL) {
 411         return TRUE;
 412     }
 413
 414     UErrorCode ec = U_ZERO_ERROR;
 415     const int32_t count = uhash_count(customFormatArgStarts);
 416     const int32_t rhs_count = uhash_count(that.customFormatArgStarts);
 417     if (count != rhs_count) {
 418         return FALSE;
 419     }
 420     int32_t idx = 0, rhs_idx = 0, pos = UHASH_FIRST, rhs_pos = UHASH_FIRST;
 421     for (; idx < count && rhs_idx < rhs_count && U_SUCCESS(ec); ++idx, ++rhs_idx) {
 422         const UHashElement* cur = uhash_nextElement(customFormatArgStarts, &pos);
 423         const UHashElement* rhs_cur = uhash_nextElement(that.customFormatArgStarts, &rhs_pos);
 424         if (cur->key.integer != rhs_cur->key.integer) {
 425             return FALSE;
 426         }
 427         const Format* format = (const Format*)uhash_iget(cachedFormatters, cur->key.integer);
 428         const Format* rhs_format = (const Format*)uhash_iget(that.cachedFormatters, rhs_cur->key.integer);
 429         if (*format != *rhs_format) {
 430             return FALSE;
 431         }
 432     }
 433     return TRUE;
 434 }
 435
 436 // -------------------------------------
 437 // Creates a copy of this MessageFormat, the caller owns the copy.
 438
 439 MessageFormat*
 440 MessageFormat::clone() const
 441 {
 442     return new MessageFormat(*this);
 443 }
 444
 445 // -------------------------------------
 446 // Sets the locale of this MessageFormat object to theLocale.
 447
 448 void
 449 MessageFormat::setLocale(const Locale& theLocale)
 450 {
 451     if (fLocale != theLocale) {
 452         delete defaultNumberFormat;
 453         defaultNumberFormat = NULL;
 454         delete defaultDateFormat;
 455         defaultDateFormat = NULL;
 456         fLocale = theLocale;
 457         setLocaleIDs(fLocale.getName(), fLocale.getName());
 458         pluralProvider.reset();
 459         ordinalProvider.reset();
 460     }
 461 }
 462
 463 // -------------------------------------
 464 // Gets the locale of this MessageFormat object.
 465
 466 const Locale&
 467 MessageFormat::getLocale() const
 468 {
 469     return fLocale;
 470 }
 471
 472 void
 473 MessageFormat::applyPattern(const UnicodeString& newPattern,
 474                             UErrorCode& status)
 475 {
 476     UParseError parseError;
 477     applyPattern(newPattern,parseError,status);
 478 }
 479
 480
 481 // -------------------------------------
 482 // Applies the new pattern and returns an error if the pattern
 483 // is not correct.
 484 void
 485 MessageFormat::applyPattern(const UnicodeString& pattern,
 486                             UParseError& parseError,
 487                             UErrorCode& ec)
 488 {
 489     if(U_FAILURE(ec)) {
 490         return;
 491     }
 492     msgPattern.parse(pattern, &parseError, ec);
 493     cacheExplicitFormats(ec);
 494
 495     if (U_FAILURE(ec)) {
 496         resetPattern();
 497     }
 498 }
 499
 500 void MessageFormat::resetPattern() {
 501     msgPattern.clear();
 502     uhash_close(cachedFormatters);
 503     cachedFormatters = NULL;
 504     uhash_close(customFormatArgStarts);
 505     customFormatArgStarts = NULL;
 506     argTypeCount = 0;
 507     hasArgTypeConflicts = FALSE;
 508 }
 509
 510 void
 511 MessageFormat::applyPattern(const UnicodeString& pattern,
 512                             UMessagePatternApostropheMode aposMode,
 513                             UParseError* parseError,
 514                             UErrorCode& status) {
 515     if (aposMode != msgPattern.getApostropheMode()) {
 516         msgPattern.clearPatternAndSetApostropheMode(aposMode);
 517     }
 518     applyPattern(pattern, *parseError, status);
 519 }
 520
 521 // -------------------------------------
 522 // Converts this MessageFormat instance to a pattern.
 523
 524 UnicodeString&
 525 MessageFormat::toPattern(UnicodeString& appendTo) const {
 526     if ((customFormatArgStarts != NULL && 0 != uhash_count(customFormatArgStarts)) ||
 527         0 == msgPattern.countParts()
 528     ) {
 529         appendTo.setToBogus();
 530         return appendTo;
 531     }
 532     return appendTo.append(msgPattern.getPatternString());
 533 }
 534
 535 int32_t MessageFormat::nextTopLevelArgStart(int32_t partIndex) const {
 536     if (partIndex != 0) {
 537         partIndex = msgPattern.getLimitPartIndex(partIndex);
 538     }
 539     for (;;) {
 540         UMessagePatternPartType type = msgPattern.getPartType(++partIndex);
 541         if (type == UMSGPAT_PART_TYPE_ARG_START) {
 542             return partIndex;
 543         }
 544         if (type == UMSGPAT_PART_TYPE_MSG_LIMIT) {
 545             return -1;
 546         }
 547     }
 548 }
 549
 550 void MessageFormat::setArgStartFormat(int32_t argStart,
 551                                       Format* formatter,
 552                                       UErrorCode& status) {
 553     if (U_FAILURE(status)) {
 554         delete formatter;
 555         return;
 556     }
 557     if (cachedFormatters == NULL) {
 558         cachedFormatters=uhash_open(uhash_hashLong, uhash_compareLong,
 559                                     equalFormatsForHash, &status);
 560         if (U_FAILURE(status)) {
 561             delete formatter;
 562             return;
 563         }
 564         uhash_setValueDeleter(cachedFormatters, uprv_deleteUObject);
 565     }
 566     if (formatter == NULL) {
 567         formatter = new DummyFormat();
 568     }
 569     uhash_iput(cachedFormatters, argStart, formatter, &status);
 570 }
 571
 572
 573 UBool MessageFormat::argNameMatches(int32_t partIndex, const UnicodeString& argName, int32_t argNumber) {
 574     const MessagePattern::Part& part = msgPattern.getPart(partIndex);
 575     return part.getType() == UMSGPAT_PART_TYPE_ARG_NAME ?
 576         msgPattern.partSubstringMatches(part, argName) :
 577         part.getValue() == argNumber;  // ARG_NUMBER
 578 }
 579
 580 // Sets a custom formatter for a MessagePattern ARG_START part index.
 581 // "Custom" formatters are provided by the user via setFormat() or similar APIs.
 582 void MessageFormat::setCustomArgStartFormat(int32_t argStart,
 583                                             Format* formatter,
 584                                             UErrorCode& status) {
 585     setArgStartFormat(argStart, formatter, status);
 586     if (customFormatArgStarts == NULL) {
 587         customFormatArgStarts=uhash_open(uhash_hashLong, uhash_compareLong,
 588                                          NULL, &status);
 589     }
 590     uhash_iputi(customFormatArgStarts, argStart, 1, &status);
 591 }
 592
 593 Format* MessageFormat::getCachedFormatter(int32_t argumentNumber) const {
 594     if (cachedFormatters == NULL) {
 595         return NULL;
 596     }
 597     void* ptr = uhash_iget(cachedFormatters, argumentNumber);
 598     if (ptr != NULL && dynamic_cast<DummyFormat*>((Format*)ptr) == NULL) {
 599         return (Format*) ptr;
 600     } else {
 601         // Not cached, or a DummyFormat representing setFormat(NULL).
 602         return NULL;
 603     }
 604 }
 605
 606 // -------------------------------------
 607 // Adopts the new formats array and updates the array count.
 608 // This MessageFormat instance owns the new formats.
 609 void
 610 MessageFormat::adoptFormats(Format** newFormats,
 611                             int32_t count) {
 612     if (newFormats == NULL || count < 0) {
 613         return;
 614     }
 615     // Throw away any cached formatters.
 616     if (cachedFormatters != NULL) {
 617         uhash_removeAll(cachedFormatters);
 618     }
 619     if (customFormatArgStarts != NULL) {
 620         uhash_removeAll(customFormatArgStarts);
 621     }
 622
 623     int32_t formatNumber = 0;
 624     UErrorCode status = U_ZERO_ERROR;
 625     for (int32_t partIndex = 0;
 626         formatNumber < count && U_SUCCESS(status) &&
 627             (partIndex = nextTopLevelArgStart(partIndex)) >= 0;) {
 628         setCustomArgStartFormat(partIndex, newFormats[formatNumber], status);
 629         ++formatNumber;
 630     }
 631     // Delete those that didn't get used (if any).
 632     for (; formatNumber < count; ++formatNumber) {
 633         delete newFormats[formatNumber];
 634     }
 635
 636 }
 637
 638 // -------------------------------------
 639 // Sets the new formats array and updates the array count.
 640 // This MessageFormat instance maks a copy of the new formats.
 641
 642 void
 643 MessageFormat::setFormats(const Format** newFormats,
 644                           int32_t count) {
 645     if (newFormats == NULL || count < 0) {
 646         return;
 647     }
 648     // Throw away any cached formatters.
 649     if (cachedFormatters != NULL) {
 650         uhash_removeAll(cachedFormatters);
 651     }
 652     if (customFormatArgStarts != NULL) {
 653         uhash_removeAll(customFormatArgStarts);
 654     }
 655
 656     UErrorCode status = U_ZERO_ERROR;
 657     int32_t formatNumber = 0;
 658     for (int32_t partIndex = 0;
 659         formatNumber < count && U_SUCCESS(status) && (partIndex = nextTopLevelArgStart(partIndex)) >= 0;) {
 660       Format* newFormat = NULL;
 661       if (newFormats[formatNumber] != NULL) {
 662           newFormat = newFormats[formatNumber]->clone();
 663           if (newFormat == NULL) {
 664               status = U_MEMORY_ALLOCATION_ERROR;
 665           }
 666       }
 667       setCustomArgStartFormat(partIndex, newFormat, status);
 668       ++formatNumber;
 669     }
 670     if (U_FAILURE(status)) {
 671         resetPattern();
 672     }
 673 }
 674
 675 // -------------------------------------
 676 // Adopt a single format by format number.
 677 // Do nothing if the format number is not less than the array count.
 678
 679 void
 680 MessageFormat::adoptFormat(int32_t n, Format *newFormat) {
 681     LocalPointer<Format> p(newFormat);
 682     if (n >= 0) {
 683         int32_t formatNumber = 0;
 684         for (int32_t partIndex = 0; (partIndex = nextTopLevelArgStart(partIndex)) >= 0;) {
 685             if (n == formatNumber) {
 686                 UErrorCode status = U_ZERO_ERROR;
 687                 setCustomArgStartFormat(partIndex, p.orphan(), status);
 688                 return;
 689             }
 690             ++formatNumber;
 691         }
 692     }
 693 }
 694
 695 // -------------------------------------
 696 // Adopt a single format by format name.
 697 // Do nothing if there is no match of formatName.
 698 void
 699 MessageFormat::adoptFormat(const UnicodeString& formatName,
 700                            Format* formatToAdopt,
 701                            UErrorCode& status) {
 702     LocalPointer<Format> p(formatToAdopt);
 703     if (U_FAILURE(status)) {
 704         return;
 705     }
 706     int32_t argNumber = MessagePattern::validateArgumentName(formatName);
 707     if (argNumber < UMSGPAT_ARG_NAME_NOT_NUMBER) {
 708         status = U_ILLEGAL_ARGUMENT_ERROR;
 709         return;
 710     }
 711     for (int32_t partIndex = 0;
 712         (partIndex = nextTopLevelArgStart(partIndex)) >= 0 && U_SUCCESS(status);
 713     ) {
 714         if (argNameMatches(partIndex + 1, formatName, argNumber)) {
 715             Format* f;
 716             if (p.isValid()) {
 717                 f = p.orphan();
 718             } else if (formatToAdopt == NULL) {
 719                 f = NULL;
 720             } else {
 721                 f = formatToAdopt->clone();
 722                 if (f == NULL) {
 723                     status = U_MEMORY_ALLOCATION_ERROR;
 724                     return;
 725                 }
 726             }
 727             setCustomArgStartFormat(partIndex, f, status);
 728         }
 729     }
 730 }
 731
 732 // -------------------------------------
 733 // Set a single format.
 734 // Do nothing if the variable is not less than the array count.
 735 void
 736 MessageFormat::setFormat(int32_t n, const Format& newFormat) {
 737
 738     if (n >= 0) {
 739         int32_t formatNumber = 0;
 740         for (int32_t partIndex = 0;
 741              (partIndex = nextTopLevelArgStart(partIndex)) >= 0;) {
 742             if (n == formatNumber) {
 743                 Format* new_format = newFormat.clone();
 744                 if (new_format) {
 745                     UErrorCode status = U_ZERO_ERROR;
 746                     setCustomArgStartFormat(partIndex, new_format, status);
 747                 }
 748                 return;
 749             }
 750             ++formatNumber;
 751         }
 752     }
 753 }
 754
 755 // -------------------------------------
 756 // Get a single format by format name.
 757 // Do nothing if the variable is not less than the array count.
 758 Format *
 759 MessageFormat::getFormat(const UnicodeString& formatName, UErrorCode& status) {
 760     if (U_FAILURE(status) || cachedFormatters == NULL) return NULL;
 761
 762     int32_t argNumber = MessagePattern::validateArgumentName(formatName);
 763     if (argNumber < UMSGPAT_ARG_NAME_NOT_NUMBER) {
 764         status = U_ILLEGAL_ARGUMENT_ERROR;
 765         return NULL;
 766     }
 767     for (int32_t partIndex = 0; (partIndex = nextTopLevelArgStart(partIndex)) >= 0;) {
 768         if (argNameMatches(partIndex + 1, formatName, argNumber)) {
 769             return getCachedFormatter(partIndex);
 770         }
 771     }
 772     return NULL;
 773 }
 774
 775 // -------------------------------------
 776 // Set a single format by format name
 777 // Do nothing if the variable is not less than the array count.
 778 void
 779 MessageFormat::setFormat(const UnicodeString& formatName,
 780                          const Format& newFormat,
 781                          UErrorCode& status) {
 782     if (U_FAILURE(status)) return;
 783
 784     int32_t argNumber = MessagePattern::validateArgumentName(formatName);
 785     if (argNumber < UMSGPAT_ARG_NAME_NOT_NUMBER) {
 786         status = U_ILLEGAL_ARGUMENT_ERROR;
 787         return;
 788     }
 789     for (int32_t partIndex = 0;
 790         (partIndex = nextTopLevelArgStart(partIndex)) >= 0 && U_SUCCESS(status);
 791     ) {
 792         if (argNameMatches(partIndex + 1, formatName, argNumber)) {
 793             Format* new_format = newFormat.clone();
 794             if (new_format == NULL) {
 795                 status = U_MEMORY_ALLOCATION_ERROR;
 796                 return;
 797             }
 798             setCustomArgStartFormat(partIndex, new_format, status);
 799         }
 800     }
 801 }
 802
 803 // -------------------------------------
 804 // Gets the format array.
 805 const Format**
 806 MessageFormat::getFormats(int32_t& cnt) const
 807 {
 808     // This old API returns an array (which we hold) of Format*
 809     // pointers.  The array is valid up to the next call to any
 810     // method on this object.  We construct and resize an array
 811     // on demand that contains aliases to the subformats[i].format
 812     // pointers.
 813
 814     // Get total required capacity first (it's refreshed on each call).
 815     int32_t totalCapacity = 0;
 816     for (int32_t partIndex = 0; (partIndex = nextTopLevelArgStart(partIndex)) >= 0; ++totalCapacity) {}
 817
 818     MessageFormat* t = const_cast<MessageFormat*> (this);
 819     cnt = 0;
 820     if (formatAliases == nullptr) {
 821         t->formatAliasesCapacity = totalCapacity;
 822         Format** a = (Format**)
 823             uprv_malloc(sizeof(Format*) * formatAliasesCapacity);
 824         if (a == nullptr) {
 825             t->formatAliasesCapacity = 0;
 826             return nullptr;
 827         }
 828         t->formatAliases = a;
 829     } else if (totalCapacity > formatAliasesCapacity) {
 830         Format** a = (Format**)
 831             uprv_realloc(formatAliases, sizeof(Format*) * totalCapacity);
 832         if (a == nullptr) {
 833             t->formatAliasesCapacity = 0;
 834             return nullptr;
 835         }
 836         t->formatAliases = a;
 837         t->formatAliasesCapacity = totalCapacity;
 838     }
 839
 840     for (int32_t partIndex = 0; (partIndex = nextTopLevelArgStart(partIndex)) >= 0;) {
 841         t->formatAliases[cnt++] = getCachedFormatter(partIndex);
 842     }
 843
 844     return (const Format**)formatAliases;
 845 }
 846
 847
 848 UnicodeString MessageFormat::getArgName(int32_t partIndex) {
 849     const MessagePattern::Part& part = msgPattern.getPart(partIndex);
 850     return msgPattern.getSubstring(part);
 851 }
 852
 853 StringEnumeration*
 854 MessageFormat::getFormatNames(UErrorCode& status) {
 855     if (U_FAILURE(status))  return NULL;
 856
 857     UVector *fFormatNames = new UVector(status);
 858     if (U_FAILURE(status)) {
 859         status = U_MEMORY_ALLOCATION_ERROR;
 860         return NULL;
 861     }
 862     fFormatNames->setDeleter(uprv_deleteUObject);
 863
 864     for (int32_t partIndex = 0; (partIndex = nextTopLevelArgStart(partIndex)) >= 0;) {
 865         fFormatNames->addElement(new UnicodeString(getArgName(partIndex + 1)), status);
 866     }
 867
 868     StringEnumeration* nameEnumerator = new FormatNameEnumeration(fFormatNames, status);
 869     return nameEnumerator;
 870 }
 871
 872 // -------------------------------------
 873 // Formats the source Formattable array and copy into the result buffer.
 874 // Ignore the FieldPosition result for error checking.
 875
 876 UnicodeString&
 877 MessageFormat::format(const Formattable* source,
 878                       int32_t cnt,
 879                       UnicodeString& appendTo,
 880                       FieldPosition& ignore,
 881                       UErrorCode& success) const
 882 {
 883     return format(source, NULL, cnt, appendTo, &ignore, success);
 884 }
 885
 886 // -------------------------------------
 887 // Internally creates a MessageFormat instance based on the
 888 // pattern and formats the arguments Formattable array and
 889 // copy into the appendTo buffer.
 890
 891 UnicodeString&
 892 MessageFormat::format(  const UnicodeString& pattern,
 893                         const Formattable* arguments,
 894                         int32_t cnt,
 895                         UnicodeString& appendTo,
 896                         UErrorCode& success)
 897 {
 898     MessageFormat temp(pattern, success);
 899     return temp.format(arguments, NULL, cnt, appendTo, NULL, success);
 900 }
 901
 902 // -------------------------------------
 903 // Formats the source Formattable object and copy into the
 904 // appendTo buffer.  The Formattable object must be an array
 905 // of Formattable instances, returns error otherwise.
 906
 907 UnicodeString&
 908 MessageFormat::format(const Formattable& source,
 909                       UnicodeString& appendTo,
 910                       FieldPosition& ignore,
 911                       UErrorCode& success) const
 912 {
 913     if (U_FAILURE(success))
 914         return appendTo;
 915     if (source.getType() != Formattable::kArray) {
 916         success = U_ILLEGAL_ARGUMENT_ERROR;
 917         return appendTo;
 918     }
 919     int32_t cnt;
 920     const Formattable* tmpPtr = source.getArray(cnt);
 921     return format(tmpPtr, NULL, cnt, appendTo, &ignore, success);
 922 }
 923
 924 UnicodeString&
 925 MessageFormat::format(const UnicodeString* argumentNames,
 926                       const Formattable* arguments,
 927                       int32_t count,
 928                       UnicodeString& appendTo,
 929                       UErrorCode& success) const {
 930     return format(arguments, argumentNames, count, appendTo, NULL, success);
 931 }
 932
 933 // Does linear search to find the match for an ArgName.
 934 const Formattable* MessageFormat::getArgFromListByName(const Formattable* arguments,
 935                                                        const UnicodeString *argumentNames,
 936                                                        int32_t cnt, UnicodeString& name) const {
 937     for (int32_t i = 0; i < cnt; ++i) {
 938         if (0 == argumentNames[i].compare(name)) {
 939             return arguments + i;
 940         }
 941     }
 942     return NULL;
 943 }
 944
 945
 946 UnicodeString&
 947 MessageFormat::format(const Formattable* arguments,
 948                       const UnicodeString *argumentNames,
 949                       int32_t cnt,
 950                       UnicodeString& appendTo,
 951                       FieldPosition* pos,
 952                       UErrorCode& status) const {
 953     if (U_FAILURE(status)) {
 954         return appendTo;
 955     }
 956
 957     UnicodeStringAppendable usapp(appendTo);
 958     AppendableWrapper app(usapp);
 959     format(0, NULL, arguments, argumentNames, cnt, app, pos, status);
 960     return appendTo;
 961 }
 962
 963 namespace {
 964
 965 /**
 966  * Mutable input/output values for the PluralSelectorProvider.
 967  * Separate so that it is possible to make MessageFormat Freezable.
 968  */
 969 class PluralSelectorContext {
 970 public:
 971     PluralSelectorContext(int32_t start, const UnicodeString &name,
 972                           const Formattable &num, double off, UErrorCode &errorCode)
 973             : startIndex(start), argName(name), offset(off),
 974               numberArgIndex(-1), formatter(NULL), forReplaceNumber(FALSE) {
 975         // number needs to be set even when select() is not called.
 976         // Keep it as a Number/Formattable:
 977         // For format() methods, and to preserve information (e.g., BigDecimal).
 978         if(off == 0) {
 979             number = num;
 980         } else {
 981             number = num.getDouble(errorCode) - off;
 982         }
 983     }
 984
 985     // Input values for plural selection with decimals.
 986     int32_t startIndex;
 987     const UnicodeString &argName;
 988     /** argument number - plural offset */
 989     Formattable number;
 990     double offset;
 991     // Output values for plural selection with decimals.
 992     /** -1 if REPLACE_NUMBER, 0 arg not found, >0 ARG_START index */
 993     int32_t numberArgIndex;
 994     const Format *formatter;
 995     /** formatted argument number - plural offset */
 996     UnicodeString numberString;
 997     /** TRUE if number-offset was formatted with the stock number formatter */
 998     UBool forReplaceNumber;
 999 };
1000
1001 }  // namespace
1002
1003 // if argumentNames is NULL, this means arguments is a numeric array.
1004 // arguments can not be NULL.
1005 // We use const void *plNumber rather than const PluralSelectorContext *pluralNumber
1006 // so that we need not declare the PluralSelectorContext in the public header file.
1007 void MessageFormat::format(int32_t msgStart, const void *plNumber,
1008                            const Formattable* arguments,
1009                            const UnicodeString *argumentNames,
1010                            int32_t cnt,
1011                            AppendableWrapper& appendTo,
1012                            FieldPosition* ignore,
1013                            UErrorCode& success) const {
1014     if (U_FAILURE(success)) {
1015         return;
1016     }
1017
1018     const UnicodeString& msgString = msgPattern.getPatternString();
1019     int32_t prevIndex = msgPattern.getPart(msgStart).getLimit();
1020     for (int32_t i = msgStart + 1; U_SUCCESS(success) ; ++i) {
1021         const MessagePattern::Part* part = &msgPattern.getPart(i);
1022         const UMessagePatternPartType type = part->getType();
1023         int32_t index = part->getIndex();
1024         appendTo.append(msgString, prevIndex, index - prevIndex);
1025         if (type == UMSGPAT_PART_TYPE_MSG_LIMIT) {
1026             return;
1027         }
1028         prevIndex = part->getLimit();
1029         if (type == UMSGPAT_PART_TYPE_REPLACE_NUMBER) {
1030             const PluralSelectorContext &pluralNumber =
1031                 *static_cast<const PluralSelectorContext *>(plNumber);
1032             if(pluralNumber.forReplaceNumber) {
1033                 // number-offset was already formatted.
1034                 appendTo.formatAndAppend(pluralNumber.formatter,
1035                         pluralNumber.number, pluralNumber.numberString, success);
1036             } else {
1037                 const NumberFormat* nf = getDefaultNumberFormat(success);
1038                 appendTo.formatAndAppend(nf, pluralNumber.number, success);
1039             }
1040             continue;
1041         }
1042         if (type != UMSGPAT_PART_TYPE_ARG_START) {
1043             continue;
1044         }
1045         int32_t argLimit = msgPattern.getLimitPartIndex(i);
1046         UMessagePatternArgType argType = part->getArgType();
1047         part = &msgPattern.getPart(++i);
1048         const Formattable* arg;
1049         UBool noArg = FALSE;
1050         UnicodeString argName = msgPattern.getSubstring(*part);
1051         if (argumentNames == NULL) {
1052             int32_t argNumber = part->getValue();  // ARG_NUMBER
1053             if (0 <= argNumber && argNumber < cnt) {
1054                 arg = arguments + argNumber;
1055             } else {
1056                 arg = NULL;
1057                 noArg = TRUE;
1058             }
1059         } else {
1060             arg = getArgFromListByName(arguments, argumentNames, cnt, argName);
1061             if (arg == NULL) {
1062                 noArg = TRUE;
1063             }
1064         }
1065         ++i;
1066         int32_t prevDestLength = appendTo.length();
1067         const Format* formatter = NULL;
1068         if (noArg) {
1069             appendTo.append(
1070                 UnicodeString(LEFT_CURLY_BRACE).append(argName).append(RIGHT_CURLY_BRACE));
1071         } else if (arg == NULL) {
1072             appendTo.append(NULL_STRING, 4);
1073         } else if(plNumber!=NULL &&
1074                 static_cast<const PluralSelectorContext *>(plNumber)->numberArgIndex==(i-2)) {
1075             const PluralSelectorContext &pluralNumber =
1076                 *static_cast<const PluralSelectorContext *>(plNumber);
1077             if(pluralNumber.offset == 0) {
1078                 // The number was already formatted with this formatter.
1079                 appendTo.formatAndAppend(pluralNumber.formatter, pluralNumber.number,
1080                                          pluralNumber.numberString, success);
1081             } else {
1082                 // Do not use the formatted (number-offset) string for a named argument
1083                 // that formats the number without subtracting the offset.
1084                 appendTo.formatAndAppend(pluralNumber.formatter, *arg, success);
1085             }
1086         } else if ((formatter = getCachedFormatter(i -2)) != 0) {
1087             // Handles all ArgType.SIMPLE, and formatters from setFormat() and its siblings.
1088             if (dynamic_cast<const ChoiceFormat*>(formatter) ||
1089                 dynamic_cast<const PluralFormat*>(formatter) ||
1090                 dynamic_cast<const SelectFormat*>(formatter)) {
1091                 // We only handle nested formats here if they were provided via
1092                 // setFormat() or its siblings. Otherwise they are not cached and instead
1093                 // handled below according to argType.
1094                 UnicodeString subMsgString;
1095                 formatter->format(*arg, subMsgString, success);
1096                 if (subMsgString.indexOf(LEFT_CURLY_BRACE) >= 0 ||
1097                     (subMsgString.indexOf(SINGLE_QUOTE) >= 0 && !MessageImpl::jdkAposMode(msgPattern))
1098                 ) {
1099                     MessageFormat subMsgFormat(subMsgString, fLocale, success);
1100                     subMsgFormat.format(0, NULL, arguments, argumentNames, cnt, appendTo, ignore, success);
1101                 } else {
1102                     appendTo.append(subMsgString);
1103                 }
1104             } else {
1105                 appendTo.formatAndAppend(formatter, *arg, success);
1106             }
1107         } else if (argType == UMSGPAT_ARG_TYPE_NONE || (cachedFormatters && uhash_iget(cachedFormatters, i - 2))) {
1108             // We arrive here if getCachedFormatter returned NULL, but there was actually an element in the hash table.
1109             // This can only happen if the hash table contained a DummyFormat, so the if statement above is a check
1110             // for the hash table containind DummyFormat.
1111             if (arg->isNumeric()) {
1112                 const NumberFormat* nf = getDefaultNumberFormat(success);
1113                 appendTo.formatAndAppend(nf, *arg, success);
1114             } else if (arg->getType() == Formattable::kDate) {
1115                 const DateFormat* df = getDefaultDateFormat(success);
1116                 appendTo.formatAndAppend(df, *arg, success);
1117             } else {
1118                 appendTo.append(arg->getString(success));
1119             }
1120         } else if (argType == UMSGPAT_ARG_TYPE_CHOICE) {
1121             if (!arg->isNumeric()) {
1122                 success = U_ILLEGAL_ARGUMENT_ERROR;
1123                 return;
1124             }
1125             // We must use the Formattable::getDouble() variant with the UErrorCode parameter
1126             // because only this one converts non-double numeric types to double.
1127             const double number = arg->getDouble(success);
1128             int32_t subMsgStart = ChoiceFormat::findSubMessage(msgPattern, i, number);
1129             formatComplexSubMessage(subMsgStart, NULL, arguments, argumentNames,
1130                                     cnt, appendTo, success);
1131         } else if (UMSGPAT_ARG_TYPE_HAS_PLURAL_STYLE(argType)) {
1132             if (!arg->isNumeric()) {
1133                 success = U_ILLEGAL_ARGUMENT_ERROR;
1134                 return;
1135             }
1136             const PluralSelectorProvider &selector =
1137                 argType == UMSGPAT_ARG_TYPE_PLURAL ? pluralProvider : ordinalProvider;
1138             // We must use the Formattable::getDouble() variant with the UErrorCode parameter
1139             // because only this one converts non-double numeric types to double.
1140             double offset = msgPattern.getPluralOffset(i);
1141             PluralSelectorContext context(i, argName, *arg, offset, success);
1142             int32_t subMsgStart = PluralFormat::findSubMessage(
1143                     msgPattern, i, selector, &context, arg->getDouble(success), success);
1144             formatComplexSubMessage(subMsgStart, &context, arguments, argumentNames,
1145                                     cnt, appendTo, success);
1146         } else if (argType == UMSGPAT_ARG_TYPE_SELECT) {
1147             int32_t subMsgStart = SelectFormat::findSubMessage(msgPattern, i, arg->getString(success), success);
1148             formatComplexSubMessage(subMsgStart, NULL, arguments, argumentNames,
1149                                     cnt, appendTo, success);
1150         } else {
1151             // This should never happen.
1152             success = U_INTERNAL_PROGRAM_ERROR;
1153             return;
1154         }
1155         ignore = updateMetaData(appendTo, prevDestLength, ignore, arg);
1156         prevIndex = msgPattern.getPart(argLimit).getLimit();
1157         i = argLimit;
1158     }
1159 }
1160
1161
1162 void MessageFormat::formatComplexSubMessage(int32_t msgStart,
1163                                             const void *plNumber,
1164                                             const Formattable* arguments,
1165                                             const UnicodeString *argumentNames,
1166                                             int32_t cnt,
1167                                             AppendableWrapper& appendTo,
1168                                             UErrorCode& success) const {
1169     if (U_FAILURE(success)) {
1170         return;
1171     }
1172
1173     if (!MessageImpl::jdkAposMode(msgPattern)) {
1174         format(msgStart, plNumber, arguments, argumentNames, cnt, appendTo, NULL, success);
1175         return;
1176     }
1177
1178     // JDK compatibility mode: (see JDK MessageFormat.format() API docs)
1179     // - remove SKIP_SYNTAX; that is, remove half of the apostrophes
1180     // - if the result string contains an open curly brace '{' then
1181     //   instantiate a temporary MessageFormat object and format again;
1182     //   otherwise just append the result string
1183     const UnicodeString& msgString = msgPattern.getPatternString();
1184     UnicodeString sb;
1185     int32_t prevIndex = msgPattern.getPart(msgStart).getLimit();
1186     for (int32_t i = msgStart;;) {
1187         const MessagePattern::Part& part = msgPattern.getPart(++i);
1188         const UMessagePatternPartType type = part.getType();
1189         int32_t index = part.getIndex();
1190         if (type == UMSGPAT_PART_TYPE_MSG_LIMIT) {
1191             sb.append(msgString, prevIndex, index - prevIndex);
1192             break;
1193         } else if (type == UMSGPAT_PART_TYPE_REPLACE_NUMBER || type == UMSGPAT_PART_TYPE_SKIP_SYNTAX) {
1194             sb.append(msgString, prevIndex, index - prevIndex);
1195             if (type == UMSGPAT_PART_TYPE_REPLACE_NUMBER) {
1196                 const PluralSelectorContext &pluralNumber =
1197                     *static_cast<const PluralSelectorContext *>(plNumber);
1198                 if(pluralNumber.forReplaceNumber) {
1199                     // number-offset was already formatted.
1200                     sb.append(pluralNumber.numberString);
1201                 } else {
1202                     const NumberFormat* nf = getDefaultNumberFormat(success);
1203                     sb.append(nf->format(pluralNumber.number, sb, success));
1204                 }
1205             }
1206             prevIndex = part.getLimit();
1207         } else if (type == UMSGPAT_PART_TYPE_ARG_START) {
1208             sb.append(msgString, prevIndex, index - prevIndex);
1209             prevIndex = index;
1210             i = msgPattern.getLimitPartIndex(i);
1211             index = msgPattern.getPart(i).getLimit();
1212             MessageImpl::appendReducedApostrophes(msgString, prevIndex, index, sb);
1213             prevIndex = index;
1214         }
1215     }
1216     if (sb.indexOf(LEFT_CURLY_BRACE) >= 0) {
1217         UnicodeString emptyPattern;  // gcc 3.3.3 fails with "UnicodeString()" as the first parameter.
1218         MessageFormat subMsgFormat(emptyPattern, fLocale, success);
1219         subMsgFormat.applyPattern(sb, UMSGPAT_APOS_DOUBLE_REQUIRED, NULL, success);
1220         subMsgFormat.format(0, NULL, arguments, argumentNames, cnt, appendTo, NULL, success);
1221     } else {
1222         appendTo.append(sb);
1223     }
1224 }
1225
1226
1227 UnicodeString MessageFormat::getLiteralStringUntilNextArgument(int32_t from) const {
1228     const UnicodeString& msgString=msgPattern.getPatternString();
1229     int32_t prevIndex=msgPattern.getPart(from).getLimit();
1230     UnicodeString b;
1231     for (int32_t i = from + 1; ; ++i) {
1232         const MessagePattern::Part& part = msgPattern.getPart(i);
1233         const UMessagePatternPartType type=part.getType();
1234         int32_t index=part.getIndex();
1235         b.append(msgString, prevIndex, index - prevIndex);
1236         if(type==UMSGPAT_PART_TYPE_ARG_START || type==UMSGPAT_PART_TYPE_MSG_LIMIT) {
1237             return b;
1238         }
1239         // Unexpected Part "part" in parsed message.
1240         U_ASSERT(type==UMSGPAT_PART_TYPE_SKIP_SYNTAX || type==UMSGPAT_PART_TYPE_INSERT_CHAR);
1241         prevIndex=part.getLimit();
1242     }
1243 }
1244
1245
1246 FieldPosition* MessageFormat::updateMetaData(AppendableWrapper& /*dest*/, int32_t /*prevLength*/,
1247                              FieldPosition* /*fp*/, const Formattable* /*argId*/) const {
1248     // Unlike in Java, there are no field attributes defined for MessageFormat. Do nothing.
1249     return NULL;
1250     /*
1251       if (fp != NULL && Field.ARGUMENT.equals(fp.getFieldAttribute())) {
1252           fp->setBeginIndex(prevLength);
1253           fp->setEndIndex(dest.get_length());
1254           return NULL;
1255       }
1256       return fp;
1257     */
1258 }
1259
1260 int32_t
1261 MessageFormat::findOtherSubMessage(int32_t partIndex) const {
1262     int32_t count=msgPattern.countParts();
1263     const MessagePattern::Part *part = &msgPattern.getPart(partIndex);
1264     if(MessagePattern::Part::hasNumericValue(part->getType())) {
1265         ++partIndex;
1266     }
1267     // Iterate over (ARG_SELECTOR [ARG_INT|ARG_DOUBLE] message) tuples
1268     // until ARG_LIMIT or end of plural-only pattern.
1269     UnicodeString other(FALSE, OTHER_STRING, 5);
1270     do {
1271         part=&msgPattern.getPart(partIndex++);
1272         UMessagePatternPartType type=part->getType();
1273         if(type==UMSGPAT_PART_TYPE_ARG_LIMIT) {
1274             break;
1275         }
1276         U_ASSERT(type==UMSGPAT_PART_TYPE_ARG_SELECTOR);
1277         // part is an ARG_SELECTOR followed by an optional explicit value, and then a message
1278         if(msgPattern.partSubstringMatches(*part, other)) {
1279             return partIndex;
1280         }
1281         if(MessagePattern::Part::hasNumericValue(msgPattern.getPartType(partIndex))) {
1282             ++partIndex;  // skip the numeric-value part of "=1" etc.
1283         }
1284         partIndex=msgPattern.getLimitPartIndex(partIndex);
1285     } while(++partIndex<count);
1286     return 0;
1287 }
1288
1289 int32_t
1290 MessageFormat::findFirstPluralNumberArg(int32_t msgStart, const UnicodeString &argName) const {
1291     for(int32_t i=msgStart+1;; ++i) {
1292         const MessagePattern::Part &part=msgPattern.getPart(i);
1293         UMessagePatternPartType type=part.getType();
1294         if(type==UMSGPAT_PART_TYPE_MSG_LIMIT) {
1295             return 0;
1296         }
1297         if(type==UMSGPAT_PART_TYPE_REPLACE_NUMBER) {
1298             return -1;
1299         }
1300         if(type==UMSGPAT_PART_TYPE_ARG_START) {
1301             UMessagePatternArgType argType=part.getArgType();
1302             if(!argName.isEmpty() && (argType==UMSGPAT_ARG_TYPE_NONE || argType==UMSGPAT_ARG_TYPE_SIMPLE)) {
1303                 // ARG_NUMBER or ARG_NAME
1304                 if(msgPattern.partSubstringMatches(msgPattern.getPart(i+1), argName)) {
1305                     return i;
1306                 }
1307             }
1308             i=msgPattern.getLimitPartIndex(i);
1309         }
1310     }
1311 }
1312
1313 void MessageFormat::copyObjects(const MessageFormat& that, UErrorCode& ec) {
1314     // Deep copy pointer fields.
1315     // We need not copy the formatAliases because they are re-filled
1316     // in each getFormats() call.
1317     // The defaultNumberFormat, defaultDateFormat and pluralProvider.rules
1318     // also get created on demand.
1319     argTypeCount = that.argTypeCount;
1320     if (argTypeCount > 0) {
1321         if (!allocateArgTypes(argTypeCount, ec)) {
1322             return;
1323         }
1324         uprv_memcpy(argTypes, that.argTypes, argTypeCount * sizeof(argTypes[0]));
1325     }
1326     if (cachedFormatters != NULL) {
1327         uhash_removeAll(cachedFormatters);
1328     }
1329     if (customFormatArgStarts != NULL) {
1330         uhash_removeAll(customFormatArgStarts);
1331     }
1332     if (that.cachedFormatters) {
1333         if (cachedFormatters == NULL) {
1334             cachedFormatters=uhash_open(uhash_hashLong, uhash_compareLong,
1335                                         equalFormatsForHash, &ec);
1336             if (U_FAILURE(ec)) {
1337                 return;
1338             }
1339             uhash_setValueDeleter(cachedFormatters, uprv_deleteUObject);
1340         }
1341
1342         const int32_t count = uhash_count(that.cachedFormatters);
1343         int32_t pos, idx;
1344         for (idx = 0, pos = UHASH_FIRST; idx < count && U_SUCCESS(ec); ++idx) {
1345             const UHashElement* cur = uhash_nextElement(that.cachedFormatters, &pos);
1346             Format* newFormat = ((Format*)(cur->value.pointer))->clone();
1347             if (newFormat) {
1348                 uhash_iput(cachedFormatters, cur->key.integer, newFormat, &ec);
1349             } else {
1350                 ec = U_MEMORY_ALLOCATION_ERROR;
1351                 return;
1352             }
1353         }
1354     }
1355     if (that.customFormatArgStarts) {
1356         if (customFormatArgStarts == NULL) {
1357             customFormatArgStarts=uhash_open(uhash_hashLong, uhash_compareLong,
1358                                               NULL, &ec);
1359         }
1360         const int32_t count = uhash_count(that.customFormatArgStarts);
1361         int32_t pos, idx;
1362         for (idx = 0, pos = UHASH_FIRST; idx < count && U_SUCCESS(ec); ++idx) {
1363             const UHashElement* cur = uhash_nextElement(that.customFormatArgStarts, &pos);
1364             uhash_iputi(customFormatArgStarts, cur->key.integer, cur->value.integer, &ec);
1365         }
1366     }
1367 }
1368
1369
1370 Formattable*
1371 MessageFormat::parse(int32_t msgStart,
1372                      const UnicodeString& source,
1373                      ParsePosition& pos,
1374                      int32_t& count,
1375                      UErrorCode& ec) const {
1376     count = 0;
1377     if (U_FAILURE(ec)) {
1378         pos.setErrorIndex(pos.getIndex());
1379         return NULL;
1380     }
1381     // parse() does not work with named arguments.
1382     if (msgPattern.hasNamedArguments()) {
1383         ec = U_ARGUMENT_TYPE_MISMATCH;
1384         pos.setErrorIndex(pos.getIndex());
1385         return NULL;
1386     }
1387     LocalArray<Formattable> resultArray(new Formattable[argTypeCount ? argTypeCount : 1]);
1388     const UnicodeString& msgString=msgPattern.getPatternString();
1389     int32_t prevIndex=msgPattern.getPart(msgStart).getLimit();
1390     int32_t sourceOffset = pos.getIndex();
1391     ParsePosition tempStatus(0);
1392
1393     for(int32_t i=msgStart+1; ; ++i) {
1394         UBool haveArgResult = FALSE;
1395         const MessagePattern::Part* part=&msgPattern.getPart(i);
1396         const UMessagePatternPartType type=part->getType();
1397         int32_t index=part->getIndex();
1398         // Make sure the literal string matches.
1399         int32_t len = index - prevIndex;
1400         if (len == 0 || (0 == msgString.compare(prevIndex, len, source, sourceOffset, len))) {
1401             sourceOffset += len;
1402             prevIndex += len;
1403         } else {
1404             pos.setErrorIndex(sourceOffset);
1405             return NULL; // leave index as is to signal error
1406         }
1407         if(type==UMSGPAT_PART_TYPE_MSG_LIMIT) {
1408             // Things went well! Done.
1409             pos.setIndex(sourceOffset);
1410             return resultArray.orphan();
1411         }
1412         if(type==UMSGPAT_PART_TYPE_SKIP_SYNTAX || type==UMSGPAT_PART_TYPE_INSERT_CHAR) {
1413             prevIndex=part->getLimit();
1414             continue;
1415         }
1416         // We do not support parsing Plural formats. (No REPLACE_NUMBER here.)
1417         // Unexpected Part "part" in parsed message.
1418         U_ASSERT(type==UMSGPAT_PART_TYPE_ARG_START);
1419         int32_t argLimit=msgPattern.getLimitPartIndex(i);
1420
1421         UMessagePatternArgType argType=part->getArgType();
1422         part=&msgPattern.getPart(++i);
1423         int32_t argNumber = part->getValue();  // ARG_NUMBER
1424         UnicodeString key;
1425         ++i;
1426         const Format* formatter = NULL;
1427         Formattable& argResult = resultArray[argNumber];
1428
1429         if(cachedFormatters!=NULL && (formatter = getCachedFormatter(i - 2))!=NULL) {
1430             // Just parse using the formatter.
1431             tempStatus.setIndex(sourceOffset);
1432             formatter->parseObject(source, argResult, tempStatus);
1433             if (tempStatus.getIndex() == sourceOffset) {
1434                 pos.setErrorIndex(sourceOffset);
1435                 return NULL; // leave index as is to signal error
1436             }
1437             sourceOffset = tempStatus.getIndex();
1438             haveArgResult = TRUE;
1439         } else if(
1440             argType==UMSGPAT_ARG_TYPE_NONE || (cachedFormatters && uhash_iget(cachedFormatters, i -2))) {
1441             // We arrive here if getCachedFormatter returned NULL, but there was actually an element in the hash table.
1442             // This can only happen if the hash table contained a DummyFormat, so the if statement above is a check
1443             // for the hash table containind DummyFormat.
1444
1445             // Match as a string.
1446             // if at end, use longest possible match
1447             // otherwise uses first match to intervening string
1448             // does NOT recursively try all possibilities
1449             UnicodeString stringAfterArgument = getLiteralStringUntilNextArgument(argLimit);
1450             int32_t next;
1451             if (!stringAfterArgument.isEmpty()) {
1452                 next = source.indexOf(stringAfterArgument, sourceOffset);
1453             } else {
1454                 next = source.length();
1455             }
1456             if (next < 0) {
1457                 pos.setErrorIndex(sourceOffset);
1458                 return NULL; // leave index as is to signal error
1459             } else {
1460                 UnicodeString strValue(source.tempSubString(sourceOffset, next - sourceOffset));
1461                 UnicodeString compValue;
1462                 compValue.append(LEFT_CURLY_BRACE);
1463                 itos(argNumber, compValue);
1464                 compValue.append(RIGHT_CURLY_BRACE);
1465                 if (0 != strValue.compare(compValue)) {
1466                     argResult.setString(strValue);
1467                     haveArgResult = TRUE;
1468                 }
1469                 sourceOffset = next;
1470             }
1471         } else if(argType==UMSGPAT_ARG_TYPE_CHOICE) {
1472             tempStatus.setIndex(sourceOffset);
1473             double choiceResult = ChoiceFormat::parseArgument(msgPattern, i, source, tempStatus);
1474             if (tempStatus.getIndex() == sourceOffset) {
1475                 pos.setErrorIndex(sourceOffset);
1476                 return NULL; // leave index as is to signal error
1477             }
1478             argResult.setDouble(choiceResult);
1479             haveArgResult = TRUE;
1480             sourceOffset = tempStatus.getIndex();
1481         } else if(UMSGPAT_ARG_TYPE_HAS_PLURAL_STYLE(argType) || argType==UMSGPAT_ARG_TYPE_SELECT) {
1482             // Parsing not supported.
1483             ec = U_UNSUPPORTED_ERROR;
1484             return NULL;
1485         } else {
1486             // This should never happen.
1487             ec = U_INTERNAL_PROGRAM_ERROR;
1488             return NULL;
1489         }
1490         if (haveArgResult && count <= argNumber) {
1491             count = argNumber + 1;
1492         }
1493         prevIndex=msgPattern.getPart(argLimit).getLimit();
1494         i=argLimit;
1495     }
1496 }
1497 // -------------------------------------
1498 // Parses the source pattern and returns the Formattable objects array,
1499 // the array count and the ending parse position.  The caller of this method
1500 // owns the array.
1501
1502 Formattable*
1503 MessageFormat::parse(const UnicodeString& source,
1504                      ParsePosition& pos,
1505                      int32_t& count) const {
1506     UErrorCode ec = U_ZERO_ERROR;
1507     return parse(0, source, pos, count, ec);
1508 }
1509
1510 // -------------------------------------
1511 // Parses the source string and returns the array of
1512 // Formattable objects and the array count.  The caller
1513 // owns the returned array.
1514
1515 Formattable*
1516 MessageFormat::parse(const UnicodeString& source,
1517                      int32_t& cnt,
1518                      UErrorCode& success) const
1519 {
1520     if (msgPattern.hasNamedArguments()) {
1521         success = U_ARGUMENT_TYPE_MISMATCH;
1522         return NULL;
1523     }
1524     ParsePosition status(0);
1525     // Calls the actual implementation method and starts
1526     // from zero offset of the source text.
1527     Formattable* result = parse(source, status, cnt);
1528     if (status.getIndex() == 0) {
1529         success = U_MESSAGE_PARSE_ERROR;
1530         delete[] result;
1531         return NULL;
1532     }
1533     return result;
1534 }
1535
1536 // -------------------------------------
1537 // Parses the source text and copy into the result buffer.
1538
1539 void
1540 MessageFormat::parseObject( const UnicodeString& source,
1541                             Formattable& result,
1542                             ParsePosition& status) const
1543 {
1544     int32_t cnt = 0;
1545     Formattable* tmpResult = parse(source, status, cnt);
1546     if (tmpResult != NULL)
1547         result.adoptArray(tmpResult, cnt);
1548 }
1549
1550 UnicodeString
1551 MessageFormat::autoQuoteApostrophe(const UnicodeString& pattern, UErrorCode& status) {
1552     UnicodeString result;
1553     if (U_SUCCESS(status)) {
1554         int32_t plen = pattern.length();
1555         const UChar* pat = pattern.getBuffer();
1556         int32_t blen = plen * 2 + 1; // space for null termination, convenience
1557         UChar* buf = result.getBuffer(blen);
1558         if (buf == NULL) {
1559             status = U_MEMORY_ALLOCATION_ERROR;
1560         } else {
1561             int32_t len = umsg_autoQuoteApostrophe(pat, plen, buf, blen, &status);
1562             result.releaseBuffer(U_SUCCESS(status) ? len : 0);
1563         }
1564     }
1565     if (U_FAILURE(status)) {
1566         result.setToBogus();
1567     }
1568     return result;
1569 }
1570
1571 // -------------------------------------
1572
1573 static Format* makeRBNF(URBNFRuleSetTag tag, const Locale& locale, const UnicodeString& defaultRuleSet, UErrorCode& ec) {
1574     RuleBasedNumberFormat* fmt = new RuleBasedNumberFormat(tag, locale, ec);
1575     if (fmt == NULL) {
1576         ec = U_MEMORY_ALLOCATION_ERROR;
1577     } else if (U_SUCCESS(ec) && defaultRuleSet.length() > 0) {
1578         UErrorCode localStatus = U_ZERO_ERROR; // ignore unrecognized default rule set
1579         fmt->setDefaultRuleSet(defaultRuleSet, localStatus);
1580     }
1581     return fmt;
1582 }
1583
1584 void MessageFormat::cacheExplicitFormats(UErrorCode& status) {
1585     if (U_FAILURE(status)) {
1586         return;
1587     }
1588
1589     if (cachedFormatters != NULL) {
1590         uhash_removeAll(cachedFormatters);
1591     }
1592     if (customFormatArgStarts != NULL) {
1593         uhash_removeAll(customFormatArgStarts);
1594     }
1595
1596     // The last two "parts" can at most be ARG_LIMIT and MSG_LIMIT
1597     // which we need not examine.
1598     int32_t limit = msgPattern.countParts() - 2;
1599     argTypeCount = 0;
1600     // We also need not look at the first two "parts"
1601     // (at most MSG_START and ARG_START) in this loop.
1602     // We determine the argTypeCount first so that we can allocateArgTypes
1603     // so that the next loop can set argTypes[argNumber].
1604     // (This is for the C API which needs the argTypes to read its va_arg list.)
1605     for (int32_t i = 2; i < limit && U_SUCCESS(status); ++i) {
1606         const MessagePattern::Part& part = msgPattern.getPart(i);
1607         if (part.getType() == UMSGPAT_PART_TYPE_ARG_NUMBER) {
1608             const int argNumber = part.getValue();
1609             if (argNumber >= argTypeCount) {
1610                 argTypeCount = argNumber + 1;
1611             }
1612         }
1613     }
1614     if (!allocateArgTypes(argTypeCount, status)) {
1615         return;
1616     }
1617     // Set all argTypes to kObject, as a "none" value, for lack of any better value.
1618     // We never use kObject for real arguments.
1619     // We use it as "no argument yet" for the check for hasArgTypeConflicts.
1620     for (int32_t i = 0; i < argTypeCount; ++i) {
1621         argTypes[i] = Formattable::kObject;
1622     }
1623     hasArgTypeConflicts = FALSE;
1624
1625     // This loop starts at part index 1 because we do need to examine
1626     // ARG_START parts. (But we can ignore the MSG_START.)
1627     for (int32_t i = 1; i < limit && U_SUCCESS(status); ++i) {
1628         const MessagePattern::Part* part = &msgPattern.getPart(i);
1629         if (part->getType() != UMSGPAT_PART_TYPE_ARG_START) {
1630             continue;
1631         }
1632         UMessagePatternArgType argType = part->getArgType();
1633
1634         int32_t argNumber = -1;
1635         part = &msgPattern.getPart(i + 1);
1636         if (part->getType() == UMSGPAT_PART_TYPE_ARG_NUMBER) {
1637             argNumber = part->getValue();
1638         }
1639         Formattable::Type formattableType;
1640
1641         switch (argType) {
1642         case UMSGPAT_ARG_TYPE_NONE:
1643             formattableType = Formattable::kString;
1644             break;
1645         case UMSGPAT_ARG_TYPE_SIMPLE: {
1646             int32_t index = i;
1647             i += 2;
1648             UnicodeString explicitType = msgPattern.getSubstring(msgPattern.getPart(i++));
1649             UnicodeString style;
1650             if ((part = &msgPattern.getPart(i))->getType() == UMSGPAT_PART_TYPE_ARG_STYLE) {
1651                 style = msgPattern.getSubstring(*part);
1652                 ++i;
1653             }
1654             UParseError parseError;
1655             Format* formatter = createAppropriateFormat(explicitType, style, formattableType, parseError, status);
1656             setArgStartFormat(index, formatter, status);
1657             break;
1658         }
1659         case UMSGPAT_ARG_TYPE_CHOICE:
1660         case UMSGPAT_ARG_TYPE_PLURAL:
1661         case UMSGPAT_ARG_TYPE_SELECTORDINAL:
1662             formattableType = Formattable::kDouble;
1663             break;
1664         case UMSGPAT_ARG_TYPE_SELECT:
1665             formattableType = Formattable::kString;
1666             break;
1667         default:
1668             status = U_INTERNAL_PROGRAM_ERROR;  // Should be unreachable.
1669             formattableType = Formattable::kString;
1670             break;
1671         }
1672         if (argNumber != -1) {
1673             if (argTypes[argNumber] != Formattable::kObject && argTypes[argNumber] != formattableType) {
1674                 hasArgTypeConflicts = TRUE;
1675             }
1676             argTypes[argNumber] = formattableType;
1677         }
1678     }
1679 }
1680
1681 Format* MessageFormat::createAppropriateFormat(UnicodeString& type, UnicodeString& style,
1682                                                Formattable::Type& formattableType, UParseError& parseError,
1683                                                UErrorCode& ec) {
1684     if (U_FAILURE(ec)) {
1685         return NULL;
1686     }
1687     Format* fmt = NULL;
1688     int32_t typeID, styleID;
1689     DateFormat::EStyle date_style;
1690     int32_t firstNonSpace;
1691
1692     switch (typeID = findKeyword(type, TYPE_IDS)) {
1693     case 0: // number
1694         formattableType = Formattable::kDouble;
1695         switch (findKeyword(style, NUMBER_STYLE_IDS)) {
1696         case 0: // default
1697             fmt = NumberFormat::createInstance(fLocale, ec);
1698             break;
1699         case 1: // currency
1700             fmt = NumberFormat::createCurrencyInstance(fLocale, ec);
1701             break;
1702         case 2: // percent
1703             fmt = NumberFormat::createPercentInstance(fLocale, ec);
1704             break;
1705         case 3: // integer
1706             formattableType = Formattable::kLong;
1707             fmt = createIntegerFormat(fLocale, ec);
1708             break;
1709         default: // pattern or skeleton
1710             firstNonSpace = PatternProps::skipWhiteSpace(style, 0);
1711             if (style.compare(firstNonSpace, 2, u"::", 0, 2) == 0) {
1712                 // Skeleton
1713                 UnicodeString skeleton = style.tempSubString(firstNonSpace + 2);
1714                 fmt = number::NumberFormatter::forSkeleton(skeleton, ec).locale(fLocale).toFormat(ec);
1715             } else {
1716                 // Pattern
1717                 fmt = NumberFormat::createInstance(fLocale, ec);
1718                 if (fmt) {
1719                     auto* decfmt = dynamic_cast<DecimalFormat*>(fmt);
1720                     if (decfmt != nullptr) {
1721                         decfmt->applyPattern(style, parseError, ec);
1722                     }
1723                 }
1724             }
1725             break;
1726         }
1727         break;
1728
1729     case 1: // date
1730     case 2: // time
1731         formattableType = Formattable::kDate;
1732         firstNonSpace = PatternProps::skipWhiteSpace(style, 0);
1733         if (style.compare(firstNonSpace, 2, u"::", 0, 2) == 0) {
1734             // Skeleton
1735             UnicodeString skeleton = style.tempSubString(firstNonSpace + 2);
1736             fmt = DateFormat::createInstanceForSkeleton(skeleton, fLocale, ec);
1737         } else {
1738             // Pattern
1739             styleID = findKeyword(style, DATE_STYLE_IDS);
1740             date_style = (styleID >= 0) ? DATE_STYLES[styleID] : DateFormat::kDefault;
1741
1742             if (typeID == 1) {
1743                 fmt = DateFormat::createDateInstance(date_style, fLocale);
1744             } else {
1745                 fmt = DateFormat::createTimeInstance(date_style, fLocale);
1746             }
1747
1748             if (styleID < 0 && fmt != NULL) {
1749                 SimpleDateFormat* sdtfmt = dynamic_cast<SimpleDateFormat*>(fmt);
1750                 if (sdtfmt != NULL) {
1751                     sdtfmt->applyPattern(style);
1752                 }
1753             }
1754         }
1755         break;
1756
1757     case 3: // spellout
1758         formattableType = Formattable::kDouble;
1759         fmt = makeRBNF(URBNF_SPELLOUT, fLocale, style, ec);
1760         break;
1761     case 4: // ordinal
1762         formattableType = Formattable::kDouble;
1763         fmt = makeRBNF(URBNF_ORDINAL, fLocale, style, ec);
1764         break;
1765     case 5: // duration
1766         formattableType = Formattable::kDouble;
1767         fmt = makeRBNF(URBNF_DURATION, fLocale, style, ec);
1768         break;
1769     default:
1770         formattableType = Formattable::kString;
1771         ec = U_ILLEGAL_ARGUMENT_ERROR;
1772         break;
1773     }
1774
1775     return fmt;
1776 }
1777
1778
1779 //-------------------------------------
1780 // Finds the string, s, in the string array, list.
1781 int32_t MessageFormat::findKeyword(const UnicodeString& s,
1782                                    const UChar * const *list)
1783 {
1784     if (s.isEmpty()) {
1785         return 0; // default
1786     }
1787
1788     int32_t length = s.length();
1789     const UChar *ps = PatternProps::trimWhiteSpace(s.getBuffer(), length);
1790     UnicodeString buffer(FALSE, ps, length);
1791     // Trims the space characters and turns all characters
1792     // in s to lower case.
1793     buffer.toLower("");
1794     for (int32_t i = 0; list[i]; ++i) {
1795         if (!buffer.compare(list[i], u_strlen(list[i]))) {
1796             return i;
1797         }
1798     }
1799     return -1;
1800 }
1801
1802 /**
1803  * Convenience method that ought to be in NumberFormat
1804  */
1805 NumberFormat*
1806 MessageFormat::createIntegerFormat(const Locale& locale, UErrorCode& status) const {
1807     NumberFormat *temp = NumberFormat::createInstance(locale, status);
1808     DecimalFormat *temp2;
1809     if (temp != NULL && (temp2 = dynamic_cast<DecimalFormat*>(temp)) != NULL) {
1810         temp2->setMaximumFractionDigits(0);
1811         temp2->setDecimalSeparatorAlwaysShown(FALSE);
1812         temp2->setParseIntegerOnly(TRUE);
1813     }
1814
1815     return temp;
1816 }
1817
1818 /**
1819  * Return the default number format.  Used to format a numeric
1820  * argument when subformats[i].format is NULL.  Returns NULL
1821  * on failure.
1822  *
1823  * Semantically const but may modify *this.
1824  */
1825 const NumberFormat* MessageFormat::getDefaultNumberFormat(UErrorCode& ec) const {
1826     if (defaultNumberFormat == NULL) {
1827         MessageFormat* t = (MessageFormat*) this;
1828         t->defaultNumberFormat = NumberFormat::createInstance(fLocale, ec);
1829         if (U_FAILURE(ec)) {
1830             delete t->defaultNumberFormat;
1831             t->defaultNumberFormat = NULL;
1832         } else if (t->defaultNumberFormat == NULL) {
1833             ec = U_MEMORY_ALLOCATION_ERROR;
1834         }
1835     }
1836     return defaultNumberFormat;
1837 }
1838
1839 /**
1840  * Return the default date format.  Used to format a date
1841  * argument when subformats[i].format is NULL.  Returns NULL
1842  * on failure.
1843  *
1844  * Semantically const but may modify *this.
1845  */
1846 const DateFormat* MessageFormat::getDefaultDateFormat(UErrorCode& ec) const {
1847     if (defaultDateFormat == NULL) {
1848         MessageFormat* t = (MessageFormat*) this;
1849         t->defaultDateFormat = DateFormat::createDateTimeInstance(DateFormat::kShort, DateFormat::kShort, fLocale);
1850         if (t->defaultDateFormat == NULL) {
1851             ec = U_MEMORY_ALLOCATION_ERROR;
1852         }
1853     }
1854     return defaultDateFormat;
1855 }
1856
1857 UBool
1858 MessageFormat::usesNamedArguments() const {
1859     return msgPattern.hasNamedArguments();
1860 }
1861
1862 int32_t
1863 MessageFormat::getArgTypeCount() const {
1864     return argTypeCount;
1865 }
1866
1867 UBool MessageFormat::equalFormats(const void* left, const void* right) {
1868     return *(const Format*)left==*(const Format*)right;
1869 }
1870
1871
1872 UBool MessageFormat::DummyFormat::operator==(const Format&) const {
1873     return TRUE;
1874 }
1875
1876 MessageFormat::DummyFormat* MessageFormat::DummyFormat::clone() const {
1877     return new DummyFormat();
1878 }
1879
1880 UnicodeString& MessageFormat::DummyFormat::format(const Formattable&,
1881                           UnicodeString& appendTo,
1882                           UErrorCode& status) const {
1883     if (U_SUCCESS(status)) {
1884         status = U_UNSUPPORTED_ERROR;
1885     }
1886     return appendTo;
1887 }
1888
1889 UnicodeString& MessageFormat::DummyFormat::format(const Formattable&,
1890                           UnicodeString& appendTo,
1891                           FieldPosition&,
1892                           UErrorCode& status) const {
1893     if (U_SUCCESS(status)) {
1894         status = U_UNSUPPORTED_ERROR;
1895     }
1896     return appendTo;
1897 }
1898
1899 UnicodeString& MessageFormat::DummyFormat::format(const Formattable&,
1900                           UnicodeString& appendTo,
1901                           FieldPositionIterator*,
1902                           UErrorCode& status) const {
1903     if (U_SUCCESS(status)) {
1904         status = U_UNSUPPORTED_ERROR;
1905     }
1906     return appendTo;
1907 }
1908
1909 void MessageFormat::DummyFormat::parseObject(const UnicodeString&,
1910                                                      Formattable&,
1911                                                      ParsePosition& ) const {
1912 }
1913
1914
1915 FormatNameEnumeration::FormatNameEnumeration(UVector *fNameList, UErrorCode& /*status*/) {
1916     pos=0;
1917     fFormatNames = fNameList;
1918 }
1919
1920 const UnicodeString*
1921 FormatNameEnumeration::snext(UErrorCode& status) {
1922     if (U_SUCCESS(status) && pos < fFormatNames->size()) {
1923         return (const UnicodeString*)fFormatNames->elementAt(pos++);
1924     }
1925     return NULL;
1926 }
1927
1928 void
1929 FormatNameEnumeration::reset(UErrorCode& /*status*/) {
1930     pos=0;
1931 }
1932
1933 int32_t
1934 FormatNameEnumeration::count(UErrorCode& /*status*/) const {
1935     return (fFormatNames==NULL) ? 0 : fFormatNames->size();
1936 }
1937
1938 FormatNameEnumeration::~FormatNameEnumeration() {
1939     delete fFormatNames;
1940 }
1941
1942 MessageFormat::PluralSelectorProvider::PluralSelectorProvider(const MessageFormat &mf, UPluralType t)
1943         : msgFormat(mf), rules(NULL), type(t) {
1944 }
1945
1946 MessageFormat::PluralSelectorProvider::~PluralSelectorProvider() {
1947     delete rules;
1948 }
1949
1950 UnicodeString MessageFormat::PluralSelectorProvider::select(void *ctx, double number,
1951                                                             UErrorCode& ec) const {
1952     if (U_FAILURE(ec)) {
1953         return UnicodeString(FALSE, OTHER_STRING, 5);
1954     }
1955     MessageFormat::PluralSelectorProvider* t = const_cast<MessageFormat::PluralSelectorProvider*>(this);
1956     if(rules == NULL) {
1957         t->rules = PluralRules::forLocale(msgFormat.fLocale, type, ec);
1958         if (U_FAILURE(ec)) {
1959             return UnicodeString(FALSE, OTHER_STRING, 5);
1960         }
1961     }
1962     // Select a sub-message according to how the number is formatted,
1963     // which is specified in the selected sub-message.
1964     // We avoid this circle by looking at how
1965     // the number is formatted in the "other" sub-message
1966     // which must always be present and usually contains the number.
1967     // Message authors should be consistent across sub-messages.
1968     PluralSelectorContext &context = *static_cast<PluralSelectorContext *>(ctx);
1969     int32_t otherIndex = msgFormat.findOtherSubMessage(context.startIndex);
1970     context.numberArgIndex = msgFormat.findFirstPluralNumberArg(otherIndex, context.argName);
1971     if(context.numberArgIndex > 0 && msgFormat.cachedFormatters != NULL) {
1972         context.formatter =
1973             (const Format*)uhash_iget(msgFormat.cachedFormatters, context.numberArgIndex);
1974     }
1975     if(context.formatter == NULL) {
1976         context.formatter = msgFormat.getDefaultNumberFormat(ec);
1977         context.forReplaceNumber = TRUE;
1978     }
1979     if (context.number.getDouble(ec) != number) {
1980         ec = U_INTERNAL_PROGRAM_ERROR;
1981         return UnicodeString(FALSE, OTHER_STRING, 5);
1982     }
1983     context.formatter->format(context.number, context.numberString, ec);
1984     auto* decFmt = dynamic_cast<const DecimalFormat *>(context.formatter);
1985     if(decFmt != NULL) {
1986         number::impl::DecimalQuantity dq;
1987         decFmt->formatToDecimalQuantity(context.number, dq, ec);
1988         if (U_FAILURE(ec)) {
1989             return UnicodeString(FALSE, OTHER_STRING, 5);
1990         }
1991         return rules->select(dq);
1992     } else {
1993         return rules->select(number);
1994     }
1995 }
1996
1997 void MessageFormat::PluralSelectorProvider::reset() {
1998     delete rules;
1999     rules = NULL;
2000 }
2001
2002
2003 U_NAMESPACE_END
2004
2005 #endif /* #if !UCONFIG_NO_FORMATTING */
2006
2007 //eof