icuSources/test/intltest/ustrtest.cpp

   1 /********************************************************************
   2  * COPYRIGHT:
   3  * Copyright (c) 1997-2014, International Business Machines Corporation and
   4  * others. All Rights Reserved.
   5  ********************************************************************/
   6
   7 #include "ustrtest.h"
   8 #include "unicode/appendable.h"
   9 #include "unicode/std_string.h"
  10 #include "unicode/unistr.h"
  11 #include "unicode/uchar.h"
  12 #include "unicode/ustring.h"
  13 #include "unicode/locid.h"
  14 #include "unicode/ucnv.h"
  15 #include "unicode/uenum.h"
  16 #include "unicode/utf16.h"
  17 #include "cmemory.h"
  18 #include "charstr.h"
  19
  20 #if 0
  21 #include "unicode/ustream.h"
  22
  23 #include <iostream>
  24 using namespace std;
  25
  26 #endif
  27
  28 UnicodeStringTest::~UnicodeStringTest() {}
  29
  30 void UnicodeStringTest::runIndexedTest( int32_t index, UBool exec, const char* &name, char *par)
  31 {
  32     if (exec) logln("TestSuite UnicodeStringTest: ");
  33     switch (index) {
  34         case 0:
  35             name = "StringCaseTest";
  36             if (exec) {
  37                 logln("StringCaseTest---"); logln("");
  38                 StringCaseTest test;
  39                 callTest(test, par);
  40             }
  41             break;
  42         case 1: name = "TestBasicManipulation"; if (exec) TestBasicManipulation(); break;
  43         case 2: name = "TestCompare"; if (exec) TestCompare(); break;
  44         case 3: name = "TestExtract"; if (exec) TestExtract(); break;
  45         case 4: name = "TestRemoveReplace"; if (exec) TestRemoveReplace(); break;
  46         case 5: name = "TestSearching"; if (exec) TestSearching(); break;
  47         case 6: name = "TestSpacePadding"; if (exec) TestSpacePadding(); break;
  48         case 7: name = "TestPrefixAndSuffix"; if (exec) TestPrefixAndSuffix(); break;
  49         case 8: name = "TestFindAndReplace"; if (exec) TestFindAndReplace(); break;
  50         case 9: name = "TestBogus"; if (exec) TestBogus(); break;
  51         case 10: name = "TestReverse"; if (exec) TestReverse(); break;
  52         case 11: name = "TestMiscellaneous"; if (exec) TestMiscellaneous(); break;
  53         case 12: name = "TestStackAllocation"; if (exec) TestStackAllocation(); break;
  54         case 13: name = "TestUnescape"; if (exec) TestUnescape(); break;
  55         case 14: name = "TestCountChar32"; if (exec) TestCountChar32(); break;
  56         case 15: name = "TestStringEnumeration"; if (exec) TestStringEnumeration(); break;
  57         case 16: name = "TestNameSpace"; if (exec) TestNameSpace(); break;
  58         case 17: name = "TestUTF32"; if (exec) TestUTF32(); break;
  59         case 18: name = "TestUTF8"; if (exec) TestUTF8(); break;
  60         case 19: name = "TestReadOnlyAlias"; if (exec) TestReadOnlyAlias(); break;
  61         case 20: name = "TestAppendable"; if (exec) TestAppendable(); break;
  62         case 21: name = "TestUnicodeStringImplementsAppendable"; if (exec) TestUnicodeStringImplementsAppendable(); break;
  63         case 22: name = "TestSizeofUnicodeString"; if (exec) TestSizeofUnicodeString(); break;
  64         case 23: name = "TestStartsWithAndEndsWithNulTerminated"; if (exec) TestStartsWithAndEndsWithNulTerminated(); break;
  65
  66         default: name = ""; break; //needed to end loop
  67     }
  68 }
  69
  70 void
  71 UnicodeStringTest::TestBasicManipulation()
  72 {
  73     UnicodeString   test1("Now is the time for all men to come swiftly to the aid of the party.\n");
  74     UnicodeString   expectedValue;
  75     UnicodeString   *c;
  76
  77     c=(UnicodeString *)test1.clone();
  78     test1.insert(24, "good ");
  79     expectedValue = "Now is the time for all good men to come swiftly to the aid of the party.\n";
  80     if (test1 != expectedValue)
  81         errln("insert() failed:  expected \"" + expectedValue + "\"\n,got \"" + test1 + "\"");
  82
  83     c->insert(24, "good ");
  84     if(*c != expectedValue) {
  85         errln("clone()->insert() failed:  expected \"" + expectedValue + "\"\n,got \"" + *c + "\"");
  86     }
  87     delete c;
  88
  89     test1.remove(41, 8);
  90     expectedValue = "Now is the time for all good men to come to the aid of the party.\n";
  91     if (test1 != expectedValue)
  92         errln("remove() failed:  expected \"" + expectedValue + "\"\n,got \"" + test1 + "\"");
  93
  94     test1.replace(58, 6, "ir country");
  95     expectedValue = "Now is the time for all good men to come to the aid of their country.\n";
  96     if (test1 != expectedValue)
  97         errln("replace() failed:  expected \"" + expectedValue + "\"\n,got \"" + test1 + "\"");
  98
  99     UChar     temp[80];
 100     test1.extract(0, 15, temp);
 101
 102     UnicodeString       test2(temp, 15);
 103
 104     expectedValue = "Now is the time";
 105     if (test2 != expectedValue)
 106         errln("extract() failed:  expected \"" + expectedValue + "\"\n,got \"" + test2 + "\"");
 107
 108     test2 += " for me to go!\n";
 109     expectedValue = "Now is the time for me to go!\n";
 110     if (test2 != expectedValue)
 111         errln("operator+=() failed:  expected \"" + expectedValue + "\"\n,got \"" + test2 + "\"");
 112
 113     if (test1.length() != 70)
 114         errln(UnicodeString("length() failed: expected 70, got ") + test1.length());
 115     if (test2.length() != 30)
 116         errln(UnicodeString("length() failed: expected 30, got ") + test2.length());
 117
 118     UnicodeString test3;
 119     test3.append((UChar32)0x20402);
 120     if(test3 != CharsToUnicodeString("\\uD841\\uDC02")){
 121         errln((UnicodeString)"append failed for UChar32, expected \"\\\\ud841\\\\udc02\", got " + prettify(test3));
 122     }
 123     if(test3.length() != 2){
 124         errln(UnicodeString("append or length failed for UChar32, expected 2, got ") + test3.length());
 125     }
 126     test3.append((UChar32)0x0074);
 127     if(test3 != CharsToUnicodeString("\\uD841\\uDC02t")){
 128         errln((UnicodeString)"append failed for UChar32, expected \"\\\\uD841\\\\uDC02t\", got " + prettify(test3));
 129     }
 130     if(test3.length() != 3){
 131         errln((UnicodeString)"append or length failed for UChar32, expected 2, got " + test3.length());
 132     }
 133
 134     // test some UChar32 overloads
 135     if( test3.setTo((UChar32)0x10330).length() != 2 ||
 136         test3.insert(0, (UChar32)0x20100).length() != 4 ||
 137         test3.replace(2, 2, (UChar32)0xe0061).length() != 4 ||
 138         (test3 = (UChar32)0x14001).length() != 2
 139     ) {
 140         errln((UnicodeString)"simple UChar32 overloads for replace, insert, setTo or = failed");
 141     }
 142
 143     {
 144         // test moveIndex32()
 145         UnicodeString s=UNICODE_STRING("\\U0002f999\\U0001d15f\\u00c4\\u1ed0", 32).unescape();
 146
 147         if(
 148             s.moveIndex32(2, -1)!=0 ||
 149             s.moveIndex32(2, 1)!=4 ||
 150             s.moveIndex32(2, 2)!=5 ||
 151             s.moveIndex32(5, -2)!=2 ||
 152             s.moveIndex32(0, -1)!=0 ||
 153             s.moveIndex32(6, 1)!=6
 154         ) {
 155             errln("UnicodeString::moveIndex32() failed");
 156         }
 157
 158         if(s.getChar32Start(1)!=0 || s.getChar32Start(2)!=2) {
 159             errln("UnicodeString::getChar32Start() failed");
 160         }
 161
 162         if(s.getChar32Limit(1)!=2 || s.getChar32Limit(2)!=2) {
 163             errln("UnicodeString::getChar32Limit() failed");
 164         }
 165     }
 166
 167     {
 168         // test new 2.2 constructors and setTo function that parallel Java's substring function.
 169         UnicodeString src("Hello folks how are you?");
 170         UnicodeString target1("how are you?");
 171         if (target1 != UnicodeString(src, 12)) {
 172             errln("UnicodeString(const UnicodeString&, int32_t) failed");
 173         }
 174         UnicodeString target2("folks");
 175         if (target2 != UnicodeString(src, 6, 5)) {
 176             errln("UnicodeString(const UnicodeString&, int32_t, int32_t) failed");
 177         }
 178         if (target1 != target2.setTo(src, 12)) {
 179             errln("UnicodeString::setTo(const UnicodeString&, int32_t) failed");
 180         }
 181     }
 182
 183     {
 184         // op+ is new in ICU 2.8
 185         UnicodeString s=UnicodeString("abc", "")+UnicodeString("def", "")+UnicodeString("ghi", "");
 186         if(s!=UnicodeString("abcdefghi", "")) {
 187             errln("operator+(UniStr, UniStr) failed");
 188         }
 189     }
 190
 191     {
 192         // tests for Jitterbug 2360
 193         // verify that APIs with source pointer + length accept length == -1
 194         // mostly test only where modified, only few functions did not already do this
 195         if(UnicodeString("abc", -1, "")!=UnicodeString("abc", "")) {
 196             errln("UnicodeString(codepageData, dataLength, codepage) does not work with dataLength==-1");
 197         }
 198
 199         UChar buffer[10]={ 0x61, 0x62, 0x20ac, 0xd900, 0xdc05, 0,   0x62, 0xffff, 0xdbff, 0xdfff };
 200         UnicodeString s, t(buffer, -1, UPRV_LENGTHOF(buffer));
 201
 202         if(s.setTo(buffer, -1, UPRV_LENGTHOF(buffer)).length()!=u_strlen(buffer)) {
 203             errln("UnicodeString.setTo(buffer, length, capacity) does not work with length==-1");
 204         }
 205         if(t.length()!=u_strlen(buffer)) {
 206             errln("UnicodeString(buffer, length, capacity) does not work with length==-1");
 207         }
 208
 209         if(0!=s.caseCompare(buffer, -1, U_FOLD_CASE_DEFAULT)) {
 210             errln("UnicodeString.caseCompare(const UChar *, length, options) does not work with length==-1");
 211         }
 212         if(0!=s.caseCompare(0, s.length(), buffer, U_FOLD_CASE_DEFAULT)) {
 213             errln("UnicodeString.caseCompare(start, _length, const UChar *, options) does not work");
 214         }
 215
 216         buffer[u_strlen(buffer)]=0xe4;
 217         UnicodeString u(buffer, -1, UPRV_LENGTHOF(buffer));
 218         if(s.setTo(buffer, -1, UPRV_LENGTHOF(buffer)).length()!=UPRV_LENGTHOF(buffer)) {
 219             errln("UnicodeString.setTo(buffer without NUL, length, capacity) does not work with length==-1");
 220         }
 221         if(u.length()!=UPRV_LENGTHOF(buffer)) {
 222             errln("UnicodeString(buffer without NUL, length, capacity) does not work with length==-1");
 223         }
 224
 225         static const char cs[]={ 0x61, (char)0xe4, (char)0x85, 0 };
 226         UConverter *cnv;
 227         UErrorCode errorCode=U_ZERO_ERROR;
 228
 229         cnv=ucnv_open("ISO-8859-1", &errorCode);
 230         UnicodeString v(cs, -1, cnv, errorCode);
 231         ucnv_close(cnv);
 232         if(v!=CharsToUnicodeString("a\\xe4\\x85")) {
 233             errln("UnicodeString(const char *, length, cnv, errorCode) does not work with length==-1");
 234         }
 235     }
 236
 237 #if U_CHARSET_IS_UTF8
 238     {
 239         // Test the hardcoded-UTF-8 UnicodeString optimizations.
 240         static const uint8_t utf8[]={ 0x61, 0xC3, 0xA4, 0xC3, 0x9F, 0xE4, 0xB8, 0x80, 0 };
 241         static const UChar utf16[]={ 0x61, 0xE4, 0xDF, 0x4E00 };
 242         UnicodeString from8a = UnicodeString((const char *)utf8);
 243         UnicodeString from8b = UnicodeString((const char *)utf8, (int32_t)sizeof(utf8)-1);
 244         UnicodeString from16(FALSE, utf16, UPRV_LENGTHOF(utf16));
 245         if(from8a != from16 || from8b != from16) {
 246             errln("UnicodeString(const char * U_CHARSET_IS_UTF8) failed");
 247         }
 248         char buffer[16];
 249         int32_t length8=from16.extract(0, 0x7fffffff, buffer, (uint32_t)sizeof(buffer));
 250         if(length8!=((int32_t)sizeof(utf8)-1) || 0!=uprv_memcmp(buffer, utf8, sizeof(utf8))) {
 251             errln("UnicodeString::extract(char * U_CHARSET_IS_UTF8) failed");
 252         }
 253         length8=from16.extract(1, 2, buffer, (uint32_t)sizeof(buffer));
 254         if(length8!=4 || buffer[length8]!=0 || 0!=uprv_memcmp(buffer, utf8+1, length8)) {
 255             errln("UnicodeString::extract(substring to char * U_CHARSET_IS_UTF8) failed");
 256         }
 257     }
 258 #endif
 259 }
 260
 261 void
 262 UnicodeStringTest::TestCompare()
 263 {
 264     UnicodeString   test1("this is a test");
 265     UnicodeString   test2("this is a test");
 266     UnicodeString   test3("this is a test of the emergency broadcast system");
 267     UnicodeString   test4("never say, \"this is a test\"!!");
 268
 269     UnicodeString   test5((UChar)0x5000);
 270     UnicodeString   test6((UChar)0x5100);
 271
 272     UChar         uniChars[] = { 0x74, 0x68, 0x69, 0x73, 0x20, 0x69, 0x73,
 273                  0x20, 0x61, 0x20, 0x74, 0x65, 0x73, 0x74, 0 };
 274     char            chars[] = "this is a test";
 275
 276     // test operator== and operator!=
 277     if (test1 != test2 || test1 == test3 || test1 == test4)
 278         errln("operator== or operator!= failed");
 279
 280     // test operator> and operator<
 281     if (test1 > test2 || test1 < test2 || !(test1 < test3) || !(test1 > test4) ||
 282         !(test5 < test6)
 283     ) {
 284         errln("operator> or operator< failed");
 285     }
 286
 287     // test operator>= and operator<=
 288     if (!(test1 >= test2) || !(test1 <= test2) || !(test1 <= test3) || !(test1 >= test4))
 289         errln("operator>= or operator<= failed");
 290
 291     // test compare(UnicodeString)
 292     if (test1.compare(test2) != 0 || test1.compare(test3) >= 0 || test1.compare(test4) <= 0)
 293         errln("compare(UnicodeString) failed");
 294
 295     //test compare(offset, length, UnicodeString)
 296     if(test1.compare(0, 14, test2) != 0 ||
 297         test3.compare(0, 14, test2) != 0 ||
 298         test4.compare(12, 14, test2) != 0 ||
 299         test3.compare(0, 18, test1) <=0  )
 300         errln("compare(offset, length, UnicodeString) failes");
 301
 302     // test compare(UChar*)
 303     if (test2.compare(uniChars) != 0 || test3.compare(uniChars) <= 0 || test4.compare(uniChars) >= 0)
 304         errln("compare(UChar*) failed");
 305
 306     // test compare(char*)
 307     if (test2.compare(chars) != 0 || test3.compare(chars) <= 0 || test4.compare(chars) >= 0)
 308         errln("compare(char*) failed");
 309
 310     // test compare(UChar*, length)
 311     if (test1.compare(uniChars, 4) <= 0 || test1.compare(uniChars, 4) <= 0)
 312         errln("compare(UChar*, length) failed");
 313
 314     // test compare(thisOffset, thisLength, that, thatOffset, thatLength)
 315     if (test1.compare(0, 14, test2, 0, 14) != 0
 316     || test1.compare(0, 14, test3, 0, 14) != 0
 317     || test1.compare(0, 14, test4, 12, 14) != 0)
 318         errln("1. compare(thisOffset, thisLength, that, thatOffset, thatLength) failed");
 319
 320     if (test1.compare(10, 4, test2, 0, 4) >= 0
 321     || test1.compare(10, 4, test3, 22, 9) <= 0
 322     || test1.compare(10, 4, test4, 22, 4) != 0)
 323         errln("2. compare(thisOffset, thisLength, that, thatOffset, thatLength) failed");
 324
 325     // test compareBetween
 326     if (test1.compareBetween(0, 14, test2, 0, 14) != 0 || test1.compareBetween(0, 14, test3, 0, 14) != 0
 327                     || test1.compareBetween(0, 14, test4, 12, 26) != 0)
 328         errln("compareBetween failed");
 329
 330     if (test1.compareBetween(10, 14, test2, 0, 4) >= 0 || test1.compareBetween(10, 14, test3, 22, 31) <= 0
 331                     || test1.compareBetween(10, 14, test4, 22, 26) != 0)
 332         errln("compareBetween failed");
 333
 334     // test compare() etc. with strings that share a buffer but are not equal
 335     test2=test1; // share the buffer, length() too large for the stackBuffer
 336     test2.truncate(1); // change only the length, not the buffer
 337     if( test1==test2 || test1<=test2 ||
 338         test1.compare(test2)<=0 ||
 339         test1.compareCodePointOrder(test2)<=0 ||
 340         test1.compareCodePointOrder(0, INT32_MAX, test2)<=0 ||
 341         test1.compareCodePointOrder(0, INT32_MAX, test2, 0, INT32_MAX)<=0 ||
 342         test1.compareCodePointOrderBetween(0, INT32_MAX, test2, 0, INT32_MAX)<=0 ||
 343         test1.caseCompare(test2, U_FOLD_CASE_DEFAULT)<=0
 344     ) {
 345         errln("UnicodeStrings that share a buffer but have different lengths compare as equal");
 346     }
 347
 348     /* test compareCodePointOrder() */
 349     {
 350         /* these strings are in ascending order */
 351         static const UChar strings[][4]={
 352             { 0x61, 0 },                    /* U+0061 */
 353             { 0x20ac, 0xd801, 0 },          /* U+20ac U+d801 */
 354             { 0x20ac, 0xd800, 0xdc00, 0 },  /* U+20ac U+10000 */
 355             { 0xd800, 0 },                  /* U+d800 */
 356             { 0xd800, 0xff61, 0 },          /* U+d800 U+ff61 */
 357             { 0xdfff, 0 },                  /* U+dfff */
 358             { 0xff61, 0xdfff, 0 },          /* U+ff61 U+dfff */
 359             { 0xff61, 0xd800, 0xdc02, 0 },  /* U+ff61 U+10002 */
 360             { 0xd800, 0xdc02, 0 },          /* U+10002 */
 361             { 0xd84d, 0xdc56, 0 }           /* U+23456 */
 362         };
 363         UnicodeString u[20]; // must be at least as long as strings[]
 364         int32_t i;
 365
 366         for(i=0; i<(int32_t)(sizeof(strings)/sizeof(strings[0])); ++i) {
 367             u[i]=UnicodeString(TRUE, strings[i], -1);
 368         }
 369
 370         for(i=0; i<(int32_t)(sizeof(strings)/sizeof(strings[0])-1); ++i) {
 371             if(u[i].compareCodePointOrder(u[i+1])>=0 || u[i].compareCodePointOrder(0, INT32_MAX, u[i+1].getBuffer())>=0) {
 372                 errln("error: UnicodeString::compareCodePointOrder() fails for string %d and the following one\n", i);
 373             }
 374         }
 375     }
 376
 377     /* test caseCompare() */
 378     {
 379         static const UChar
 380         _mixed[]=               { 0x61, 0x42, 0x131, 0x3a3, 0xdf,       0x130,       0x49,  0xfb03,           0xd93f, 0xdfff, 0 },
 381         _otherDefault[]=        { 0x41, 0x62, 0x131, 0x3c3, 0x73, 0x53, 0x69, 0x307, 0x69,  0x46, 0x66, 0x49, 0xd93f, 0xdfff, 0 },
 382         _otherExcludeSpecialI[]={ 0x41, 0x62, 0x131, 0x3c3, 0x53, 0x73, 0x69,        0x131, 0x66, 0x46, 0x69, 0xd93f, 0xdfff, 0 },
 383         _different[]=           { 0x41, 0x62, 0x131, 0x3c3, 0x73, 0x53, 0x130,       0x49,  0x46, 0x66, 0x49, 0xd93f, 0xdffd, 0 };
 384
 385         UnicodeString
 386             mixed(TRUE, _mixed, -1),
 387             otherDefault(TRUE, _otherDefault, -1),
 388             otherExcludeSpecialI(TRUE, _otherExcludeSpecialI, -1),
 389             different(TRUE, _different, -1);
 390
 391         int8_t result;
 392
 393         /* test caseCompare() */
 394         result=mixed.caseCompare(otherDefault, U_FOLD_CASE_DEFAULT);
 395         if(result!=0 || 0!=mixed.caseCompareBetween(0, INT32_MAX, otherDefault, 0, INT32_MAX, U_FOLD_CASE_DEFAULT)) {
 396             errln("error: mixed.caseCompare(other, default)=%ld instead of 0\n", result);
 397         }
 398         result=mixed.caseCompare(otherExcludeSpecialI, U_FOLD_CASE_EXCLUDE_SPECIAL_I);
 399         if(result!=0) {
 400             errln("error: mixed.caseCompare(otherExcludeSpecialI, U_FOLD_CASE_EXCLUDE_SPECIAL_I)=%ld instead of 0\n", result);
 401         }
 402         result=mixed.caseCompare(otherDefault, U_FOLD_CASE_EXCLUDE_SPECIAL_I);
 403         if(result==0 || 0==mixed.caseCompareBetween(0, INT32_MAX, otherDefault, 0, INT32_MAX, U_FOLD_CASE_EXCLUDE_SPECIAL_I)) {
 404             errln("error: mixed.caseCompare(other, U_FOLD_CASE_EXCLUDE_SPECIAL_I)=0 instead of !=0\n");
 405         }
 406
 407         /* test caseCompare() */
 408         result=mixed.caseCompare(different, U_FOLD_CASE_DEFAULT);
 409         if(result<=0) {
 410             errln("error: mixed.caseCompare(different, default)=%ld instead of positive\n", result);
 411         }
 412
 413         /* test caseCompare() - include the folded sharp s (U+00df) with different lengths */
 414         result=mixed.caseCompare(1, 4, different, 1, 5, U_FOLD_CASE_DEFAULT);
 415         if(result!=0 || 0!=mixed.caseCompareBetween(1, 5, different, 1, 6, U_FOLD_CASE_DEFAULT)) {
 416             errln("error: mixed.caseCompare(mixed, 1, 4, different, 1, 5, default)=%ld instead of 0\n", result);
 417         }
 418
 419         /* test caseCompare() - stop in the middle of the sharp s (U+00df) */
 420         result=mixed.caseCompare(1, 4, different, 1, 4, U_FOLD_CASE_DEFAULT);
 421         if(result<=0) {
 422             errln("error: mixed.caseCompare(1, 4, different, 1, 4, default)=%ld instead of positive\n", result);
 423         }
 424     }
 425
 426     // test that srcLength=-1 is handled in functions that
 427     // take input const UChar */int32_t srcLength (j785)
 428     {
 429         static const UChar u[]={ 0x61, 0x308, 0x62, 0 };
 430         UnicodeString s=UNICODE_STRING("a\\u0308b", 8).unescape();
 431
 432         if(s.compare(u, -1)!=0 || s.compare(0, 999, u, 0, -1)!=0) {
 433             errln("error UnicodeString::compare(..., const UChar *, srcLength=-1) does not work");
 434         }
 435
 436         if(s.compareCodePointOrder(u, -1)!=0 || s.compareCodePointOrder(0, 999, u, 0, -1)!=0) {
 437             errln("error UnicodeString::compareCodePointOrder(..., const UChar *, srcLength=-1, ...) does not work");
 438         }
 439
 440         if(s.caseCompare(u, -1, U_FOLD_CASE_DEFAULT)!=0 || s.caseCompare(0, 999, u, 0, -1, U_FOLD_CASE_DEFAULT)!=0) {
 441             errln("error UnicodeString::caseCompare(..., const UChar *, srcLength=-1, ...) does not work");
 442         }
 443
 444         if(s.indexOf(u, 1, -1, 0, 999)!=1 || s.indexOf(u+1, -1, 0, 999)!=1 || s.indexOf(u+1, -1, 0)!=1) {
 445             errln("error UnicodeString::indexOf(const UChar *, srcLength=-1, ...) does not work");
 446         }
 447
 448         if(s.lastIndexOf(u, 1, -1, 0, 999)!=1 || s.lastIndexOf(u+1, -1, 0, 999)!=1 || s.lastIndexOf(u+1, -1, 0)!=1) {
 449             errln("error UnicodeString::lastIndexOf(const UChar *, srcLength=-1, ...) does not work");
 450         }
 451
 452         UnicodeString s2, s3;
 453         s2.replace(0, 0, u+1, -1);
 454         s3.replace(0, 0, u, 1, -1);
 455         if(s.compare(1, 999, s2)!=0 || s2!=s3) {
 456             errln("error UnicodeString::replace(..., const UChar *, srcLength=-1, ...) does not work");
 457         }
 458     }
 459 }
 460
 461 void
 462 UnicodeStringTest::TestExtract()
 463 {
 464     UnicodeString  test1("Now is the time for all good men to come to the aid of their country.", "");
 465     UnicodeString  test2;
 466     UChar          test3[13] = {1, 2, 3, 4, 5, 6, 7, 8, 8, 10, 11, 12, 13};
 467     char           test4[13] = {1, 2, 3, 4, 5, 6, 7, 8, 8, 10, 11, 12, 13};
 468     UnicodeString  test5;
 469     char           test6[13] = {1, 2, 3, 4, 5, 6, 7, 8, 8, 10, 11, 12, 13};
 470
 471     test1.extract(11, 12, test2);
 472     test1.extract(11, 12, test3);
 473     if (test1.extract(11, 12, test4) != 12 || test4[12] != 0) {
 474         errln("UnicodeString.extract(char *) failed to return the correct size of destination buffer.");
 475     }
 476
 477     // test proper pinning in extractBetween()
 478     test1.extractBetween(-3, 7, test5);
 479     if(test5!=UNICODE_STRING("Now is ", 7)) {
 480         errln("UnicodeString.extractBetween(-3, 7) did not pin properly.");
 481     }
 482
 483     test1.extractBetween(11, 23, test5);
 484     if (test1.extract(60, 71, test6) != 9) {
 485         errln("UnicodeString.extract() failed to return the correct size of destination buffer for end of buffer.");
 486     }
 487     if (test1.extract(11, 12, test6) != 12) {
 488         errln("UnicodeString.extract() failed to return the correct size of destination buffer.");
 489     }
 490
 491     // convert test4 back to Unicode for comparison
 492     UnicodeString test4b(test4, 12);
 493
 494     if (test1.extract(11, 12, (char *)NULL) != 12) {
 495         errln("UnicodeString.extract(NULL) failed to return the correct size of destination buffer.");
 496     }
 497     if (test1.extract(11, -1, test6) != 0) {
 498         errln("UnicodeString.extract(-1) failed to stop reading the string.");
 499     }
 500
 501     for (int32_t i = 0; i < 12; i++) {
 502         if (test1.charAt((int32_t)(11 + i)) != test2.charAt(i)) {
 503             errln(UnicodeString("extracting into a UnicodeString failed at position ") + i);
 504             break;
 505         }
 506         if (test1.charAt((int32_t)(11 + i)) != test3[i]) {
 507             errln(UnicodeString("extracting into an array of UChar failed at position ") + i);
 508             break;
 509         }
 510         if (((char)test1.charAt((int32_t)(11 + i))) != test4b.charAt(i)) {
 511             errln(UnicodeString("extracting into an array of char failed at position ") + i);
 512             break;
 513         }
 514         if (test1.charAt((int32_t)(11 + i)) != test5.charAt(i)) {
 515             errln(UnicodeString("extracting with extractBetween failed at position ") + i);
 516             break;
 517         }
 518     }
 519
 520     // test preflighting and overflows with invariant conversion
 521     if (test1.extract(0, 10, (char *)NULL, "") != 10) {
 522         errln("UnicodeString.extract(0, 10, (char *)NULL, \"\") != 10");
 523     }
 524
 525     test4[2] = (char)0xff;
 526     if (test1.extract(0, 10, test4, 2, "") != 10) {
 527         errln("UnicodeString.extract(0, 10, test4, 2, \"\") != 10");
 528     }
 529     if (test4[2] != (char)0xff) {
 530         errln("UnicodeString.extract(0, 10, test4, 2, \"\") overwrote test4[2]");
 531     }
 532
 533     {
 534         // test new, NUL-terminating extract() function
 535         UnicodeString s("terminate", "");
 536         UChar dest[20]={
 537             0xa5, 0xa5, 0xa5, 0xa5, 0xa5, 0xa5, 0xa5, 0xa5, 0xa5, 0xa5,
 538             0xa5, 0xa5, 0xa5, 0xa5, 0xa5, 0xa5, 0xa5, 0xa5, 0xa5, 0xa5
 539         };
 540         UErrorCode errorCode;
 541         int32_t length;
 542
 543         errorCode=U_ZERO_ERROR;
 544         length=s.extract((UChar *)NULL, 0, errorCode);
 545         if(errorCode!=U_BUFFER_OVERFLOW_ERROR || length!=s.length()) {
 546             errln("UnicodeString.extract(NULL, 0)==%d (%s) expected %d (U_BUFFER_OVERFLOW_ERROR)", length, s.length(), u_errorName(errorCode));
 547         }
 548
 549         errorCode=U_ZERO_ERROR;
 550         length=s.extract(dest, s.length()-1, errorCode);
 551         if(errorCode!=U_BUFFER_OVERFLOW_ERROR || length!=s.length()) {
 552             errln("UnicodeString.extract(dest too short)==%d (%s) expected %d (U_BUFFER_OVERFLOW_ERROR)",
 553                 length, u_errorName(errorCode), s.length());
 554         }
 555
 556         errorCode=U_ZERO_ERROR;
 557         length=s.extract(dest, s.length(), errorCode);
 558         if(errorCode!=U_STRING_NOT_TERMINATED_WARNING || length!=s.length()) {
 559             errln("UnicodeString.extract(dest just right without NUL)==%d (%s) expected %d (U_STRING_NOT_TERMINATED_WARNING)",
 560                 length, u_errorName(errorCode), s.length());
 561         }
 562         if(dest[length-1]!=s[length-1] || dest[length]!=0xa5) {
 563             errln("UnicodeString.extract(dest just right without NUL) did not extract the string correctly");
 564         }
 565
 566         errorCode=U_ZERO_ERROR;
 567         length=s.extract(dest, s.length()+1, errorCode);
 568         if(errorCode!=U_ZERO_ERROR || length!=s.length()) {
 569             errln("UnicodeString.extract(dest large enough)==%d (%s) expected %d (U_ZERO_ERROR)",
 570                 length, u_errorName(errorCode), s.length());
 571         }
 572         if(dest[length-1]!=s[length-1] || dest[length]!=0 || dest[length+1]!=0xa5) {
 573             errln("UnicodeString.extract(dest large enough) did not extract the string correctly");
 574         }
 575     }
 576
 577     {
 578         // test new UConverter extract() and constructor
 579         UnicodeString s=UNICODE_STRING("\\U0002f999\\U0001d15f\\u00c4\\u1ed0", 32).unescape();
 580         char buffer[32];
 581         static const char expect[]={
 582             (char)0xf0, (char)0xaf, (char)0xa6, (char)0x99,
 583             (char)0xf0, (char)0x9d, (char)0x85, (char)0x9f,
 584             (char)0xc3, (char)0x84,
 585             (char)0xe1, (char)0xbb, (char)0x90
 586         };
 587         UErrorCode errorCode=U_ZERO_ERROR;
 588         UConverter *cnv=ucnv_open("UTF-8", &errorCode);
 589         int32_t length;
 590
 591         if(U_SUCCESS(errorCode)) {
 592             // test preflighting
 593             if( (length=s.extract(NULL, 0, cnv, errorCode))!=13 ||
 594                 errorCode!=U_BUFFER_OVERFLOW_ERROR
 595             ) {
 596                 errln("UnicodeString::extract(NULL, UConverter) preflighting failed (length=%ld, %s)",
 597                       length, u_errorName(errorCode));
 598             }
 599             errorCode=U_ZERO_ERROR;
 600             if( (length=s.extract(buffer, 2, cnv, errorCode))!=13 ||
 601                 errorCode!=U_BUFFER_OVERFLOW_ERROR
 602             ) {
 603                 errln("UnicodeString::extract(too small, UConverter) preflighting failed (length=%ld, %s)",
 604                       length, u_errorName(errorCode));
 605             }
 606
 607             // try error cases
 608             errorCode=U_ZERO_ERROR;
 609             if( s.extract(NULL, 2, cnv, errorCode)==13 || U_SUCCESS(errorCode)) {
 610                 errln("UnicodeString::extract(UConverter) succeeded with an illegal destination");
 611             }
 612             errorCode=U_ILLEGAL_ARGUMENT_ERROR;
 613             if( s.extract(NULL, 0, cnv, errorCode)==13 || U_SUCCESS(errorCode)) {
 614                 errln("UnicodeString::extract(UConverter) succeeded with a previous error code");
 615             }
 616             errorCode=U_ZERO_ERROR;
 617
 618             // extract for real
 619             if( (length=s.extract(buffer, sizeof(buffer), cnv, errorCode))!=13 ||
 620                 uprv_memcmp(buffer, expect, 13)!=0 ||
 621                 buffer[13]!=0 ||
 622                 U_FAILURE(errorCode)
 623             ) {
 624                 errln("UnicodeString::extract(UConverter) conversion failed (length=%ld, %s)",
 625                       length, u_errorName(errorCode));
 626             }
 627             // Test again with just the converter name.
 628             if( (length=s.extract(0, s.length(), buffer, sizeof(buffer), "UTF-8"))!=13 ||
 629                 uprv_memcmp(buffer, expect, 13)!=0 ||
 630                 buffer[13]!=0 ||
 631                 U_FAILURE(errorCode)
 632             ) {
 633                 errln("UnicodeString::extract(\"UTF-8\") conversion failed (length=%ld, %s)",
 634                       length, u_errorName(errorCode));
 635             }
 636
 637             // try the constructor
 638             UnicodeString t(expect, sizeof(expect), cnv, errorCode);
 639             if(U_FAILURE(errorCode) || s!=t) {
 640                 errln("UnicodeString(UConverter) conversion failed (%s)",
 641                       u_errorName(errorCode));
 642             }
 643
 644             ucnv_close(cnv);
 645         }
 646     }
 647 }
 648
 649 void
 650 UnicodeStringTest::TestRemoveReplace()
 651 {
 652     UnicodeString   test1("The rain in Spain stays mainly on the plain");
 653     UnicodeString   test2("eat SPAMburgers!");
 654     UChar         test3[] = { 0x53, 0x50, 0x41, 0x4d, 0x4d, 0 };
 655     char            test4[] = "SPAM";
 656     UnicodeString&  test5 = test1;
 657
 658     test1.replace(4, 4, test2, 4, 4);
 659     test1.replace(12, 5, test3, 4);
 660     test3[4] = 0;
 661     test1.replace(17, 4, test3);
 662     test1.replace(23, 4, test4);
 663     test1.replaceBetween(37, 42, test2, 4, 8);
 664
 665     if (test1 != "The SPAM in SPAM SPAMs SPAMly on the SPAM")
 666         errln("One of the replace methods failed:\n"
 667               "  expected \"The SPAM in SPAM SPAMs SPAMly on the SPAM\",\n"
 668               "  got \"" + test1 + "\"");
 669
 670     test1.remove(21, 1);
 671     test1.removeBetween(26, 28);
 672
 673     if (test1 != "The SPAM in SPAM SPAM SPAM on the SPAM")
 674         errln("One of the remove methods failed:\n"
 675               "  expected \"The SPAM in SPAM SPAM SPAM on the SPAM\",\n"
 676               "  got \"" + test1 + "\"");
 677
 678     for (int32_t i = 0; i < test1.length(); i++) {
 679         if (test5[i] != 0x53 && test5[i] != 0x50 && test5[i] != 0x41 && test5[i] != 0x4d && test5[i] != 0x20) {
 680             test1.setCharAt(i, 0x78);
 681         }
 682     }
 683
 684     if (test1 != "xxx SPAM xx SPAM SPAM SPAM xx xxx SPAM")
 685         errln("One of the remove methods failed:\n"
 686               "  expected \"xxx SPAM xx SPAM SPAM SPAM xx xxx SPAM\",\n"
 687               "  got \"" + test1 + "\"");
 688
 689     test1.remove();
 690     if (test1.length() != 0)
 691         errln("Remove() failed: expected empty string, got \"" + test1 + "\"");
 692 }
 693
 694 void
 695 UnicodeStringTest::TestSearching()
 696 {
 697     UnicodeString test1("test test ttest tetest testesteststt");
 698     UnicodeString test2("test");
 699     UChar testChar = 0x74;
 700
 701     UChar32 testChar32 = 0x20402;
 702     UChar testData[]={
 703         //   0       1       2       3       4       5       6       7
 704         0xd841, 0xdc02, 0x0071, 0xdc02, 0xd841, 0x0071, 0xd841, 0xdc02,
 705
 706         //   8       9      10      11      12      13      14      15
 707         0x0071, 0x0072, 0xd841, 0xdc02, 0x0071, 0xd841, 0xdc02, 0x0071,
 708
 709         //  16      17      18      19
 710         0xdc02, 0xd841, 0x0073, 0x0000
 711     };
 712     UnicodeString test3(testData);
 713     UnicodeString test4(testChar32);
 714
 715     uint16_t occurrences = 0;
 716     int32_t startPos = 0;
 717     for ( ;
 718           startPos != -1 && startPos < test1.length();
 719           (startPos = test1.indexOf(test2, startPos)) != -1 ? (++occurrences, startPos += 4) : 0)
 720         ;
 721     if (occurrences != 6)
 722         errln(UnicodeString("indexOf failed: expected to find 6 occurrences, found ") + occurrences);
 723
 724     for ( occurrences = 0, startPos = 10;
 725           startPos != -1 && startPos < test1.length();
 726           (startPos = test1.indexOf(test2, startPos)) != -1 ? (++occurrences, startPos += 4) : 0)
 727         ;
 728     if (occurrences != 4)
 729         errln(UnicodeString("indexOf with starting offset failed: "
 730                             "expected to find 4 occurrences, found ") + occurrences);
 731
 732     int32_t endPos = 28;
 733     for ( occurrences = 0, startPos = 5;
 734           startPos != -1 && startPos < test1.length();
 735           (startPos = test1.indexOf(test2, startPos, endPos - startPos)) != -1 ? (++occurrences, startPos += 4) : 0)
 736         ;
 737     if (occurrences != 4)
 738         errln(UnicodeString("indexOf with starting and ending offsets failed: "
 739                             "expected to find 4 occurrences, found ") + occurrences);
 740
 741     //using UChar32 string
 742     for ( startPos=0, occurrences=0;
 743           startPos != -1 && startPos < test3.length();
 744           (startPos = test3.indexOf(test4, startPos)) != -1 ? (++occurrences, startPos += 2) : 0)
 745         ;
 746     if (occurrences != 4)
 747         errln((UnicodeString)"indexOf failed: expected to find 4 occurrences, found " + occurrences);
 748
 749     for ( startPos=10, occurrences=0;
 750           startPos != -1 && startPos < test3.length();
 751           (startPos = test3.indexOf(test4, startPos)) != -1 ? (++occurrences, startPos += 2) : 0)
 752         ;
 753     if (occurrences != 2)
 754         errln(UnicodeString("indexOf failed: expected to find 2 occurrences, found ") + occurrences);
 755     //---
 756
 757     for ( occurrences = 0, startPos = 0;
 758           startPos != -1 && startPos < test1.length();
 759           (startPos = test1.indexOf(testChar, startPos)) != -1 ? (++occurrences, startPos += 1) : 0)
 760         ;
 761     if (occurrences != 16)
 762         errln(UnicodeString("indexOf with character failed: "
 763                             "expected to find 16 occurrences, found ") + occurrences);
 764
 765     for ( occurrences = 0, startPos = 10;
 766           startPos != -1 && startPos < test1.length();
 767           (startPos = test1.indexOf(testChar, startPos)) != -1 ? (++occurrences, startPos += 1) : 0)
 768         ;
 769     if (occurrences != 12)
 770         errln(UnicodeString("indexOf with character & start offset failed: "
 771                             "expected to find 12 occurrences, found ") + occurrences);
 772
 773     for ( occurrences = 0, startPos = 5, endPos = 28;
 774           startPos != -1 && startPos < test1.length();
 775           (startPos = test1.indexOf(testChar, startPos, endPos - startPos)) != -1 ? (++occurrences, startPos += 1) : 0)
 776         ;
 777     if (occurrences != 10)
 778         errln(UnicodeString("indexOf with character & start & end offsets failed: "
 779                             "expected to find 10 occurrences, found ") + occurrences);
 780
 781     //testing for UChar32
 782     UnicodeString subString;
 783     for( occurrences =0, startPos=0; startPos < test3.length(); startPos +=1){
 784         subString.append(test3, startPos, test3.length());
 785         if(subString.indexOf(testChar32) != -1 ){
 786              ++occurrences;
 787         }
 788         subString.remove();
 789     }
 790     if (occurrences != 14)
 791         errln((UnicodeString)"indexOf failed: expected to find 14 occurrences, found " + occurrences);
 792
 793     for ( occurrences = 0, startPos = 0;
 794           startPos != -1 && startPos < test3.length();
 795           (startPos = test3.indexOf(testChar32, startPos)) != -1 ? (++occurrences, startPos += 1) : 0)
 796         ;
 797     if (occurrences != 4)
 798         errln((UnicodeString)"indexOf failed: expected to find 4 occurrences, found " + occurrences);
 799
 800     endPos=test3.length();
 801     for ( occurrences = 0, startPos = 5;
 802           startPos != -1 && startPos < test3.length();
 803           (startPos = test3.indexOf(testChar32, startPos, endPos - startPos)) != -1 ? (++occurrences, startPos += 1) : 0)
 804         ;
 805     if (occurrences != 3)
 806         errln((UnicodeString)"indexOf with character & start & end offsets failed: expected to find 2 occurrences, found " + occurrences);
 807     //---
 808
 809     if(test1.lastIndexOf(test2)!=29) {
 810         errln("test1.lastIndexOf(test2)!=29");
 811     }
 812
 813     if(test1.lastIndexOf(test2, 15)!=29 || test1.lastIndexOf(test2, 29)!=29 || test1.lastIndexOf(test2, 30)!=-1) {
 814         errln("test1.lastIndexOf(test2, start) failed");
 815     }
 816
 817     for ( occurrences = 0, startPos = 32;
 818           startPos != -1;
 819           (startPos = test1.lastIndexOf(test2, 5, startPos - 5)) != -1 ? ++occurrences : 0)
 820         ;
 821     if (occurrences != 4)
 822         errln(UnicodeString("lastIndexOf with starting and ending offsets failed: "
 823                             "expected to find 4 occurrences, found ") + occurrences);
 824
 825     for ( occurrences = 0, startPos = 32;
 826           startPos != -1;
 827           (startPos = test1.lastIndexOf(testChar, 5, startPos - 5)) != -1 ? ++occurrences : 0)
 828         ;
 829     if (occurrences != 11)
 830         errln(UnicodeString("lastIndexOf with character & start & end offsets failed: "
 831                             "expected to find 11 occurrences, found ") + occurrences);
 832
 833     //testing UChar32
 834     startPos=test3.length();
 835     for ( occurrences = 0;
 836           startPos != -1;
 837           (startPos = test3.lastIndexOf(testChar32, 5, startPos - 5)) != -1 ? ++occurrences : 0)
 838         ;
 839     if (occurrences != 3)
 840         errln((UnicodeString)"lastIndexOf with character & start & end offsets failed: expected to find 3 occurrences, found " + occurrences);
 841
 842
 843     for ( occurrences = 0, endPos = test3.length();  endPos > 0; endPos -= 1){
 844         subString.remove();
 845         subString.append(test3, 0, endPos);
 846         if(subString.lastIndexOf(testChar32) != -1 ){
 847             ++occurrences;
 848         }
 849     }
 850     if (occurrences != 18)
 851         errln((UnicodeString)"indexOf failed: expected to find 18 occurrences, found " + occurrences);
 852     //---
 853
 854     // test that indexOf(UChar32) and lastIndexOf(UChar32)
 855     // do not find surrogate code points when they are part of matched pairs
 856     // (= part of supplementary code points)
 857     // Jitterbug 1542
 858     if(test3.indexOf((UChar32)0xd841) != 4 || test3.indexOf((UChar32)0xdc02) != 3) {
 859         errln("error: UnicodeString::indexOf(UChar32 surrogate) finds a partial supplementary code point");
 860     }
 861     if( UnicodeString(test3, 0, 17).lastIndexOf((UChar)0xd841, 0) != 4 ||
 862         UnicodeString(test3, 0, 17).lastIndexOf((UChar32)0xd841, 2) != 4 ||
 863         test3.lastIndexOf((UChar32)0xd841, 0, 17) != 4 || test3.lastIndexOf((UChar32)0xdc02, 0, 17) != 16
 864     ) {
 865         errln("error: UnicodeString::lastIndexOf(UChar32 surrogate) finds a partial supplementary code point");
 866     }
 867 }
 868
 869 void
 870 UnicodeStringTest::TestSpacePadding()
 871 {
 872     UnicodeString test1("hello");
 873     UnicodeString test2("   there");
 874     UnicodeString test3("Hi!  How ya doin'?  Beautiful day, isn't it?");
 875     UnicodeString test4;
 876     UBool returnVal;
 877     UnicodeString expectedValue;
 878
 879     returnVal = test1.padLeading(15);
 880     expectedValue = "          hello";
 881     if (returnVal == FALSE || test1 != expectedValue)
 882         errln("padLeading() failed: expected \"" + expectedValue + "\", got \"" + test1 + "\".");
 883
 884     returnVal = test2.padTrailing(15);
 885     expectedValue = "   there       ";
 886     if (returnVal == FALSE || test2 != expectedValue)
 887         errln("padTrailing() failed: expected \"" + expectedValue + "\", got \"" + test2 + "\".");
 888
 889     expectedValue = test3;
 890     returnVal = test3.padTrailing(15);
 891     if (returnVal == TRUE || test3 != expectedValue)
 892         errln("padTrailing() failed: expected \"" + expectedValue + "\", got \"" + test3 + "\".");
 893
 894     expectedValue = "hello";
 895     test4.setTo(test1).trim();
 896
 897     if (test4 != expectedValue || test1 == expectedValue || test4 != expectedValue)
 898         errln("trim(UnicodeString&) failed");
 899
 900     test1.trim();
 901     if (test1 != expectedValue)
 902         errln("trim() failed: expected \"" + expectedValue + "\", got \"" + test1 + "\".");
 903
 904     test2.trim();
 905     expectedValue = "there";
 906     if (test2 != expectedValue)
 907         errln("trim() failed: expected \"" + expectedValue + "\", got \"" + test2 + "\".");
 908
 909     test3.trim();
 910     expectedValue = "Hi!  How ya doin'?  Beautiful day, isn't it?";
 911     if (test3 != expectedValue)
 912         errln("trim() failed: expected \"" + expectedValue + "\", got \"" + test3 + "\".");
 913
 914     returnVal = test1.truncate(15);
 915     expectedValue = "hello";
 916     if (returnVal == TRUE || test1 != expectedValue)
 917         errln("truncate() failed: expected \"" + expectedValue + "\", got \"" + test1 + "\".");
 918
 919     returnVal = test2.truncate(15);
 920     expectedValue = "there";
 921     if (returnVal == TRUE || test2 != expectedValue)
 922         errln("truncate() failed: expected \"" + expectedValue + "\", got \"" + test2 + "\".");
 923
 924     returnVal = test3.truncate(15);
 925     expectedValue = "Hi!  How ya doi";
 926     if (returnVal == FALSE || test3 != expectedValue)
 927         errln("truncate() failed: expected \"" + expectedValue + "\", got \"" + test3 + "\".");
 928 }
 929
 930 void
 931 UnicodeStringTest::TestPrefixAndSuffix()
 932 {
 933     UnicodeString test1("Now is the time for all good men to come to the aid of their country.");
 934     UnicodeString test2("Now");
 935     UnicodeString test3("country.");
 936     UnicodeString test4("count");
 937
 938     if (!test1.startsWith(test2) || !test1.startsWith(test2, 0, test2.length())) {
 939         errln("startsWith() failed: \"" + test2 + "\" should be a prefix of \"" + test1 + "\".");
 940     }
 941
 942     if (test1.startsWith(test3) ||
 943         test1.startsWith(test3.getBuffer(), test3.length()) ||
 944         test1.startsWith(test3.getTerminatedBuffer(), 0, -1)
 945     ) {
 946         errln("startsWith() failed: \"" + test3 + "\" shouldn't be a prefix of \"" + test1 + "\".");
 947     }
 948
 949     if (test1.endsWith(test2)) {
 950         errln("endsWith() failed: \"" + test2 + "\" shouldn't be a suffix of \"" + test1 + "\".");
 951     }
 952
 953     if (!test1.endsWith(test3)) {
 954         errln("endsWith(test3) failed: \"" + test3 + "\" should be a suffix of \"" + test1 + "\".");
 955     }
 956     if (!test1.endsWith(test3, 0, INT32_MAX)) {
 957         errln("endsWith(test3, 0, INT32_MAX) failed: \"" + test3 + "\" should be a suffix of \"" + test1 + "\".");
 958     }
 959
 960     if(!test1.endsWith(test3.getBuffer(), test3.length())) {
 961         errln("endsWith(test3.getBuffer(), test3.length()) failed: \"" + test3 + "\" should be a suffix of \"" + test1 + "\".");
 962     }
 963     if(!test1.endsWith(test3.getTerminatedBuffer(), 0, -1)) {
 964         errln("endsWith(test3.getTerminatedBuffer(), 0, -1) failed: \"" + test3 + "\" should be a suffix of \"" + test1 + "\".");
 965     }
 966
 967     if (!test3.startsWith(test4)) {
 968         errln("endsWith(test4) failed: \"" + test4 + "\" should be a prefix of \"" + test3 + "\".");
 969     }
 970
 971     if (test4.startsWith(test3)) {
 972         errln("startsWith(test3) failed: \"" + test3 + "\" shouldn't be a prefix of \"" + test4 + "\".");
 973     }
 974 }
 975
 976 void
 977 UnicodeStringTest::TestStartsWithAndEndsWithNulTerminated() {
 978     UnicodeString test("abcde");
 979     const UChar ab[] = { 0x61, 0x62, 0 };
 980     const UChar de[] = { 0x64, 0x65, 0 };
 981     assertTrue("abcde.startsWith(ab, -1)", test.startsWith(ab, -1));
 982     assertTrue("abcde.startsWith(ab, 0, -1)", test.startsWith(ab, 0, -1));
 983     assertTrue("abcde.endsWith(de, -1)", test.endsWith(de, -1));
 984     assertTrue("abcde.endsWith(de, 0, -1)", test.endsWith(de, 0, -1));
 985 }
 986
 987 void
 988 UnicodeStringTest::TestFindAndReplace()
 989 {
 990     UnicodeString test1("One potato, two potato, three potato, four\n");
 991     UnicodeString test2("potato");
 992     UnicodeString test3("MISSISSIPPI");
 993
 994     UnicodeString expectedValue;
 995
 996     test1.findAndReplace(test2, test3);
 997     expectedValue = "One MISSISSIPPI, two MISSISSIPPI, three MISSISSIPPI, four\n";
 998     if (test1 != expectedValue)
 999         errln("findAndReplace failed: expected \"" + expectedValue + "\", got \"" + test1 + "\".");
1000     test1.findAndReplace(2, 32, test3, test2);
1001     expectedValue = "One potato, two potato, three MISSISSIPPI, four\n";
1002     if (test1 != expectedValue)
1003         errln("findAndReplace failed: expected \"" + expectedValue + "\", got \"" + test1 + "\".");
1004 }
1005
1006 void
1007 UnicodeStringTest::TestReverse()
1008 {
1009     UnicodeString test("backwards words say to used I");
1010
1011     test.reverse();
1012     test.reverse(2, 4);
1013     test.reverse(7, 2);
1014     test.reverse(10, 3);
1015     test.reverse(14, 5);
1016     test.reverse(20, 9);
1017
1018     if (test != "I used to say words backwards")
1019         errln("reverse() failed:  Expected \"I used to say words backwards\",\n got \""
1020             + test + "\"");
1021
1022     test=UNICODE_STRING("\\U0002f999\\U0001d15f\\u00c4\\u1ed0", 32).unescape();
1023     test.reverse();
1024     if(test.char32At(0)!=0x1ed0 || test.char32At(1)!=0xc4 || test.char32At(2)!=0x1d15f || test.char32At(4)!=0x2f999) {
1025         errln("reverse() failed with supplementary characters");
1026     }
1027
1028     // Test case for ticket #8091:
1029     // UnicodeString::reverse() failed to see a lead surrogate in the middle of
1030     // an odd-length string that contains no other lead surrogates.
1031     test=UNICODE_STRING_SIMPLE("ab\\U0001F4A9e").unescape();
1032     UnicodeString expected=UNICODE_STRING_SIMPLE("e\\U0001F4A9ba").unescape();
1033     test.reverse();
1034     if(test!=expected) {
1035         errln("reverse() failed with only lead surrogate in the middle");
1036     }
1037 }
1038
1039 void
1040 UnicodeStringTest::TestMiscellaneous()
1041 {
1042     UnicodeString   test1("This is a test");
1043     UnicodeString   test2("This is a test");
1044     UnicodeString   test3("Me too!");
1045
1046     // test getBuffer(minCapacity) and releaseBuffer()
1047     test1=UnicodeString(); // make sure that it starts with its stackBuffer
1048     UChar *p=test1.getBuffer(20);
1049     if(test1.getCapacity()<20) {
1050         errln("UnicodeString::getBuffer(20).getCapacity()<20");
1051     }
1052
1053     test1.append((UChar)7); // must not be able to modify the string here
1054     test1.setCharAt(3, 7);
1055     test1.reverse();
1056     if( test1.length()!=0 ||
1057         test1.charAt(0)!=0xffff || test1.charAt(3)!=0xffff ||
1058         test1.getBuffer(10)!=0 || test1.getBuffer()!=0
1059     ) {
1060         errln("UnicodeString::getBuffer(minCapacity) allows read or write access to the UnicodeString");
1061     }
1062
1063     p[0]=1;
1064     p[1]=2;
1065     p[2]=3;
1066     test1.releaseBuffer(3);
1067     test1.append((UChar)4);
1068
1069     if(test1.length()!=4 || test1.charAt(0)!=1 || test1.charAt(1)!=2 || test1.charAt(2)!=3 || test1.charAt(3)!=4) {
1070         errln("UnicodeString::releaseBuffer(newLength) does not properly reallow access to the UnicodeString");
1071     }
1072
1073     // test releaseBuffer() without getBuffer(minCapacity) - must not have any effect
1074     test1.releaseBuffer(1);
1075     if(test1.length()!=4 || test1.charAt(0)!=1 || test1.charAt(1)!=2 || test1.charAt(2)!=3 || test1.charAt(3)!=4) {
1076         errln("UnicodeString::releaseBuffer(newLength) without getBuffer(minCapacity) changed the UnicodeString");
1077     }
1078
1079     // test getBuffer(const)
1080     const UChar *q=test1.getBuffer(), *r=test1.getBuffer();
1081     if( test1.length()!=4 ||
1082         q[0]!=1 || q[1]!=2 || q[2]!=3 || q[3]!=4 ||
1083         r[0]!=1 || r[1]!=2 || r[2]!=3 || r[3]!=4
1084     ) {
1085         errln("UnicodeString::getBuffer(const) does not return a usable buffer pointer");
1086     }
1087
1088     // test releaseBuffer() with a NUL-terminated buffer
1089     test1.getBuffer(20)[2]=0;
1090     test1.releaseBuffer(); // implicit -1
1091     if(test1.length()!=2 || test1.charAt(0)!=1 || test1.charAt(1) !=2) {
1092         errln("UnicodeString::releaseBuffer(-1) does not properly set the length of the UnicodeString");
1093     }
1094
1095     // test releaseBuffer() with a non-NUL-terminated buffer
1096     p=test1.getBuffer(256);
1097     for(int32_t i=0; i<test1.getCapacity(); ++i) {
1098         p[i]=(UChar)1;      // fill the buffer with all non-NUL code units
1099     }
1100     test1.releaseBuffer();  // implicit -1
1101     if(test1.length()!=test1.getCapacity() || test1.charAt(1)!=1 || test1.charAt(100)!=1 || test1.charAt(test1.getCapacity()-1)!=1) {
1102         errln("UnicodeString::releaseBuffer(-1 but no NUL) does not properly set the length of the UnicodeString");
1103     }
1104
1105     // test getTerminatedBuffer()
1106     test1=UnicodeString("This is another test.", "");
1107     test2=UnicodeString("This is another test.", "");
1108     q=test1.getTerminatedBuffer();
1109     if(q[test1.length()]!=0 || test1!=test2 || test2.compare(q, -1)!=0) {
1110         errln("getTerminatedBuffer()[length]!=0");
1111     }
1112
1113     const UChar u[]={ 5, 6, 7, 8, 0 };
1114     test1.setTo(FALSE, u, 3);
1115     q=test1.getTerminatedBuffer();
1116     if(q==u || q[0]!=5 || q[1]!=6 || q[2]!=7 || q[3]!=0) {
1117         errln("UnicodeString(u[3]).getTerminatedBuffer() returns a bad buffer");
1118     }
1119
1120     test1.setTo(TRUE, u, -1);
1121     q=test1.getTerminatedBuffer();
1122     if(q!=u || test1.length()!=4 || q[3]!=8 || q[4]!=0) {
1123         errln("UnicodeString(u[-1]).getTerminatedBuffer() returns a bad buffer");
1124     }
1125
1126     test1=UNICODE_STRING("la", 2);
1127     test1.append(UNICODE_STRING(" lila", 5).getTerminatedBuffer(), 0, -1);
1128     if(test1!=UNICODE_STRING("la lila", 7)) {
1129         errln("UnicodeString::append(const UChar *, start, length) failed");
1130     }
1131
1132     test1.insert(3, UNICODE_STRING("dudum ", 6), 0, INT32_MAX);
1133     if(test1!=UNICODE_STRING("la dudum lila", 13)) {
1134         errln("UnicodeString::insert(start, const UniStr &, start, length) failed");
1135     }
1136
1137     static const UChar ucs[]={ 0x68, 0x6d, 0x20, 0 };
1138     test1.insert(9, ucs, -1);
1139     if(test1!=UNICODE_STRING("la dudum hm lila", 16)) {
1140         errln("UnicodeString::insert(start, const UChar *, length) failed");
1141     }
1142
1143     test1.replace(9, 2, (UChar)0x2b);
1144     if(test1!=UNICODE_STRING("la dudum + lila", 15)) {
1145         errln("UnicodeString::replace(start, length, UChar) failed");
1146     }
1147
1148     if(test1.hasMetaData() || UnicodeString().hasMetaData()) {
1149         errln("UnicodeString::hasMetaData() returns TRUE");
1150     }
1151
1152     // test getTerminatedBuffer() on a truncated, shared, heap-allocated string
1153     test1=UNICODE_STRING_SIMPLE("abcdefghijklmnopqrstuvwxyz0123456789.");
1154     test1.truncate(36);  // ensure length()<getCapacity()
1155     test2=test1;  // share the buffer
1156     test1.truncate(5);
1157     if(test1.length()!=5 || test1.getTerminatedBuffer()[5]!=0) {
1158         errln("UnicodeString(shared buffer).truncate() failed");
1159     }
1160     if(test2.length()!=36 || test2[5]!=0x66 || u_strlen(test2.getTerminatedBuffer())!=36) {
1161         errln("UnicodeString(shared buffer).truncate().getTerminatedBuffer() "
1162               "modified another copy of the string!");
1163     }
1164     test1=UNICODE_STRING_SIMPLE("abcdefghijklmnopqrstuvwxyz0123456789.");
1165     test1.truncate(36);  // ensure length()<getCapacity()
1166     test2=test1;  // share the buffer
1167     test1.remove();
1168     if(test1.length()!=0 || test1.getTerminatedBuffer()[0]!=0) {
1169         errln("UnicodeString(shared buffer).remove() failed");
1170     }
1171     if(test2.length()!=36 || test2[0]!=0x61 || u_strlen(test2.getTerminatedBuffer())!=36) {
1172         errln("UnicodeString(shared buffer).remove().getTerminatedBuffer() "
1173               "modified another copy of the string!");
1174     }
1175
1176     // ticket #9740
1177     test1.setTo(TRUE, ucs, 3);
1178     assertEquals("length of read-only alias", 3, test1.length());
1179     test1.trim();
1180     assertEquals("length of read-only alias after trim()", 2, test1.length());
1181     assertEquals("length of terminated buffer of read-only alias + trim()",
1182                  2, u_strlen(test1.getTerminatedBuffer()));
1183 }
1184
1185 void
1186 UnicodeStringTest::TestStackAllocation()
1187 {
1188     UChar           testString[] ={
1189         0x54, 0x68, 0x69, 0x73, 0x20, 0x69, 0x73, 0x20, 0x61, 0x20, 0x63, 0x72, 0x61, 0x7a, 0x79, 0x20, 0x74, 0x65, 0x73, 0x74, 0x2e, 0 };
1190     UChar           guardWord = 0x4DED;
1191     UnicodeString*  test = 0;
1192
1193     test = new  UnicodeString(testString);
1194     if (*test != "This is a crazy test.")
1195         errln("Test string failed to initialize properly.");
1196     if (guardWord != 0x04DED)
1197         errln("Test string initialization overwrote guard word!");
1198
1199     test->insert(8, "only ");
1200     test->remove(15, 6);
1201     if (*test != "This is only a test.")
1202         errln("Manipulation of test string failed to work right.");
1203     if (guardWord != 0x4DED)
1204         errln("Manipulation of test string overwrote guard word!");
1205
1206     // we have to deinitialize and release the backing store by calling the destructor
1207     // explicitly, since we can't overload operator delete
1208     delete test;
1209
1210     UChar workingBuffer[] = {
1211         0x4e, 0x6f, 0x77, 0x20, 0x69, 0x73, 0x20, 0x74, 0x68, 0x65, 0x20, 0x74, 0x69, 0x6d, 0x65, 0x20,
1212         0x66, 0x6f, 0x72, 0x20, 0x61, 0x6c, 0x6c, 0x20, 0x6d, 0x65, 0x6e, 0x20, 0x74, 0x6f, 0x20,
1213         0x63, 0x6f, 0x6d, 0x65, 0xffff, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
1214         0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
1215         0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 };
1216     UChar guardWord2 = 0x4DED;
1217
1218     test = new UnicodeString(workingBuffer, 35, 100);
1219     if (*test != "Now is the time for all men to come")
1220         errln("Stack-allocated backing store failed to initialize correctly.");
1221     if (guardWord2 != 0x4DED)
1222         errln("Stack-allocated backing store overwrote guard word!");
1223
1224     test->insert(24, "good ");
1225     if (*test != "Now is the time for all good men to come")
1226         errln("insert() on stack-allocated UnicodeString didn't work right");
1227     if (guardWord2 != 0x4DED)
1228         errln("insert() on stack-allocated UnicodeString overwrote guard word!");
1229
1230     if (workingBuffer[24] != 0x67)
1231         errln("insert() on stack-allocated UnicodeString didn't affect backing store");
1232
1233     *test += " to the aid of their country.";
1234     if (*test != "Now is the time for all good men to come to the aid of their country.")
1235         errln("Stack-allocated UnicodeString overflow didn't work");
1236     if (guardWord2 != 0x4DED)
1237         errln("Stack-allocated UnicodeString overflow overwrote guard word!");
1238
1239     *test = "ha!";
1240     if (*test != "ha!")
1241         errln("Assignment to stack-allocated UnicodeString didn't work");
1242     if (workingBuffer[0] != 0x4e)
1243         errln("Change to UnicodeString after overflow are still affecting original buffer");
1244     if (guardWord2 != 0x4DED)
1245         errln("Change to UnicodeString after overflow overwrote guard word!");
1246
1247     // test read-only aliasing with setTo()
1248     workingBuffer[0] = 0x20ac;
1249     workingBuffer[1] = 0x125;
1250     workingBuffer[2] = 0;
1251     test->setTo(TRUE, workingBuffer, 2);
1252     if(test->length() != 2 || test->charAt(0) != 0x20ac || test->charAt(1) != 0x125) {
1253         errln("UnicodeString.setTo(readonly alias) does not alias correctly");
1254     }
1255
1256     UnicodeString *c=(UnicodeString *)test->clone();
1257
1258     workingBuffer[1] = 0x109;
1259     if(test->charAt(1) != 0x109) {
1260         errln("UnicodeString.setTo(readonly alias) made a copy: did not see change in buffer");
1261     }
1262
1263     if(c->length() != 2 || c->charAt(1) != 0x125) {
1264         errln("clone(alias) did not copy the buffer");
1265     }
1266     delete c;
1267
1268     test->setTo(TRUE, workingBuffer, -1);
1269     if(test->length() != 2 || test->charAt(0) != 0x20ac || test->charAt(1) != 0x109) {
1270         errln("UnicodeString.setTo(readonly alias, length -1) does not alias correctly");
1271     }
1272
1273     test->setTo(FALSE, workingBuffer, -1);
1274     if(!test->isBogus()) {
1275         errln("UnicodeString.setTo(unterminated readonly alias, length -1) does not result in isBogus()");
1276     }
1277
1278     delete test;
1279
1280     test=new UnicodeString();
1281     UChar buffer[]={0x0061, 0x0062, 0x20ac, 0x0043, 0x0042, 0x0000};
1282     test->setTo(buffer, 4, 10);
1283     if(test->length() !=4 || test->charAt(0) != 0x0061 || test->charAt(1) != 0x0062 ||
1284         test->charAt(2) != 0x20ac || test->charAt(3) != 0x0043){
1285         errln((UnicodeString)"UnicodeString.setTo(UChar*, length, capacity) does not work correctly\n" + prettify(*test));
1286     }
1287     delete test;
1288
1289
1290     // test the UChar32 constructor
1291     UnicodeString c32Test((UChar32)0x10ff2a);
1292     if( c32Test.length() != U16_LENGTH(0x10ff2a) ||
1293         c32Test.char32At(c32Test.length() - 1) != 0x10ff2a
1294     ) {
1295         errln("The UnicodeString(UChar32) constructor does not work with a 0x10ff2a filler");
1296     }
1297
1298     // test the (new) capacity constructor
1299     UnicodeString capTest(5, (UChar32)0x2a, 5);
1300     if( capTest.length() != 5 * U16_LENGTH(0x2a) ||
1301         capTest.char32At(0) != 0x2a ||
1302         capTest.char32At(4) != 0x2a
1303     ) {
1304         errln("The UnicodeString capacity constructor does not work with an ASCII filler");
1305     }
1306
1307     capTest = UnicodeString(5, (UChar32)0x10ff2a, 5);
1308     if( capTest.length() != 5 * U16_LENGTH(0x10ff2a) ||
1309         capTest.char32At(0) != 0x10ff2a ||
1310         capTest.char32At(4) != 0x10ff2a
1311     ) {
1312         errln("The UnicodeString capacity constructor does not work with a 0x10ff2a filler");
1313     }
1314
1315     capTest = UnicodeString(5, (UChar32)0, 0);
1316     if(capTest.length() != 0) {
1317         errln("The UnicodeString capacity constructor does not work with a 0x10ff2a filler");
1318     }
1319 }
1320
1321 /**
1322  * Test the unescape() function.
1323  */
1324 void UnicodeStringTest::TestUnescape(void) {
1325     UnicodeString IN("abc\\u4567 \\n\\r \\U00101234xyz\\x1\\x{5289}\\x1b", -1, US_INV);
1326     UnicodeString OUT("abc");
1327     OUT.append((UChar)0x4567);
1328     OUT.append(" ");
1329     OUT.append((UChar)0xA);
1330     OUT.append((UChar)0xD);
1331     OUT.append(" ");
1332     OUT.append((UChar32)0x00101234);
1333     OUT.append("xyz");
1334     OUT.append((UChar32)1).append((UChar32)0x5289).append((UChar)0x1b);
1335     UnicodeString result = IN.unescape();
1336     if (result != OUT) {
1337         errln("FAIL: " + prettify(IN) + ".unescape() -> " +
1338               prettify(result) + ", expected " +
1339               prettify(OUT));
1340     }
1341
1342     // test that an empty string is returned in case of an error
1343     if (!UNICODE_STRING("wrong \\u sequence", 17).unescape().isEmpty()) {
1344         errln("FAIL: unescaping of a string with an illegal escape sequence did not return an empty string");
1345     }
1346 }
1347
1348 /* test code point counting functions --------------------------------------- */
1349
1350 /* reference implementation of UnicodeString::hasMoreChar32Than() */
1351 static int32_t
1352 _refUnicodeStringHasMoreChar32Than(const UnicodeString &s, int32_t start, int32_t length, int32_t number) {
1353     int32_t count=s.countChar32(start, length);
1354     return count>number;
1355 }
1356
1357 /* compare the real function against the reference */
1358 void
1359 UnicodeStringTest::_testUnicodeStringHasMoreChar32Than(const UnicodeString &s, int32_t start, int32_t length, int32_t number) {
1360     if(s.hasMoreChar32Than(start, length, number)!=_refUnicodeStringHasMoreChar32Than(s, start, length, number)) {
1361         errln("hasMoreChar32Than(%d, %d, %d)=%hd is wrong\n",
1362                 start, length, number, s.hasMoreChar32Than(start, length, number));
1363     }
1364 }
1365
1366 void
1367 UnicodeStringTest::TestCountChar32(void) {
1368     {
1369         UnicodeString s=UNICODE_STRING("\\U0002f999\\U0001d15f\\u00c4\\u1ed0", 32).unescape();
1370
1371         // test countChar32()
1372         // note that this also calls and tests u_countChar32(length>=0)
1373         if(
1374             s.countChar32()!=4 ||
1375             s.countChar32(1)!=4 ||
1376             s.countChar32(2)!=3 ||
1377             s.countChar32(2, 3)!=2 ||
1378             s.countChar32(2, 0)!=0
1379         ) {
1380             errln("UnicodeString::countChar32() failed");
1381         }
1382
1383         // NUL-terminate the string buffer and test u_countChar32(length=-1)
1384         const UChar *buffer=s.getTerminatedBuffer();
1385         if(
1386             u_countChar32(buffer, -1)!=4 ||
1387             u_countChar32(buffer+1, -1)!=4 ||
1388             u_countChar32(buffer+2, -1)!=3 ||
1389             u_countChar32(buffer+3, -1)!=3 ||
1390             u_countChar32(buffer+4, -1)!=2 ||
1391             u_countChar32(buffer+5, -1)!=1 ||
1392             u_countChar32(buffer+6, -1)!=0
1393         ) {
1394             errln("u_countChar32(length=-1) failed");
1395         }
1396
1397         // test u_countChar32() with bad input
1398         if(u_countChar32(NULL, 5)!=0 || u_countChar32(buffer, -2)!=0) {
1399             errln("u_countChar32(bad input) failed (returned non-zero counts)");
1400         }
1401     }
1402
1403     /* test data and variables for hasMoreChar32Than() */
1404     static const UChar str[]={
1405         0x61, 0x62, 0xd800, 0xdc00,
1406         0xd801, 0xdc01, 0x63, 0xd802,
1407         0x64, 0xdc03, 0x65, 0x66,
1408         0xd804, 0xdc04, 0xd805, 0xdc05,
1409         0x67
1410     };
1411     UnicodeString string(str, UPRV_LENGTHOF(str));
1412     int32_t start, length, number;
1413
1414     /* test hasMoreChar32Than() */
1415     for(length=string.length(); length>=0; --length) {
1416         for(start=0; start<=length; ++start) {
1417             for(number=-1; number<=((length-start)+2); ++number) {
1418                 _testUnicodeStringHasMoreChar32Than(string, start, length-start, number);
1419             }
1420         }
1421     }
1422
1423     /* test hasMoreChar32Than() with pinning */
1424     for(start=-1; start<=string.length()+1; ++start) {
1425         for(number=-1; number<=((string.length()-start)+2); ++number) {
1426             _testUnicodeStringHasMoreChar32Than(string, start, 0x7fffffff, number);
1427         }
1428     }
1429
1430     /* test hasMoreChar32Than() with a bogus string */
1431     string.setToBogus();
1432     for(length=-1; length<=1; ++length) {
1433         for(start=-1; start<=length; ++start) {
1434             for(number=-1; number<=((length-start)+2); ++number) {
1435                 _testUnicodeStringHasMoreChar32Than(string, start, length-start, number);
1436             }
1437         }
1438     }
1439 }
1440
1441 void
1442 UnicodeStringTest::TestBogus() {
1443     UnicodeString   test1("This is a test");
1444     UnicodeString   test2("This is a test");
1445     UnicodeString   test3("Me too!");
1446
1447     // test isBogus() and setToBogus()
1448     if (test1.isBogus() || test2.isBogus() || test3.isBogus()) {
1449         errln("A string returned TRUE for isBogus()!");
1450     }
1451
1452     // NULL pointers are treated like empty strings
1453     // use other illegal arguments to make a bogus string
1454     test3.setTo(FALSE, test1.getBuffer(), -2);
1455     if(!test3.isBogus()) {
1456         errln("A bogus string returned FALSE for isBogus()!");
1457     }
1458     if (test1.hashCode() != test2.hashCode() || test1.hashCode() == test3.hashCode()) {
1459         errln("hashCode() failed");
1460     }
1461     if(test3.getBuffer()!=0 || test3.getBuffer(20)!=0 || test3.getTerminatedBuffer()!=0) {
1462         errln("bogus.getBuffer()!=0");
1463     }
1464     if (test1.indexOf(test3) != -1) {
1465         errln("bogus.indexOf() != -1");
1466     }
1467     if (test1.lastIndexOf(test3) != -1) {
1468         errln("bogus.lastIndexOf() != -1");
1469     }
1470     if (test1.caseCompare(test3, U_FOLD_CASE_DEFAULT) != 1 || test3.caseCompare(test1, U_FOLD_CASE_DEFAULT) != -1) {
1471         errln("caseCompare() doesn't work with bogus strings");
1472     }
1473     if (test1.compareCodePointOrder(test3) != 1 || test3.compareCodePointOrder(test1) != -1) {
1474         errln("compareCodePointOrder() doesn't work with bogus strings");
1475     }
1476
1477     // verify that non-assignment modifications fail and do not revive a bogus string
1478     test3.setToBogus();
1479     test3.append((UChar)0x61);
1480     if(!test3.isBogus() || test3.getBuffer()!=0) {
1481         errln("bogus.append('a') worked but must not");
1482     }
1483
1484     test3.setToBogus();
1485     test3.findAndReplace(UnicodeString((UChar)0x61), test2);
1486     if(!test3.isBogus() || test3.getBuffer()!=0) {
1487         errln("bogus.findAndReplace() worked but must not");
1488     }
1489
1490     test3.setToBogus();
1491     test3.trim();
1492     if(!test3.isBogus() || test3.getBuffer()!=0) {
1493         errln("bogus.trim() revived bogus but must not");
1494     }
1495
1496     test3.setToBogus();
1497     test3.remove(1);
1498     if(!test3.isBogus() || test3.getBuffer()!=0) {
1499         errln("bogus.remove(1) revived bogus but must not");
1500     }
1501
1502     test3.setToBogus();
1503     if(!test3.setCharAt(0, 0x62).isBogus() || !test3.isEmpty()) {
1504         errln("bogus.setCharAt(0, 'b') worked but must not");
1505     }
1506
1507     test3.setToBogus();
1508     if(test3.truncate(1) || !test3.isBogus() || !test3.isEmpty()) {
1509         errln("bogus.truncate(1) revived bogus but must not");
1510     }
1511
1512     // verify that assignments revive a bogus string
1513     test3.setToBogus();
1514     if(!test3.isBogus() || (test3=test1).isBogus() || test3!=test1) {
1515         errln("bogus.operator=() failed");
1516     }
1517
1518     test3.setToBogus();
1519     if(!test3.isBogus() || test3.fastCopyFrom(test1).isBogus() || test3!=test1) {
1520         errln("bogus.fastCopyFrom() failed");
1521     }
1522
1523     test3.setToBogus();
1524     if(!test3.isBogus() || test3.setTo(test1).isBogus() || test3!=test1) {
1525         errln("bogus.setTo(UniStr) failed");
1526     }
1527
1528     test3.setToBogus();
1529     if(!test3.isBogus() || test3.setTo(test1, 0).isBogus() || test3!=test1) {
1530         errln("bogus.setTo(UniStr, 0) failed");
1531     }
1532
1533     test3.setToBogus();
1534     if(!test3.isBogus() || test3.setTo(test1, 0, 0x7fffffff).isBogus() || test3!=test1) {
1535         errln("bogus.setTo(UniStr, 0, len) failed");
1536     }
1537
1538     test3.setToBogus();
1539     if(!test3.isBogus() || test3.setTo(test1.getBuffer(), test1.length()).isBogus() || test3!=test1) {
1540         errln("bogus.setTo(const UChar *, len) failed");
1541     }
1542
1543     test3.setToBogus();
1544     if(!test3.isBogus() || test3.setTo((UChar)0x2028).isBogus() || test3!=UnicodeString((UChar)0x2028)) {
1545         errln("bogus.setTo(UChar) failed");
1546     }
1547
1548     test3.setToBogus();
1549     if(!test3.isBogus() || test3.setTo((UChar32)0x1d157).isBogus() || test3!=UnicodeString((UChar32)0x1d157)) {
1550         errln("bogus.setTo(UChar32) failed");
1551     }
1552
1553     test3.setToBogus();
1554     if(!test3.isBogus() || test3.setTo(FALSE, test1.getBuffer(), test1.length()).isBogus() || test3!=test1) {
1555         errln("bogus.setTo(readonly alias) failed");
1556     }
1557
1558     // writable alias to another string's buffer: very bad idea, just convenient for this test
1559     test3.setToBogus();
1560     if(!test3.isBogus() || test3.setTo((UChar *)test1.getBuffer(), test1.length(), test1.getCapacity()).isBogus() || test3!=test1) {
1561         errln("bogus.setTo(writable alias) failed");
1562     }
1563
1564     // verify simple, documented ways to turn a bogus string into an empty one
1565     test3.setToBogus();
1566     if(!test3.isBogus() || (test3=UnicodeString()).isBogus() || !test3.isEmpty()) {
1567         errln("bogus.operator=(UnicodeString()) failed");
1568     }
1569
1570     test3.setToBogus();
1571     if(!test3.isBogus() || test3.setTo(UnicodeString()).isBogus() || !test3.isEmpty()) {
1572         errln("bogus.setTo(UnicodeString()) failed");
1573     }
1574
1575     test3.setToBogus();
1576     if(test3.remove().isBogus() || test3.getBuffer()==0 || !test3.isEmpty()) {
1577         errln("bogus.remove() failed");
1578     }
1579
1580     test3.setToBogus();
1581     if(test3.remove(0, INT32_MAX).isBogus() || test3.getBuffer()==0 || !test3.isEmpty()) {
1582         errln("bogus.remove(0, INT32_MAX) failed");
1583     }
1584
1585     test3.setToBogus();
1586     if(test3.truncate(0) || test3.isBogus() || !test3.isEmpty()) {
1587         errln("bogus.truncate(0) failed");
1588     }
1589
1590     test3.setToBogus();
1591     if(!test3.isBogus() || test3.setTo((UChar32)-1).isBogus() || !test3.isEmpty()) {
1592         errln("bogus.setTo((UChar32)-1) failed");
1593     }
1594
1595     static const UChar nul=0;
1596
1597     test3.setToBogus();
1598     if(!test3.isBogus() || test3.setTo(&nul, 0).isBogus() || !test3.isEmpty()) {
1599         errln("bogus.setTo(&nul, 0) failed");
1600     }
1601
1602     test3.setToBogus();
1603     if(!test3.isBogus() || test3.getBuffer()!=0) {
1604         errln("setToBogus() failed to make a string bogus");
1605     }
1606
1607     test3.setToBogus();
1608     if(test1.isBogus() || !(test1=test3).isBogus()) {
1609         errln("normal=bogus failed to make the left string bogus");
1610     }
1611
1612     // test that NULL primitive input string values are treated like
1613     // empty strings, not errors (bogus)
1614     test2.setTo((UChar32)0x10005);
1615     if(test2.insert(1, NULL, 1).length()!=2) {
1616         errln("UniStr.insert(...NULL...) should not modify the string but does");
1617     }
1618
1619     UErrorCode errorCode=U_ZERO_ERROR;
1620     UnicodeString
1621         test4((const UChar *)NULL),
1622         test5(TRUE, (const UChar *)NULL, 1),
1623         test6((UChar *)NULL, 5, 5),
1624         test7((const char *)NULL, 3, NULL, errorCode);
1625     if(test4.isBogus() || test5.isBogus() || test6.isBogus() || test7.isBogus()) {
1626         errln("a constructor set to bogus for a NULL input string, should be empty");
1627     }
1628
1629     test4.setTo(NULL, 3);
1630     test5.setTo(TRUE, (const UChar *)NULL, 1);
1631     test6.setTo((UChar *)NULL, 5, 5);
1632     if(test4.isBogus() || test5.isBogus() || test6.isBogus()) {
1633         errln("a setTo() set to bogus for a NULL input string, should be empty");
1634     }
1635
1636     // test that bogus==bogus<any
1637     if(test1!=test3 || test1.compare(test3)!=0) {
1638         errln("bogus==bogus failed");
1639     }
1640
1641     test2.remove();
1642     if(test1>=test2 || !(test2>test1) || test1.compare(test2)>=0 || !(test2.compare(test1)>0)) {
1643         errln("bogus<empty failed");
1644     }
1645 }
1646
1647 // StringEnumeration ------------------------------------------------------- ***
1648 // most of StringEnumeration is tested elsewhere
1649 // this test improves code coverage
1650
1651 static const char *const
1652 testEnumStrings[]={
1653     "a",
1654     "b",
1655     "c",
1656     "this is a long string which helps us test some buffer limits",
1657     "eeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeee"
1658 };
1659
1660 class TestEnumeration : public StringEnumeration {
1661 public:
1662     TestEnumeration() : i(0) {}
1663
1664     virtual int32_t count(UErrorCode& /*status*/) const {
1665         return UPRV_LENGTHOF(testEnumStrings);
1666     }
1667
1668     virtual const UnicodeString *snext(UErrorCode &status) {
1669         if(U_SUCCESS(status) && i<UPRV_LENGTHOF(testEnumStrings)) {
1670             unistr=UnicodeString(testEnumStrings[i++], "");
1671             return &unistr;
1672         }
1673
1674         return NULL;
1675     }
1676
1677     virtual void reset(UErrorCode& /*status*/) {
1678         i=0;
1679     }
1680
1681     static inline UClassID getStaticClassID() {
1682         return (UClassID)&fgClassID;
1683     }
1684     virtual UClassID getDynamicClassID() const {
1685         return getStaticClassID();
1686     }
1687
1688 private:
1689     static const char fgClassID;
1690
1691     int32_t i;
1692 };
1693
1694 const char TestEnumeration::fgClassID=0;
1695
1696 void
1697 UnicodeStringTest::TestStringEnumeration() {
1698     UnicodeString s;
1699     TestEnumeration ten;
1700     int32_t i, length;
1701     UErrorCode status;
1702
1703     const UChar *pu;
1704     const char *pc;
1705
1706     // test the next() default implementation and ensureCharsCapacity()
1707     for(i=0; i<UPRV_LENGTHOF(testEnumStrings); ++i) {
1708         status=U_ZERO_ERROR;
1709         pc=ten.next(&length, status);
1710         s=UnicodeString(testEnumStrings[i], "");
1711         if(U_FAILURE(status) || pc==NULL || length!=s.length() || UnicodeString(pc, length, "")!=s) {
1712             errln("StringEnumeration.next(%d) failed", i);
1713         }
1714     }
1715     status=U_ZERO_ERROR;
1716     if(ten.next(&length, status)!=NULL) {
1717         errln("StringEnumeration.next(done)!=NULL");
1718     }
1719
1720     // test the unext() default implementation
1721     ten.reset(status);
1722     for(i=0; i<UPRV_LENGTHOF(testEnumStrings); ++i) {
1723         status=U_ZERO_ERROR;
1724         pu=ten.unext(&length, status);
1725         s=UnicodeString(testEnumStrings[i], "");
1726         if(U_FAILURE(status) || pu==NULL || length!=s.length() || UnicodeString(TRUE, pu, length)!=s) {
1727             errln("StringEnumeration.unext(%d) failed", i);
1728         }
1729     }
1730     status=U_ZERO_ERROR;
1731     if(ten.unext(&length, status)!=NULL) {
1732         errln("StringEnumeration.unext(done)!=NULL");
1733     }
1734
1735     // test that the default clone() implementation works, and returns NULL
1736     if(ten.clone()!=NULL) {
1737         errln("StringEnumeration.clone()!=NULL");
1738     }
1739
1740     // test that uenum_openFromStringEnumeration() works
1741     // Need a heap allocated string enumeration because it is adopted by the UEnumeration.
1742     StringEnumeration *newTen = new TestEnumeration;
1743     status=U_ZERO_ERROR;
1744     UEnumeration *uten = uenum_openFromStringEnumeration(newTen, &status);
1745     if (uten==NULL || U_FAILURE(status)) {
1746         errln("fail at file %s, line %d, UErrorCode is %s\n", __FILE__, __LINE__, u_errorName(status));
1747         return;
1748     }
1749
1750     // test  uenum_next()
1751     for(i=0; i<UPRV_LENGTHOF(testEnumStrings); ++i) {
1752         status=U_ZERO_ERROR;
1753         pc=uenum_next(uten, &length, &status);
1754         if(U_FAILURE(status) || pc==NULL || strcmp(pc, testEnumStrings[i]) != 0) {
1755             errln("File %s, line %d, StringEnumeration.next(%d) failed", __FILE__, __LINE__, i);
1756         }
1757     }
1758     status=U_ZERO_ERROR;
1759     if(uenum_next(uten, &length, &status)!=NULL) {
1760         errln("File %s, line %d, uenum_next(done)!=NULL");
1761     }
1762
1763     // test the uenum_unext()
1764     uenum_reset(uten, &status);
1765     for(i=0; i<UPRV_LENGTHOF(testEnumStrings); ++i) {
1766         status=U_ZERO_ERROR;
1767         pu=uenum_unext(uten, &length, &status);
1768         s=UnicodeString(testEnumStrings[i], "");
1769         if(U_FAILURE(status) || pu==NULL || length!=s.length() || UnicodeString(TRUE, pu, length)!=s) {
1770             errln("File %s, Line %d, uenum_unext(%d) failed", __FILE__, __LINE__, i);
1771         }
1772     }
1773     status=U_ZERO_ERROR;
1774     if(uenum_unext(uten, &length, &status)!=NULL) {
1775         errln("File %s, Line %d, uenum_unext(done)!=NULL" __FILE__, __LINE__);
1776     }
1777
1778     uenum_close(uten);
1779 }
1780
1781 /*
1782  * Namespace test, to make sure that macros like UNICODE_STRING include the
1783  * namespace qualifier.
1784  *
1785  * Define a (bogus) UnicodeString class in another namespace and check for ambiguity.
1786  */
1787 namespace bogus {
1788     class UnicodeString {
1789     public:
1790         enum EInvariant { kInvariant };
1791         UnicodeString() : i(1) {}
1792         UnicodeString(UBool /*isTerminated*/, const UChar * /*text*/, int32_t textLength) : i(textLength) {(void)i;}
1793         UnicodeString(const char * /*src*/, int32_t length, enum EInvariant /*inv*/
1794 ) : i(length) {}
1795     private:
1796         int32_t i;
1797     };
1798 }
1799
1800 void
1801 UnicodeStringTest::TestNameSpace() {
1802     // Provoke name collision unless the UnicodeString macros properly
1803     // qualify the icu::UnicodeString class.
1804     using namespace bogus;
1805
1806     // Use all UnicodeString macros from unistr.h.
1807     icu::UnicodeString s1=icu::UnicodeString("abc", 3, US_INV);
1808     icu::UnicodeString s2=UNICODE_STRING("def", 3);
1809     icu::UnicodeString s3=UNICODE_STRING_SIMPLE("ghi");
1810
1811     // Make sure the compiler does not optimize away instantiation of s1, s2, s3.
1812     icu::UnicodeString s4=s1+s2+s3;
1813     if(s4.length()!=9) {
1814         errln("Something wrong with UnicodeString::operator+().");
1815     }
1816 }
1817
1818 void
1819 UnicodeStringTest::TestUTF32() {
1820     // Input string length US_STACKBUF_SIZE to cause overflow of the
1821     // initially chosen fStackBuffer due to supplementary characters.
1822     static const UChar32 utf32[] = {
1823         0x41, 0xd900, 0x61, 0xdc00, -1, 0x110000, 0x5a, 0x50000, 0x7a,
1824         0x10000, 0x20000, 0xe0000, 0x10ffff
1825     };
1826     static const UChar expected_utf16[] = {
1827         0x41, 0xfffd, 0x61, 0xfffd, 0xfffd, 0xfffd, 0x5a, 0xd900, 0xdc00, 0x7a,
1828         0xd800, 0xdc00, 0xd840, 0xdc00, 0xdb40, 0xdc00, 0xdbff, 0xdfff
1829     };
1830     UnicodeString from32 = UnicodeString::fromUTF32(utf32, UPRV_LENGTHOF(utf32));
1831     UnicodeString expected(FALSE, expected_utf16, UPRV_LENGTHOF(expected_utf16));
1832     if(from32 != expected) {
1833         errln("UnicodeString::fromUTF32() did not create the expected string.");
1834     }
1835
1836     static const UChar utf16[] = {
1837         0x41, 0xd900, 0x61, 0xdc00, 0x5a, 0xd900, 0xdc00, 0x7a, 0xd800, 0xdc00, 0xdbff, 0xdfff
1838     };
1839     static const UChar32 expected_utf32[] = {
1840         0x41, 0xfffd, 0x61, 0xfffd, 0x5a, 0x50000, 0x7a, 0x10000, 0x10ffff
1841     };
1842     UChar32 result32[16];
1843     UErrorCode errorCode = U_ZERO_ERROR;
1844     int32_t length32 =
1845         UnicodeString(FALSE, utf16, UPRV_LENGTHOF(utf16)).
1846         toUTF32(result32, UPRV_LENGTHOF(result32), errorCode);
1847     if( length32 != UPRV_LENGTHOF(expected_utf32) ||
1848         0 != uprv_memcmp(result32, expected_utf32, length32*4) ||
1849         result32[length32] != 0
1850     ) {
1851         errln("UnicodeString::toUTF32() did not create the expected string.");
1852     }
1853 }
1854
1855 class TestCheckedArrayByteSink : public CheckedArrayByteSink {
1856 public:
1857     TestCheckedArrayByteSink(char* outbuf, int32_t capacity)
1858             : CheckedArrayByteSink(outbuf, capacity), calledFlush(FALSE) {}
1859     virtual void Flush() { calledFlush = TRUE; }
1860     UBool calledFlush;
1861 };
1862
1863 void
1864 UnicodeStringTest::TestUTF8() {
1865     static const uint8_t utf8[] = {
1866         // Code points:
1867         // 0x41, 0xd900,
1868         // 0x61, 0xdc00,
1869         // 0x110000, 0x5a,
1870         // 0x50000, 0x7a,
1871         // 0x10000, 0x20000,
1872         // 0xe0000, 0x10ffff
1873         0x41, 0xed, 0xa4, 0x80,
1874         0x61, 0xed, 0xb0, 0x80,
1875         0xf4, 0x90, 0x80, 0x80, 0x5a,
1876         0xf1, 0x90, 0x80, 0x80, 0x7a,
1877         0xf0, 0x90, 0x80, 0x80, 0xf0, 0xa0, 0x80, 0x80,
1878         0xf3, 0xa0, 0x80, 0x80, 0xf4, 0x8f, 0xbf, 0xbf
1879     };
1880     static const UChar expected_utf16[] = {
1881         0x41, 0xfffd,
1882         0x61, 0xfffd,
1883         0xfffd, 0x5a,
1884         0xd900, 0xdc00, 0x7a,
1885         0xd800, 0xdc00, 0xd840, 0xdc00,
1886         0xdb40, 0xdc00, 0xdbff, 0xdfff
1887     };
1888     UnicodeString from8 = UnicodeString::fromUTF8(StringPiece((const char *)utf8, (int32_t)sizeof(utf8)));
1889     UnicodeString expected(FALSE, expected_utf16, UPRV_LENGTHOF(expected_utf16));
1890
1891     if(from8 != expected) {
1892         errln("UnicodeString::fromUTF8(StringPiece) did not create the expected string.");
1893     }
1894 #if U_HAVE_STD_STRING
1895     std::string utf8_string((const char *)utf8, sizeof(utf8));
1896     UnicodeString from8b = UnicodeString::fromUTF8(utf8_string);
1897     if(from8b != expected) {
1898         errln("UnicodeString::fromUTF8(std::string) did not create the expected string.");
1899     }
1900 #endif
1901
1902     static const UChar utf16[] = {
1903         0x41, 0xd900, 0x61, 0xdc00, 0x5a, 0xd900, 0xdc00, 0x7a, 0xd800, 0xdc00, 0xdbff, 0xdfff
1904     };
1905     static const uint8_t expected_utf8[] = {
1906         0x41, 0xef, 0xbf, 0xbd, 0x61, 0xef, 0xbf, 0xbd, 0x5a, 0xf1, 0x90, 0x80, 0x80, 0x7a,
1907         0xf0, 0x90, 0x80, 0x80, 0xf4, 0x8f, 0xbf, 0xbf
1908     };
1909     UnicodeString us(FALSE, utf16, UPRV_LENGTHOF(utf16));
1910
1911     char buffer[64];
1912     TestCheckedArrayByteSink sink(buffer, (int32_t)sizeof(buffer));
1913     us.toUTF8(sink);
1914     if( sink.NumberOfBytesWritten() != (int32_t)sizeof(expected_utf8) ||
1915         0 != uprv_memcmp(buffer, expected_utf8, sizeof(expected_utf8))
1916     ) {
1917         errln("UnicodeString::toUTF8() did not create the expected string.");
1918     }
1919     if(!sink.calledFlush) {
1920         errln("UnicodeString::toUTF8(sink) did not sink.Flush().");
1921     }
1922 #if U_HAVE_STD_STRING
1923     // Initial contents for testing that toUTF8String() appends.
1924     std::string result8 = "-->";
1925     std::string expected8 = "-->" + std::string((const char *)expected_utf8, sizeof(expected_utf8));
1926     // Use the return value just for testing.
1927     std::string &result8r = us.toUTF8String(result8);
1928     if(result8r != expected8 || &result8r != &result8) {
1929         errln("UnicodeString::toUTF8String() did not create the expected string.");
1930     }
1931 #endif
1932 }
1933
1934 // Test if this compiler supports Return Value Optimization of unnamed temporary objects.
1935 static UnicodeString wrapUChars(const UChar *uchars) {
1936     return UnicodeString(TRUE, uchars, -1);
1937 }
1938
1939 void
1940 UnicodeStringTest::TestReadOnlyAlias() {
1941     UChar uchars[]={ 0x61, 0x62, 0 };
1942     UnicodeString alias(TRUE, uchars, 2);
1943     if(alias.length()!=2 || alias.getBuffer()!=uchars || alias.getTerminatedBuffer()!=uchars) {
1944         errln("UnicodeString read-only-aliasing constructor does not behave as expected.");
1945         return;
1946     }
1947     alias.truncate(1);
1948     if(alias.length()!=1 || alias.getBuffer()!=uchars) {
1949         errln("UnicodeString(read-only-alias).truncate() did not preserve aliasing as expected.");
1950     }
1951     if(alias.getTerminatedBuffer()==uchars) {
1952         errln("UnicodeString(read-only-alias).truncate().getTerminatedBuffer() "
1953               "did not allocate and copy as expected.");
1954     }
1955     if(uchars[1]!=0x62) {
1956         errln("UnicodeString(read-only-alias).truncate().getTerminatedBuffer() "
1957               "modified the original buffer.");
1958     }
1959     if(1!=u_strlen(alias.getTerminatedBuffer())) {
1960         errln("UnicodeString(read-only-alias).truncate().getTerminatedBuffer() "
1961               "does not return a buffer terminated at the proper length.");
1962     }
1963
1964     alias.setTo(TRUE, uchars, 2);
1965     if(alias.length()!=2 || alias.getBuffer()!=uchars || alias.getTerminatedBuffer()!=uchars) {
1966         errln("UnicodeString read-only-aliasing setTo() does not behave as expected.");
1967         return;
1968     }
1969     alias.remove();
1970     if(alias.length()!=0) {
1971         errln("UnicodeString(read-only-alias).remove() did not work.");
1972     }
1973     if(alias.getTerminatedBuffer()==uchars) {
1974         errln("UnicodeString(read-only-alias).remove().getTerminatedBuffer() "
1975               "did not un-alias as expected.");
1976     }
1977     if(uchars[0]!=0x61) {
1978         errln("UnicodeString(read-only-alias).remove().getTerminatedBuffer() "
1979               "modified the original buffer.");
1980     }
1981     if(0!=u_strlen(alias.getTerminatedBuffer())) {
1982         errln("UnicodeString.setTo(read-only-alias).remove().getTerminatedBuffer() "
1983               "does not return a buffer terminated at length 0.");
1984     }
1985
1986     UnicodeString longString=UNICODE_STRING_SIMPLE("abcdefghijklmnopqrstuvwxyz0123456789");
1987     alias.setTo(FALSE, longString.getBuffer(), longString.length());
1988     alias.remove(0, 10);
1989     if(longString.compare(10, INT32_MAX, alias)!=0 || alias.getBuffer()!=longString.getBuffer()+10) {
1990         errln("UnicodeString.setTo(read-only-alias).remove(0, 10) did not preserve aliasing as expected.");
1991     }
1992     alias.setTo(FALSE, longString.getBuffer(), longString.length());
1993     alias.remove(27, 99);
1994     if(longString.compare(0, 27, alias)!=0 || alias.getBuffer()!=longString.getBuffer()) {
1995         errln("UnicodeString.setTo(read-only-alias).remove(27, 99) did not preserve aliasing as expected.");
1996     }
1997     alias.setTo(FALSE, longString.getBuffer(), longString.length());
1998     alias.retainBetween(6, 30);
1999     if(longString.compare(6, 24, alias)!=0 || alias.getBuffer()!=longString.getBuffer()+6) {
2000         errln("UnicodeString.setTo(read-only-alias).retainBetween(6, 30) did not preserve aliasing as expected.");
2001     }
2002
2003     UChar abc[]={ 0x61, 0x62, 0x63, 0 };
2004     UBool hasRVO= wrapUChars(abc).getBuffer()==abc;
2005
2006     UnicodeString temp;
2007     temp.fastCopyFrom(longString.tempSubString());
2008     if(temp!=longString || (hasRVO && temp.getBuffer()!=longString.getBuffer())) {
2009         errln("UnicodeString.tempSubString() failed");
2010     }
2011     temp.fastCopyFrom(longString.tempSubString(-3, 5));
2012     if(longString.compare(0, 5, temp)!=0 || (hasRVO && temp.getBuffer()!=longString.getBuffer())) {
2013         errln("UnicodeString.tempSubString(-3, 5) failed");
2014     }
2015     temp.fastCopyFrom(longString.tempSubString(17));
2016     if(longString.compare(17, INT32_MAX, temp)!=0 || (hasRVO && temp.getBuffer()!=longString.getBuffer()+17)) {
2017         errln("UnicodeString.tempSubString(17) failed");
2018     }
2019     temp.fastCopyFrom(longString.tempSubString(99));
2020     if(!temp.isEmpty()) {
2021         errln("UnicodeString.tempSubString(99) failed");
2022     }
2023     temp.fastCopyFrom(longString.tempSubStringBetween(6));
2024     if(longString.compare(6, INT32_MAX, temp)!=0 || (hasRVO && temp.getBuffer()!=longString.getBuffer()+6)) {
2025         errln("UnicodeString.tempSubStringBetween(6) failed");
2026     }
2027     temp.fastCopyFrom(longString.tempSubStringBetween(8, 18));
2028     if(longString.compare(8, 10, temp)!=0 || (hasRVO && temp.getBuffer()!=longString.getBuffer()+8)) {
2029         errln("UnicodeString.tempSubStringBetween(8, 18) failed");
2030     }
2031     UnicodeString bogusString;
2032     bogusString.setToBogus();
2033     temp.fastCopyFrom(bogusString.tempSubStringBetween(8, 18));
2034     if(!temp.isBogus()) {
2035         errln("UnicodeString.setToBogus().tempSubStringBetween(8, 18) failed");
2036     }
2037 }
2038
2039 void
2040 UnicodeStringTest::doTestAppendable(UnicodeString &dest, Appendable &app) {
2041     static const UChar cde[3]={ 0x63, 0x64, 0x65 };
2042     static const UChar fg[3]={ 0x66, 0x67, 0 };
2043     if(!app.reserveAppendCapacity(12)) {
2044         errln("Appendable.reserve(12) failed");
2045     }
2046     app.appendCodeUnit(0x61);
2047     app.appendCodePoint(0x62);
2048     app.appendCodePoint(0x50000);
2049     app.appendString(cde, 3);
2050     app.appendString(fg, -1);
2051     UChar scratch[3];
2052     int32_t capacity=-1;
2053     UChar *buffer=app.getAppendBuffer(3, 3, scratch, 3, &capacity);
2054     if(capacity<3) {
2055         errln("Appendable.getAppendBuffer(min=3) returned capacity=%d<3", (int)capacity);
2056         return;
2057     }
2058     static const UChar hij[3]={ 0x68, 0x69, 0x6a };
2059     u_memcpy(buffer, hij, 3);
2060     app.appendString(buffer, 3);
2061     if(dest!=UNICODE_STRING_SIMPLE("ab\\U00050000cdefghij").unescape()) {
2062         errln("Appendable.append(...) failed");
2063     }
2064     buffer=app.getAppendBuffer(0, 3, scratch, 3, &capacity);
2065     if(buffer!=NULL || capacity!=0) {
2066         errln("Appendable.getAppendBuffer(min=0) failed");
2067     }
2068     capacity=1;
2069     buffer=app.getAppendBuffer(3, 3, scratch, 2, &capacity);
2070     if(buffer!=NULL || capacity!=0) {
2071         errln("Appendable.getAppendBuffer(scratch<min) failed");
2072     }
2073 }
2074
2075 class SimpleAppendable : public Appendable {
2076 public:
2077     explicit SimpleAppendable(UnicodeString &dest) : str(dest) {}
2078     virtual UBool appendCodeUnit(UChar c) { str.append(c); return TRUE; }
2079     SimpleAppendable &reset() { str.remove(); return *this; }
2080 private:
2081     UnicodeString &str;
2082 };
2083
2084 void
2085 UnicodeStringTest::TestAppendable() {
2086     UnicodeString dest;
2087     SimpleAppendable app(dest);
2088     doTestAppendable(dest, app);
2089 }
2090
2091 void
2092 UnicodeStringTest::TestUnicodeStringImplementsAppendable() {
2093     UnicodeString dest;
2094     UnicodeStringAppendable app(dest);
2095     doTestAppendable(dest, app);
2096 }
2097
2098 void
2099 UnicodeStringTest::TestSizeofUnicodeString() {
2100     // See the comments in unistr.h near the declaration of UnicodeString's fields.
2101     size_t sizeofUniStr=sizeof(UnicodeString);
2102     size_t expected;
2103     switch(sizeof(void *)) {
2104     case 4:
2105         expected=32;
2106         break;
2107     case 8:
2108         expected=40;
2109         break;
2110     default:
2111         logln("This platform has neither 32-bit nor 64-bit pointers.");
2112         return;
2113     }
2114     if(expected!=sizeofUniStr) {
2115         errln("sizeof(UnicodeString)=%d, expected %d", (int)sizeofUniStr, (int)expected);
2116     }
2117 }