git.saurik.com Git - apple/icu.git/blame_incremental - icuSources/test/intltest/ustrtest.cpp

... / ...

Commit	Line	Data
	1	/********************************************************************
	2	* COPYRIGHT:
	3	* Copyright (c) 1997-2008, International Business Machines Corporation and
	4	* others. All Rights Reserved.
	5	********************************************************************/
	6
	7	#include "ustrtest.h"
	8	#include "unicode/unistr.h"
	9	#include "unicode/uchar.h"
	10	#include "unicode/ustring.h"
	11	#include "unicode/locid.h"
	12	#include "unicode/ucnv.h"
	13	#include "cmemory.h"
	14	#include "charstr.h"
	15
	16	#if 0
	17	#include "unicode/ustream.h"
	18
	19	#if U_IOSTREAM_SOURCE >= 199711
	20	#include <iostream>
	21	using namespace std;
	22	#elif U_IOSTREAM_SOURCE >= 198506
	23	#include <iostream.h>
	24	#endif
	25
	26	#endif
	27
	28	#define LENGTHOF(array) (int32_t)((sizeof(array)/sizeof((array)[0])))
	29
	30	UnicodeStringTest::~UnicodeStringTest() {}
	31
	32	void UnicodeStringTest::runIndexedTest( int32_t index, UBool exec, const char* &name, char *par)
	33	{
	34	if (exec) logln("TestSuite UnicodeStringTest: ");
	35	switch (index) {
	36	case 0:
	37	name = "StringCaseTest";
	38	if (exec) {
	39	logln("StringCaseTest---"); logln("");
	40	StringCaseTest test;
	41	callTest(test, par);
	42	}
	43	break;
	44	case 1: name = "TestBasicManipulation"; if (exec) TestBasicManipulation(); break;
	45	case 2: name = "TestCompare"; if (exec) TestCompare(); break;
	46	case 3: name = "TestExtract"; if (exec) TestExtract(); break;
	47	case 4: name = "TestRemoveReplace"; if (exec) TestRemoveReplace(); break;
	48	case 5: name = "TestSearching"; if (exec) TestSearching(); break;
	49	case 6: name = "TestSpacePadding"; if (exec) TestSpacePadding(); break;
	50	case 7: name = "TestPrefixAndSuffix"; if (exec) TestPrefixAndSuffix(); break;
	51	case 8: name = "TestFindAndReplace"; if (exec) TestFindAndReplace(); break;
	52	case 9: name = "TestBogus"; if (exec) TestBogus(); break;
	53	case 10: name = "TestReverse"; if (exec) TestReverse(); break;
	54	case 11: name = "TestMiscellaneous"; if (exec) TestMiscellaneous(); break;
	55	case 12: name = "TestStackAllocation"; if (exec) TestStackAllocation(); break;
	56	case 13: name = "TestUnescape"; if (exec) TestUnescape(); break;
	57	case 14: name = "TestCountChar32"; if (exec) TestCountChar32(); break;
	58	case 15: name = "TestStringEnumeration"; if (exec) TestStringEnumeration(); break;
	59	case 16: name = "TestCharString"; if (exec) TestCharString(); break;
	60	case 17: name = "TestNameSpace"; if (exec) TestNameSpace(); break;
	61
	62	default: name = ""; break; //needed to end loop
	63	}
	64	}
	65
	66	void
	67	UnicodeStringTest::TestBasicManipulation()
	68	{
	69	UnicodeString test1("Now is the time for all men to come swiftly to the aid of the party.\n");
	70	UnicodeString expectedValue;
	71	UnicodeString *c;
	72
	73	c=(UnicodeString *)test1.clone();
	74	test1.insert(24, "good ");
	75	expectedValue = "Now is the time for all good men to come swiftly to the aid of the party.\n";
	76	if (test1 != expectedValue)
	77	errln("insert() failed: expected \"" + expectedValue + "\"\n,got \"" + test1 + "\"");
	78
	79	c->insert(24, "good ");
	80	if(*c != expectedValue) {
	81	errln("clone()->insert() failed: expected \"" + expectedValue + "\"\n,got \"" + *c + "\"");
	82	}
	83	delete c;
	84
	85	test1.remove(41, 8);
	86	expectedValue = "Now is the time for all good men to come to the aid of the party.\n";
	87	if (test1 != expectedValue)
	88	errln("remove() failed: expected \"" + expectedValue + "\"\n,got \"" + test1 + "\"");
	89
	90	test1.replace(58, 6, "ir country");
	91	expectedValue = "Now is the time for all good men to come to the aid of their country.\n";
	92	if (test1 != expectedValue)
	93	errln("replace() failed: expected \"" + expectedValue + "\"\n,got \"" + test1 + "\"");
	94
	95	UChar temp[80];
	96	test1.extract(0, 15, temp);
	97
	98	UnicodeString test2(temp, 15);
	99
	100	expectedValue = "Now is the time";
	101	if (test2 != expectedValue)
	102	errln("extract() failed: expected \"" + expectedValue + "\"\n,got \"" + test2 + "\"");
	103
	104	test2 += " for me to go!\n";
	105	expectedValue = "Now is the time for me to go!\n";
	106	if (test2 != expectedValue)
	107	errln("operator+=() failed: expected \"" + expectedValue + "\"\n,got \"" + test2 + "\"");
	108
	109	if (test1.length() != 70)
	110	errln("length() failed: expected 70, got " + test1.length());
	111	if (test2.length() != 30)
	112	errln("length() failed: expected 30, got " + test2.length());
	113
	114	UnicodeString test3;
	115	test3.append((UChar32)0x20402);
	116	if(test3 != CharsToUnicodeString("\\uD841\\uDC02")){
	117	errln((UnicodeString)"append failed for UChar32, expected \"\\\\ud841\\\\udc02\", got " + prettify(test3));
	118	}
	119	if(test3.length() != 2){
	120	errln("append or length failed for UChar32, expected 2, got " + test3.length());
	121	}
	122	test3.append((UChar32)0x0074);
	123	if(test3 != CharsToUnicodeString("\\uD841\\uDC02t")){
	124	errln((UnicodeString)"append failed for UChar32, expected \"\\\\uD841\\\\uDC02t\", got " + prettify(test3));
	125	}
	126	if(test3.length() != 3){
	127	errln((UnicodeString)"append or length failed for UChar32, expected 2, got " + test3.length());
	128	}
	129
	130	// test some UChar32 overloads
	131	if( test3.setTo((UChar32)0x10330).length() != 2 \|\|
	132	test3.insert(0, (UChar32)0x20100).length() != 4 \|\|
	133	test3.replace(2, 2, (UChar32)0xe0061).length() != 4 \|\|
	134	(test3 = (UChar32)0x14001).length() != 2
	135	) {
	136	errln((UnicodeString)"simple UChar32 overloads for replace, insert, setTo or = failed");
	137	}
	138
	139	{
	140	// test moveIndex32()
	141	UnicodeString s=UNICODE_STRING("\\U0002f999\\U0001d15f\\u00c4\\u1ed0", 32).unescape();
	142
	143	if(
	144	s.moveIndex32(2, -1)!=0 \|\|
	145	s.moveIndex32(2, 1)!=4 \|\|
	146	s.moveIndex32(2, 2)!=5 \|\|
	147	s.moveIndex32(5, -2)!=2 \|\|
	148	s.moveIndex32(0, -1)!=0 \|\|
	149	s.moveIndex32(6, 1)!=6
	150	) {
	151	errln("UnicodeString::moveIndex32() failed");
	152	}
	153
	154	if(s.getChar32Start(1)!=0 \|\| s.getChar32Start(2)!=2) {
	155	errln("UnicodeString::getChar32Start() failed");
	156	}
	157
	158	if(s.getChar32Limit(1)!=2 \|\| s.getChar32Limit(2)!=2) {
	159	errln("UnicodeString::getChar32Limit() failed");
	160	}
	161	}
	162
	163	{
	164	// test new 2.2 constructors and setTo function that parallel Java's substring function.
	165	UnicodeString src("Hello folks how are you?");
	166	UnicodeString target1("how are you?");
	167	if (target1 != UnicodeString(src, 12)) {
	168	errln("UnicodeString(const UnicodeString&, int32_t) failed");
	169	}
	170	UnicodeString target2("folks");
	171	if (target2 != UnicodeString(src, 6, 5)) {
	172	errln("UnicodeString(const UnicodeString&, int32_t, int32_t) failed");
	173	}
	174	if (target1 != target2.setTo(src, 12)) {
	175	errln("UnicodeString::setTo(const UnicodeString&, int32_t) failed");
	176	}
	177	}
	178
	179	{
	180	// op+ is new in ICU 2.8
	181	UnicodeString s=UnicodeString("abc", "")+UnicodeString("def", "")+UnicodeString("ghi", "");
	182	if(s!=UnicodeString("abcdefghi", "")) {
	183	errln("operator+(UniStr, UniStr) failed");
	184	}
	185	}
	186
	187	{
	188	// tests for Jitterbug 2360
	189	// verify that APIs with source pointer + length accept length == -1
	190	// mostly test only where modified, only few functions did not already do this
	191	if(UnicodeString("abc", -1, "")!=UnicodeString("abc", "")) {
	192	errln("UnicodeString(codepageData, dataLength, codepage) does not work with dataLength==-1");
	193	}
	194
	195	UChar buffer[10]={ 0x61, 0x62, 0x20ac, 0xd900, 0xdc05, 0, 0x62, 0xffff, 0xdbff, 0xdfff };
	196	UnicodeString s, t(buffer, -1, LENGTHOF(buffer));
	197
	198	if(s.setTo(buffer, -1, LENGTHOF(buffer)).length()!=u_strlen(buffer)) {
	199	errln("UnicodeString.setTo(buffer, length, capacity) does not work with length==-1");
	200	}
	201	if(t.length()!=u_strlen(buffer)) {
	202	errln("UnicodeString(buffer, length, capacity) does not work with length==-1");
	203	}
	204
	205	if(0!=s.caseCompare(buffer, -1, U_FOLD_CASE_DEFAULT)) {
	206	errln("UnicodeString.caseCompare(const UChar *, length, options) does not work with length==-1");
	207	}
	208	if(0!=s.caseCompare(0, s.length(), buffer, U_FOLD_CASE_DEFAULT)) {
	209	errln("UnicodeString.caseCompare(start, _length, const UChar *, options) does not work");
	210	}
	211
	212	buffer[u_strlen(buffer)]=0xe4;
	213	UnicodeString u(buffer, -1, LENGTHOF(buffer));
	214	if(s.setTo(buffer, -1, LENGTHOF(buffer)).length()!=LENGTHOF(buffer)) {
	215	errln("UnicodeString.setTo(buffer without NUL, length, capacity) does not work with length==-1");
	216	}
	217	if(u.length()!=LENGTHOF(buffer)) {
	218	errln("UnicodeString(buffer without NUL, length, capacity) does not work with length==-1");
	219	}
	220
	221	static const char cs[]={ 0x61, (char)0xe4, (char)0x85, 0 };
	222	UConverter *cnv;
	223	UErrorCode errorCode=U_ZERO_ERROR;
	224
	225	cnv=ucnv_open("ISO-8859-1", &errorCode);
	226	UnicodeString v(cs, -1, cnv, errorCode);
	227	ucnv_close(cnv);
	228	if(v!=CharsToUnicodeString("a\\xe4\\x85")) {
	229	errln("UnicodeString(const char *, length, cnv, errorCode) does not work with length==-1");
	230	}
	231	}
	232	}
	233
	234	void
	235	UnicodeStringTest::TestCompare()
	236	{
	237	UnicodeString test1("this is a test");
	238	UnicodeString test2("this is a test");
	239	UnicodeString test3("this is a test of the emergency broadcast system");
	240	UnicodeString test4("never say, \"this is a test\"!!");
	241
	242	UnicodeString test5((UChar)0x5000);
	243	UnicodeString test6((UChar)0x5100);
	244
	245	UChar uniChars[] = { 0x74, 0x68, 0x69, 0x73, 0x20, 0x69, 0x73,
	246	0x20, 0x61, 0x20, 0x74, 0x65, 0x73, 0x74, 0 };
	247	char chars[] = "this is a test";
	248
	249	// test operator== and operator!=
	250	if (test1 != test2 \|\| test1 == test3 \|\| test1 == test4)
	251	errln("operator== or operator!= failed");
	252
	253	// test operator> and operator<
	254	if (test1 > test2 \|\| test1 < test2 \|\| !(test1 < test3) \|\| !(test1 > test4) \|\|
	255	!(test5 < test6)
	256	) {
	257	errln("operator> or operator< failed");
	258	}
	259
	260	// test operator>= and operator<=
	261	if (!(test1 >= test2) \|\| !(test1 <= test2) \|\| !(test1 <= test3) \|\| !(test1 >= test4))
	262	errln("operator>= or operator<= failed");
	263
	264	// test compare(UnicodeString)
	265	if (test1.compare(test2) != 0 \|\| test1.compare(test3) >= 0 \|\| test1.compare(test4) <= 0)
	266	errln("compare(UnicodeString) failed");
	267
	268	//test compare(offset, length, UnicodeString)
	269	if(test1.compare(0, 14, test2) != 0 \|\|
	270	test3.compare(0, 14, test2) != 0 \|\|
	271	test4.compare(12, 14, test2) != 0 \|\|
	272	test3.compare(0, 18, test1) <=0 )
	273	errln("compare(offset, length, UnicodeString) failes");
	274
	275	// test compare(UChar*)
	276	if (test2.compare(uniChars) != 0 \|\| test3.compare(uniChars) <= 0 \|\| test4.compare(uniChars) >= 0)
	277	errln("compare(UChar*) failed");
	278
	279	// test compare(char*)
	280	if (test2.compare(chars) != 0 \|\| test3.compare(chars) <= 0 \|\| test4.compare(chars) >= 0)
	281	errln("compare(char*) failed");
	282
	283	// test compare(UChar*, length)
	284	if (test1.compare(uniChars, 4) <= 0 \|\| test1.compare(uniChars, 4) <= 0)
	285	errln("compare(UChar*, length) failed");
	286
	287	// test compare(thisOffset, thisLength, that, thatOffset, thatLength)
	288	if (test1.compare(0, 14, test2, 0, 14) != 0
	289	\|\| test1.compare(0, 14, test3, 0, 14) != 0
	290	\|\| test1.compare(0, 14, test4, 12, 14) != 0)
	291	errln("1. compare(thisOffset, thisLength, that, thatOffset, thatLength) failed");
	292
	293	if (test1.compare(10, 4, test2, 0, 4) >= 0
	294	\|\| test1.compare(10, 4, test3, 22, 9) <= 0
	295	\|\| test1.compare(10, 4, test4, 22, 4) != 0)
	296	errln("2. compare(thisOffset, thisLength, that, thatOffset, thatLength) failed");
	297
	298	// test compareBetween
	299	if (test1.compareBetween(0, 14, test2, 0, 14) != 0 \|\| test1.compareBetween(0, 14, test3, 0, 14) != 0
	300	\|\| test1.compareBetween(0, 14, test4, 12, 26) != 0)
	301	errln("compareBetween failed");
	302
	303	if (test1.compareBetween(10, 14, test2, 0, 4) >= 0 \|\| test1.compareBetween(10, 14, test3, 22, 31) <= 0
	304	\|\| test1.compareBetween(10, 14, test4, 22, 26) != 0)
	305	errln("compareBetween failed");
	306
	307	// test compare() etc. with strings that share a buffer but are not equal
	308	test2=test1; // share the buffer, length() too large for the stackBuffer
	309	test2.truncate(1); // change only the length, not the buffer
	310	if( test1==test2 \|\| test1<=test2 \|\|
	311	test1.compare(test2)<=0 \|\|
	312	test1.compareCodePointOrder(test2)<=0 \|\|
	313	test1.compareCodePointOrder(0, INT32_MAX, test2)<=0 \|\|
	314	test1.compareCodePointOrder(0, INT32_MAX, test2, 0, INT32_MAX)<=0 \|\|
	315	test1.compareCodePointOrderBetween(0, INT32_MAX, test2, 0, INT32_MAX)<=0 \|\|
	316	test1.caseCompare(test2, U_FOLD_CASE_DEFAULT)<=0
	317	) {
	318	errln("UnicodeStrings that share a buffer but have different lengths compare as equal");
	319	}
	320
	321	/* test compareCodePointOrder() */
	322	{
	323	/* these strings are in ascending order */
	324	static const UChar strings[][4]={
	325	{ 0x61, 0 }, /* U+0061 */
	326	{ 0x20ac, 0xd801, 0 }, /* U+20ac U+d801 */
	327	{ 0x20ac, 0xd800, 0xdc00, 0 }, /* U+20ac U+10000 */
	328	{ 0xd800, 0 }, /* U+d800 */
	329	{ 0xd800, 0xff61, 0 }, /* U+d800 U+ff61 */
	330	{ 0xdfff, 0 }, /* U+dfff */
	331	{ 0xff61, 0xdfff, 0 }, /* U+ff61 U+dfff */
	332	{ 0xff61, 0xd800, 0xdc02, 0 }, /* U+ff61 U+10002 */
	333	{ 0xd800, 0xdc02, 0 }, /* U+10002 */
	334	{ 0xd84d, 0xdc56, 0 } /* U+23456 */
	335	};
	336	UnicodeString u[20]; // must be at least as long as strings[]
	337	int32_t i;
	338
	339	for(i=0; i<(int32_t)(sizeof(strings)/sizeof(strings[0])); ++i) {
	340	u[i]=UnicodeString(TRUE, strings[i], -1);
	341	}
	342
	343	for(i=0; i<(int32_t)(sizeof(strings)/sizeof(strings[0])-1); ++i) {
	344	if(u[i].compareCodePointOrder(u[i+1])>=0 \|\| u[i].compareCodePointOrder(0, INT32_MAX, u[i+1].getBuffer())>=0) {
	345	errln("error: UnicodeString::compareCodePointOrder() fails for string %d and the following one\n", i);
	346	}
	347	}
	348	}
	349
	350	/* test caseCompare() */
	351	{
	352	static const UChar
	353	_mixed[]= { 0x61, 0x42, 0x131, 0x3a3, 0xdf, 0x130, 0x49, 0xfb03, 0xd93f, 0xdfff, 0 },
	354	_otherDefault[]= { 0x41, 0x62, 0x131, 0x3c3, 0x73, 0x53, 0x69, 0x307, 0x69, 0x46, 0x66, 0x49, 0xd93f, 0xdfff, 0 },
	355	_otherExcludeSpecialI[]={ 0x41, 0x62, 0x131, 0x3c3, 0x53, 0x73, 0x69, 0x131, 0x66, 0x46, 0x69, 0xd93f, 0xdfff, 0 },
	356	_different[]= { 0x41, 0x62, 0x131, 0x3c3, 0x73, 0x53, 0x130, 0x49, 0x46, 0x66, 0x49, 0xd93f, 0xdffd, 0 };
	357
	358	UnicodeString
	359	mixed(TRUE, _mixed, -1),
	360	otherDefault(TRUE, _otherDefault, -1),
	361	otherExcludeSpecialI(TRUE, _otherExcludeSpecialI, -1),
	362	different(TRUE, _different, -1);
	363
	364	int8_t result;
	365
	366	/* test caseCompare() */
	367	result=mixed.caseCompare(otherDefault, U_FOLD_CASE_DEFAULT);
	368	if(result!=0 \|\| 0!=mixed.caseCompareBetween(0, INT32_MAX, otherDefault, 0, INT32_MAX, U_FOLD_CASE_DEFAULT)) {
	369	errln("error: mixed.caseCompare(other, default)=%ld instead of 0\n", result);
	370	}
	371	result=mixed.caseCompare(otherExcludeSpecialI, U_FOLD_CASE_EXCLUDE_SPECIAL_I);
	372	if(result!=0) {
	373	errln("error: mixed.caseCompare(otherExcludeSpecialI, U_FOLD_CASE_EXCLUDE_SPECIAL_I)=%ld instead of 0\n", result);
	374	}
	375	result=mixed.caseCompare(otherDefault, U_FOLD_CASE_EXCLUDE_SPECIAL_I);
	376	if(result==0 \|\| 0==mixed.caseCompareBetween(0, INT32_MAX, otherDefault, 0, INT32_MAX, U_FOLD_CASE_EXCLUDE_SPECIAL_I)) {
	377	errln("error: mixed.caseCompare(other, U_FOLD_CASE_EXCLUDE_SPECIAL_I)=0 instead of !=0\n");
	378	}
	379
	380	/* test caseCompare() */
	381	result=mixed.caseCompare(different, U_FOLD_CASE_DEFAULT);
	382	if(result<=0) {
	383	errln("error: mixed.caseCompare(different, default)=%ld instead of positive\n", result);
	384	}
	385
	386	/* test caseCompare() - include the folded sharp s (U+00df) with different lengths */
	387	result=mixed.caseCompare(1, 4, different, 1, 5, U_FOLD_CASE_DEFAULT);
	388	if(result!=0 \|\| 0!=mixed.caseCompareBetween(1, 5, different, 1, 6, U_FOLD_CASE_DEFAULT)) {
	389	errln("error: mixed.caseCompare(mixed, 1, 4, different, 1, 5, default)=%ld instead of 0\n", result);
	390	}
	391
	392	/* test caseCompare() - stop in the middle of the sharp s (U+00df) */
	393	result=mixed.caseCompare(1, 4, different, 1, 4, U_FOLD_CASE_DEFAULT);
	394	if(result<=0) {
	395	errln("error: mixed.caseCompare(1, 4, different, 1, 4, default)=%ld instead of positive\n", result);
	396	}
	397	}
	398
	399	// test that srcLength=-1 is handled in functions that
	400	// take input const UChar */int32_t srcLength (j785)
	401	{
	402	static const UChar u[]={ 0x61, 0x308, 0x62, 0 };
	403	UnicodeString s=UNICODE_STRING("a\\u0308b", 8).unescape();
	404
	405	if(s.compare(u, -1)!=0 \|\| s.compare(0, 999, u, 0, -1)!=0) {
	406	errln("error UnicodeString::compare(..., const UChar *, srcLength=-1) does not work");
	407	}
	408
	409	if(s.compareCodePointOrder(u, -1)!=0 \|\| s.compareCodePointOrder(0, 999, u, 0, -1)!=0) {
	410	errln("error UnicodeString::compareCodePointOrder(..., const UChar *, srcLength=-1, ...) does not work");
	411	}
	412
	413	if(s.caseCompare(u, -1, U_FOLD_CASE_DEFAULT)!=0 \|\| s.caseCompare(0, 999, u, 0, -1, U_FOLD_CASE_DEFAULT)!=0) {
	414	errln("error UnicodeString::caseCompare(..., const UChar *, srcLength=-1, ...) does not work");
	415	}
	416
	417	if(s.indexOf(u, 1, -1, 0, 999)!=1 \|\| s.indexOf(u+1, -1, 0, 999)!=1 \|\| s.indexOf(u+1, -1, 0)!=1) {
	418	errln("error UnicodeString::indexOf(const UChar *, srcLength=-1, ...) does not work");
	419	}
	420
	421	if(s.lastIndexOf(u, 1, -1, 0, 999)!=1 \|\| s.lastIndexOf(u+1, -1, 0, 999)!=1 \|\| s.lastIndexOf(u+1, -1, 0)!=1) {
	422	errln("error UnicodeString::lastIndexOf(const UChar *, srcLength=-1, ...) does not work");
	423	}
	424
	425	UnicodeString s2, s3;
	426	s2.replace(0, 0, u+1, -1);
	427	s3.replace(0, 0, u, 1, -1);
	428	if(s.compare(1, 999, s2)!=0 \|\| s2!=s3) {
	429	errln("error UnicodeString::replace(..., const UChar *, srcLength=-1, ...) does not work");
	430	}
	431	}
	432	}
	433
	434	void
	435	UnicodeStringTest::TestExtract()
	436	{
	437	UnicodeString test1("Now is the time for all good men to come to the aid of their country.", "");
	438	UnicodeString test2;
	439	UChar test3[13] = {1, 2, 3, 4, 5, 6, 7, 8, 8, 10, 11, 12, 13};
	440	char test4[13] = {1, 2, 3, 4, 5, 6, 7, 8, 8, 10, 11, 12, 13};
	441	UnicodeString test5;
	442	char test6[13] = {1, 2, 3, 4, 5, 6, 7, 8, 8, 10, 11, 12, 13};
	443
	444	test1.extract(11, 12, test2);
	445	test1.extract(11, 12, test3);
	446	if (test1.extract(11, 12, test4) != 12 \|\| test4[12] != 0) {
	447	errln("UnicodeString.extract(char *) failed to return the correct size of destination buffer.");
	448	}
	449
	450	// test proper pinning in extractBetween()
	451	test1.extractBetween(-3, 7, test5);
	452	if(test5!=UNICODE_STRING("Now is ", 7)) {
	453	errln("UnicodeString.extractBetween(-3, 7) did not pin properly.");
	454	}
	455
	456	test1.extractBetween(11, 23, test5);
	457	if (test1.extract(60, 71, test6) != 9) {
	458	errln("UnicodeString.extract() failed to return the correct size of destination buffer for end of buffer.");
	459	}
	460	if (test1.extract(11, 12, test6) != 12) {
	461	errln("UnicodeString.extract() failed to return the correct size of destination buffer.");
	462	}
	463
	464	// convert test4 back to Unicode for comparison
	465	UnicodeString test4b(test4, 12);
	466
	467	if (test1.extract(11, 12, (char *)NULL) != 12) {
	468	errln("UnicodeString.extract(NULL) failed to return the correct size of destination buffer.");
	469	}
	470	if (test1.extract(11, -1, test6) != 0) {
	471	errln("UnicodeString.extract(-1) failed to stop reading the string.");
	472	}
	473
	474	for (int32_t i = 0; i < 12; i++) {
	475	if (test1.charAt((int32_t)(11 + i)) != test2.charAt(i)) {
	476	errln(UnicodeString("extracting into a UnicodeString failed at position ") + i);
	477	break;
	478	}
	479	if (test1.charAt((int32_t)(11 + i)) != test3[i]) {
	480	errln(UnicodeString("extracting into an array of UChar failed at position ") + i);
	481	break;
	482	}
	483	if (((char)test1.charAt((int32_t)(11 + i))) != test4b.charAt(i)) {
	484	errln(UnicodeString("extracting into an array of char failed at position ") + i);
	485	break;
	486	}
	487	if (test1.charAt((int32_t)(11 + i)) != test5.charAt(i)) {
	488	errln(UnicodeString("extracting with extractBetween failed at position ") + i);
	489	break;
	490	}
	491	}
	492
	493	// test preflighting and overflows with invariant conversion
	494	if (test1.extract(0, 10, (char *)NULL, "") != 10) {
	495	errln("UnicodeString.extract(0, 10, (char *)NULL, \"\") != 10");
	496	}
	497
	498	test4[2] = (char)0xff;
	499	if (test1.extract(0, 10, test4, 2, "") != 10) {
	500	errln("UnicodeString.extract(0, 10, test4, 2, \"\") != 10");
	501	}
	502	if (test4[2] != (char)0xff) {
	503	errln("UnicodeString.extract(0, 10, test4, 2, \"\") overwrote test4[2]");
	504	}
	505
	506	{
	507	// test new, NUL-terminating extract() function
	508	UnicodeString s("terminate", "");
	509	UChar dest[20]={
	510	0xa5, 0xa5, 0xa5, 0xa5, 0xa5, 0xa5, 0xa5, 0xa5, 0xa5, 0xa5,
	511	0xa5, 0xa5, 0xa5, 0xa5, 0xa5, 0xa5, 0xa5, 0xa5, 0xa5, 0xa5
	512	};
	513	UErrorCode errorCode;
	514	int32_t length;
	515
	516	errorCode=U_ZERO_ERROR;
	517	length=s.extract((UChar *)NULL, 0, errorCode);
	518	if(errorCode!=U_BUFFER_OVERFLOW_ERROR \|\| length!=s.length()) {
	519	errln("UnicodeString.extract(NULL, 0)==%d (%s) expected %d (U_BUFFER_OVERFLOW_ERROR)", length, s.length(), u_errorName(errorCode));
	520	}
	521
	522	errorCode=U_ZERO_ERROR;
	523	length=s.extract(dest, s.length()-1, errorCode);
	524	if(errorCode!=U_BUFFER_OVERFLOW_ERROR \|\| length!=s.length()) {
	525	errln("UnicodeString.extract(dest too short)==%d (%s) expected %d (U_BUFFER_OVERFLOW_ERROR)",
	526	length, u_errorName(errorCode), s.length());
	527	}
	528
	529	errorCode=U_ZERO_ERROR;
	530	length=s.extract(dest, s.length(), errorCode);
	531	if(errorCode!=U_STRING_NOT_TERMINATED_WARNING \|\| length!=s.length()) {
	532	errln("UnicodeString.extract(dest just right without NUL)==%d (%s) expected %d (U_STRING_NOT_TERMINATED_WARNING)",
	533	length, u_errorName(errorCode), s.length());
	534	}
	535	if(dest[length-1]!=s[length-1] \|\| dest[length]!=0xa5) {
	536	errln("UnicodeString.extract(dest just right without NUL) did not extract the string correctly");
	537	}
	538
	539	errorCode=U_ZERO_ERROR;
	540	length=s.extract(dest, s.length()+1, errorCode);
	541	if(errorCode!=U_ZERO_ERROR \|\| length!=s.length()) {
	542	errln("UnicodeString.extract(dest large enough)==%d (%s) expected %d (U_ZERO_ERROR)",
	543	length, u_errorName(errorCode), s.length());
	544	}
	545	if(dest[length-1]!=s[length-1] \|\| dest[length]!=0 \|\| dest[length+1]!=0xa5) {
	546	errln("UnicodeString.extract(dest large enough) did not extract the string correctly");
	547	}
	548	}
	549
	550	{
	551	// test new UConverter extract() and constructor
	552	UnicodeString s=UNICODE_STRING("\\U0002f999\\U0001d15f\\u00c4\\u1ed0", 32).unescape();
	553	char buffer[32];
	554	static const char expect[]={
	555	(char)0xf0, (char)0xaf, (char)0xa6, (char)0x99,
	556	(char)0xf0, (char)0x9d, (char)0x85, (char)0x9f,
	557	(char)0xc3, (char)0x84,
	558	(char)0xe1, (char)0xbb, (char)0x90
	559	};
	560	UErrorCode errorCode=U_ZERO_ERROR;
	561	UConverter *cnv=ucnv_open("UTF-8", &errorCode);
	562	int32_t length;
	563
	564	if(U_SUCCESS(errorCode)) {
	565	// test preflighting
	566	if( (length=s.extract(NULL, 0, cnv, errorCode))!=13 \|\|
	567	errorCode!=U_BUFFER_OVERFLOW_ERROR
	568	) {
	569	errln("UnicodeString::extract(NULL, UConverter) preflighting failed (length=%ld, %s)",
	570	length, u_errorName(errorCode));
	571	}
	572	errorCode=U_ZERO_ERROR;
	573	if( (length=s.extract(buffer, 2, cnv, errorCode))!=13 \|\|
	574	errorCode!=U_BUFFER_OVERFLOW_ERROR
	575	) {
	576	errln("UnicodeString::extract(too small, UConverter) preflighting failed (length=%ld, %s)",
	577	length, u_errorName(errorCode));
	578	}
	579
	580	// try error cases
	581	errorCode=U_ZERO_ERROR;
	582	if( s.extract(NULL, 2, cnv, errorCode)==13 \|\| U_SUCCESS(errorCode)) {
	583	errln("UnicodeString::extract(UConverter) succeeded with an illegal destination");
	584	}
	585	errorCode=U_ILLEGAL_ARGUMENT_ERROR;
	586	if( s.extract(NULL, 0, cnv, errorCode)==13 \|\| U_SUCCESS(errorCode)) {
	587	errln("UnicodeString::extract(UConverter) succeeded with a previous error code");
	588	}
	589	errorCode=U_ZERO_ERROR;
	590
	591	// extract for real
	592	if( (length=s.extract(buffer, sizeof(buffer), cnv, errorCode))!=13 \|\|
	593	uprv_memcmp(buffer, expect, 13)!=0 \|\|
	594	buffer[13]!=0 \|\|
	595	U_FAILURE(errorCode)
	596	) {
	597	errln("UnicodeString::extract(UConverter) conversion failed (length=%ld, %s)",
	598	length, u_errorName(errorCode));
	599	}
	600	// Test again with just the converter name.
	601	if( (length=s.extract(0, s.length(), buffer, sizeof(buffer), "UTF-8"))!=13 \|\|
	602	uprv_memcmp(buffer, expect, 13)!=0 \|\|
	603	buffer[13]!=0 \|\|
	604	U_FAILURE(errorCode)
	605	) {
	606	errln("UnicodeString::extract(\"UTF-8\") conversion failed (length=%ld, %s)",
	607	length, u_errorName(errorCode));
	608	}
	609
	610	// try the constructor
	611	UnicodeString t(expect, sizeof(expect), cnv, errorCode);
	612	if(U_FAILURE(errorCode) \|\| s!=t) {
	613	errln("UnicodeString(UConverter) conversion failed (%s)",
	614	u_errorName(errorCode));
	615	}
	616
	617	ucnv_close(cnv);
	618	}
	619	}
	620	}
	621
	622	void
	623	UnicodeStringTest::TestRemoveReplace()
	624	{
	625	UnicodeString test1("The rain in Spain stays mainly on the plain");
	626	UnicodeString test2("eat SPAMburgers!");
	627	UChar test3[] = { 0x53, 0x50, 0x41, 0x4d, 0x4d, 0 };
	628	char test4[] = "SPAM";
	629	UnicodeString& test5 = test1;
	630
	631	test1.replace(4, 4, test2, 4, 4);
	632	test1.replace(12, 5, test3, 4);
	633	test3[4] = 0;
	634	test1.replace(17, 4, test3);
	635	test1.replace(23, 4, test4);
	636	test1.replaceBetween(37, 42, test2, 4, 8);
	637
	638	if (test1 != "The SPAM in SPAM SPAMs SPAMly on the SPAM")
	639	errln("One of the replace methods failed:\n"
	640	" expected \"The SPAM in SPAM SPAMs SPAMly on the SPAM\",\n"
	641	" got \"" + test1 + "\"");
	642
	643	test1.remove(21, 1);
	644	test1.removeBetween(26, 28);
	645
	646	if (test1 != "The SPAM in SPAM SPAM SPAM on the SPAM")
	647	errln("One of the remove methods failed:\n"
	648	" expected \"The SPAM in SPAM SPAM SPAM on the SPAM\",\n"
	649	" got \"" + test1 + "\"");
	650
	651	for (int32_t i = 0; i < test1.length(); i++) {
	652	if (test5[i] != 0x53 && test5[i] != 0x50 && test5[i] != 0x41 && test5[i] != 0x4d && test5[i] != 0x20) {
	653	test1.setCharAt(i, 0x78);
	654	}
	655	}
	656
	657	if (test1 != "xxx SPAM xx SPAM SPAM SPAM xx xxx SPAM")
	658	errln("One of the remove methods failed:\n"
	659	" expected \"xxx SPAM xx SPAM SPAM SPAM xx xxx SPAM\",\n"
	660	" got \"" + test1 + "\"");
	661
	662	test1.remove();
	663	if (test1.length() != 0)
	664	errln("Remove() failed: expected empty string, got \"" + test1 + "\"");
	665	}
	666
	667	void
	668	UnicodeStringTest::TestSearching()
	669	{
	670	UnicodeString test1("test test ttest tetest testesteststt");
	671	UnicodeString test2("test");
	672	UChar testChar = 0x74;
	673
	674	UChar32 testChar32 = 0x20402;
	675	UChar testData[]={
	676	// 0 1 2 3 4 5 6 7
	677	0xd841, 0xdc02, 0x0071, 0xdc02, 0xd841, 0x0071, 0xd841, 0xdc02,
	678
	679	// 8 9 10 11 12 13 14 15
	680	0x0071, 0x0072, 0xd841, 0xdc02, 0x0071, 0xd841, 0xdc02, 0x0071,
	681
	682	// 16 17 18 19
	683	0xdc02, 0xd841, 0x0073, 0x0000
	684	};
	685	UnicodeString test3(testData);
	686	UnicodeString test4(testChar32);
	687
	688	uint16_t occurrences = 0;
	689	int32_t startPos = 0;
	690	for ( ;
	691	startPos != -1 && startPos < test1.length();
	692	(startPos = test1.indexOf(test2, startPos)) != -1 ? (++occurrences, startPos += 4) : 0)
	693	;
	694	if (occurrences != 6)
	695	errln("indexOf failed: expected to find 6 occurrences, found " + occurrences);
	696
	697	for ( occurrences = 0, startPos = 10;
	698	startPos != -1 && startPos < test1.length();
	699	(startPos = test1.indexOf(test2, startPos)) != -1 ? (++occurrences, startPos += 4) : 0)
	700	;
	701	if (occurrences != 4)
	702	errln("indexOf with starting offset failed: expected to find 4 occurrences, found " + occurrences);
	703
	704	int32_t endPos = 28;
	705	for ( occurrences = 0, startPos = 5;
	706	startPos != -1 && startPos < test1.length();
	707	(startPos = test1.indexOf(test2, startPos, endPos - startPos)) != -1 ? (++occurrences, startPos += 4) : 0)
	708	;
	709	if (occurrences != 4)
	710	errln("indexOf with starting and ending offsets failed: expected to find 4 occurrences, found " + occurrences);
	711
	712	//using UChar32 string
	713	for ( startPos=0, occurrences=0;
	714	startPos != -1 && startPos < test3.length();
	715	(startPos = test3.indexOf(test4, startPos)) != -1 ? (++occurrences, startPos += 2) : 0)
	716	;
	717	if (occurrences != 4)
	718	errln((UnicodeString)"indexOf failed: expected to find 4 occurrences, found " + occurrences);
	719
	720	for ( startPos=10, occurrences=0;
	721	startPos != -1 && startPos < test3.length();
	722	(startPos = test3.indexOf(test4, startPos)) != -1 ? (++occurrences, startPos += 2) : 0)
	723	;
	724	if (occurrences != 2)
	725	errln("indexOf failed: expected to find 2 occurrences, found " + occurrences);
	726	//---
	727
	728	for ( occurrences = 0, startPos = 0;
	729	startPos != -1 && startPos < test1.length();
	730	(startPos = test1.indexOf(testChar, startPos)) != -1 ? (++occurrences, startPos += 1) : 0)
	731	;
	732	if (occurrences != 16)
	733	errln("indexOf with character failed: expected to find 16 occurrences, found " + occurrences);
	734
	735	for ( occurrences = 0, startPos = 10;
	736	startPos != -1 && startPos < test1.length();
	737	(startPos = test1.indexOf(testChar, startPos)) != -1 ? (++occurrences, startPos += 1) : 0)
	738	;
	739	if (occurrences != 12)
	740	errln("indexOf with character & start offset failed: expected to find 12 occurrences, found " + occurrences);
	741
	742	for ( occurrences = 0, startPos = 5, endPos = 28;
	743	startPos != -1 && startPos < test1.length();
	744	(startPos = test1.indexOf(testChar, startPos, endPos - startPos)) != -1 ? (++occurrences, startPos += 1) : 0)
	745	;
	746	if (occurrences != 10)
	747	errln("indexOf with character & start & end offsets failed: expected to find 10 occurrences, found " + occurrences);
	748
	749	//testing for UChar32
	750	UnicodeString subString;
	751	for( occurrences =0, startPos=0; startPos < test3.length(); startPos +=1){
	752	subString.append(test3, startPos, test3.length());
	753	if(subString.indexOf(testChar32) != -1 ){
	754	++occurrences;
	755	}
	756	subString.remove();
	757	}
	758	if (occurrences != 14)
	759	errln((UnicodeString)"indexOf failed: expected to find 14 occurrences, found " + occurrences);
	760
	761	for ( occurrences = 0, startPos = 0;
	762	startPos != -1 && startPos < test3.length();
	763	(startPos = test3.indexOf(testChar32, startPos)) != -1 ? (++occurrences, startPos += 1) : 0)
	764	;
	765	if (occurrences != 4)
	766	errln((UnicodeString)"indexOf failed: expected to find 4 occurrences, found " + occurrences);
	767
	768	endPos=test3.length();
	769	for ( occurrences = 0, startPos = 5;
	770	startPos != -1 && startPos < test3.length();
	771	(startPos = test3.indexOf(testChar32, startPos, endPos - startPos)) != -1 ? (++occurrences, startPos += 1) : 0)
	772	;
	773	if (occurrences != 3)
	774	errln((UnicodeString)"indexOf with character & start & end offsets failed: expected to find 2 occurrences, found " + occurrences);
	775	//---
	776
	777	if(test1.lastIndexOf(test2)!=29) {
	778	errln("test1.lastIndexOf(test2)!=29");
	779	}
	780
	781	if(test1.lastIndexOf(test2, 15)!=29 \|\| test1.lastIndexOf(test2, 29)!=29 \|\| test1.lastIndexOf(test2, 30)!=-1) {
	782	errln("test1.lastIndexOf(test2, start) failed");
	783	}
	784
	785	for ( occurrences = 0, startPos = 32;
	786	startPos != -1;
	787	(startPos = test1.lastIndexOf(test2, 5, startPos - 5)) != -1 ? ++occurrences : 0)
	788	;
	789	if (occurrences != 4)
	790	errln("lastIndexOf with starting and ending offsets failed: expected to find 4 occurrences, found " + occurrences);
	791
	792	for ( occurrences = 0, startPos = 32;
	793	startPos != -1;
	794	(startPos = test1.lastIndexOf(testChar, 5, startPos - 5)) != -1 ? ++occurrences : 0)
	795	;
	796	if (occurrences != 11)
	797	errln("lastIndexOf with character & start & end offsets failed: expected to find 11 occurrences, found " + occurrences);
	798
	799	//testing UChar32
	800	startPos=test3.length();
	801	for ( occurrences = 0;
	802	startPos != -1;
	803	(startPos = test3.lastIndexOf(testChar32, 5, startPos - 5)) != -1 ? ++occurrences : 0)
	804	;
	805	if (occurrences != 3)
	806	errln((UnicodeString)"lastIndexOf with character & start & end offsets failed: expected to find 3 occurrences, found " + occurrences);
	807
	808
	809	for ( occurrences = 0, endPos = test3.length(); endPos > 0; endPos -= 1){
	810	subString.remove();
	811	subString.append(test3, 0, endPos);
	812	if(subString.lastIndexOf(testChar32) != -1 ){
	813	++occurrences;
	814	}
	815	}
	816	if (occurrences != 18)
	817	errln((UnicodeString)"indexOf failed: expected to find 18 occurrences, found " + occurrences);
	818	//---
	819
	820	// test that indexOf(UChar32) and lastIndexOf(UChar32)
	821	// do not find surrogate code points when they are part of matched pairs
	822	// (= part of supplementary code points)
	823	// Jitterbug 1542
	824	if(test3.indexOf((UChar32)0xd841) != 4 \|\| test3.indexOf((UChar32)0xdc02) != 3) {
	825	errln("error: UnicodeString::indexOf(UChar32 surrogate) finds a partial supplementary code point");
	826	}
	827	if( UnicodeString(test3, 0, 17).lastIndexOf((UChar)0xd841, 0) != 4 \|\|
	828	UnicodeString(test3, 0, 17).lastIndexOf((UChar32)0xd841, 2) != 4 \|\|
	829	test3.lastIndexOf((UChar32)0xd841, 0, 17) != 4 \|\| test3.lastIndexOf((UChar32)0xdc02, 0, 17) != 16
	830	) {
	831	errln("error: UnicodeString::lastIndexOf(UChar32 surrogate) finds a partial supplementary code point");
	832	}
	833	}
	834
	835	void
	836	UnicodeStringTest::TestSpacePadding()
	837	{
	838	UnicodeString test1("hello");
	839	UnicodeString test2(" there");
	840	UnicodeString test3("Hi! How ya doin'? Beautiful day, isn't it?");
	841	UnicodeString test4;
	842	UBool returnVal;
	843	UnicodeString expectedValue;
	844
	845	returnVal = test1.padLeading(15);
	846	expectedValue = " hello";
	847	if (returnVal == FALSE \|\| test1 != expectedValue)
	848	errln("padLeading() failed: expected \"" + expectedValue + "\", got \"" + test1 + "\".");
	849
	850	returnVal = test2.padTrailing(15);
	851	expectedValue = " there ";
	852	if (returnVal == FALSE \|\| test2 != expectedValue)
	853	errln("padTrailing() failed: expected \"" + expectedValue + "\", got \"" + test2 + "\".");
	854
	855	expectedValue = test3;
	856	returnVal = test3.padTrailing(15);
	857	if (returnVal == TRUE \|\| test3 != expectedValue)
	858	errln("padTrailing() failed: expected \"" + expectedValue + "\", got \"" + test3 + "\".");
	859
	860	expectedValue = "hello";
	861	test4.setTo(test1).trim();
	862
	863	if (test4 != expectedValue \|\| test1 == expectedValue \|\| test4 != expectedValue)
	864	errln("trim(UnicodeString&) failed");
	865
	866	test1.trim();
	867	if (test1 != expectedValue)
	868	errln("trim() failed: expected \"" + expectedValue + "\", got \"" + test1 + "\".");
	869
	870	test2.trim();
	871	expectedValue = "there";
	872	if (test2 != expectedValue)
	873	errln("trim() failed: expected \"" + expectedValue + "\", got \"" + test2 + "\".");
	874
	875	test3.trim();
	876	expectedValue = "Hi! How ya doin'? Beautiful day, isn't it?";
	877	if (test3 != expectedValue)
	878	errln("trim() failed: expected \"" + expectedValue + "\", got \"" + test3 + "\".");
	879
	880	returnVal = test1.truncate(15);
	881	expectedValue = "hello";
	882	if (returnVal == TRUE \|\| test1 != expectedValue)
	883	errln("truncate() failed: expected \"" + expectedValue + "\", got \"" + test1 + "\".");
	884
	885	returnVal = test2.truncate(15);
	886	expectedValue = "there";
	887	if (returnVal == TRUE \|\| test2 != expectedValue)
	888	errln("truncate() failed: expected \"" + expectedValue + "\", got \"" + test2 + "\".");
	889
	890	returnVal = test3.truncate(15);
	891	expectedValue = "Hi! How ya doi";
	892	if (returnVal == FALSE \|\| test3 != expectedValue)
	893	errln("truncate() failed: expected \"" + expectedValue + "\", got \"" + test3 + "\".");
	894	}
	895
	896	void
	897	UnicodeStringTest::TestPrefixAndSuffix()
	898	{
	899	UnicodeString test1("Now is the time for all good men to come to the aid of their country.");
	900	UnicodeString test2("Now");
	901	UnicodeString test3("country.");
	902	UnicodeString test4("count");
	903
	904	if (!test1.startsWith(test2) \|\| !test1.startsWith(test2, 0, test2.length())) {
	905	errln("startsWith() failed: \"" + test2 + "\" should be a prefix of \"" + test1 + "\".");
	906	}
	907
	908	if (test1.startsWith(test3) \|\|
	909	test1.startsWith(test3.getBuffer(), test3.length()) \|\|
	910	test1.startsWith(test3.getTerminatedBuffer(), 0, -1)
	911	) {
	912	errln("startsWith() failed: \"" + test3 + "\" shouldn't be a prefix of \"" + test1 + "\".");
	913	}
	914
	915	if (test1.endsWith(test2)) {
	916	errln("endsWith() failed: \"" + test2 + "\" shouldn't be a suffix of \"" + test1 + "\".");
	917	}
	918
	919	if (!test1.endsWith(test3)) {
	920	errln("endsWith(test3) failed: \"" + test3 + "\" should be a suffix of \"" + test1 + "\".");
	921	}
	922	if (!test1.endsWith(test3, 0, INT32_MAX)) {
	923	errln("endsWith(test3, 0, INT32_MAX) failed: \"" + test3 + "\" should be a suffix of \"" + test1 + "\".");
	924	}
	925
	926	if(!test1.endsWith(test3.getBuffer(), test3.length())) {
	927	errln("endsWith(test3.getBuffer(), test3.length()) failed: \"" + test3 + "\" should be a suffix of \"" + test1 + "\".");
	928	}
	929	if(!test1.endsWith(test3.getTerminatedBuffer(), 0, -1)) {
	930	errln("endsWith(test3.getTerminatedBuffer(), 0, -1) failed: \"" + test3 + "\" should be a suffix of \"" + test1 + "\".");
	931	}
	932
	933	if (!test3.startsWith(test4)) {
	934	errln("endsWith(test4) failed: \"" + test4 + "\" should be a prefix of \"" + test3 + "\".");
	935	}
	936
	937	if (test4.startsWith(test3)) {
	938	errln("startsWith(test3) failed: \"" + test3 + "\" shouldn't be a prefix of \"" + test4 + "\".");
	939	}
	940	}
	941
	942	void
	943	UnicodeStringTest::TestFindAndReplace()
	944	{
	945	UnicodeString test1("One potato, two potato, three potato, four\n");
	946	UnicodeString test2("potato");
	947	UnicodeString test3("MISSISSIPPI");
	948
	949	UnicodeString expectedValue;
	950
	951	test1.findAndReplace(test2, test3);
	952	expectedValue = "One MISSISSIPPI, two MISSISSIPPI, three MISSISSIPPI, four\n";
	953	if (test1 != expectedValue)
	954	errln("findAndReplace failed: expected \"" + expectedValue + "\", got \"" + test1 + "\".");
	955	test1.findAndReplace(2, 32, test3, test2);
	956	expectedValue = "One potato, two potato, three MISSISSIPPI, four\n";
	957	if (test1 != expectedValue)
	958	errln("findAndReplace failed: expected \"" + expectedValue + "\", got \"" + test1 + "\".");
	959	}
	960
	961	void
	962	UnicodeStringTest::TestReverse()
	963	{
	964	UnicodeString test("backwards words say to used I");
	965
	966	test.reverse();
	967	test.reverse(2, 4);
	968	test.reverse(7, 2);
	969	test.reverse(10, 3);
	970	test.reverse(14, 5);
	971	test.reverse(20, 9);
	972
	973	if (test != "I used to say words backwards")
	974	errln("reverse() failed: Expected \"I used to say words backwards\",\n got \""
	975	+ test + "\"");
	976
	977	test=UNICODE_STRING("\\U0002f999\\U0001d15f\\u00c4\\u1ed0", 32).unescape();
	978	test.reverse();
	979	if(test.char32At(0)!=0x1ed0 \|\| test.char32At(1)!=0xc4 \|\| test.char32At(2)!=0x1d15f \|\| test.char32At(4)!=0x2f999) {
	980	errln("reverse() failed with supplementary characters");
	981	}
	982	}
	983
	984	void
	985	UnicodeStringTest::TestMiscellaneous()
	986	{
	987	UnicodeString test1("This is a test");
	988	UnicodeString test2("This is a test");
	989	UnicodeString test3("Me too!");
	990
	991	// test getBuffer(minCapacity) and releaseBuffer()
	992	test1=UnicodeString(); // make sure that it starts with its stackBuffer
	993	UChar *p=test1.getBuffer(20);
	994	if(test1.getCapacity()<20) {
	995	errln("UnicodeString::getBuffer(20).getCapacity()<20");
	996	}
	997
	998	test1.append((UChar)7); // must not be able to modify the string here
	999	test1.setCharAt(3, 7);
	1000	test1.reverse();
	1001	if( test1.length()!=0 \|\|
	1002	test1.charAt(0)!=0xffff \|\| test1.charAt(3)!=0xffff \|\|
	1003	test1.getBuffer(10)!=0 \|\| test1.getBuffer()!=0
	1004	) {
	1005	errln("UnicodeString::getBuffer(minCapacity) allows read or write access to the UnicodeString");
	1006	}
	1007
	1008	p[0]=1;
	1009	p[1]=2;
	1010	p[2]=3;
	1011	test1.releaseBuffer(3);
	1012	test1.append((UChar)4);
	1013
	1014	if(test1.length()!=4 \|\| test1.charAt(0)!=1 \|\| test1.charAt(1)!=2 \|\| test1.charAt(2)!=3 \|\| test1.charAt(3)!=4) {
	1015	errln("UnicodeString::releaseBuffer(newLength) does not properly reallow access to the UnicodeString");
	1016	}
	1017
	1018	// test releaseBuffer() without getBuffer(minCapacity) - must not have any effect
	1019	test1.releaseBuffer(1);
	1020	if(test1.length()!=4 \|\| test1.charAt(0)!=1 \|\| test1.charAt(1)!=2 \|\| test1.charAt(2)!=3 \|\| test1.charAt(3)!=4) {
	1021	errln("UnicodeString::releaseBuffer(newLength) without getBuffer(minCapacity) changed the UnicodeString");
	1022	}
	1023
	1024	// test getBuffer(const)
	1025	const UChar q=test1.getBuffer(), r=test1.getBuffer();
	1026	if( test1.length()!=4 \|\|
	1027	q[0]!=1 \|\| q[1]!=2 \|\| q[2]!=3 \|\| q[3]!=4 \|\|
	1028	r[0]!=1 \|\| r[1]!=2 \|\| r[2]!=3 \|\| r[3]!=4
	1029	) {
	1030	errln("UnicodeString::getBuffer(const) does not return a usable buffer pointer");
	1031	}
	1032
	1033	// test releaseBuffer() with a NUL-terminated buffer
	1034	test1.getBuffer(20)[2]=0;
	1035	test1.releaseBuffer(); // implicit -1
	1036	if(test1.length()!=2 \|\| test1.charAt(0)!=1 \|\| test1.charAt(1) !=2) {
	1037	errln("UnicodeString::releaseBuffer(-1) does not properly set the length of the UnicodeString");
	1038	}
	1039
	1040	// test releaseBuffer() with a non-NUL-terminated buffer
	1041	p=test1.getBuffer(256);
	1042	for(int32_t i=0; i<test1.getCapacity(); ++i) {
	1043	p[i]=(UChar)1; // fill the buffer with all non-NUL code units
	1044	}
	1045	test1.releaseBuffer(); // implicit -1
	1046	if(test1.length()!=test1.getCapacity() \|\| test1.charAt(1)!=1 \|\| test1.charAt(100)!=1 \|\| test1.charAt(test1.getCapacity()-1)!=1) {
	1047	errln("UnicodeString::releaseBuffer(-1 but no NUL) does not properly set the length of the UnicodeString");
	1048	}
	1049
	1050	// test getTerminatedBuffer()
	1051	test1=UnicodeString("This is another test.", "");
	1052	test2=UnicodeString("This is another test.", "");
	1053	q=test1.getTerminatedBuffer();
	1054	if(q[test1.length()]!=0 \|\| test1!=test2 \|\| test2.compare(q, -1)!=0) {
	1055	errln("getTerminatedBuffer()[length]!=0");
	1056	}
	1057
	1058	const UChar u[]={ 5, 6, 7, 8, 0 };
	1059	test1.setTo(FALSE, u, 3);
	1060	q=test1.getTerminatedBuffer();
	1061	if(q==u \|\| q[0]!=5 \|\| q[1]!=6 \|\| q[2]!=7 \|\| q[3]!=0) {
	1062	errln("UnicodeString(u[3]).getTerminatedBuffer() returns a bad buffer");
	1063	}
	1064
	1065	test1.setTo(TRUE, u, -1);
	1066	q=test1.getTerminatedBuffer();
	1067	if(q!=u \|\| test1.length()!=4 \|\| q[3]!=8 \|\| q[4]!=0) {
	1068	errln("UnicodeString(u[-1]).getTerminatedBuffer() returns a bad buffer");
	1069	}
	1070
	1071	test1=UNICODE_STRING("la", 2);
	1072	test1.append(UNICODE_STRING(" lila", 5).getTerminatedBuffer(), 0, -1);
	1073	if(test1!=UNICODE_STRING("la lila", 7)) {
	1074	errln("UnicodeString::append(const UChar *, start, length) failed");
	1075	}
	1076
	1077	test1.insert(3, UNICODE_STRING("dudum ", 6), 0, INT32_MAX);
	1078	if(test1!=UNICODE_STRING("la dudum lila", 13)) {
	1079	errln("UnicodeString::insert(start, const UniStr &, start, length) failed");
	1080	}
	1081
	1082	static const UChar ucs[]={ 0x68, 0x6d, 0x20, 0 };
	1083	test1.insert(9, ucs, -1);
	1084	if(test1!=UNICODE_STRING("la dudum hm lila", 16)) {
	1085	errln("UnicodeString::insert(start, const UChar *, length) failed");
	1086	}
	1087
	1088	test1.replace(9, 2, (UChar)0x2b);
	1089	if(test1!=UNICODE_STRING("la dudum + lila", 15)) {
	1090	errln("UnicodeString::replace(start, length, UChar) failed");
	1091	}
	1092
	1093	if(test1.hasMetaData() \|\| UnicodeString().hasMetaData()) {
	1094	errln("UnicodeString::hasMetaData() returns TRUE");
	1095	}
	1096	}
	1097
	1098	void
	1099	UnicodeStringTest::TestStackAllocation()
	1100	{
	1101	UChar testString[] ={
	1102	0x54, 0x68, 0x69, 0x73, 0x20, 0x69, 0x73, 0x20, 0x61, 0x20, 0x63, 0x72, 0x61, 0x7a, 0x79, 0x20, 0x74, 0x65, 0x73, 0x74, 0x2e, 0 };
	1103	UChar guardWord = 0x4DED;
	1104	UnicodeString* test = 0;
	1105
	1106	test = new UnicodeString(testString);
	1107	if (*test != "This is a crazy test.")
	1108	errln("Test string failed to initialize properly.");
	1109	if (guardWord != 0x04DED)
	1110	errln("Test string initialization overwrote guard word!");
	1111
	1112	test->insert(8, "only ");
	1113	test->remove(15, 6);
	1114	if (*test != "This is only a test.")
	1115	errln("Manipulation of test string failed to work right.");
	1116	if (guardWord != 0x4DED)
	1117	errln("Manipulation of test string overwrote guard word!");
	1118
	1119	// we have to deinitialize and release the backing store by calling the destructor
	1120	// explicitly, since we can't overload operator delete
	1121	delete test;
	1122
	1123	UChar workingBuffer[] = {
	1124	0x4e, 0x6f, 0x77, 0x20, 0x69, 0x73, 0x20, 0x74, 0x68, 0x65, 0x20, 0x74, 0x69, 0x6d, 0x65, 0x20,
	1125	0x66, 0x6f, 0x72, 0x20, 0x61, 0x6c, 0x6c, 0x20, 0x6d, 0x65, 0x6e, 0x20, 0x74, 0x6f, 0x20,
	1126	0x63, 0x6f, 0x6d, 0x65, 0xffff, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
	1127	0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
	1128	0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 };
	1129	UChar guardWord2 = 0x4DED;
	1130
	1131	test = new UnicodeString(workingBuffer, 35, 100);
	1132	if (*test != "Now is the time for all men to come")
	1133	errln("Stack-allocated backing store failed to initialize correctly.");
	1134	if (guardWord2 != 0x4DED)
	1135	errln("Stack-allocated backing store overwrote guard word!");
	1136
	1137	test->insert(24, "good ");
	1138	if (*test != "Now is the time for all good men to come")
	1139	errln("insert() on stack-allocated UnicodeString didn't work right");
	1140	if (guardWord2 != 0x4DED)
	1141	errln("insert() on stack-allocated UnicodeString overwrote guard word!");
	1142
	1143	if (workingBuffer[24] != 0x67)
	1144	errln("insert() on stack-allocated UnicodeString didn't affect backing store");
	1145
	1146	*test += " to the aid of their country.";
	1147	if (*test != "Now is the time for all good men to come to the aid of their country.")
	1148	errln("Stack-allocated UnicodeString overflow didn't work");
	1149	if (guardWord2 != 0x4DED)
	1150	errln("Stack-allocated UnicodeString overflow overwrote guard word!");
	1151
	1152	*test = "ha!";
	1153	if (*test != "ha!")
	1154	errln("Assignment to stack-allocated UnicodeString didn't work");
	1155	if (workingBuffer[0] != 0x4e)
	1156	errln("Change to UnicodeString after overflow are still affecting original buffer");
	1157	if (guardWord2 != 0x4DED)
	1158	errln("Change to UnicodeString after overflow overwrote guard word!");
	1159
	1160	// test read-only aliasing with setTo()
	1161	workingBuffer[0] = 0x20ac;
	1162	workingBuffer[1] = 0x125;
	1163	workingBuffer[2] = 0;
	1164	test->setTo(TRUE, workingBuffer, 2);
	1165	if(test->length() != 2 \|\| test->charAt(0) != 0x20ac \|\| test->charAt(1) != 0x125) {
	1166	errln("UnicodeString.setTo(readonly alias) does not alias correctly");
	1167	}
	1168
	1169	UnicodeString c=(UnicodeString )test->clone();
	1170
	1171	workingBuffer[1] = 0x109;
	1172	if(test->charAt(1) != 0x109) {
	1173	errln("UnicodeString.setTo(readonly alias) made a copy: did not see change in buffer");
	1174	}
	1175
	1176	if(c->length() != 2 \|\| c->charAt(1) != 0x125) {
	1177	errln("clone(alias) did not copy the buffer");
	1178	}
	1179	delete c;
	1180
	1181	test->setTo(TRUE, workingBuffer, -1);
	1182	if(test->length() != 2 \|\| test->charAt(0) != 0x20ac \|\| test->charAt(1) != 0x109) {
	1183	errln("UnicodeString.setTo(readonly alias, length -1) does not alias correctly");
	1184	}
	1185
	1186	test->setTo(FALSE, workingBuffer, -1);
	1187	if(!test->isBogus()) {
	1188	errln("UnicodeString.setTo(unterminated readonly alias, length -1) does not result in isBogus()");
	1189	}
	1190
	1191	delete test;
	1192
	1193	test=new UnicodeString();
	1194	UChar buffer[]={0x0061, 0x0062, 0x20ac, 0x0043, 0x0042, 0x0000};
	1195	test->setTo(buffer, 4, 10);
	1196	if(test->length() !=4 \|\| test->charAt(0) != 0x0061 \|\| test->charAt(1) != 0x0062 \|\|
	1197	test->charAt(2) != 0x20ac \|\| test->charAt(3) != 0x0043){
	1198	errln((UnicodeString)"UnicodeString.setTo(UChar, length, capacity) does not work correctly\n" + prettify(test));
	1199	}
	1200	delete test;
	1201
	1202
	1203	// test the UChar32 constructor
	1204	UnicodeString c32Test((UChar32)0x10ff2a);
	1205	if( c32Test.length() != UTF_CHAR_LENGTH(0x10ff2a) \|\|
	1206	c32Test.char32At(c32Test.length() - 1) != 0x10ff2a
	1207	) {
	1208	errln("The UnicodeString(UChar32) constructor does not work with a 0x10ff2a filler");
	1209	}
	1210
	1211	// test the (new) capacity constructor
	1212	UnicodeString capTest(5, (UChar32)0x2a, 5);
	1213	if( capTest.length() != 5 * UTF_CHAR_LENGTH(0x2a) \|\|
	1214	capTest.char32At(0) != 0x2a \|\|
	1215	capTest.char32At(4) != 0x2a
	1216	) {
	1217	errln("The UnicodeString capacity constructor does not work with an ASCII filler");
	1218	}
	1219
	1220	capTest = UnicodeString(5, (UChar32)0x10ff2a, 5);
	1221	if( capTest.length() != 5 * UTF_CHAR_LENGTH(0x10ff2a) \|\|
	1222	capTest.char32At(0) != 0x10ff2a \|\|
	1223	capTest.char32At(4) != 0x10ff2a
	1224	) {
	1225	errln("The UnicodeString capacity constructor does not work with a 0x10ff2a filler");
	1226	}
	1227
	1228	capTest = UnicodeString(5, (UChar32)0, 0);
	1229	if(capTest.length() != 0) {
	1230	errln("The UnicodeString capacity constructor does not work with a 0x10ff2a filler");
	1231	}
	1232	}
	1233
	1234	/**
	1235	* Test the unescape() function.
	1236	*/
	1237	void UnicodeStringTest::TestUnescape(void) {
	1238	UnicodeString IN("abc\\u4567 \\n\\r \\U00101234xyz\\x1\\x{5289}\\x1b", -1, US_INV);
	1239	UnicodeString OUT("abc");
	1240	OUT.append((UChar)0x4567);
	1241	OUT.append(" ");
	1242	OUT.append((UChar)0xA);
	1243	OUT.append((UChar)0xD);
	1244	OUT.append(" ");
	1245	OUT.append((UChar32)0x00101234);
	1246	OUT.append("xyz");
	1247	OUT.append((UChar32)1).append((UChar32)0x5289).append((UChar)0x1b);
	1248	UnicodeString result = IN.unescape();
	1249	if (result != OUT) {
	1250	errln("FAIL: " + prettify(IN) + ".unescape() -> " +
	1251	prettify(result) + ", expected " +
	1252	prettify(OUT));
	1253	}
	1254
	1255	// test that an empty string is returned in case of an error
	1256	if (!UNICODE_STRING("wrong \\u sequence", 17).unescape().isEmpty()) {
	1257	errln("FAIL: unescaping of a string with an illegal escape sequence did not return an empty string");
	1258	}
	1259	}
	1260
	1261	/* test code point counting functions --------------------------------------- */
	1262
	1263	/* reference implementation of UnicodeString::hasMoreChar32Than() */
	1264	static int32_t
	1265	_refUnicodeStringHasMoreChar32Than(const UnicodeString &s, int32_t start, int32_t length, int32_t number) {
	1266	int32_t count=s.countChar32(start, length);
	1267	return count>number;
	1268	}
	1269
	1270	/* compare the real function against the reference */
	1271	void
	1272	UnicodeStringTest::_testUnicodeStringHasMoreChar32Than(const UnicodeString &s, int32_t start, int32_t length, int32_t number) {
	1273	if(s.hasMoreChar32Than(start, length, number)!=_refUnicodeStringHasMoreChar32Than(s, start, length, number)) {
	1274	errln("hasMoreChar32Than(%d, %d, %d)=%hd is wrong\n",
	1275	start, length, number, s.hasMoreChar32Than(start, length, number));
	1276	}
	1277	}
	1278
	1279	void
	1280	UnicodeStringTest::TestCountChar32(void) {
	1281	{
	1282	UnicodeString s=UNICODE_STRING("\\U0002f999\\U0001d15f\\u00c4\\u1ed0", 32).unescape();
	1283
	1284	// test countChar32()
	1285	// note that this also calls and tests u_countChar32(length>=0)
	1286	if(
	1287	s.countChar32()!=4 \|\|
	1288	s.countChar32(1)!=4 \|\|
	1289	s.countChar32(2)!=3 \|\|
	1290	s.countChar32(2, 3)!=2 \|\|
	1291	s.countChar32(2, 0)!=0
	1292	) {
	1293	errln("UnicodeString::countChar32() failed");
	1294	}
	1295
	1296	// NUL-terminate the string buffer and test u_countChar32(length=-1)
	1297	const UChar *buffer=s.getTerminatedBuffer();
	1298	if(
	1299	u_countChar32(buffer, -1)!=4 \|\|
	1300	u_countChar32(buffer+1, -1)!=4 \|\|
	1301	u_countChar32(buffer+2, -1)!=3 \|\|
	1302	u_countChar32(buffer+3, -1)!=3 \|\|
	1303	u_countChar32(buffer+4, -1)!=2 \|\|
	1304	u_countChar32(buffer+5, -1)!=1 \|\|
	1305	u_countChar32(buffer+6, -1)!=0
	1306	) {
	1307	errln("u_countChar32(length=-1) failed");
	1308	}
	1309
	1310	// test u_countChar32() with bad input
	1311	if(u_countChar32(NULL, 5)!=0 \|\| u_countChar32(buffer, -2)!=0) {
	1312	errln("u_countChar32(bad input) failed (returned non-zero counts)");
	1313	}
	1314	}
	1315
	1316	/* test data and variables for hasMoreChar32Than() */
	1317	static const UChar str[]={
	1318	0x61, 0x62, 0xd800, 0xdc00,
	1319	0xd801, 0xdc01, 0x63, 0xd802,
	1320	0x64, 0xdc03, 0x65, 0x66,
	1321	0xd804, 0xdc04, 0xd805, 0xdc05,
	1322	0x67
	1323	};
	1324	UnicodeString string(str, LENGTHOF(str));
	1325	int32_t start, length, number;
	1326
	1327	/* test hasMoreChar32Than() */
	1328	for(length=string.length(); length>=0; --length) {
	1329	for(start=0; start<=length; ++start) {
	1330	for(number=-1; number<=((length-start)+2); ++number) {
	1331	_testUnicodeStringHasMoreChar32Than(string, start, length-start, number);
	1332	}
	1333	}
	1334	}
	1335
	1336	/* test hasMoreChar32Than() with pinning */
	1337	for(start=-1; start<=string.length()+1; ++start) {
	1338	for(number=-1; number<=((string.length()-start)+2); ++number) {
	1339	_testUnicodeStringHasMoreChar32Than(string, start, 0x7fffffff, number);
	1340	}
	1341	}
	1342
	1343	/* test hasMoreChar32Than() with a bogus string */
	1344	string.setToBogus();
	1345	for(length=-1; length<=1; ++length) {
	1346	for(start=-1; start<=length; ++start) {
	1347	for(number=-1; number<=((length-start)+2); ++number) {
	1348	_testUnicodeStringHasMoreChar32Than(string, start, length-start, number);
	1349	}
	1350	}
	1351	}
	1352	}
	1353
	1354	void
	1355	UnicodeStringTest::TestBogus() {
	1356	UnicodeString test1("This is a test");
	1357	UnicodeString test2("This is a test");
	1358	UnicodeString test3("Me too!");
	1359
	1360	// test isBogus() and setToBogus()
	1361	if (test1.isBogus() \|\| test2.isBogus() \|\| test3.isBogus()) {
	1362	errln("A string returned TRUE for isBogus()!");
	1363	}
	1364
	1365	// NULL pointers are treated like empty strings
	1366	// use other illegal arguments to make a bogus string
	1367	test3.setTo(FALSE, test1.getBuffer(), -2);
	1368	if(!test3.isBogus()) {
	1369	errln("A bogus string returned FALSE for isBogus()!");
	1370	}
	1371	if (test1.hashCode() != test2.hashCode() \|\| test1.hashCode() == test3.hashCode()) {
	1372	errln("hashCode() failed");
	1373	}
	1374	if(test3.getBuffer()!=0 \|\| test3.getBuffer(20)!=0 \|\| test3.getTerminatedBuffer()!=0) {
	1375	errln("bogus.getBuffer()!=0");
	1376	}
	1377	if (test1.indexOf(test3) != -1) {
	1378	errln("bogus.indexOf() != -1");
	1379	}
	1380	if (test1.lastIndexOf(test3) != -1) {
	1381	errln("bogus.lastIndexOf() != -1");
	1382	}
	1383	if (test1.caseCompare(test3, U_FOLD_CASE_DEFAULT) != 1 \|\| test3.caseCompare(test1, U_FOLD_CASE_DEFAULT) != -1) {
	1384	errln("caseCompare() doesn't work with bogus strings");
	1385	}
	1386	if (test1.compareCodePointOrder(test3) != 1 \|\| test3.compareCodePointOrder(test1) != -1) {
	1387	errln("compareCodePointOrder() doesn't work with bogus strings");
	1388	}
	1389
	1390	// verify that non-assignment modifications fail and do not revive a bogus string
	1391	test3.setToBogus();
	1392	test3.append((UChar)0x61);
	1393	if(!test3.isBogus() \|\| test3.getBuffer()!=0) {
	1394	errln("bogus.append('a') worked but must not");
	1395	}
	1396
	1397	test3.setToBogus();
	1398	test3.findAndReplace(UnicodeString((UChar)0x61), test2);
	1399	if(!test3.isBogus() \|\| test3.getBuffer()!=0) {
	1400	errln("bogus.findAndReplace() worked but must not");
	1401	}
	1402
	1403	test3.setToBogus();
	1404	test3.trim();
	1405	if(!test3.isBogus() \|\| test3.getBuffer()!=0) {
	1406	errln("bogus.trim() revived bogus but must not");
	1407	}
	1408
	1409	test3.setToBogus();
	1410	test3.remove(1);
	1411	if(!test3.isBogus() \|\| test3.getBuffer()!=0) {
	1412	errln("bogus.remove(1) revived bogus but must not");
	1413	}
	1414
	1415	test3.setToBogus();
	1416	if(!test3.setCharAt(0, 0x62).isBogus() \|\| !test3.isEmpty()) {
	1417	errln("bogus.setCharAt(0, 'b') worked but must not");
	1418	}
	1419
	1420	test3.setToBogus();
	1421	if(test3.truncate(1) \|\| !test3.isBogus() \|\| !test3.isEmpty()) {
	1422	errln("bogus.truncate(1) revived bogus but must not");
	1423	}
	1424
	1425	// verify that assignments revive a bogus string
	1426	test3.setToBogus();
	1427	if(!test3.isBogus() \|\| (test3=test1).isBogus() \|\| test3!=test1) {
	1428	errln("bogus.operator=() failed");
	1429	}
	1430
	1431	test3.setToBogus();
	1432	if(!test3.isBogus() \|\| test3.fastCopyFrom(test1).isBogus() \|\| test3!=test1) {
	1433	errln("bogus.fastCopyFrom() failed");
	1434	}
	1435
	1436	test3.setToBogus();
	1437	if(!test3.isBogus() \|\| test3.setTo(test1).isBogus() \|\| test3!=test1) {
	1438	errln("bogus.setTo(UniStr) failed");
	1439	}
	1440
	1441	test3.setToBogus();
	1442	if(!test3.isBogus() \|\| test3.setTo(test1, 0).isBogus() \|\| test3!=test1) {
	1443	errln("bogus.setTo(UniStr, 0) failed");
	1444	}
	1445
	1446	test3.setToBogus();
	1447	if(!test3.isBogus() \|\| test3.setTo(test1, 0, 0x7fffffff).isBogus() \|\| test3!=test1) {
	1448	errln("bogus.setTo(UniStr, 0, len) failed");
	1449	}
	1450
	1451	test3.setToBogus();
	1452	if(!test3.isBogus() \|\| test3.setTo(test1.getBuffer(), test1.length()).isBogus() \|\| test3!=test1) {
	1453	errln("bogus.setTo(const UChar *, len) failed");
	1454	}
	1455
	1456	test3.setToBogus();
	1457	if(!test3.isBogus() \|\| test3.setTo((UChar)0x2028).isBogus() \|\| test3!=UnicodeString((UChar)0x2028)) {
	1458	errln("bogus.setTo(UChar) failed");
	1459	}
	1460
	1461	test3.setToBogus();
	1462	if(!test3.isBogus() \|\| test3.setTo((UChar32)0x1d157).isBogus() \|\| test3!=UnicodeString((UChar32)0x1d157)) {
	1463	errln("bogus.setTo(UChar32) failed");
	1464	}
	1465
	1466	test3.setToBogus();
	1467	if(!test3.isBogus() \|\| test3.setTo(FALSE, test1.getBuffer(), test1.length()).isBogus() \|\| test3!=test1) {
	1468	errln("bogus.setTo(readonly alias) failed");
	1469	}
	1470
	1471	// writable alias to another string's buffer: very bad idea, just convenient for this test
	1472	test3.setToBogus();
	1473	if(!test3.isBogus() \|\| test3.setTo((UChar *)test1.getBuffer(), test1.length(), test1.getCapacity()).isBogus() \|\| test3!=test1) {
	1474	errln("bogus.setTo(writable alias) failed");
	1475	}
	1476
	1477	// verify simple, documented ways to turn a bogus string into an empty one
	1478	test3.setToBogus();
	1479	if(!test3.isBogus() \|\| (test3=UnicodeString()).isBogus() \|\| !test3.isEmpty()) {
	1480	errln("bogus.operator=(UnicodeString()) failed");
	1481	}
	1482
	1483	test3.setToBogus();
	1484	if(!test3.isBogus() \|\| test3.setTo(UnicodeString()).isBogus() \|\| !test3.isEmpty()) {
	1485	errln("bogus.setTo(UnicodeString()) failed");
	1486	}
	1487
	1488	test3.setToBogus();
	1489	if(test3.remove().isBogus() \|\| test3.getBuffer()==0 \|\| !test3.isEmpty()) {
	1490	errln("bogus.remove() failed");
	1491	}
	1492
	1493	test3.setToBogus();
	1494	if(test3.remove(0, INT32_MAX).isBogus() \|\| test3.getBuffer()==0 \|\| !test3.isEmpty()) {
	1495	errln("bogus.remove(0, INT32_MAX) failed");
	1496	}
	1497
	1498	test3.setToBogus();
	1499	if(test3.truncate(0) \|\| test3.isBogus() \|\| !test3.isEmpty()) {
	1500	errln("bogus.truncate(0) failed");
	1501	}
	1502
	1503	test3.setToBogus();
	1504	if(!test3.isBogus() \|\| test3.setTo((UChar32)-1).isBogus() \|\| !test3.isEmpty()) {
	1505	errln("bogus.setTo((UChar32)-1) failed");
	1506	}
	1507
	1508	static const UChar nul=0;
	1509
	1510	test3.setToBogus();
	1511	if(!test3.isBogus() \|\| test3.setTo(&nul, 0).isBogus() \|\| !test3.isEmpty()) {
	1512	errln("bogus.setTo(&nul, 0) failed");
	1513	}
	1514
	1515	test3.setToBogus();
	1516	if(!test3.isBogus() \|\| test3.getBuffer()!=0) {
	1517	errln("setToBogus() failed to make a string bogus");
	1518	}
	1519
	1520	test3.setToBogus();
	1521	if(test1.isBogus() \|\| !(test1=test3).isBogus()) {
	1522	errln("normal=bogus failed to make the left string bogus");
	1523	}
	1524
	1525	// test that NULL primitive input string values are treated like
	1526	// empty strings, not errors (bogus)
	1527	test2.setTo((UChar32)0x10005);
	1528	if(test2.insert(1, NULL, 1).length()!=2) {
	1529	errln("UniStr.insert(...NULL...) should not modify the string but does");
	1530	}
	1531
	1532	UErrorCode errorCode=U_ZERO_ERROR;
	1533	UnicodeString
	1534	test4((const UChar *)NULL),
	1535	test5(TRUE, (const UChar *)NULL, 1),
	1536	test6((UChar *)NULL, 5, 5),
	1537	test7((const char *)NULL, 3, NULL, errorCode);
	1538	if(test4.isBogus() \|\| test5.isBogus() \|\| test6.isBogus() \|\| test7.isBogus()) {
	1539	errln("a constructor set to bogus for a NULL input string, should be empty");
	1540	}
	1541
	1542	test4.setTo(NULL, 3);
	1543	test5.setTo(TRUE, (const UChar *)NULL, 1);
	1544	test6.setTo((UChar *)NULL, 5, 5);
	1545	if(test4.isBogus() \|\| test5.isBogus() \|\| test6.isBogus()) {
	1546	errln("a setTo() set to bogus for a NULL input string, should be empty");
	1547	}
	1548
	1549	// test that bogus==bogus<any
	1550	if(test1!=test3 \|\| test1.compare(test3)!=0) {
	1551	errln("bogus==bogus failed");
	1552	}
	1553
	1554	test2.remove();
	1555	if(test1>=test2 \|\| !(test2>test1) \|\| test1.compare(test2)>=0 \|\| !(test2.compare(test1)>0)) {
	1556	errln("bogus<empty failed");
	1557	}
	1558	}
	1559
	1560	// StringEnumeration ------------------------------------------------------- ***
	1561	// most of StringEnumeration is tested elsewhere
	1562	// this test improves code coverage
	1563
	1564	static const char *const
	1565	testEnumStrings[]={
	1566	"a",
	1567	"b",
	1568	"c",
	1569	"this is a long string which helps us test some buffer limits",
	1570	"eeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeee"
	1571	};
	1572
	1573	class TestEnumeration : public StringEnumeration {
	1574	public:
	1575	TestEnumeration() : i(0) {}
	1576
	1577	virtual int32_t count(UErrorCode& /status/) const {
	1578	return LENGTHOF(testEnumStrings);
	1579	}
	1580
	1581	virtual const UnicodeString *snext(UErrorCode &status) {
	1582	if(U_SUCCESS(status) && i<LENGTHOF(testEnumStrings)) {
	1583	unistr=UnicodeString(testEnumStrings[i++], "");
	1584	return &unistr;
	1585	}
	1586
	1587	return NULL;
	1588	}
	1589
	1590	virtual void reset(UErrorCode& /status/) {
	1591	i=0;
	1592	}
	1593
	1594	static inline UClassID getStaticClassID() {
	1595	return (UClassID)&fgClassID;
	1596	}
	1597	virtual UClassID getDynamicClassID() const {
	1598	return getStaticClassID();
	1599	}
	1600
	1601	private:
	1602	static const char fgClassID;
	1603
	1604	int32_t i, length;
	1605	};
	1606
	1607	const char TestEnumeration::fgClassID=0;
	1608
	1609	void
	1610	UnicodeStringTest::TestStringEnumeration() {
	1611	UnicodeString s;
	1612	TestEnumeration ten;
	1613	int32_t i, length;
	1614	UErrorCode status;
	1615
	1616	const UChar *pu;
	1617	const char *pc;
	1618
	1619	// test the next() default implementation and ensureCharsCapacity()
	1620	for(i=0; i<LENGTHOF(testEnumStrings); ++i) {
	1621	status=U_ZERO_ERROR;
	1622	pc=ten.next(&length, status);
	1623	s=UnicodeString(testEnumStrings[i], "");
	1624	if(U_FAILURE(status) \|\| pc==NULL \|\| length!=s.length() \|\| UnicodeString(pc, length, "")!=s) {
	1625	errln("StringEnumeration.next(%d) failed", i);
	1626	}
	1627	}
	1628	status=U_ZERO_ERROR;
	1629	if(ten.next(&length, status)!=NULL) {
	1630	errln("StringEnumeration.next(done)!=NULL");
	1631	}
	1632
	1633	// test the unext() default implementation
	1634	ten.reset(status);
	1635	for(i=0; i<LENGTHOF(testEnumStrings); ++i) {
	1636	status=U_ZERO_ERROR;
	1637	pu=ten.unext(&length, status);
	1638	s=UnicodeString(testEnumStrings[i], "");
	1639	if(U_FAILURE(status) \|\| pu==NULL \|\| length!=s.length() \|\| UnicodeString(TRUE, pu, length)!=s) {
	1640	errln("StringEnumeration.unext(%d) failed", i);
	1641	}
	1642	}
	1643	status=U_ZERO_ERROR;
	1644	if(ten.unext(&length, status)!=NULL) {
	1645	errln("StringEnumeration.unext(done)!=NULL");
	1646	}
	1647
	1648	// test that the default clone() implementation works, and returns NULL
	1649	if(ten.clone()!=NULL) {
	1650	errln("StringEnumeration.clone()!=NULL");
	1651	}
	1652	}
	1653
	1654	void
	1655	UnicodeStringTest::TestCharString() {
	1656	static const char originalCStr[] =
	1657	"This is a large string that is meant to over flow the internal buffer of CharString. At the time of writing this test, the internal buffer is 128 bytes.";
	1658	CharString chStr(originalCStr);
	1659	if (strcmp(originalCStr, chStr) != 0) {
	1660	errln("CharString doesn't work with large strings.");
	1661	}
	1662	}
	1663
	1664	/*
	1665	* Namespace test, to make sure that macros like UNICODE_STRING include the
	1666	* namespace qualifier.
	1667	*
	1668	* Define a (bogus) UnicodeString class in another namespace and check for ambiguity.
	1669	*/
	1670	#if U_HAVE_NAMESPACE
	1671	namespace bogus {
	1672	class UnicodeString {
	1673	public:
	1674	enum EInvariant { kInvariant };
	1675	UnicodeString() : i(1) {}
	1676	UnicodeString(UBool /isTerminated/, const UChar * /text/, int32_t textLength) : i(textLength) {}
	1677	UnicodeString(const char * /src/, int32_t length, enum EInvariant /inv/
	1678	) : i(length) {}
	1679	private:
	1680	int32_t i;
	1681	};
	1682	}
	1683	#endif
	1684
	1685	void
	1686	UnicodeStringTest::TestNameSpace() {
	1687	#if U_HAVE_NAMESPACE
	1688	// Provoke name collision unless the UnicodeString macros properly
	1689	// qualify the icu::UnicodeString class.
	1690	using namespace bogus;
	1691
	1692	// Use all UnicodeString macros from unistr.h.
	1693	icu::UnicodeString s1=icu::UnicodeString("abc", 3, US_INV);
	1694	icu::UnicodeString s2=UNICODE_STRING("def", 3);
	1695	icu::UnicodeString s3=UNICODE_STRING_SIMPLE("ghi");
	1696
	1697	// Make sure the compiler does not optimize away instantiation of s1, s2, s3.
	1698	icu::UnicodeString s4=s1+s2+s3;
	1699	if(s4.length()!=9) {
	1700	errln("Something wrong with UnicodeString::operator+().");
	1701	}
	1702	#endif
	1703	}