]>
Commit | Line | Data |
---|---|---|
1 | /******************************************************************** | |
2 | * COPYRIGHT: | |
3 | * Copyright (c) 1997-2011, International Business Machines Corporation and | |
4 | * others. All Rights Reserved. | |
5 | ********************************************************************/ | |
6 | ||
7 | #include "ustrtest.h" | |
8 | #include "unicode/appendable.h" | |
9 | #include "unicode/std_string.h" | |
10 | #include "unicode/unistr.h" | |
11 | #include "unicode/uchar.h" | |
12 | #include "unicode/ustring.h" | |
13 | #include "unicode/locid.h" | |
14 | #include "unicode/ucnv.h" | |
15 | #include "unicode/uenum.h" | |
16 | #include "unicode/utf16.h" | |
17 | #include "cmemory.h" | |
18 | #include "charstr.h" | |
19 | ||
20 | #if 0 | |
21 | #include "unicode/ustream.h" | |
22 | ||
23 | #include <iostream> | |
24 | using namespace std; | |
25 | ||
26 | #endif | |
27 | ||
28 | #define LENGTHOF(array) (int32_t)((sizeof(array)/sizeof((array)[0]))) | |
29 | ||
30 | UnicodeStringTest::~UnicodeStringTest() {} | |
31 | ||
32 | void UnicodeStringTest::runIndexedTest( int32_t index, UBool exec, const char* &name, char *par) | |
33 | { | |
34 | if (exec) logln("TestSuite UnicodeStringTest: "); | |
35 | switch (index) { | |
36 | case 0: | |
37 | name = "StringCaseTest"; | |
38 | if (exec) { | |
39 | logln("StringCaseTest---"); logln(""); | |
40 | StringCaseTest test; | |
41 | callTest(test, par); | |
42 | } | |
43 | break; | |
44 | case 1: name = "TestBasicManipulation"; if (exec) TestBasicManipulation(); break; | |
45 | case 2: name = "TestCompare"; if (exec) TestCompare(); break; | |
46 | case 3: name = "TestExtract"; if (exec) TestExtract(); break; | |
47 | case 4: name = "TestRemoveReplace"; if (exec) TestRemoveReplace(); break; | |
48 | case 5: name = "TestSearching"; if (exec) TestSearching(); break; | |
49 | case 6: name = "TestSpacePadding"; if (exec) TestSpacePadding(); break; | |
50 | case 7: name = "TestPrefixAndSuffix"; if (exec) TestPrefixAndSuffix(); break; | |
51 | case 8: name = "TestFindAndReplace"; if (exec) TestFindAndReplace(); break; | |
52 | case 9: name = "TestBogus"; if (exec) TestBogus(); break; | |
53 | case 10: name = "TestReverse"; if (exec) TestReverse(); break; | |
54 | case 11: name = "TestMiscellaneous"; if (exec) TestMiscellaneous(); break; | |
55 | case 12: name = "TestStackAllocation"; if (exec) TestStackAllocation(); break; | |
56 | case 13: name = "TestUnescape"; if (exec) TestUnescape(); break; | |
57 | case 14: name = "TestCountChar32"; if (exec) TestCountChar32(); break; | |
58 | case 15: name = "TestStringEnumeration"; if (exec) TestStringEnumeration(); break; | |
59 | case 16: name = "TestNameSpace"; if (exec) TestNameSpace(); break; | |
60 | case 17: name = "TestUTF32"; if (exec) TestUTF32(); break; | |
61 | case 18: name = "TestUTF8"; if (exec) TestUTF8(); break; | |
62 | case 19: name = "TestReadOnlyAlias"; if (exec) TestReadOnlyAlias(); break; | |
63 | case 20: name = "TestAppendable"; if (exec) TestAppendable(); break; | |
64 | case 21: name = "TestUnicodeStringImplementsAppendable"; if (exec) TestUnicodeStringImplementsAppendable(); break; | |
65 | case 22: name = "TestSizeofUnicodeString"; if (exec) TestSizeofUnicodeString(); break; | |
66 | case 23: name = "TestStartsWithAndEndsWithNulTerminated"; if (exec) TestStartsWithAndEndsWithNulTerminated(); break; | |
67 | ||
68 | default: name = ""; break; //needed to end loop | |
69 | } | |
70 | } | |
71 | ||
72 | void | |
73 | UnicodeStringTest::TestBasicManipulation() | |
74 | { | |
75 | UnicodeString test1("Now is the time for all men to come swiftly to the aid of the party.\n"); | |
76 | UnicodeString expectedValue; | |
77 | UnicodeString *c; | |
78 | ||
79 | c=(UnicodeString *)test1.clone(); | |
80 | test1.insert(24, "good "); | |
81 | expectedValue = "Now is the time for all good men to come swiftly to the aid of the party.\n"; | |
82 | if (test1 != expectedValue) | |
83 | errln("insert() failed: expected \"" + expectedValue + "\"\n,got \"" + test1 + "\""); | |
84 | ||
85 | c->insert(24, "good "); | |
86 | if(*c != expectedValue) { | |
87 | errln("clone()->insert() failed: expected \"" + expectedValue + "\"\n,got \"" + *c + "\""); | |
88 | } | |
89 | delete c; | |
90 | ||
91 | test1.remove(41, 8); | |
92 | expectedValue = "Now is the time for all good men to come to the aid of the party.\n"; | |
93 | if (test1 != expectedValue) | |
94 | errln("remove() failed: expected \"" + expectedValue + "\"\n,got \"" + test1 + "\""); | |
95 | ||
96 | test1.replace(58, 6, "ir country"); | |
97 | expectedValue = "Now is the time for all good men to come to the aid of their country.\n"; | |
98 | if (test1 != expectedValue) | |
99 | errln("replace() failed: expected \"" + expectedValue + "\"\n,got \"" + test1 + "\""); | |
100 | ||
101 | UChar temp[80]; | |
102 | test1.extract(0, 15, temp); | |
103 | ||
104 | UnicodeString test2(temp, 15); | |
105 | ||
106 | expectedValue = "Now is the time"; | |
107 | if (test2 != expectedValue) | |
108 | errln("extract() failed: expected \"" + expectedValue + "\"\n,got \"" + test2 + "\""); | |
109 | ||
110 | test2 += " for me to go!\n"; | |
111 | expectedValue = "Now is the time for me to go!\n"; | |
112 | if (test2 != expectedValue) | |
113 | errln("operator+=() failed: expected \"" + expectedValue + "\"\n,got \"" + test2 + "\""); | |
114 | ||
115 | if (test1.length() != 70) | |
116 | errln("length() failed: expected 70, got " + test1.length()); | |
117 | if (test2.length() != 30) | |
118 | errln("length() failed: expected 30, got " + test2.length()); | |
119 | ||
120 | UnicodeString test3; | |
121 | test3.append((UChar32)0x20402); | |
122 | if(test3 != CharsToUnicodeString("\\uD841\\uDC02")){ | |
123 | errln((UnicodeString)"append failed for UChar32, expected \"\\\\ud841\\\\udc02\", got " + prettify(test3)); | |
124 | } | |
125 | if(test3.length() != 2){ | |
126 | errln("append or length failed for UChar32, expected 2, got " + test3.length()); | |
127 | } | |
128 | test3.append((UChar32)0x0074); | |
129 | if(test3 != CharsToUnicodeString("\\uD841\\uDC02t")){ | |
130 | errln((UnicodeString)"append failed for UChar32, expected \"\\\\uD841\\\\uDC02t\", got " + prettify(test3)); | |
131 | } | |
132 | if(test3.length() != 3){ | |
133 | errln((UnicodeString)"append or length failed for UChar32, expected 2, got " + test3.length()); | |
134 | } | |
135 | ||
136 | // test some UChar32 overloads | |
137 | if( test3.setTo((UChar32)0x10330).length() != 2 || | |
138 | test3.insert(0, (UChar32)0x20100).length() != 4 || | |
139 | test3.replace(2, 2, (UChar32)0xe0061).length() != 4 || | |
140 | (test3 = (UChar32)0x14001).length() != 2 | |
141 | ) { | |
142 | errln((UnicodeString)"simple UChar32 overloads for replace, insert, setTo or = failed"); | |
143 | } | |
144 | ||
145 | { | |
146 | // test moveIndex32() | |
147 | UnicodeString s=UNICODE_STRING("\\U0002f999\\U0001d15f\\u00c4\\u1ed0", 32).unescape(); | |
148 | ||
149 | if( | |
150 | s.moveIndex32(2, -1)!=0 || | |
151 | s.moveIndex32(2, 1)!=4 || | |
152 | s.moveIndex32(2, 2)!=5 || | |
153 | s.moveIndex32(5, -2)!=2 || | |
154 | s.moveIndex32(0, -1)!=0 || | |
155 | s.moveIndex32(6, 1)!=6 | |
156 | ) { | |
157 | errln("UnicodeString::moveIndex32() failed"); | |
158 | } | |
159 | ||
160 | if(s.getChar32Start(1)!=0 || s.getChar32Start(2)!=2) { | |
161 | errln("UnicodeString::getChar32Start() failed"); | |
162 | } | |
163 | ||
164 | if(s.getChar32Limit(1)!=2 || s.getChar32Limit(2)!=2) { | |
165 | errln("UnicodeString::getChar32Limit() failed"); | |
166 | } | |
167 | } | |
168 | ||
169 | { | |
170 | // test new 2.2 constructors and setTo function that parallel Java's substring function. | |
171 | UnicodeString src("Hello folks how are you?"); | |
172 | UnicodeString target1("how are you?"); | |
173 | if (target1 != UnicodeString(src, 12)) { | |
174 | errln("UnicodeString(const UnicodeString&, int32_t) failed"); | |
175 | } | |
176 | UnicodeString target2("folks"); | |
177 | if (target2 != UnicodeString(src, 6, 5)) { | |
178 | errln("UnicodeString(const UnicodeString&, int32_t, int32_t) failed"); | |
179 | } | |
180 | if (target1 != target2.setTo(src, 12)) { | |
181 | errln("UnicodeString::setTo(const UnicodeString&, int32_t) failed"); | |
182 | } | |
183 | } | |
184 | ||
185 | { | |
186 | // op+ is new in ICU 2.8 | |
187 | UnicodeString s=UnicodeString("abc", "")+UnicodeString("def", "")+UnicodeString("ghi", ""); | |
188 | if(s!=UnicodeString("abcdefghi", "")) { | |
189 | errln("operator+(UniStr, UniStr) failed"); | |
190 | } | |
191 | } | |
192 | ||
193 | { | |
194 | // tests for Jitterbug 2360 | |
195 | // verify that APIs with source pointer + length accept length == -1 | |
196 | // mostly test only where modified, only few functions did not already do this | |
197 | if(UnicodeString("abc", -1, "")!=UnicodeString("abc", "")) { | |
198 | errln("UnicodeString(codepageData, dataLength, codepage) does not work with dataLength==-1"); | |
199 | } | |
200 | ||
201 | UChar buffer[10]={ 0x61, 0x62, 0x20ac, 0xd900, 0xdc05, 0, 0x62, 0xffff, 0xdbff, 0xdfff }; | |
202 | UnicodeString s, t(buffer, -1, LENGTHOF(buffer)); | |
203 | ||
204 | if(s.setTo(buffer, -1, LENGTHOF(buffer)).length()!=u_strlen(buffer)) { | |
205 | errln("UnicodeString.setTo(buffer, length, capacity) does not work with length==-1"); | |
206 | } | |
207 | if(t.length()!=u_strlen(buffer)) { | |
208 | errln("UnicodeString(buffer, length, capacity) does not work with length==-1"); | |
209 | } | |
210 | ||
211 | if(0!=s.caseCompare(buffer, -1, U_FOLD_CASE_DEFAULT)) { | |
212 | errln("UnicodeString.caseCompare(const UChar *, length, options) does not work with length==-1"); | |
213 | } | |
214 | if(0!=s.caseCompare(0, s.length(), buffer, U_FOLD_CASE_DEFAULT)) { | |
215 | errln("UnicodeString.caseCompare(start, _length, const UChar *, options) does not work"); | |
216 | } | |
217 | ||
218 | buffer[u_strlen(buffer)]=0xe4; | |
219 | UnicodeString u(buffer, -1, LENGTHOF(buffer)); | |
220 | if(s.setTo(buffer, -1, LENGTHOF(buffer)).length()!=LENGTHOF(buffer)) { | |
221 | errln("UnicodeString.setTo(buffer without NUL, length, capacity) does not work with length==-1"); | |
222 | } | |
223 | if(u.length()!=LENGTHOF(buffer)) { | |
224 | errln("UnicodeString(buffer without NUL, length, capacity) does not work with length==-1"); | |
225 | } | |
226 | ||
227 | static const char cs[]={ 0x61, (char)0xe4, (char)0x85, 0 }; | |
228 | UConverter *cnv; | |
229 | UErrorCode errorCode=U_ZERO_ERROR; | |
230 | ||
231 | cnv=ucnv_open("ISO-8859-1", &errorCode); | |
232 | UnicodeString v(cs, -1, cnv, errorCode); | |
233 | ucnv_close(cnv); | |
234 | if(v!=CharsToUnicodeString("a\\xe4\\x85")) { | |
235 | errln("UnicodeString(const char *, length, cnv, errorCode) does not work with length==-1"); | |
236 | } | |
237 | } | |
238 | ||
239 | #if U_CHARSET_IS_UTF8 | |
240 | { | |
241 | // Test the hardcoded-UTF-8 UnicodeString optimizations. | |
242 | static const uint8_t utf8[]={ 0x61, 0xC3, 0xA4, 0xC3, 0x9F, 0xE4, 0xB8, 0x80, 0 }; | |
243 | static const UChar utf16[]={ 0x61, 0xE4, 0xDF, 0x4E00 }; | |
244 | UnicodeString from8a = UnicodeString((const char *)utf8); | |
245 | UnicodeString from8b = UnicodeString((const char *)utf8, (int32_t)sizeof(utf8)-1); | |
246 | UnicodeString from16(FALSE, utf16, LENGTHOF(utf16)); | |
247 | if(from8a != from16 || from8b != from16) { | |
248 | errln("UnicodeString(const char * U_CHARSET_IS_UTF8) failed"); | |
249 | } | |
250 | char buffer[16]; | |
251 | int32_t length8=from16.extract(0, 0x7fffffff, buffer, (uint32_t)sizeof(buffer)); | |
252 | if(length8!=((int32_t)sizeof(utf8)-1) || 0!=uprv_memcmp(buffer, utf8, sizeof(utf8))) { | |
253 | errln("UnicodeString::extract(char * U_CHARSET_IS_UTF8) failed"); | |
254 | } | |
255 | length8=from16.extract(1, 2, buffer, (uint32_t)sizeof(buffer)); | |
256 | if(length8!=4 || buffer[length8]!=0 || 0!=uprv_memcmp(buffer, utf8+1, length8)) { | |
257 | errln("UnicodeString::extract(substring to char * U_CHARSET_IS_UTF8) failed"); | |
258 | } | |
259 | } | |
260 | #endif | |
261 | } | |
262 | ||
263 | void | |
264 | UnicodeStringTest::TestCompare() | |
265 | { | |
266 | UnicodeString test1("this is a test"); | |
267 | UnicodeString test2("this is a test"); | |
268 | UnicodeString test3("this is a test of the emergency broadcast system"); | |
269 | UnicodeString test4("never say, \"this is a test\"!!"); | |
270 | ||
271 | UnicodeString test5((UChar)0x5000); | |
272 | UnicodeString test6((UChar)0x5100); | |
273 | ||
274 | UChar uniChars[] = { 0x74, 0x68, 0x69, 0x73, 0x20, 0x69, 0x73, | |
275 | 0x20, 0x61, 0x20, 0x74, 0x65, 0x73, 0x74, 0 }; | |
276 | char chars[] = "this is a test"; | |
277 | ||
278 | // test operator== and operator!= | |
279 | if (test1 != test2 || test1 == test3 || test1 == test4) | |
280 | errln("operator== or operator!= failed"); | |
281 | ||
282 | // test operator> and operator< | |
283 | if (test1 > test2 || test1 < test2 || !(test1 < test3) || !(test1 > test4) || | |
284 | !(test5 < test6) | |
285 | ) { | |
286 | errln("operator> or operator< failed"); | |
287 | } | |
288 | ||
289 | // test operator>= and operator<= | |
290 | if (!(test1 >= test2) || !(test1 <= test2) || !(test1 <= test3) || !(test1 >= test4)) | |
291 | errln("operator>= or operator<= failed"); | |
292 | ||
293 | // test compare(UnicodeString) | |
294 | if (test1.compare(test2) != 0 || test1.compare(test3) >= 0 || test1.compare(test4) <= 0) | |
295 | errln("compare(UnicodeString) failed"); | |
296 | ||
297 | //test compare(offset, length, UnicodeString) | |
298 | if(test1.compare(0, 14, test2) != 0 || | |
299 | test3.compare(0, 14, test2) != 0 || | |
300 | test4.compare(12, 14, test2) != 0 || | |
301 | test3.compare(0, 18, test1) <=0 ) | |
302 | errln("compare(offset, length, UnicodeString) failes"); | |
303 | ||
304 | // test compare(UChar*) | |
305 | if (test2.compare(uniChars) != 0 || test3.compare(uniChars) <= 0 || test4.compare(uniChars) >= 0) | |
306 | errln("compare(UChar*) failed"); | |
307 | ||
308 | // test compare(char*) | |
309 | if (test2.compare(chars) != 0 || test3.compare(chars) <= 0 || test4.compare(chars) >= 0) | |
310 | errln("compare(char*) failed"); | |
311 | ||
312 | // test compare(UChar*, length) | |
313 | if (test1.compare(uniChars, 4) <= 0 || test1.compare(uniChars, 4) <= 0) | |
314 | errln("compare(UChar*, length) failed"); | |
315 | ||
316 | // test compare(thisOffset, thisLength, that, thatOffset, thatLength) | |
317 | if (test1.compare(0, 14, test2, 0, 14) != 0 | |
318 | || test1.compare(0, 14, test3, 0, 14) != 0 | |
319 | || test1.compare(0, 14, test4, 12, 14) != 0) | |
320 | errln("1. compare(thisOffset, thisLength, that, thatOffset, thatLength) failed"); | |
321 | ||
322 | if (test1.compare(10, 4, test2, 0, 4) >= 0 | |
323 | || test1.compare(10, 4, test3, 22, 9) <= 0 | |
324 | || test1.compare(10, 4, test4, 22, 4) != 0) | |
325 | errln("2. compare(thisOffset, thisLength, that, thatOffset, thatLength) failed"); | |
326 | ||
327 | // test compareBetween | |
328 | if (test1.compareBetween(0, 14, test2, 0, 14) != 0 || test1.compareBetween(0, 14, test3, 0, 14) != 0 | |
329 | || test1.compareBetween(0, 14, test4, 12, 26) != 0) | |
330 | errln("compareBetween failed"); | |
331 | ||
332 | if (test1.compareBetween(10, 14, test2, 0, 4) >= 0 || test1.compareBetween(10, 14, test3, 22, 31) <= 0 | |
333 | || test1.compareBetween(10, 14, test4, 22, 26) != 0) | |
334 | errln("compareBetween failed"); | |
335 | ||
336 | // test compare() etc. with strings that share a buffer but are not equal | |
337 | test2=test1; // share the buffer, length() too large for the stackBuffer | |
338 | test2.truncate(1); // change only the length, not the buffer | |
339 | if( test1==test2 || test1<=test2 || | |
340 | test1.compare(test2)<=0 || | |
341 | test1.compareCodePointOrder(test2)<=0 || | |
342 | test1.compareCodePointOrder(0, INT32_MAX, test2)<=0 || | |
343 | test1.compareCodePointOrder(0, INT32_MAX, test2, 0, INT32_MAX)<=0 || | |
344 | test1.compareCodePointOrderBetween(0, INT32_MAX, test2, 0, INT32_MAX)<=0 || | |
345 | test1.caseCompare(test2, U_FOLD_CASE_DEFAULT)<=0 | |
346 | ) { | |
347 | errln("UnicodeStrings that share a buffer but have different lengths compare as equal"); | |
348 | } | |
349 | ||
350 | /* test compareCodePointOrder() */ | |
351 | { | |
352 | /* these strings are in ascending order */ | |
353 | static const UChar strings[][4]={ | |
354 | { 0x61, 0 }, /* U+0061 */ | |
355 | { 0x20ac, 0xd801, 0 }, /* U+20ac U+d801 */ | |
356 | { 0x20ac, 0xd800, 0xdc00, 0 }, /* U+20ac U+10000 */ | |
357 | { 0xd800, 0 }, /* U+d800 */ | |
358 | { 0xd800, 0xff61, 0 }, /* U+d800 U+ff61 */ | |
359 | { 0xdfff, 0 }, /* U+dfff */ | |
360 | { 0xff61, 0xdfff, 0 }, /* U+ff61 U+dfff */ | |
361 | { 0xff61, 0xd800, 0xdc02, 0 }, /* U+ff61 U+10002 */ | |
362 | { 0xd800, 0xdc02, 0 }, /* U+10002 */ | |
363 | { 0xd84d, 0xdc56, 0 } /* U+23456 */ | |
364 | }; | |
365 | UnicodeString u[20]; // must be at least as long as strings[] | |
366 | int32_t i; | |
367 | ||
368 | for(i=0; i<(int32_t)(sizeof(strings)/sizeof(strings[0])); ++i) { | |
369 | u[i]=UnicodeString(TRUE, strings[i], -1); | |
370 | } | |
371 | ||
372 | for(i=0; i<(int32_t)(sizeof(strings)/sizeof(strings[0])-1); ++i) { | |
373 | if(u[i].compareCodePointOrder(u[i+1])>=0 || u[i].compareCodePointOrder(0, INT32_MAX, u[i+1].getBuffer())>=0) { | |
374 | errln("error: UnicodeString::compareCodePointOrder() fails for string %d and the following one\n", i); | |
375 | } | |
376 | } | |
377 | } | |
378 | ||
379 | /* test caseCompare() */ | |
380 | { | |
381 | static const UChar | |
382 | _mixed[]= { 0x61, 0x42, 0x131, 0x3a3, 0xdf, 0x130, 0x49, 0xfb03, 0xd93f, 0xdfff, 0 }, | |
383 | _otherDefault[]= { 0x41, 0x62, 0x131, 0x3c3, 0x73, 0x53, 0x69, 0x307, 0x69, 0x46, 0x66, 0x49, 0xd93f, 0xdfff, 0 }, | |
384 | _otherExcludeSpecialI[]={ 0x41, 0x62, 0x131, 0x3c3, 0x53, 0x73, 0x69, 0x131, 0x66, 0x46, 0x69, 0xd93f, 0xdfff, 0 }, | |
385 | _different[]= { 0x41, 0x62, 0x131, 0x3c3, 0x73, 0x53, 0x130, 0x49, 0x46, 0x66, 0x49, 0xd93f, 0xdffd, 0 }; | |
386 | ||
387 | UnicodeString | |
388 | mixed(TRUE, _mixed, -1), | |
389 | otherDefault(TRUE, _otherDefault, -1), | |
390 | otherExcludeSpecialI(TRUE, _otherExcludeSpecialI, -1), | |
391 | different(TRUE, _different, -1); | |
392 | ||
393 | int8_t result; | |
394 | ||
395 | /* test caseCompare() */ | |
396 | result=mixed.caseCompare(otherDefault, U_FOLD_CASE_DEFAULT); | |
397 | if(result!=0 || 0!=mixed.caseCompareBetween(0, INT32_MAX, otherDefault, 0, INT32_MAX, U_FOLD_CASE_DEFAULT)) { | |
398 | errln("error: mixed.caseCompare(other, default)=%ld instead of 0\n", result); | |
399 | } | |
400 | result=mixed.caseCompare(otherExcludeSpecialI, U_FOLD_CASE_EXCLUDE_SPECIAL_I); | |
401 | if(result!=0) { | |
402 | errln("error: mixed.caseCompare(otherExcludeSpecialI, U_FOLD_CASE_EXCLUDE_SPECIAL_I)=%ld instead of 0\n", result); | |
403 | } | |
404 | result=mixed.caseCompare(otherDefault, U_FOLD_CASE_EXCLUDE_SPECIAL_I); | |
405 | if(result==0 || 0==mixed.caseCompareBetween(0, INT32_MAX, otherDefault, 0, INT32_MAX, U_FOLD_CASE_EXCLUDE_SPECIAL_I)) { | |
406 | errln("error: mixed.caseCompare(other, U_FOLD_CASE_EXCLUDE_SPECIAL_I)=0 instead of !=0\n"); | |
407 | } | |
408 | ||
409 | /* test caseCompare() */ | |
410 | result=mixed.caseCompare(different, U_FOLD_CASE_DEFAULT); | |
411 | if(result<=0) { | |
412 | errln("error: mixed.caseCompare(different, default)=%ld instead of positive\n", result); | |
413 | } | |
414 | ||
415 | /* test caseCompare() - include the folded sharp s (U+00df) with different lengths */ | |
416 | result=mixed.caseCompare(1, 4, different, 1, 5, U_FOLD_CASE_DEFAULT); | |
417 | if(result!=0 || 0!=mixed.caseCompareBetween(1, 5, different, 1, 6, U_FOLD_CASE_DEFAULT)) { | |
418 | errln("error: mixed.caseCompare(mixed, 1, 4, different, 1, 5, default)=%ld instead of 0\n", result); | |
419 | } | |
420 | ||
421 | /* test caseCompare() - stop in the middle of the sharp s (U+00df) */ | |
422 | result=mixed.caseCompare(1, 4, different, 1, 4, U_FOLD_CASE_DEFAULT); | |
423 | if(result<=0) { | |
424 | errln("error: mixed.caseCompare(1, 4, different, 1, 4, default)=%ld instead of positive\n", result); | |
425 | } | |
426 | } | |
427 | ||
428 | // test that srcLength=-1 is handled in functions that | |
429 | // take input const UChar */int32_t srcLength (j785) | |
430 | { | |
431 | static const UChar u[]={ 0x61, 0x308, 0x62, 0 }; | |
432 | UnicodeString s=UNICODE_STRING("a\\u0308b", 8).unescape(); | |
433 | ||
434 | if(s.compare(u, -1)!=0 || s.compare(0, 999, u, 0, -1)!=0) { | |
435 | errln("error UnicodeString::compare(..., const UChar *, srcLength=-1) does not work"); | |
436 | } | |
437 | ||
438 | if(s.compareCodePointOrder(u, -1)!=0 || s.compareCodePointOrder(0, 999, u, 0, -1)!=0) { | |
439 | errln("error UnicodeString::compareCodePointOrder(..., const UChar *, srcLength=-1, ...) does not work"); | |
440 | } | |
441 | ||
442 | if(s.caseCompare(u, -1, U_FOLD_CASE_DEFAULT)!=0 || s.caseCompare(0, 999, u, 0, -1, U_FOLD_CASE_DEFAULT)!=0) { | |
443 | errln("error UnicodeString::caseCompare(..., const UChar *, srcLength=-1, ...) does not work"); | |
444 | } | |
445 | ||
446 | if(s.indexOf(u, 1, -1, 0, 999)!=1 || s.indexOf(u+1, -1, 0, 999)!=1 || s.indexOf(u+1, -1, 0)!=1) { | |
447 | errln("error UnicodeString::indexOf(const UChar *, srcLength=-1, ...) does not work"); | |
448 | } | |
449 | ||
450 | if(s.lastIndexOf(u, 1, -1, 0, 999)!=1 || s.lastIndexOf(u+1, -1, 0, 999)!=1 || s.lastIndexOf(u+1, -1, 0)!=1) { | |
451 | errln("error UnicodeString::lastIndexOf(const UChar *, srcLength=-1, ...) does not work"); | |
452 | } | |
453 | ||
454 | UnicodeString s2, s3; | |
455 | s2.replace(0, 0, u+1, -1); | |
456 | s3.replace(0, 0, u, 1, -1); | |
457 | if(s.compare(1, 999, s2)!=0 || s2!=s3) { | |
458 | errln("error UnicodeString::replace(..., const UChar *, srcLength=-1, ...) does not work"); | |
459 | } | |
460 | } | |
461 | } | |
462 | ||
463 | void | |
464 | UnicodeStringTest::TestExtract() | |
465 | { | |
466 | UnicodeString test1("Now is the time for all good men to come to the aid of their country.", ""); | |
467 | UnicodeString test2; | |
468 | UChar test3[13] = {1, 2, 3, 4, 5, 6, 7, 8, 8, 10, 11, 12, 13}; | |
469 | char test4[13] = {1, 2, 3, 4, 5, 6, 7, 8, 8, 10, 11, 12, 13}; | |
470 | UnicodeString test5; | |
471 | char test6[13] = {1, 2, 3, 4, 5, 6, 7, 8, 8, 10, 11, 12, 13}; | |
472 | ||
473 | test1.extract(11, 12, test2); | |
474 | test1.extract(11, 12, test3); | |
475 | if (test1.extract(11, 12, test4) != 12 || test4[12] != 0) { | |
476 | errln("UnicodeString.extract(char *) failed to return the correct size of destination buffer."); | |
477 | } | |
478 | ||
479 | // test proper pinning in extractBetween() | |
480 | test1.extractBetween(-3, 7, test5); | |
481 | if(test5!=UNICODE_STRING("Now is ", 7)) { | |
482 | errln("UnicodeString.extractBetween(-3, 7) did not pin properly."); | |
483 | } | |
484 | ||
485 | test1.extractBetween(11, 23, test5); | |
486 | if (test1.extract(60, 71, test6) != 9) { | |
487 | errln("UnicodeString.extract() failed to return the correct size of destination buffer for end of buffer."); | |
488 | } | |
489 | if (test1.extract(11, 12, test6) != 12) { | |
490 | errln("UnicodeString.extract() failed to return the correct size of destination buffer."); | |
491 | } | |
492 | ||
493 | // convert test4 back to Unicode for comparison | |
494 | UnicodeString test4b(test4, 12); | |
495 | ||
496 | if (test1.extract(11, 12, (char *)NULL) != 12) { | |
497 | errln("UnicodeString.extract(NULL) failed to return the correct size of destination buffer."); | |
498 | } | |
499 | if (test1.extract(11, -1, test6) != 0) { | |
500 | errln("UnicodeString.extract(-1) failed to stop reading the string."); | |
501 | } | |
502 | ||
503 | for (int32_t i = 0; i < 12; i++) { | |
504 | if (test1.charAt((int32_t)(11 + i)) != test2.charAt(i)) { | |
505 | errln(UnicodeString("extracting into a UnicodeString failed at position ") + i); | |
506 | break; | |
507 | } | |
508 | if (test1.charAt((int32_t)(11 + i)) != test3[i]) { | |
509 | errln(UnicodeString("extracting into an array of UChar failed at position ") + i); | |
510 | break; | |
511 | } | |
512 | if (((char)test1.charAt((int32_t)(11 + i))) != test4b.charAt(i)) { | |
513 | errln(UnicodeString("extracting into an array of char failed at position ") + i); | |
514 | break; | |
515 | } | |
516 | if (test1.charAt((int32_t)(11 + i)) != test5.charAt(i)) { | |
517 | errln(UnicodeString("extracting with extractBetween failed at position ") + i); | |
518 | break; | |
519 | } | |
520 | } | |
521 | ||
522 | // test preflighting and overflows with invariant conversion | |
523 | if (test1.extract(0, 10, (char *)NULL, "") != 10) { | |
524 | errln("UnicodeString.extract(0, 10, (char *)NULL, \"\") != 10"); | |
525 | } | |
526 | ||
527 | test4[2] = (char)0xff; | |
528 | if (test1.extract(0, 10, test4, 2, "") != 10) { | |
529 | errln("UnicodeString.extract(0, 10, test4, 2, \"\") != 10"); | |
530 | } | |
531 | if (test4[2] != (char)0xff) { | |
532 | errln("UnicodeString.extract(0, 10, test4, 2, \"\") overwrote test4[2]"); | |
533 | } | |
534 | ||
535 | { | |
536 | // test new, NUL-terminating extract() function | |
537 | UnicodeString s("terminate", ""); | |
538 | UChar dest[20]={ | |
539 | 0xa5, 0xa5, 0xa5, 0xa5, 0xa5, 0xa5, 0xa5, 0xa5, 0xa5, 0xa5, | |
540 | 0xa5, 0xa5, 0xa5, 0xa5, 0xa5, 0xa5, 0xa5, 0xa5, 0xa5, 0xa5 | |
541 | }; | |
542 | UErrorCode errorCode; | |
543 | int32_t length; | |
544 | ||
545 | errorCode=U_ZERO_ERROR; | |
546 | length=s.extract((UChar *)NULL, 0, errorCode); | |
547 | if(errorCode!=U_BUFFER_OVERFLOW_ERROR || length!=s.length()) { | |
548 | errln("UnicodeString.extract(NULL, 0)==%d (%s) expected %d (U_BUFFER_OVERFLOW_ERROR)", length, s.length(), u_errorName(errorCode)); | |
549 | } | |
550 | ||
551 | errorCode=U_ZERO_ERROR; | |
552 | length=s.extract(dest, s.length()-1, errorCode); | |
553 | if(errorCode!=U_BUFFER_OVERFLOW_ERROR || length!=s.length()) { | |
554 | errln("UnicodeString.extract(dest too short)==%d (%s) expected %d (U_BUFFER_OVERFLOW_ERROR)", | |
555 | length, u_errorName(errorCode), s.length()); | |
556 | } | |
557 | ||
558 | errorCode=U_ZERO_ERROR; | |
559 | length=s.extract(dest, s.length(), errorCode); | |
560 | if(errorCode!=U_STRING_NOT_TERMINATED_WARNING || length!=s.length()) { | |
561 | errln("UnicodeString.extract(dest just right without NUL)==%d (%s) expected %d (U_STRING_NOT_TERMINATED_WARNING)", | |
562 | length, u_errorName(errorCode), s.length()); | |
563 | } | |
564 | if(dest[length-1]!=s[length-1] || dest[length]!=0xa5) { | |
565 | errln("UnicodeString.extract(dest just right without NUL) did not extract the string correctly"); | |
566 | } | |
567 | ||
568 | errorCode=U_ZERO_ERROR; | |
569 | length=s.extract(dest, s.length()+1, errorCode); | |
570 | if(errorCode!=U_ZERO_ERROR || length!=s.length()) { | |
571 | errln("UnicodeString.extract(dest large enough)==%d (%s) expected %d (U_ZERO_ERROR)", | |
572 | length, u_errorName(errorCode), s.length()); | |
573 | } | |
574 | if(dest[length-1]!=s[length-1] || dest[length]!=0 || dest[length+1]!=0xa5) { | |
575 | errln("UnicodeString.extract(dest large enough) did not extract the string correctly"); | |
576 | } | |
577 | } | |
578 | ||
579 | { | |
580 | // test new UConverter extract() and constructor | |
581 | UnicodeString s=UNICODE_STRING("\\U0002f999\\U0001d15f\\u00c4\\u1ed0", 32).unescape(); | |
582 | char buffer[32]; | |
583 | static const char expect[]={ | |
584 | (char)0xf0, (char)0xaf, (char)0xa6, (char)0x99, | |
585 | (char)0xf0, (char)0x9d, (char)0x85, (char)0x9f, | |
586 | (char)0xc3, (char)0x84, | |
587 | (char)0xe1, (char)0xbb, (char)0x90 | |
588 | }; | |
589 | UErrorCode errorCode=U_ZERO_ERROR; | |
590 | UConverter *cnv=ucnv_open("UTF-8", &errorCode); | |
591 | int32_t length; | |
592 | ||
593 | if(U_SUCCESS(errorCode)) { | |
594 | // test preflighting | |
595 | if( (length=s.extract(NULL, 0, cnv, errorCode))!=13 || | |
596 | errorCode!=U_BUFFER_OVERFLOW_ERROR | |
597 | ) { | |
598 | errln("UnicodeString::extract(NULL, UConverter) preflighting failed (length=%ld, %s)", | |
599 | length, u_errorName(errorCode)); | |
600 | } | |
601 | errorCode=U_ZERO_ERROR; | |
602 | if( (length=s.extract(buffer, 2, cnv, errorCode))!=13 || | |
603 | errorCode!=U_BUFFER_OVERFLOW_ERROR | |
604 | ) { | |
605 | errln("UnicodeString::extract(too small, UConverter) preflighting failed (length=%ld, %s)", | |
606 | length, u_errorName(errorCode)); | |
607 | } | |
608 | ||
609 | // try error cases | |
610 | errorCode=U_ZERO_ERROR; | |
611 | if( s.extract(NULL, 2, cnv, errorCode)==13 || U_SUCCESS(errorCode)) { | |
612 | errln("UnicodeString::extract(UConverter) succeeded with an illegal destination"); | |
613 | } | |
614 | errorCode=U_ILLEGAL_ARGUMENT_ERROR; | |
615 | if( s.extract(NULL, 0, cnv, errorCode)==13 || U_SUCCESS(errorCode)) { | |
616 | errln("UnicodeString::extract(UConverter) succeeded with a previous error code"); | |
617 | } | |
618 | errorCode=U_ZERO_ERROR; | |
619 | ||
620 | // extract for real | |
621 | if( (length=s.extract(buffer, sizeof(buffer), cnv, errorCode))!=13 || | |
622 | uprv_memcmp(buffer, expect, 13)!=0 || | |
623 | buffer[13]!=0 || | |
624 | U_FAILURE(errorCode) | |
625 | ) { | |
626 | errln("UnicodeString::extract(UConverter) conversion failed (length=%ld, %s)", | |
627 | length, u_errorName(errorCode)); | |
628 | } | |
629 | // Test again with just the converter name. | |
630 | if( (length=s.extract(0, s.length(), buffer, sizeof(buffer), "UTF-8"))!=13 || | |
631 | uprv_memcmp(buffer, expect, 13)!=0 || | |
632 | buffer[13]!=0 || | |
633 | U_FAILURE(errorCode) | |
634 | ) { | |
635 | errln("UnicodeString::extract(\"UTF-8\") conversion failed (length=%ld, %s)", | |
636 | length, u_errorName(errorCode)); | |
637 | } | |
638 | ||
639 | // try the constructor | |
640 | UnicodeString t(expect, sizeof(expect), cnv, errorCode); | |
641 | if(U_FAILURE(errorCode) || s!=t) { | |
642 | errln("UnicodeString(UConverter) conversion failed (%s)", | |
643 | u_errorName(errorCode)); | |
644 | } | |
645 | ||
646 | ucnv_close(cnv); | |
647 | } | |
648 | } | |
649 | } | |
650 | ||
651 | void | |
652 | UnicodeStringTest::TestRemoveReplace() | |
653 | { | |
654 | UnicodeString test1("The rain in Spain stays mainly on the plain"); | |
655 | UnicodeString test2("eat SPAMburgers!"); | |
656 | UChar test3[] = { 0x53, 0x50, 0x41, 0x4d, 0x4d, 0 }; | |
657 | char test4[] = "SPAM"; | |
658 | UnicodeString& test5 = test1; | |
659 | ||
660 | test1.replace(4, 4, test2, 4, 4); | |
661 | test1.replace(12, 5, test3, 4); | |
662 | test3[4] = 0; | |
663 | test1.replace(17, 4, test3); | |
664 | test1.replace(23, 4, test4); | |
665 | test1.replaceBetween(37, 42, test2, 4, 8); | |
666 | ||
667 | if (test1 != "The SPAM in SPAM SPAMs SPAMly on the SPAM") | |
668 | errln("One of the replace methods failed:\n" | |
669 | " expected \"The SPAM in SPAM SPAMs SPAMly on the SPAM\",\n" | |
670 | " got \"" + test1 + "\""); | |
671 | ||
672 | test1.remove(21, 1); | |
673 | test1.removeBetween(26, 28); | |
674 | ||
675 | if (test1 != "The SPAM in SPAM SPAM SPAM on the SPAM") | |
676 | errln("One of the remove methods failed:\n" | |
677 | " expected \"The SPAM in SPAM SPAM SPAM on the SPAM\",\n" | |
678 | " got \"" + test1 + "\""); | |
679 | ||
680 | for (int32_t i = 0; i < test1.length(); i++) { | |
681 | if (test5[i] != 0x53 && test5[i] != 0x50 && test5[i] != 0x41 && test5[i] != 0x4d && test5[i] != 0x20) { | |
682 | test1.setCharAt(i, 0x78); | |
683 | } | |
684 | } | |
685 | ||
686 | if (test1 != "xxx SPAM xx SPAM SPAM SPAM xx xxx SPAM") | |
687 | errln("One of the remove methods failed:\n" | |
688 | " expected \"xxx SPAM xx SPAM SPAM SPAM xx xxx SPAM\",\n" | |
689 | " got \"" + test1 + "\""); | |
690 | ||
691 | test1.remove(); | |
692 | if (test1.length() != 0) | |
693 | errln("Remove() failed: expected empty string, got \"" + test1 + "\""); | |
694 | } | |
695 | ||
696 | void | |
697 | UnicodeStringTest::TestSearching() | |
698 | { | |
699 | UnicodeString test1("test test ttest tetest testesteststt"); | |
700 | UnicodeString test2("test"); | |
701 | UChar testChar = 0x74; | |
702 | ||
703 | UChar32 testChar32 = 0x20402; | |
704 | UChar testData[]={ | |
705 | // 0 1 2 3 4 5 6 7 | |
706 | 0xd841, 0xdc02, 0x0071, 0xdc02, 0xd841, 0x0071, 0xd841, 0xdc02, | |
707 | ||
708 | // 8 9 10 11 12 13 14 15 | |
709 | 0x0071, 0x0072, 0xd841, 0xdc02, 0x0071, 0xd841, 0xdc02, 0x0071, | |
710 | ||
711 | // 16 17 18 19 | |
712 | 0xdc02, 0xd841, 0x0073, 0x0000 | |
713 | }; | |
714 | UnicodeString test3(testData); | |
715 | UnicodeString test4(testChar32); | |
716 | ||
717 | uint16_t occurrences = 0; | |
718 | int32_t startPos = 0; | |
719 | for ( ; | |
720 | startPos != -1 && startPos < test1.length(); | |
721 | (startPos = test1.indexOf(test2, startPos)) != -1 ? (++occurrences, startPos += 4) : 0) | |
722 | ; | |
723 | if (occurrences != 6) | |
724 | errln("indexOf failed: expected to find 6 occurrences, found " + occurrences); | |
725 | ||
726 | for ( occurrences = 0, startPos = 10; | |
727 | startPos != -1 && startPos < test1.length(); | |
728 | (startPos = test1.indexOf(test2, startPos)) != -1 ? (++occurrences, startPos += 4) : 0) | |
729 | ; | |
730 | if (occurrences != 4) | |
731 | errln("indexOf with starting offset failed: expected to find 4 occurrences, found " + occurrences); | |
732 | ||
733 | int32_t endPos = 28; | |
734 | for ( occurrences = 0, startPos = 5; | |
735 | startPos != -1 && startPos < test1.length(); | |
736 | (startPos = test1.indexOf(test2, startPos, endPos - startPos)) != -1 ? (++occurrences, startPos += 4) : 0) | |
737 | ; | |
738 | if (occurrences != 4) | |
739 | errln("indexOf with starting and ending offsets failed: expected to find 4 occurrences, found " + occurrences); | |
740 | ||
741 | //using UChar32 string | |
742 | for ( startPos=0, occurrences=0; | |
743 | startPos != -1 && startPos < test3.length(); | |
744 | (startPos = test3.indexOf(test4, startPos)) != -1 ? (++occurrences, startPos += 2) : 0) | |
745 | ; | |
746 | if (occurrences != 4) | |
747 | errln((UnicodeString)"indexOf failed: expected to find 4 occurrences, found " + occurrences); | |
748 | ||
749 | for ( startPos=10, occurrences=0; | |
750 | startPos != -1 && startPos < test3.length(); | |
751 | (startPos = test3.indexOf(test4, startPos)) != -1 ? (++occurrences, startPos += 2) : 0) | |
752 | ; | |
753 | if (occurrences != 2) | |
754 | errln("indexOf failed: expected to find 2 occurrences, found " + occurrences); | |
755 | //--- | |
756 | ||
757 | for ( occurrences = 0, startPos = 0; | |
758 | startPos != -1 && startPos < test1.length(); | |
759 | (startPos = test1.indexOf(testChar, startPos)) != -1 ? (++occurrences, startPos += 1) : 0) | |
760 | ; | |
761 | if (occurrences != 16) | |
762 | errln("indexOf with character failed: expected to find 16 occurrences, found " + occurrences); | |
763 | ||
764 | for ( occurrences = 0, startPos = 10; | |
765 | startPos != -1 && startPos < test1.length(); | |
766 | (startPos = test1.indexOf(testChar, startPos)) != -1 ? (++occurrences, startPos += 1) : 0) | |
767 | ; | |
768 | if (occurrences != 12) | |
769 | errln("indexOf with character & start offset failed: expected to find 12 occurrences, found " + occurrences); | |
770 | ||
771 | for ( occurrences = 0, startPos = 5, endPos = 28; | |
772 | startPos != -1 && startPos < test1.length(); | |
773 | (startPos = test1.indexOf(testChar, startPos, endPos - startPos)) != -1 ? (++occurrences, startPos += 1) : 0) | |
774 | ; | |
775 | if (occurrences != 10) | |
776 | errln("indexOf with character & start & end offsets failed: expected to find 10 occurrences, found " + occurrences); | |
777 | ||
778 | //testing for UChar32 | |
779 | UnicodeString subString; | |
780 | for( occurrences =0, startPos=0; startPos < test3.length(); startPos +=1){ | |
781 | subString.append(test3, startPos, test3.length()); | |
782 | if(subString.indexOf(testChar32) != -1 ){ | |
783 | ++occurrences; | |
784 | } | |
785 | subString.remove(); | |
786 | } | |
787 | if (occurrences != 14) | |
788 | errln((UnicodeString)"indexOf failed: expected to find 14 occurrences, found " + occurrences); | |
789 | ||
790 | for ( occurrences = 0, startPos = 0; | |
791 | startPos != -1 && startPos < test3.length(); | |
792 | (startPos = test3.indexOf(testChar32, startPos)) != -1 ? (++occurrences, startPos += 1) : 0) | |
793 | ; | |
794 | if (occurrences != 4) | |
795 | errln((UnicodeString)"indexOf failed: expected to find 4 occurrences, found " + occurrences); | |
796 | ||
797 | endPos=test3.length(); | |
798 | for ( occurrences = 0, startPos = 5; | |
799 | startPos != -1 && startPos < test3.length(); | |
800 | (startPos = test3.indexOf(testChar32, startPos, endPos - startPos)) != -1 ? (++occurrences, startPos += 1) : 0) | |
801 | ; | |
802 | if (occurrences != 3) | |
803 | errln((UnicodeString)"indexOf with character & start & end offsets failed: expected to find 2 occurrences, found " + occurrences); | |
804 | //--- | |
805 | ||
806 | if(test1.lastIndexOf(test2)!=29) { | |
807 | errln("test1.lastIndexOf(test2)!=29"); | |
808 | } | |
809 | ||
810 | if(test1.lastIndexOf(test2, 15)!=29 || test1.lastIndexOf(test2, 29)!=29 || test1.lastIndexOf(test2, 30)!=-1) { | |
811 | errln("test1.lastIndexOf(test2, start) failed"); | |
812 | } | |
813 | ||
814 | for ( occurrences = 0, startPos = 32; | |
815 | startPos != -1; | |
816 | (startPos = test1.lastIndexOf(test2, 5, startPos - 5)) != -1 ? ++occurrences : 0) | |
817 | ; | |
818 | if (occurrences != 4) | |
819 | errln("lastIndexOf with starting and ending offsets failed: expected to find 4 occurrences, found " + occurrences); | |
820 | ||
821 | for ( occurrences = 0, startPos = 32; | |
822 | startPos != -1; | |
823 | (startPos = test1.lastIndexOf(testChar, 5, startPos - 5)) != -1 ? ++occurrences : 0) | |
824 | ; | |
825 | if (occurrences != 11) | |
826 | errln("lastIndexOf with character & start & end offsets failed: expected to find 11 occurrences, found " + occurrences); | |
827 | ||
828 | //testing UChar32 | |
829 | startPos=test3.length(); | |
830 | for ( occurrences = 0; | |
831 | startPos != -1; | |
832 | (startPos = test3.lastIndexOf(testChar32, 5, startPos - 5)) != -1 ? ++occurrences : 0) | |
833 | ; | |
834 | if (occurrences != 3) | |
835 | errln((UnicodeString)"lastIndexOf with character & start & end offsets failed: expected to find 3 occurrences, found " + occurrences); | |
836 | ||
837 | ||
838 | for ( occurrences = 0, endPos = test3.length(); endPos > 0; endPos -= 1){ | |
839 | subString.remove(); | |
840 | subString.append(test3, 0, endPos); | |
841 | if(subString.lastIndexOf(testChar32) != -1 ){ | |
842 | ++occurrences; | |
843 | } | |
844 | } | |
845 | if (occurrences != 18) | |
846 | errln((UnicodeString)"indexOf failed: expected to find 18 occurrences, found " + occurrences); | |
847 | //--- | |
848 | ||
849 | // test that indexOf(UChar32) and lastIndexOf(UChar32) | |
850 | // do not find surrogate code points when they are part of matched pairs | |
851 | // (= part of supplementary code points) | |
852 | // Jitterbug 1542 | |
853 | if(test3.indexOf((UChar32)0xd841) != 4 || test3.indexOf((UChar32)0xdc02) != 3) { | |
854 | errln("error: UnicodeString::indexOf(UChar32 surrogate) finds a partial supplementary code point"); | |
855 | } | |
856 | if( UnicodeString(test3, 0, 17).lastIndexOf((UChar)0xd841, 0) != 4 || | |
857 | UnicodeString(test3, 0, 17).lastIndexOf((UChar32)0xd841, 2) != 4 || | |
858 | test3.lastIndexOf((UChar32)0xd841, 0, 17) != 4 || test3.lastIndexOf((UChar32)0xdc02, 0, 17) != 16 | |
859 | ) { | |
860 | errln("error: UnicodeString::lastIndexOf(UChar32 surrogate) finds a partial supplementary code point"); | |
861 | } | |
862 | } | |
863 | ||
864 | void | |
865 | UnicodeStringTest::TestSpacePadding() | |
866 | { | |
867 | UnicodeString test1("hello"); | |
868 | UnicodeString test2(" there"); | |
869 | UnicodeString test3("Hi! How ya doin'? Beautiful day, isn't it?"); | |
870 | UnicodeString test4; | |
871 | UBool returnVal; | |
872 | UnicodeString expectedValue; | |
873 | ||
874 | returnVal = test1.padLeading(15); | |
875 | expectedValue = " hello"; | |
876 | if (returnVal == FALSE || test1 != expectedValue) | |
877 | errln("padLeading() failed: expected \"" + expectedValue + "\", got \"" + test1 + "\"."); | |
878 | ||
879 | returnVal = test2.padTrailing(15); | |
880 | expectedValue = " there "; | |
881 | if (returnVal == FALSE || test2 != expectedValue) | |
882 | errln("padTrailing() failed: expected \"" + expectedValue + "\", got \"" + test2 + "\"."); | |
883 | ||
884 | expectedValue = test3; | |
885 | returnVal = test3.padTrailing(15); | |
886 | if (returnVal == TRUE || test3 != expectedValue) | |
887 | errln("padTrailing() failed: expected \"" + expectedValue + "\", got \"" + test3 + "\"."); | |
888 | ||
889 | expectedValue = "hello"; | |
890 | test4.setTo(test1).trim(); | |
891 | ||
892 | if (test4 != expectedValue || test1 == expectedValue || test4 != expectedValue) | |
893 | errln("trim(UnicodeString&) failed"); | |
894 | ||
895 | test1.trim(); | |
896 | if (test1 != expectedValue) | |
897 | errln("trim() failed: expected \"" + expectedValue + "\", got \"" + test1 + "\"."); | |
898 | ||
899 | test2.trim(); | |
900 | expectedValue = "there"; | |
901 | if (test2 != expectedValue) | |
902 | errln("trim() failed: expected \"" + expectedValue + "\", got \"" + test2 + "\"."); | |
903 | ||
904 | test3.trim(); | |
905 | expectedValue = "Hi! How ya doin'? Beautiful day, isn't it?"; | |
906 | if (test3 != expectedValue) | |
907 | errln("trim() failed: expected \"" + expectedValue + "\", got \"" + test3 + "\"."); | |
908 | ||
909 | returnVal = test1.truncate(15); | |
910 | expectedValue = "hello"; | |
911 | if (returnVal == TRUE || test1 != expectedValue) | |
912 | errln("truncate() failed: expected \"" + expectedValue + "\", got \"" + test1 + "\"."); | |
913 | ||
914 | returnVal = test2.truncate(15); | |
915 | expectedValue = "there"; | |
916 | if (returnVal == TRUE || test2 != expectedValue) | |
917 | errln("truncate() failed: expected \"" + expectedValue + "\", got \"" + test2 + "\"."); | |
918 | ||
919 | returnVal = test3.truncate(15); | |
920 | expectedValue = "Hi! How ya doi"; | |
921 | if (returnVal == FALSE || test3 != expectedValue) | |
922 | errln("truncate() failed: expected \"" + expectedValue + "\", got \"" + test3 + "\"."); | |
923 | } | |
924 | ||
925 | void | |
926 | UnicodeStringTest::TestPrefixAndSuffix() | |
927 | { | |
928 | UnicodeString test1("Now is the time for all good men to come to the aid of their country."); | |
929 | UnicodeString test2("Now"); | |
930 | UnicodeString test3("country."); | |
931 | UnicodeString test4("count"); | |
932 | ||
933 | if (!test1.startsWith(test2) || !test1.startsWith(test2, 0, test2.length())) { | |
934 | errln("startsWith() failed: \"" + test2 + "\" should be a prefix of \"" + test1 + "\"."); | |
935 | } | |
936 | ||
937 | if (test1.startsWith(test3) || | |
938 | test1.startsWith(test3.getBuffer(), test3.length()) || | |
939 | test1.startsWith(test3.getTerminatedBuffer(), 0, -1) | |
940 | ) { | |
941 | errln("startsWith() failed: \"" + test3 + "\" shouldn't be a prefix of \"" + test1 + "\"."); | |
942 | } | |
943 | ||
944 | if (test1.endsWith(test2)) { | |
945 | errln("endsWith() failed: \"" + test2 + "\" shouldn't be a suffix of \"" + test1 + "\"."); | |
946 | } | |
947 | ||
948 | if (!test1.endsWith(test3)) { | |
949 | errln("endsWith(test3) failed: \"" + test3 + "\" should be a suffix of \"" + test1 + "\"."); | |
950 | } | |
951 | if (!test1.endsWith(test3, 0, INT32_MAX)) { | |
952 | errln("endsWith(test3, 0, INT32_MAX) failed: \"" + test3 + "\" should be a suffix of \"" + test1 + "\"."); | |
953 | } | |
954 | ||
955 | if(!test1.endsWith(test3.getBuffer(), test3.length())) { | |
956 | errln("endsWith(test3.getBuffer(), test3.length()) failed: \"" + test3 + "\" should be a suffix of \"" + test1 + "\"."); | |
957 | } | |
958 | if(!test1.endsWith(test3.getTerminatedBuffer(), 0, -1)) { | |
959 | errln("endsWith(test3.getTerminatedBuffer(), 0, -1) failed: \"" + test3 + "\" should be a suffix of \"" + test1 + "\"."); | |
960 | } | |
961 | ||
962 | if (!test3.startsWith(test4)) { | |
963 | errln("endsWith(test4) failed: \"" + test4 + "\" should be a prefix of \"" + test3 + "\"."); | |
964 | } | |
965 | ||
966 | if (test4.startsWith(test3)) { | |
967 | errln("startsWith(test3) failed: \"" + test3 + "\" shouldn't be a prefix of \"" + test4 + "\"."); | |
968 | } | |
969 | } | |
970 | ||
971 | void | |
972 | UnicodeStringTest::TestStartsWithAndEndsWithNulTerminated() { | |
973 | UnicodeString test("abcde"); | |
974 | const UChar ab[] = { 0x61, 0x62, 0 }; | |
975 | const UChar de[] = { 0x64, 0x65, 0 }; | |
976 | assertTrue("abcde.startsWith(ab, -1)", test.startsWith(ab, -1)); | |
977 | assertTrue("abcde.startsWith(ab, 0, -1)", test.startsWith(ab, 0, -1)); | |
978 | assertTrue("abcde.endsWith(de, -1)", test.endsWith(de, -1)); | |
979 | assertTrue("abcde.endsWith(de, 0, -1)", test.endsWith(de, 0, -1)); | |
980 | } | |
981 | ||
982 | void | |
983 | UnicodeStringTest::TestFindAndReplace() | |
984 | { | |
985 | UnicodeString test1("One potato, two potato, three potato, four\n"); | |
986 | UnicodeString test2("potato"); | |
987 | UnicodeString test3("MISSISSIPPI"); | |
988 | ||
989 | UnicodeString expectedValue; | |
990 | ||
991 | test1.findAndReplace(test2, test3); | |
992 | expectedValue = "One MISSISSIPPI, two MISSISSIPPI, three MISSISSIPPI, four\n"; | |
993 | if (test1 != expectedValue) | |
994 | errln("findAndReplace failed: expected \"" + expectedValue + "\", got \"" + test1 + "\"."); | |
995 | test1.findAndReplace(2, 32, test3, test2); | |
996 | expectedValue = "One potato, two potato, three MISSISSIPPI, four\n"; | |
997 | if (test1 != expectedValue) | |
998 | errln("findAndReplace failed: expected \"" + expectedValue + "\", got \"" + test1 + "\"."); | |
999 | } | |
1000 | ||
1001 | void | |
1002 | UnicodeStringTest::TestReverse() | |
1003 | { | |
1004 | UnicodeString test("backwards words say to used I"); | |
1005 | ||
1006 | test.reverse(); | |
1007 | test.reverse(2, 4); | |
1008 | test.reverse(7, 2); | |
1009 | test.reverse(10, 3); | |
1010 | test.reverse(14, 5); | |
1011 | test.reverse(20, 9); | |
1012 | ||
1013 | if (test != "I used to say words backwards") | |
1014 | errln("reverse() failed: Expected \"I used to say words backwards\",\n got \"" | |
1015 | + test + "\""); | |
1016 | ||
1017 | test=UNICODE_STRING("\\U0002f999\\U0001d15f\\u00c4\\u1ed0", 32).unescape(); | |
1018 | test.reverse(); | |
1019 | if(test.char32At(0)!=0x1ed0 || test.char32At(1)!=0xc4 || test.char32At(2)!=0x1d15f || test.char32At(4)!=0x2f999) { | |
1020 | errln("reverse() failed with supplementary characters"); | |
1021 | } | |
1022 | ||
1023 | // Test case for ticket #8091: | |
1024 | // UnicodeString::reverse() failed to see a lead surrogate in the middle of | |
1025 | // an odd-length string that contains no other lead surrogates. | |
1026 | test=UNICODE_STRING_SIMPLE("ab\\U0001F4A9e").unescape(); | |
1027 | UnicodeString expected=UNICODE_STRING_SIMPLE("e\\U0001F4A9ba").unescape(); | |
1028 | test.reverse(); | |
1029 | if(test!=expected) { | |
1030 | errln("reverse() failed with only lead surrogate in the middle"); | |
1031 | } | |
1032 | } | |
1033 | ||
1034 | void | |
1035 | UnicodeStringTest::TestMiscellaneous() | |
1036 | { | |
1037 | UnicodeString test1("This is a test"); | |
1038 | UnicodeString test2("This is a test"); | |
1039 | UnicodeString test3("Me too!"); | |
1040 | ||
1041 | // test getBuffer(minCapacity) and releaseBuffer() | |
1042 | test1=UnicodeString(); // make sure that it starts with its stackBuffer | |
1043 | UChar *p=test1.getBuffer(20); | |
1044 | if(test1.getCapacity()<20) { | |
1045 | errln("UnicodeString::getBuffer(20).getCapacity()<20"); | |
1046 | } | |
1047 | ||
1048 | test1.append((UChar)7); // must not be able to modify the string here | |
1049 | test1.setCharAt(3, 7); | |
1050 | test1.reverse(); | |
1051 | if( test1.length()!=0 || | |
1052 | test1.charAt(0)!=0xffff || test1.charAt(3)!=0xffff || | |
1053 | test1.getBuffer(10)!=0 || test1.getBuffer()!=0 | |
1054 | ) { | |
1055 | errln("UnicodeString::getBuffer(minCapacity) allows read or write access to the UnicodeString"); | |
1056 | } | |
1057 | ||
1058 | p[0]=1; | |
1059 | p[1]=2; | |
1060 | p[2]=3; | |
1061 | test1.releaseBuffer(3); | |
1062 | test1.append((UChar)4); | |
1063 | ||
1064 | if(test1.length()!=4 || test1.charAt(0)!=1 || test1.charAt(1)!=2 || test1.charAt(2)!=3 || test1.charAt(3)!=4) { | |
1065 | errln("UnicodeString::releaseBuffer(newLength) does not properly reallow access to the UnicodeString"); | |
1066 | } | |
1067 | ||
1068 | // test releaseBuffer() without getBuffer(minCapacity) - must not have any effect | |
1069 | test1.releaseBuffer(1); | |
1070 | if(test1.length()!=4 || test1.charAt(0)!=1 || test1.charAt(1)!=2 || test1.charAt(2)!=3 || test1.charAt(3)!=4) { | |
1071 | errln("UnicodeString::releaseBuffer(newLength) without getBuffer(minCapacity) changed the UnicodeString"); | |
1072 | } | |
1073 | ||
1074 | // test getBuffer(const) | |
1075 | const UChar *q=test1.getBuffer(), *r=test1.getBuffer(); | |
1076 | if( test1.length()!=4 || | |
1077 | q[0]!=1 || q[1]!=2 || q[2]!=3 || q[3]!=4 || | |
1078 | r[0]!=1 || r[1]!=2 || r[2]!=3 || r[3]!=4 | |
1079 | ) { | |
1080 | errln("UnicodeString::getBuffer(const) does not return a usable buffer pointer"); | |
1081 | } | |
1082 | ||
1083 | // test releaseBuffer() with a NUL-terminated buffer | |
1084 | test1.getBuffer(20)[2]=0; | |
1085 | test1.releaseBuffer(); // implicit -1 | |
1086 | if(test1.length()!=2 || test1.charAt(0)!=1 || test1.charAt(1) !=2) { | |
1087 | errln("UnicodeString::releaseBuffer(-1) does not properly set the length of the UnicodeString"); | |
1088 | } | |
1089 | ||
1090 | // test releaseBuffer() with a non-NUL-terminated buffer | |
1091 | p=test1.getBuffer(256); | |
1092 | for(int32_t i=0; i<test1.getCapacity(); ++i) { | |
1093 | p[i]=(UChar)1; // fill the buffer with all non-NUL code units | |
1094 | } | |
1095 | test1.releaseBuffer(); // implicit -1 | |
1096 | if(test1.length()!=test1.getCapacity() || test1.charAt(1)!=1 || test1.charAt(100)!=1 || test1.charAt(test1.getCapacity()-1)!=1) { | |
1097 | errln("UnicodeString::releaseBuffer(-1 but no NUL) does not properly set the length of the UnicodeString"); | |
1098 | } | |
1099 | ||
1100 | // test getTerminatedBuffer() | |
1101 | test1=UnicodeString("This is another test.", ""); | |
1102 | test2=UnicodeString("This is another test.", ""); | |
1103 | q=test1.getTerminatedBuffer(); | |
1104 | if(q[test1.length()]!=0 || test1!=test2 || test2.compare(q, -1)!=0) { | |
1105 | errln("getTerminatedBuffer()[length]!=0"); | |
1106 | } | |
1107 | ||
1108 | const UChar u[]={ 5, 6, 7, 8, 0 }; | |
1109 | test1.setTo(FALSE, u, 3); | |
1110 | q=test1.getTerminatedBuffer(); | |
1111 | if(q==u || q[0]!=5 || q[1]!=6 || q[2]!=7 || q[3]!=0) { | |
1112 | errln("UnicodeString(u[3]).getTerminatedBuffer() returns a bad buffer"); | |
1113 | } | |
1114 | ||
1115 | test1.setTo(TRUE, u, -1); | |
1116 | q=test1.getTerminatedBuffer(); | |
1117 | if(q!=u || test1.length()!=4 || q[3]!=8 || q[4]!=0) { | |
1118 | errln("UnicodeString(u[-1]).getTerminatedBuffer() returns a bad buffer"); | |
1119 | } | |
1120 | ||
1121 | test1=UNICODE_STRING("la", 2); | |
1122 | test1.append(UNICODE_STRING(" lila", 5).getTerminatedBuffer(), 0, -1); | |
1123 | if(test1!=UNICODE_STRING("la lila", 7)) { | |
1124 | errln("UnicodeString::append(const UChar *, start, length) failed"); | |
1125 | } | |
1126 | ||
1127 | test1.insert(3, UNICODE_STRING("dudum ", 6), 0, INT32_MAX); | |
1128 | if(test1!=UNICODE_STRING("la dudum lila", 13)) { | |
1129 | errln("UnicodeString::insert(start, const UniStr &, start, length) failed"); | |
1130 | } | |
1131 | ||
1132 | static const UChar ucs[]={ 0x68, 0x6d, 0x20, 0 }; | |
1133 | test1.insert(9, ucs, -1); | |
1134 | if(test1!=UNICODE_STRING("la dudum hm lila", 16)) { | |
1135 | errln("UnicodeString::insert(start, const UChar *, length) failed"); | |
1136 | } | |
1137 | ||
1138 | test1.replace(9, 2, (UChar)0x2b); | |
1139 | if(test1!=UNICODE_STRING("la dudum + lila", 15)) { | |
1140 | errln("UnicodeString::replace(start, length, UChar) failed"); | |
1141 | } | |
1142 | ||
1143 | if(test1.hasMetaData() || UnicodeString().hasMetaData()) { | |
1144 | errln("UnicodeString::hasMetaData() returns TRUE"); | |
1145 | } | |
1146 | ||
1147 | // test getTerminatedBuffer() on a truncated, shared, heap-allocated string | |
1148 | test1=UNICODE_STRING_SIMPLE("abcdefghijklmnopqrstuvwxyz0123456789."); | |
1149 | test1.truncate(36); // ensure length()<getCapacity() | |
1150 | test2=test1; // share the buffer | |
1151 | test1.truncate(5); | |
1152 | if(test1.length()!=5 || test1.getTerminatedBuffer()[5]!=0) { | |
1153 | errln("UnicodeString(shared buffer).truncate() failed"); | |
1154 | } | |
1155 | if(test2.length()!=36 || test2[5]!=0x66 || u_strlen(test2.getTerminatedBuffer())!=36) { | |
1156 | errln("UnicodeString(shared buffer).truncate().getTerminatedBuffer() " | |
1157 | "modified another copy of the string!"); | |
1158 | } | |
1159 | test1=UNICODE_STRING_SIMPLE("abcdefghijklmnopqrstuvwxyz0123456789."); | |
1160 | test1.truncate(36); // ensure length()<getCapacity() | |
1161 | test2=test1; // share the buffer | |
1162 | test1.remove(); | |
1163 | if(test1.length()!=0 || test1.getTerminatedBuffer()[0]!=0) { | |
1164 | errln("UnicodeString(shared buffer).remove() failed"); | |
1165 | } | |
1166 | if(test2.length()!=36 || test2[0]!=0x61 || u_strlen(test2.getTerminatedBuffer())!=36) { | |
1167 | errln("UnicodeString(shared buffer).remove().getTerminatedBuffer() " | |
1168 | "modified another copy of the string!"); | |
1169 | } | |
1170 | } | |
1171 | ||
1172 | void | |
1173 | UnicodeStringTest::TestStackAllocation() | |
1174 | { | |
1175 | UChar testString[] ={ | |
1176 | 0x54, 0x68, 0x69, 0x73, 0x20, 0x69, 0x73, 0x20, 0x61, 0x20, 0x63, 0x72, 0x61, 0x7a, 0x79, 0x20, 0x74, 0x65, 0x73, 0x74, 0x2e, 0 }; | |
1177 | UChar guardWord = 0x4DED; | |
1178 | UnicodeString* test = 0; | |
1179 | ||
1180 | test = new UnicodeString(testString); | |
1181 | if (*test != "This is a crazy test.") | |
1182 | errln("Test string failed to initialize properly."); | |
1183 | if (guardWord != 0x04DED) | |
1184 | errln("Test string initialization overwrote guard word!"); | |
1185 | ||
1186 | test->insert(8, "only "); | |
1187 | test->remove(15, 6); | |
1188 | if (*test != "This is only a test.") | |
1189 | errln("Manipulation of test string failed to work right."); | |
1190 | if (guardWord != 0x4DED) | |
1191 | errln("Manipulation of test string overwrote guard word!"); | |
1192 | ||
1193 | // we have to deinitialize and release the backing store by calling the destructor | |
1194 | // explicitly, since we can't overload operator delete | |
1195 | delete test; | |
1196 | ||
1197 | UChar workingBuffer[] = { | |
1198 | 0x4e, 0x6f, 0x77, 0x20, 0x69, 0x73, 0x20, 0x74, 0x68, 0x65, 0x20, 0x74, 0x69, 0x6d, 0x65, 0x20, | |
1199 | 0x66, 0x6f, 0x72, 0x20, 0x61, 0x6c, 0x6c, 0x20, 0x6d, 0x65, 0x6e, 0x20, 0x74, 0x6f, 0x20, | |
1200 | 0x63, 0x6f, 0x6d, 0x65, 0xffff, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, | |
1201 | 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, | |
1202 | 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 }; | |
1203 | UChar guardWord2 = 0x4DED; | |
1204 | ||
1205 | test = new UnicodeString(workingBuffer, 35, 100); | |
1206 | if (*test != "Now is the time for all men to come") | |
1207 | errln("Stack-allocated backing store failed to initialize correctly."); | |
1208 | if (guardWord2 != 0x4DED) | |
1209 | errln("Stack-allocated backing store overwrote guard word!"); | |
1210 | ||
1211 | test->insert(24, "good "); | |
1212 | if (*test != "Now is the time for all good men to come") | |
1213 | errln("insert() on stack-allocated UnicodeString didn't work right"); | |
1214 | if (guardWord2 != 0x4DED) | |
1215 | errln("insert() on stack-allocated UnicodeString overwrote guard word!"); | |
1216 | ||
1217 | if (workingBuffer[24] != 0x67) | |
1218 | errln("insert() on stack-allocated UnicodeString didn't affect backing store"); | |
1219 | ||
1220 | *test += " to the aid of their country."; | |
1221 | if (*test != "Now is the time for all good men to come to the aid of their country.") | |
1222 | errln("Stack-allocated UnicodeString overflow didn't work"); | |
1223 | if (guardWord2 != 0x4DED) | |
1224 | errln("Stack-allocated UnicodeString overflow overwrote guard word!"); | |
1225 | ||
1226 | *test = "ha!"; | |
1227 | if (*test != "ha!") | |
1228 | errln("Assignment to stack-allocated UnicodeString didn't work"); | |
1229 | if (workingBuffer[0] != 0x4e) | |
1230 | errln("Change to UnicodeString after overflow are still affecting original buffer"); | |
1231 | if (guardWord2 != 0x4DED) | |
1232 | errln("Change to UnicodeString after overflow overwrote guard word!"); | |
1233 | ||
1234 | // test read-only aliasing with setTo() | |
1235 | workingBuffer[0] = 0x20ac; | |
1236 | workingBuffer[1] = 0x125; | |
1237 | workingBuffer[2] = 0; | |
1238 | test->setTo(TRUE, workingBuffer, 2); | |
1239 | if(test->length() != 2 || test->charAt(0) != 0x20ac || test->charAt(1) != 0x125) { | |
1240 | errln("UnicodeString.setTo(readonly alias) does not alias correctly"); | |
1241 | } | |
1242 | ||
1243 | UnicodeString *c=(UnicodeString *)test->clone(); | |
1244 | ||
1245 | workingBuffer[1] = 0x109; | |
1246 | if(test->charAt(1) != 0x109) { | |
1247 | errln("UnicodeString.setTo(readonly alias) made a copy: did not see change in buffer"); | |
1248 | } | |
1249 | ||
1250 | if(c->length() != 2 || c->charAt(1) != 0x125) { | |
1251 | errln("clone(alias) did not copy the buffer"); | |
1252 | } | |
1253 | delete c; | |
1254 | ||
1255 | test->setTo(TRUE, workingBuffer, -1); | |
1256 | if(test->length() != 2 || test->charAt(0) != 0x20ac || test->charAt(1) != 0x109) { | |
1257 | errln("UnicodeString.setTo(readonly alias, length -1) does not alias correctly"); | |
1258 | } | |
1259 | ||
1260 | test->setTo(FALSE, workingBuffer, -1); | |
1261 | if(!test->isBogus()) { | |
1262 | errln("UnicodeString.setTo(unterminated readonly alias, length -1) does not result in isBogus()"); | |
1263 | } | |
1264 | ||
1265 | delete test; | |
1266 | ||
1267 | test=new UnicodeString(); | |
1268 | UChar buffer[]={0x0061, 0x0062, 0x20ac, 0x0043, 0x0042, 0x0000}; | |
1269 | test->setTo(buffer, 4, 10); | |
1270 | if(test->length() !=4 || test->charAt(0) != 0x0061 || test->charAt(1) != 0x0062 || | |
1271 | test->charAt(2) != 0x20ac || test->charAt(3) != 0x0043){ | |
1272 | errln((UnicodeString)"UnicodeString.setTo(UChar*, length, capacity) does not work correctly\n" + prettify(*test)); | |
1273 | } | |
1274 | delete test; | |
1275 | ||
1276 | ||
1277 | // test the UChar32 constructor | |
1278 | UnicodeString c32Test((UChar32)0x10ff2a); | |
1279 | if( c32Test.length() != U16_LENGTH(0x10ff2a) || | |
1280 | c32Test.char32At(c32Test.length() - 1) != 0x10ff2a | |
1281 | ) { | |
1282 | errln("The UnicodeString(UChar32) constructor does not work with a 0x10ff2a filler"); | |
1283 | } | |
1284 | ||
1285 | // test the (new) capacity constructor | |
1286 | UnicodeString capTest(5, (UChar32)0x2a, 5); | |
1287 | if( capTest.length() != 5 * U16_LENGTH(0x2a) || | |
1288 | capTest.char32At(0) != 0x2a || | |
1289 | capTest.char32At(4) != 0x2a | |
1290 | ) { | |
1291 | errln("The UnicodeString capacity constructor does not work with an ASCII filler"); | |
1292 | } | |
1293 | ||
1294 | capTest = UnicodeString(5, (UChar32)0x10ff2a, 5); | |
1295 | if( capTest.length() != 5 * U16_LENGTH(0x10ff2a) || | |
1296 | capTest.char32At(0) != 0x10ff2a || | |
1297 | capTest.char32At(4) != 0x10ff2a | |
1298 | ) { | |
1299 | errln("The UnicodeString capacity constructor does not work with a 0x10ff2a filler"); | |
1300 | } | |
1301 | ||
1302 | capTest = UnicodeString(5, (UChar32)0, 0); | |
1303 | if(capTest.length() != 0) { | |
1304 | errln("The UnicodeString capacity constructor does not work with a 0x10ff2a filler"); | |
1305 | } | |
1306 | } | |
1307 | ||
1308 | /** | |
1309 | * Test the unescape() function. | |
1310 | */ | |
1311 | void UnicodeStringTest::TestUnescape(void) { | |
1312 | UnicodeString IN("abc\\u4567 \\n\\r \\U00101234xyz\\x1\\x{5289}\\x1b", -1, US_INV); | |
1313 | UnicodeString OUT("abc"); | |
1314 | OUT.append((UChar)0x4567); | |
1315 | OUT.append(" "); | |
1316 | OUT.append((UChar)0xA); | |
1317 | OUT.append((UChar)0xD); | |
1318 | OUT.append(" "); | |
1319 | OUT.append((UChar32)0x00101234); | |
1320 | OUT.append("xyz"); | |
1321 | OUT.append((UChar32)1).append((UChar32)0x5289).append((UChar)0x1b); | |
1322 | UnicodeString result = IN.unescape(); | |
1323 | if (result != OUT) { | |
1324 | errln("FAIL: " + prettify(IN) + ".unescape() -> " + | |
1325 | prettify(result) + ", expected " + | |
1326 | prettify(OUT)); | |
1327 | } | |
1328 | ||
1329 | // test that an empty string is returned in case of an error | |
1330 | if (!UNICODE_STRING("wrong \\u sequence", 17).unescape().isEmpty()) { | |
1331 | errln("FAIL: unescaping of a string with an illegal escape sequence did not return an empty string"); | |
1332 | } | |
1333 | } | |
1334 | ||
1335 | /* test code point counting functions --------------------------------------- */ | |
1336 | ||
1337 | /* reference implementation of UnicodeString::hasMoreChar32Than() */ | |
1338 | static int32_t | |
1339 | _refUnicodeStringHasMoreChar32Than(const UnicodeString &s, int32_t start, int32_t length, int32_t number) { | |
1340 | int32_t count=s.countChar32(start, length); | |
1341 | return count>number; | |
1342 | } | |
1343 | ||
1344 | /* compare the real function against the reference */ | |
1345 | void | |
1346 | UnicodeStringTest::_testUnicodeStringHasMoreChar32Than(const UnicodeString &s, int32_t start, int32_t length, int32_t number) { | |
1347 | if(s.hasMoreChar32Than(start, length, number)!=_refUnicodeStringHasMoreChar32Than(s, start, length, number)) { | |
1348 | errln("hasMoreChar32Than(%d, %d, %d)=%hd is wrong\n", | |
1349 | start, length, number, s.hasMoreChar32Than(start, length, number)); | |
1350 | } | |
1351 | } | |
1352 | ||
1353 | void | |
1354 | UnicodeStringTest::TestCountChar32(void) { | |
1355 | { | |
1356 | UnicodeString s=UNICODE_STRING("\\U0002f999\\U0001d15f\\u00c4\\u1ed0", 32).unescape(); | |
1357 | ||
1358 | // test countChar32() | |
1359 | // note that this also calls and tests u_countChar32(length>=0) | |
1360 | if( | |
1361 | s.countChar32()!=4 || | |
1362 | s.countChar32(1)!=4 || | |
1363 | s.countChar32(2)!=3 || | |
1364 | s.countChar32(2, 3)!=2 || | |
1365 | s.countChar32(2, 0)!=0 | |
1366 | ) { | |
1367 | errln("UnicodeString::countChar32() failed"); | |
1368 | } | |
1369 | ||
1370 | // NUL-terminate the string buffer and test u_countChar32(length=-1) | |
1371 | const UChar *buffer=s.getTerminatedBuffer(); | |
1372 | if( | |
1373 | u_countChar32(buffer, -1)!=4 || | |
1374 | u_countChar32(buffer+1, -1)!=4 || | |
1375 | u_countChar32(buffer+2, -1)!=3 || | |
1376 | u_countChar32(buffer+3, -1)!=3 || | |
1377 | u_countChar32(buffer+4, -1)!=2 || | |
1378 | u_countChar32(buffer+5, -1)!=1 || | |
1379 | u_countChar32(buffer+6, -1)!=0 | |
1380 | ) { | |
1381 | errln("u_countChar32(length=-1) failed"); | |
1382 | } | |
1383 | ||
1384 | // test u_countChar32() with bad input | |
1385 | if(u_countChar32(NULL, 5)!=0 || u_countChar32(buffer, -2)!=0) { | |
1386 | errln("u_countChar32(bad input) failed (returned non-zero counts)"); | |
1387 | } | |
1388 | } | |
1389 | ||
1390 | /* test data and variables for hasMoreChar32Than() */ | |
1391 | static const UChar str[]={ | |
1392 | 0x61, 0x62, 0xd800, 0xdc00, | |
1393 | 0xd801, 0xdc01, 0x63, 0xd802, | |
1394 | 0x64, 0xdc03, 0x65, 0x66, | |
1395 | 0xd804, 0xdc04, 0xd805, 0xdc05, | |
1396 | 0x67 | |
1397 | }; | |
1398 | UnicodeString string(str, LENGTHOF(str)); | |
1399 | int32_t start, length, number; | |
1400 | ||
1401 | /* test hasMoreChar32Than() */ | |
1402 | for(length=string.length(); length>=0; --length) { | |
1403 | for(start=0; start<=length; ++start) { | |
1404 | for(number=-1; number<=((length-start)+2); ++number) { | |
1405 | _testUnicodeStringHasMoreChar32Than(string, start, length-start, number); | |
1406 | } | |
1407 | } | |
1408 | } | |
1409 | ||
1410 | /* test hasMoreChar32Than() with pinning */ | |
1411 | for(start=-1; start<=string.length()+1; ++start) { | |
1412 | for(number=-1; number<=((string.length()-start)+2); ++number) { | |
1413 | _testUnicodeStringHasMoreChar32Than(string, start, 0x7fffffff, number); | |
1414 | } | |
1415 | } | |
1416 | ||
1417 | /* test hasMoreChar32Than() with a bogus string */ | |
1418 | string.setToBogus(); | |
1419 | for(length=-1; length<=1; ++length) { | |
1420 | for(start=-1; start<=length; ++start) { | |
1421 | for(number=-1; number<=((length-start)+2); ++number) { | |
1422 | _testUnicodeStringHasMoreChar32Than(string, start, length-start, number); | |
1423 | } | |
1424 | } | |
1425 | } | |
1426 | } | |
1427 | ||
1428 | void | |
1429 | UnicodeStringTest::TestBogus() { | |
1430 | UnicodeString test1("This is a test"); | |
1431 | UnicodeString test2("This is a test"); | |
1432 | UnicodeString test3("Me too!"); | |
1433 | ||
1434 | // test isBogus() and setToBogus() | |
1435 | if (test1.isBogus() || test2.isBogus() || test3.isBogus()) { | |
1436 | errln("A string returned TRUE for isBogus()!"); | |
1437 | } | |
1438 | ||
1439 | // NULL pointers are treated like empty strings | |
1440 | // use other illegal arguments to make a bogus string | |
1441 | test3.setTo(FALSE, test1.getBuffer(), -2); | |
1442 | if(!test3.isBogus()) { | |
1443 | errln("A bogus string returned FALSE for isBogus()!"); | |
1444 | } | |
1445 | if (test1.hashCode() != test2.hashCode() || test1.hashCode() == test3.hashCode()) { | |
1446 | errln("hashCode() failed"); | |
1447 | } | |
1448 | if(test3.getBuffer()!=0 || test3.getBuffer(20)!=0 || test3.getTerminatedBuffer()!=0) { | |
1449 | errln("bogus.getBuffer()!=0"); | |
1450 | } | |
1451 | if (test1.indexOf(test3) != -1) { | |
1452 | errln("bogus.indexOf() != -1"); | |
1453 | } | |
1454 | if (test1.lastIndexOf(test3) != -1) { | |
1455 | errln("bogus.lastIndexOf() != -1"); | |
1456 | } | |
1457 | if (test1.caseCompare(test3, U_FOLD_CASE_DEFAULT) != 1 || test3.caseCompare(test1, U_FOLD_CASE_DEFAULT) != -1) { | |
1458 | errln("caseCompare() doesn't work with bogus strings"); | |
1459 | } | |
1460 | if (test1.compareCodePointOrder(test3) != 1 || test3.compareCodePointOrder(test1) != -1) { | |
1461 | errln("compareCodePointOrder() doesn't work with bogus strings"); | |
1462 | } | |
1463 | ||
1464 | // verify that non-assignment modifications fail and do not revive a bogus string | |
1465 | test3.setToBogus(); | |
1466 | test3.append((UChar)0x61); | |
1467 | if(!test3.isBogus() || test3.getBuffer()!=0) { | |
1468 | errln("bogus.append('a') worked but must not"); | |
1469 | } | |
1470 | ||
1471 | test3.setToBogus(); | |
1472 | test3.findAndReplace(UnicodeString((UChar)0x61), test2); | |
1473 | if(!test3.isBogus() || test3.getBuffer()!=0) { | |
1474 | errln("bogus.findAndReplace() worked but must not"); | |
1475 | } | |
1476 | ||
1477 | test3.setToBogus(); | |
1478 | test3.trim(); | |
1479 | if(!test3.isBogus() || test3.getBuffer()!=0) { | |
1480 | errln("bogus.trim() revived bogus but must not"); | |
1481 | } | |
1482 | ||
1483 | test3.setToBogus(); | |
1484 | test3.remove(1); | |
1485 | if(!test3.isBogus() || test3.getBuffer()!=0) { | |
1486 | errln("bogus.remove(1) revived bogus but must not"); | |
1487 | } | |
1488 | ||
1489 | test3.setToBogus(); | |
1490 | if(!test3.setCharAt(0, 0x62).isBogus() || !test3.isEmpty()) { | |
1491 | errln("bogus.setCharAt(0, 'b') worked but must not"); | |
1492 | } | |
1493 | ||
1494 | test3.setToBogus(); | |
1495 | if(test3.truncate(1) || !test3.isBogus() || !test3.isEmpty()) { | |
1496 | errln("bogus.truncate(1) revived bogus but must not"); | |
1497 | } | |
1498 | ||
1499 | // verify that assignments revive a bogus string | |
1500 | test3.setToBogus(); | |
1501 | if(!test3.isBogus() || (test3=test1).isBogus() || test3!=test1) { | |
1502 | errln("bogus.operator=() failed"); | |
1503 | } | |
1504 | ||
1505 | test3.setToBogus(); | |
1506 | if(!test3.isBogus() || test3.fastCopyFrom(test1).isBogus() || test3!=test1) { | |
1507 | errln("bogus.fastCopyFrom() failed"); | |
1508 | } | |
1509 | ||
1510 | test3.setToBogus(); | |
1511 | if(!test3.isBogus() || test3.setTo(test1).isBogus() || test3!=test1) { | |
1512 | errln("bogus.setTo(UniStr) failed"); | |
1513 | } | |
1514 | ||
1515 | test3.setToBogus(); | |
1516 | if(!test3.isBogus() || test3.setTo(test1, 0).isBogus() || test3!=test1) { | |
1517 | errln("bogus.setTo(UniStr, 0) failed"); | |
1518 | } | |
1519 | ||
1520 | test3.setToBogus(); | |
1521 | if(!test3.isBogus() || test3.setTo(test1, 0, 0x7fffffff).isBogus() || test3!=test1) { | |
1522 | errln("bogus.setTo(UniStr, 0, len) failed"); | |
1523 | } | |
1524 | ||
1525 | test3.setToBogus(); | |
1526 | if(!test3.isBogus() || test3.setTo(test1.getBuffer(), test1.length()).isBogus() || test3!=test1) { | |
1527 | errln("bogus.setTo(const UChar *, len) failed"); | |
1528 | } | |
1529 | ||
1530 | test3.setToBogus(); | |
1531 | if(!test3.isBogus() || test3.setTo((UChar)0x2028).isBogus() || test3!=UnicodeString((UChar)0x2028)) { | |
1532 | errln("bogus.setTo(UChar) failed"); | |
1533 | } | |
1534 | ||
1535 | test3.setToBogus(); | |
1536 | if(!test3.isBogus() || test3.setTo((UChar32)0x1d157).isBogus() || test3!=UnicodeString((UChar32)0x1d157)) { | |
1537 | errln("bogus.setTo(UChar32) failed"); | |
1538 | } | |
1539 | ||
1540 | test3.setToBogus(); | |
1541 | if(!test3.isBogus() || test3.setTo(FALSE, test1.getBuffer(), test1.length()).isBogus() || test3!=test1) { | |
1542 | errln("bogus.setTo(readonly alias) failed"); | |
1543 | } | |
1544 | ||
1545 | // writable alias to another string's buffer: very bad idea, just convenient for this test | |
1546 | test3.setToBogus(); | |
1547 | if(!test3.isBogus() || test3.setTo((UChar *)test1.getBuffer(), test1.length(), test1.getCapacity()).isBogus() || test3!=test1) { | |
1548 | errln("bogus.setTo(writable alias) failed"); | |
1549 | } | |
1550 | ||
1551 | // verify simple, documented ways to turn a bogus string into an empty one | |
1552 | test3.setToBogus(); | |
1553 | if(!test3.isBogus() || (test3=UnicodeString()).isBogus() || !test3.isEmpty()) { | |
1554 | errln("bogus.operator=(UnicodeString()) failed"); | |
1555 | } | |
1556 | ||
1557 | test3.setToBogus(); | |
1558 | if(!test3.isBogus() || test3.setTo(UnicodeString()).isBogus() || !test3.isEmpty()) { | |
1559 | errln("bogus.setTo(UnicodeString()) failed"); | |
1560 | } | |
1561 | ||
1562 | test3.setToBogus(); | |
1563 | if(test3.remove().isBogus() || test3.getBuffer()==0 || !test3.isEmpty()) { | |
1564 | errln("bogus.remove() failed"); | |
1565 | } | |
1566 | ||
1567 | test3.setToBogus(); | |
1568 | if(test3.remove(0, INT32_MAX).isBogus() || test3.getBuffer()==0 || !test3.isEmpty()) { | |
1569 | errln("bogus.remove(0, INT32_MAX) failed"); | |
1570 | } | |
1571 | ||
1572 | test3.setToBogus(); | |
1573 | if(test3.truncate(0) || test3.isBogus() || !test3.isEmpty()) { | |
1574 | errln("bogus.truncate(0) failed"); | |
1575 | } | |
1576 | ||
1577 | test3.setToBogus(); | |
1578 | if(!test3.isBogus() || test3.setTo((UChar32)-1).isBogus() || !test3.isEmpty()) { | |
1579 | errln("bogus.setTo((UChar32)-1) failed"); | |
1580 | } | |
1581 | ||
1582 | static const UChar nul=0; | |
1583 | ||
1584 | test3.setToBogus(); | |
1585 | if(!test3.isBogus() || test3.setTo(&nul, 0).isBogus() || !test3.isEmpty()) { | |
1586 | errln("bogus.setTo(&nul, 0) failed"); | |
1587 | } | |
1588 | ||
1589 | test3.setToBogus(); | |
1590 | if(!test3.isBogus() || test3.getBuffer()!=0) { | |
1591 | errln("setToBogus() failed to make a string bogus"); | |
1592 | } | |
1593 | ||
1594 | test3.setToBogus(); | |
1595 | if(test1.isBogus() || !(test1=test3).isBogus()) { | |
1596 | errln("normal=bogus failed to make the left string bogus"); | |
1597 | } | |
1598 | ||
1599 | // test that NULL primitive input string values are treated like | |
1600 | // empty strings, not errors (bogus) | |
1601 | test2.setTo((UChar32)0x10005); | |
1602 | if(test2.insert(1, NULL, 1).length()!=2) { | |
1603 | errln("UniStr.insert(...NULL...) should not modify the string but does"); | |
1604 | } | |
1605 | ||
1606 | UErrorCode errorCode=U_ZERO_ERROR; | |
1607 | UnicodeString | |
1608 | test4((const UChar *)NULL), | |
1609 | test5(TRUE, (const UChar *)NULL, 1), | |
1610 | test6((UChar *)NULL, 5, 5), | |
1611 | test7((const char *)NULL, 3, NULL, errorCode); | |
1612 | if(test4.isBogus() || test5.isBogus() || test6.isBogus() || test7.isBogus()) { | |
1613 | errln("a constructor set to bogus for a NULL input string, should be empty"); | |
1614 | } | |
1615 | ||
1616 | test4.setTo(NULL, 3); | |
1617 | test5.setTo(TRUE, (const UChar *)NULL, 1); | |
1618 | test6.setTo((UChar *)NULL, 5, 5); | |
1619 | if(test4.isBogus() || test5.isBogus() || test6.isBogus()) { | |
1620 | errln("a setTo() set to bogus for a NULL input string, should be empty"); | |
1621 | } | |
1622 | ||
1623 | // test that bogus==bogus<any | |
1624 | if(test1!=test3 || test1.compare(test3)!=0) { | |
1625 | errln("bogus==bogus failed"); | |
1626 | } | |
1627 | ||
1628 | test2.remove(); | |
1629 | if(test1>=test2 || !(test2>test1) || test1.compare(test2)>=0 || !(test2.compare(test1)>0)) { | |
1630 | errln("bogus<empty failed"); | |
1631 | } | |
1632 | } | |
1633 | ||
1634 | // StringEnumeration ------------------------------------------------------- *** | |
1635 | // most of StringEnumeration is tested elsewhere | |
1636 | // this test improves code coverage | |
1637 | ||
1638 | static const char *const | |
1639 | testEnumStrings[]={ | |
1640 | "a", | |
1641 | "b", | |
1642 | "c", | |
1643 | "this is a long string which helps us test some buffer limits", | |
1644 | "eeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeee" | |
1645 | }; | |
1646 | ||
1647 | class TestEnumeration : public StringEnumeration { | |
1648 | public: | |
1649 | TestEnumeration() : i(0) {} | |
1650 | ||
1651 | virtual int32_t count(UErrorCode& /*status*/) const { | |
1652 | return LENGTHOF(testEnumStrings); | |
1653 | } | |
1654 | ||
1655 | virtual const UnicodeString *snext(UErrorCode &status) { | |
1656 | if(U_SUCCESS(status) && i<LENGTHOF(testEnumStrings)) { | |
1657 | unistr=UnicodeString(testEnumStrings[i++], ""); | |
1658 | return &unistr; | |
1659 | } | |
1660 | ||
1661 | return NULL; | |
1662 | } | |
1663 | ||
1664 | virtual void reset(UErrorCode& /*status*/) { | |
1665 | i=0; | |
1666 | } | |
1667 | ||
1668 | static inline UClassID getStaticClassID() { | |
1669 | return (UClassID)&fgClassID; | |
1670 | } | |
1671 | virtual UClassID getDynamicClassID() const { | |
1672 | return getStaticClassID(); | |
1673 | } | |
1674 | ||
1675 | private: | |
1676 | static const char fgClassID; | |
1677 | ||
1678 | int32_t i, length; | |
1679 | }; | |
1680 | ||
1681 | const char TestEnumeration::fgClassID=0; | |
1682 | ||
1683 | void | |
1684 | UnicodeStringTest::TestStringEnumeration() { | |
1685 | UnicodeString s; | |
1686 | TestEnumeration ten; | |
1687 | int32_t i, length; | |
1688 | UErrorCode status; | |
1689 | ||
1690 | const UChar *pu; | |
1691 | const char *pc; | |
1692 | ||
1693 | // test the next() default implementation and ensureCharsCapacity() | |
1694 | for(i=0; i<LENGTHOF(testEnumStrings); ++i) { | |
1695 | status=U_ZERO_ERROR; | |
1696 | pc=ten.next(&length, status); | |
1697 | s=UnicodeString(testEnumStrings[i], ""); | |
1698 | if(U_FAILURE(status) || pc==NULL || length!=s.length() || UnicodeString(pc, length, "")!=s) { | |
1699 | errln("StringEnumeration.next(%d) failed", i); | |
1700 | } | |
1701 | } | |
1702 | status=U_ZERO_ERROR; | |
1703 | if(ten.next(&length, status)!=NULL) { | |
1704 | errln("StringEnumeration.next(done)!=NULL"); | |
1705 | } | |
1706 | ||
1707 | // test the unext() default implementation | |
1708 | ten.reset(status); | |
1709 | for(i=0; i<LENGTHOF(testEnumStrings); ++i) { | |
1710 | status=U_ZERO_ERROR; | |
1711 | pu=ten.unext(&length, status); | |
1712 | s=UnicodeString(testEnumStrings[i], ""); | |
1713 | if(U_FAILURE(status) || pu==NULL || length!=s.length() || UnicodeString(TRUE, pu, length)!=s) { | |
1714 | errln("StringEnumeration.unext(%d) failed", i); | |
1715 | } | |
1716 | } | |
1717 | status=U_ZERO_ERROR; | |
1718 | if(ten.unext(&length, status)!=NULL) { | |
1719 | errln("StringEnumeration.unext(done)!=NULL"); | |
1720 | } | |
1721 | ||
1722 | // test that the default clone() implementation works, and returns NULL | |
1723 | if(ten.clone()!=NULL) { | |
1724 | errln("StringEnumeration.clone()!=NULL"); | |
1725 | } | |
1726 | ||
1727 | // test that uenum_openFromStringEnumeration() works | |
1728 | // Need a heap allocated string enumeration because it is adopted by the UEnumeration. | |
1729 | StringEnumeration *newTen = new TestEnumeration; | |
1730 | status=U_ZERO_ERROR; | |
1731 | UEnumeration *uten = uenum_openFromStringEnumeration(newTen, &status); | |
1732 | if (uten==NULL || U_FAILURE(status)) { | |
1733 | errln("fail at file %s, line %d, UErrorCode is %s\n", __FILE__, __LINE__, u_errorName(status)); | |
1734 | return; | |
1735 | } | |
1736 | ||
1737 | // test uenum_next() | |
1738 | for(i=0; i<LENGTHOF(testEnumStrings); ++i) { | |
1739 | status=U_ZERO_ERROR; | |
1740 | pc=uenum_next(uten, &length, &status); | |
1741 | if(U_FAILURE(status) || pc==NULL || strcmp(pc, testEnumStrings[i]) != 0) { | |
1742 | errln("File %s, line %d, StringEnumeration.next(%d) failed", __FILE__, __LINE__, i); | |
1743 | } | |
1744 | } | |
1745 | status=U_ZERO_ERROR; | |
1746 | if(uenum_next(uten, &length, &status)!=NULL) { | |
1747 | errln("File %s, line %d, uenum_next(done)!=NULL"); | |
1748 | } | |
1749 | ||
1750 | // test the uenum_unext() | |
1751 | uenum_reset(uten, &status); | |
1752 | for(i=0; i<LENGTHOF(testEnumStrings); ++i) { | |
1753 | status=U_ZERO_ERROR; | |
1754 | pu=uenum_unext(uten, &length, &status); | |
1755 | s=UnicodeString(testEnumStrings[i], ""); | |
1756 | if(U_FAILURE(status) || pu==NULL || length!=s.length() || UnicodeString(TRUE, pu, length)!=s) { | |
1757 | errln("File %s, Line %d, uenum_unext(%d) failed", __FILE__, __LINE__, i); | |
1758 | } | |
1759 | } | |
1760 | status=U_ZERO_ERROR; | |
1761 | if(uenum_unext(uten, &length, &status)!=NULL) { | |
1762 | errln("File %s, Line %d, uenum_unext(done)!=NULL" __FILE__, __LINE__); | |
1763 | } | |
1764 | ||
1765 | uenum_close(uten); | |
1766 | } | |
1767 | ||
1768 | /* | |
1769 | * Namespace test, to make sure that macros like UNICODE_STRING include the | |
1770 | * namespace qualifier. | |
1771 | * | |
1772 | * Define a (bogus) UnicodeString class in another namespace and check for ambiguity. | |
1773 | */ | |
1774 | namespace bogus { | |
1775 | class UnicodeString { | |
1776 | public: | |
1777 | enum EInvariant { kInvariant }; | |
1778 | UnicodeString() : i(1) {} | |
1779 | UnicodeString(UBool /*isTerminated*/, const UChar * /*text*/, int32_t textLength) : i(textLength) {} | |
1780 | UnicodeString(const char * /*src*/, int32_t length, enum EInvariant /*inv*/ | |
1781 | ) : i(length) {} | |
1782 | private: | |
1783 | int32_t i; | |
1784 | }; | |
1785 | } | |
1786 | ||
1787 | void | |
1788 | UnicodeStringTest::TestNameSpace() { | |
1789 | // Provoke name collision unless the UnicodeString macros properly | |
1790 | // qualify the icu::UnicodeString class. | |
1791 | using namespace bogus; | |
1792 | ||
1793 | // Use all UnicodeString macros from unistr.h. | |
1794 | icu::UnicodeString s1=icu::UnicodeString("abc", 3, US_INV); | |
1795 | icu::UnicodeString s2=UNICODE_STRING("def", 3); | |
1796 | icu::UnicodeString s3=UNICODE_STRING_SIMPLE("ghi"); | |
1797 | ||
1798 | // Make sure the compiler does not optimize away instantiation of s1, s2, s3. | |
1799 | icu::UnicodeString s4=s1+s2+s3; | |
1800 | if(s4.length()!=9) { | |
1801 | errln("Something wrong with UnicodeString::operator+()."); | |
1802 | } | |
1803 | } | |
1804 | ||
1805 | void | |
1806 | UnicodeStringTest::TestUTF32() { | |
1807 | // Input string length US_STACKBUF_SIZE to cause overflow of the | |
1808 | // initially chosen fStackBuffer due to supplementary characters. | |
1809 | static const UChar32 utf32[] = { | |
1810 | 0x41, 0xd900, 0x61, 0xdc00, -1, 0x110000, 0x5a, 0x50000, 0x7a, | |
1811 | 0x10000, 0x20000, 0xe0000, 0x10ffff | |
1812 | }; | |
1813 | static const UChar expected_utf16[] = { | |
1814 | 0x41, 0xfffd, 0x61, 0xfffd, 0xfffd, 0xfffd, 0x5a, 0xd900, 0xdc00, 0x7a, | |
1815 | 0xd800, 0xdc00, 0xd840, 0xdc00, 0xdb40, 0xdc00, 0xdbff, 0xdfff | |
1816 | }; | |
1817 | UnicodeString from32 = UnicodeString::fromUTF32(utf32, LENGTHOF(utf32)); | |
1818 | UnicodeString expected(FALSE, expected_utf16, LENGTHOF(expected_utf16)); | |
1819 | if(from32 != expected) { | |
1820 | errln("UnicodeString::fromUTF32() did not create the expected string."); | |
1821 | } | |
1822 | ||
1823 | static const UChar utf16[] = { | |
1824 | 0x41, 0xd900, 0x61, 0xdc00, 0x5a, 0xd900, 0xdc00, 0x7a, 0xd800, 0xdc00, 0xdbff, 0xdfff | |
1825 | }; | |
1826 | static const UChar32 expected_utf32[] = { | |
1827 | 0x41, 0xfffd, 0x61, 0xfffd, 0x5a, 0x50000, 0x7a, 0x10000, 0x10ffff | |
1828 | }; | |
1829 | UChar32 result32[16]; | |
1830 | UErrorCode errorCode = U_ZERO_ERROR; | |
1831 | int32_t length32 = | |
1832 | UnicodeString(FALSE, utf16, LENGTHOF(utf16)). | |
1833 | toUTF32(result32, LENGTHOF(result32), errorCode); | |
1834 | if( length32 != LENGTHOF(expected_utf32) || | |
1835 | 0 != uprv_memcmp(result32, expected_utf32, length32*4) || | |
1836 | result32[length32] != 0 | |
1837 | ) { | |
1838 | errln("UnicodeString::toUTF32() did not create the expected string."); | |
1839 | } | |
1840 | } | |
1841 | ||
1842 | class TestCheckedArrayByteSink : public CheckedArrayByteSink { | |
1843 | public: | |
1844 | TestCheckedArrayByteSink(char* outbuf, int32_t capacity) | |
1845 | : CheckedArrayByteSink(outbuf, capacity), calledFlush(FALSE) {} | |
1846 | virtual void Flush() { calledFlush = TRUE; } | |
1847 | UBool calledFlush; | |
1848 | }; | |
1849 | ||
1850 | void | |
1851 | UnicodeStringTest::TestUTF8() { | |
1852 | static const uint8_t utf8[] = { | |
1853 | // Code points: | |
1854 | // 0x41, 0xd900, | |
1855 | // 0x61, 0xdc00, | |
1856 | // 0x110000, 0x5a, | |
1857 | // 0x50000, 0x7a, | |
1858 | // 0x10000, 0x20000, | |
1859 | // 0xe0000, 0x10ffff | |
1860 | 0x41, 0xed, 0xa4, 0x80, | |
1861 | 0x61, 0xed, 0xb0, 0x80, | |
1862 | 0xf4, 0x90, 0x80, 0x80, 0x5a, | |
1863 | 0xf1, 0x90, 0x80, 0x80, 0x7a, | |
1864 | 0xf0, 0x90, 0x80, 0x80, 0xf0, 0xa0, 0x80, 0x80, | |
1865 | 0xf3, 0xa0, 0x80, 0x80, 0xf4, 0x8f, 0xbf, 0xbf | |
1866 | }; | |
1867 | static const UChar expected_utf16[] = { | |
1868 | 0x41, 0xfffd, | |
1869 | 0x61, 0xfffd, | |
1870 | 0xfffd, 0x5a, | |
1871 | 0xd900, 0xdc00, 0x7a, | |
1872 | 0xd800, 0xdc00, 0xd840, 0xdc00, | |
1873 | 0xdb40, 0xdc00, 0xdbff, 0xdfff | |
1874 | }; | |
1875 | UnicodeString from8 = UnicodeString::fromUTF8(StringPiece((const char *)utf8, (int32_t)sizeof(utf8))); | |
1876 | UnicodeString expected(FALSE, expected_utf16, LENGTHOF(expected_utf16)); | |
1877 | ||
1878 | if(from8 != expected) { | |
1879 | errln("UnicodeString::fromUTF8(StringPiece) did not create the expected string."); | |
1880 | } | |
1881 | #if U_HAVE_STD_STRING | |
1882 | std::string utf8_string((const char *)utf8, sizeof(utf8)); | |
1883 | UnicodeString from8b = UnicodeString::fromUTF8(utf8_string); | |
1884 | if(from8b != expected) { | |
1885 | errln("UnicodeString::fromUTF8(std::string) did not create the expected string."); | |
1886 | } | |
1887 | #endif | |
1888 | ||
1889 | static const UChar utf16[] = { | |
1890 | 0x41, 0xd900, 0x61, 0xdc00, 0x5a, 0xd900, 0xdc00, 0x7a, 0xd800, 0xdc00, 0xdbff, 0xdfff | |
1891 | }; | |
1892 | static const uint8_t expected_utf8[] = { | |
1893 | 0x41, 0xef, 0xbf, 0xbd, 0x61, 0xef, 0xbf, 0xbd, 0x5a, 0xf1, 0x90, 0x80, 0x80, 0x7a, | |
1894 | 0xf0, 0x90, 0x80, 0x80, 0xf4, 0x8f, 0xbf, 0xbf | |
1895 | }; | |
1896 | UnicodeString us(FALSE, utf16, LENGTHOF(utf16)); | |
1897 | ||
1898 | char buffer[64]; | |
1899 | TestCheckedArrayByteSink sink(buffer, (int32_t)sizeof(buffer)); | |
1900 | us.toUTF8(sink); | |
1901 | if( sink.NumberOfBytesWritten() != (int32_t)sizeof(expected_utf8) || | |
1902 | 0 != uprv_memcmp(buffer, expected_utf8, sizeof(expected_utf8)) | |
1903 | ) { | |
1904 | errln("UnicodeString::toUTF8() did not create the expected string."); | |
1905 | } | |
1906 | if(!sink.calledFlush) { | |
1907 | errln("UnicodeString::toUTF8(sink) did not sink.Flush()."); | |
1908 | } | |
1909 | #if U_HAVE_STD_STRING | |
1910 | // Initial contents for testing that toUTF8String() appends. | |
1911 | std::string result8 = "-->"; | |
1912 | std::string expected8 = "-->" + std::string((const char *)expected_utf8, sizeof(expected_utf8)); | |
1913 | // Use the return value just for testing. | |
1914 | std::string &result8r = us.toUTF8String(result8); | |
1915 | if(result8r != expected8 || &result8r != &result8) { | |
1916 | errln("UnicodeString::toUTF8String() did not create the expected string."); | |
1917 | } | |
1918 | #endif | |
1919 | } | |
1920 | ||
1921 | // Test if this compiler supports Return Value Optimization of unnamed temporary objects. | |
1922 | static UnicodeString wrapUChars(const UChar *uchars) { | |
1923 | return UnicodeString(TRUE, uchars, -1); | |
1924 | } | |
1925 | ||
1926 | void | |
1927 | UnicodeStringTest::TestReadOnlyAlias() { | |
1928 | UChar uchars[]={ 0x61, 0x62, 0 }; | |
1929 | UnicodeString alias(TRUE, uchars, 2); | |
1930 | if(alias.length()!=2 || alias.getBuffer()!=uchars || alias.getTerminatedBuffer()!=uchars) { | |
1931 | errln("UnicodeString read-only-aliasing constructor does not behave as expected."); | |
1932 | return; | |
1933 | } | |
1934 | alias.truncate(1); | |
1935 | if(alias.length()!=1 || alias.getBuffer()!=uchars) { | |
1936 | errln("UnicodeString(read-only-alias).truncate() did not preserve aliasing as expected."); | |
1937 | } | |
1938 | if(alias.getTerminatedBuffer()==uchars) { | |
1939 | errln("UnicodeString(read-only-alias).truncate().getTerminatedBuffer() " | |
1940 | "did not allocate and copy as expected."); | |
1941 | } | |
1942 | if(uchars[1]!=0x62) { | |
1943 | errln("UnicodeString(read-only-alias).truncate().getTerminatedBuffer() " | |
1944 | "modified the original buffer."); | |
1945 | } | |
1946 | if(1!=u_strlen(alias.getTerminatedBuffer())) { | |
1947 | errln("UnicodeString(read-only-alias).truncate().getTerminatedBuffer() " | |
1948 | "does not return a buffer terminated at the proper length."); | |
1949 | } | |
1950 | ||
1951 | alias.setTo(TRUE, uchars, 2); | |
1952 | if(alias.length()!=2 || alias.getBuffer()!=uchars || alias.getTerminatedBuffer()!=uchars) { | |
1953 | errln("UnicodeString read-only-aliasing setTo() does not behave as expected."); | |
1954 | return; | |
1955 | } | |
1956 | alias.remove(); | |
1957 | if(alias.length()!=0) { | |
1958 | errln("UnicodeString(read-only-alias).remove() did not work."); | |
1959 | } | |
1960 | if(alias.getTerminatedBuffer()==uchars) { | |
1961 | errln("UnicodeString(read-only-alias).remove().getTerminatedBuffer() " | |
1962 | "did not un-alias as expected."); | |
1963 | } | |
1964 | if(uchars[0]!=0x61) { | |
1965 | errln("UnicodeString(read-only-alias).remove().getTerminatedBuffer() " | |
1966 | "modified the original buffer."); | |
1967 | } | |
1968 | if(0!=u_strlen(alias.getTerminatedBuffer())) { | |
1969 | errln("UnicodeString.setTo(read-only-alias).remove().getTerminatedBuffer() " | |
1970 | "does not return a buffer terminated at length 0."); | |
1971 | } | |
1972 | ||
1973 | UnicodeString longString=UNICODE_STRING_SIMPLE("abcdefghijklmnopqrstuvwxyz0123456789"); | |
1974 | alias.setTo(FALSE, longString.getBuffer(), longString.length()); | |
1975 | alias.remove(0, 10); | |
1976 | if(longString.compare(10, INT32_MAX, alias)!=0 || alias.getBuffer()!=longString.getBuffer()+10) { | |
1977 | errln("UnicodeString.setTo(read-only-alias).remove(0, 10) did not preserve aliasing as expected."); | |
1978 | } | |
1979 | alias.setTo(FALSE, longString.getBuffer(), longString.length()); | |
1980 | alias.remove(27, 99); | |
1981 | if(longString.compare(0, 27, alias)!=0 || alias.getBuffer()!=longString.getBuffer()) { | |
1982 | errln("UnicodeString.setTo(read-only-alias).remove(27, 99) did not preserve aliasing as expected."); | |
1983 | } | |
1984 | alias.setTo(FALSE, longString.getBuffer(), longString.length()); | |
1985 | alias.retainBetween(6, 30); | |
1986 | if(longString.compare(6, 24, alias)!=0 || alias.getBuffer()!=longString.getBuffer()+6) { | |
1987 | errln("UnicodeString.setTo(read-only-alias).retainBetween(6, 30) did not preserve aliasing as expected."); | |
1988 | } | |
1989 | ||
1990 | UChar abc[]={ 0x61, 0x62, 0x63, 0 }; | |
1991 | UBool hasRVO= wrapUChars(abc).getBuffer()==abc; | |
1992 | ||
1993 | UnicodeString temp; | |
1994 | temp.fastCopyFrom(longString.tempSubString()); | |
1995 | if(temp!=longString || (hasRVO && temp.getBuffer()!=longString.getBuffer())) { | |
1996 | errln("UnicodeString.tempSubString() failed"); | |
1997 | } | |
1998 | temp.fastCopyFrom(longString.tempSubString(-3, 5)); | |
1999 | if(longString.compare(0, 5, temp)!=0 || (hasRVO && temp.getBuffer()!=longString.getBuffer())) { | |
2000 | errln("UnicodeString.tempSubString(-3, 5) failed"); | |
2001 | } | |
2002 | temp.fastCopyFrom(longString.tempSubString(17)); | |
2003 | if(longString.compare(17, INT32_MAX, temp)!=0 || (hasRVO && temp.getBuffer()!=longString.getBuffer()+17)) { | |
2004 | errln("UnicodeString.tempSubString(17) failed"); | |
2005 | } | |
2006 | temp.fastCopyFrom(longString.tempSubString(99)); | |
2007 | if(!temp.isEmpty()) { | |
2008 | errln("UnicodeString.tempSubString(99) failed"); | |
2009 | } | |
2010 | temp.fastCopyFrom(longString.tempSubStringBetween(6)); | |
2011 | if(longString.compare(6, INT32_MAX, temp)!=0 || (hasRVO && temp.getBuffer()!=longString.getBuffer()+6)) { | |
2012 | errln("UnicodeString.tempSubStringBetween(6) failed"); | |
2013 | } | |
2014 | temp.fastCopyFrom(longString.tempSubStringBetween(8, 18)); | |
2015 | if(longString.compare(8, 10, temp)!=0 || (hasRVO && temp.getBuffer()!=longString.getBuffer()+8)) { | |
2016 | errln("UnicodeString.tempSubStringBetween(8, 18) failed"); | |
2017 | } | |
2018 | UnicodeString bogusString; | |
2019 | bogusString.setToBogus(); | |
2020 | temp.fastCopyFrom(bogusString.tempSubStringBetween(8, 18)); | |
2021 | if(!temp.isBogus()) { | |
2022 | errln("UnicodeString.setToBogus().tempSubStringBetween(8, 18) failed"); | |
2023 | } | |
2024 | } | |
2025 | ||
2026 | void | |
2027 | UnicodeStringTest::doTestAppendable(UnicodeString &dest, Appendable &app) { | |
2028 | static const UChar cde[3]={ 0x63, 0x64, 0x65 }; | |
2029 | static const UChar fg[3]={ 0x66, 0x67, 0 }; | |
2030 | if(!app.reserveAppendCapacity(12)) { | |
2031 | errln("Appendable.reserve(12) failed"); | |
2032 | } | |
2033 | app.appendCodeUnit(0x61); | |
2034 | app.appendCodePoint(0x62); | |
2035 | app.appendCodePoint(0x50000); | |
2036 | app.appendString(cde, 3); | |
2037 | app.appendString(fg, -1); | |
2038 | UChar scratch[3]; | |
2039 | int32_t capacity=-1; | |
2040 | UChar *buffer=app.getAppendBuffer(3, 3, scratch, 3, &capacity); | |
2041 | if(capacity<3) { | |
2042 | errln("Appendable.getAppendBuffer(min=3) returned capacity=%d<3", (int)capacity); | |
2043 | return; | |
2044 | } | |
2045 | static const UChar hij[3]={ 0x68, 0x69, 0x6a }; | |
2046 | u_memcpy(buffer, hij, 3); | |
2047 | app.appendString(buffer, 3); | |
2048 | if(dest!=UNICODE_STRING_SIMPLE("ab\\U00050000cdefghij").unescape()) { | |
2049 | errln("Appendable.append(...) failed"); | |
2050 | } | |
2051 | buffer=app.getAppendBuffer(0, 3, scratch, 3, &capacity); | |
2052 | if(buffer!=NULL || capacity!=0) { | |
2053 | errln("Appendable.getAppendBuffer(min=0) failed"); | |
2054 | } | |
2055 | capacity=1; | |
2056 | buffer=app.getAppendBuffer(3, 3, scratch, 2, &capacity); | |
2057 | if(buffer!=NULL || capacity!=0) { | |
2058 | errln("Appendable.getAppendBuffer(scratch<min) failed"); | |
2059 | } | |
2060 | } | |
2061 | ||
2062 | class SimpleAppendable : public Appendable { | |
2063 | public: | |
2064 | explicit SimpleAppendable(UnicodeString &dest) : str(dest) {} | |
2065 | virtual UBool appendCodeUnit(UChar c) { str.append(c); return TRUE; } | |
2066 | SimpleAppendable &reset() { str.remove(); return *this; } | |
2067 | private: | |
2068 | UnicodeString &str; | |
2069 | }; | |
2070 | ||
2071 | void | |
2072 | UnicodeStringTest::TestAppendable() { | |
2073 | UnicodeString dest; | |
2074 | SimpleAppendable app(dest); | |
2075 | doTestAppendable(dest, app); | |
2076 | } | |
2077 | ||
2078 | void | |
2079 | UnicodeStringTest::TestUnicodeStringImplementsAppendable() { | |
2080 | UnicodeString dest; | |
2081 | UnicodeStringAppendable app(dest); | |
2082 | doTestAppendable(dest, app); | |
2083 | } | |
2084 | ||
2085 | void | |
2086 | UnicodeStringTest::TestSizeofUnicodeString() { | |
2087 | // See the comments in unistr.h near the declaration of UnicodeString's fields. | |
2088 | size_t sizeofUniStr=sizeof(UnicodeString); | |
2089 | size_t expected; | |
2090 | switch(sizeof(void *)) { | |
2091 | case 4: | |
2092 | expected=32; | |
2093 | break; | |
2094 | case 8: | |
2095 | expected=40; | |
2096 | break; | |
2097 | default: | |
2098 | logln("This platform has neither 32-bit nor 64-bit pointers."); | |
2099 | return; | |
2100 | } | |
2101 | if(expected!=sizeofUniStr) { | |
2102 | errln("sizeof(UnicodeString)=%d, expected %d", (int)sizeofUniStr, (int)expected); | |
2103 | } | |
2104 | } |