]>
Commit | Line | Data |
---|---|---|
1 | /******************************************************************** | |
2 | * COPYRIGHT: | |
3 | * Copyright (c) 1997-2012, International Business Machines Corporation and | |
4 | * others. All Rights Reserved. | |
5 | ********************************************************************/ | |
6 | ||
7 | #include "ustrtest.h" | |
8 | #include "unicode/appendable.h" | |
9 | #include "unicode/std_string.h" | |
10 | #include "unicode/unistr.h" | |
11 | #include "unicode/uchar.h" | |
12 | #include "unicode/ustring.h" | |
13 | #include "unicode/locid.h" | |
14 | #include "unicode/ucnv.h" | |
15 | #include "unicode/uenum.h" | |
16 | #include "unicode/utf16.h" | |
17 | #include "cmemory.h" | |
18 | #include "charstr.h" | |
19 | ||
20 | #if 0 | |
21 | #include "unicode/ustream.h" | |
22 | ||
23 | #include <iostream> | |
24 | using namespace std; | |
25 | ||
26 | #endif | |
27 | ||
28 | #define LENGTHOF(array) (int32_t)((sizeof(array)/sizeof((array)[0]))) | |
29 | ||
30 | UnicodeStringTest::~UnicodeStringTest() {} | |
31 | ||
32 | void UnicodeStringTest::runIndexedTest( int32_t index, UBool exec, const char* &name, char *par) | |
33 | { | |
34 | if (exec) logln("TestSuite UnicodeStringTest: "); | |
35 | switch (index) { | |
36 | case 0: | |
37 | name = "StringCaseTest"; | |
38 | if (exec) { | |
39 | logln("StringCaseTest---"); logln(""); | |
40 | StringCaseTest test; | |
41 | callTest(test, par); | |
42 | } | |
43 | break; | |
44 | case 1: name = "TestBasicManipulation"; if (exec) TestBasicManipulation(); break; | |
45 | case 2: name = "TestCompare"; if (exec) TestCompare(); break; | |
46 | case 3: name = "TestExtract"; if (exec) TestExtract(); break; | |
47 | case 4: name = "TestRemoveReplace"; if (exec) TestRemoveReplace(); break; | |
48 | case 5: name = "TestSearching"; if (exec) TestSearching(); break; | |
49 | case 6: name = "TestSpacePadding"; if (exec) TestSpacePadding(); break; | |
50 | case 7: name = "TestPrefixAndSuffix"; if (exec) TestPrefixAndSuffix(); break; | |
51 | case 8: name = "TestFindAndReplace"; if (exec) TestFindAndReplace(); break; | |
52 | case 9: name = "TestBogus"; if (exec) TestBogus(); break; | |
53 | case 10: name = "TestReverse"; if (exec) TestReverse(); break; | |
54 | case 11: name = "TestMiscellaneous"; if (exec) TestMiscellaneous(); break; | |
55 | case 12: name = "TestStackAllocation"; if (exec) TestStackAllocation(); break; | |
56 | case 13: name = "TestUnescape"; if (exec) TestUnescape(); break; | |
57 | case 14: name = "TestCountChar32"; if (exec) TestCountChar32(); break; | |
58 | case 15: name = "TestStringEnumeration"; if (exec) TestStringEnumeration(); break; | |
59 | case 16: name = "TestNameSpace"; if (exec) TestNameSpace(); break; | |
60 | case 17: name = "TestUTF32"; if (exec) TestUTF32(); break; | |
61 | case 18: name = "TestUTF8"; if (exec) TestUTF8(); break; | |
62 | case 19: name = "TestReadOnlyAlias"; if (exec) TestReadOnlyAlias(); break; | |
63 | case 20: name = "TestAppendable"; if (exec) TestAppendable(); break; | |
64 | case 21: name = "TestUnicodeStringImplementsAppendable"; if (exec) TestUnicodeStringImplementsAppendable(); break; | |
65 | case 22: name = "TestSizeofUnicodeString"; if (exec) TestSizeofUnicodeString(); break; | |
66 | case 23: name = "TestStartsWithAndEndsWithNulTerminated"; if (exec) TestStartsWithAndEndsWithNulTerminated(); break; | |
67 | ||
68 | default: name = ""; break; //needed to end loop | |
69 | } | |
70 | } | |
71 | ||
72 | void | |
73 | UnicodeStringTest::TestBasicManipulation() | |
74 | { | |
75 | UnicodeString test1("Now is the time for all men to come swiftly to the aid of the party.\n"); | |
76 | UnicodeString expectedValue; | |
77 | UnicodeString *c; | |
78 | ||
79 | c=(UnicodeString *)test1.clone(); | |
80 | test1.insert(24, "good "); | |
81 | expectedValue = "Now is the time for all good men to come swiftly to the aid of the party.\n"; | |
82 | if (test1 != expectedValue) | |
83 | errln("insert() failed: expected \"" + expectedValue + "\"\n,got \"" + test1 + "\""); | |
84 | ||
85 | c->insert(24, "good "); | |
86 | if(*c != expectedValue) { | |
87 | errln("clone()->insert() failed: expected \"" + expectedValue + "\"\n,got \"" + *c + "\""); | |
88 | } | |
89 | delete c; | |
90 | ||
91 | test1.remove(41, 8); | |
92 | expectedValue = "Now is the time for all good men to come to the aid of the party.\n"; | |
93 | if (test1 != expectedValue) | |
94 | errln("remove() failed: expected \"" + expectedValue + "\"\n,got \"" + test1 + "\""); | |
95 | ||
96 | test1.replace(58, 6, "ir country"); | |
97 | expectedValue = "Now is the time for all good men to come to the aid of their country.\n"; | |
98 | if (test1 != expectedValue) | |
99 | errln("replace() failed: expected \"" + expectedValue + "\"\n,got \"" + test1 + "\""); | |
100 | ||
101 | UChar temp[80]; | |
102 | test1.extract(0, 15, temp); | |
103 | ||
104 | UnicodeString test2(temp, 15); | |
105 | ||
106 | expectedValue = "Now is the time"; | |
107 | if (test2 != expectedValue) | |
108 | errln("extract() failed: expected \"" + expectedValue + "\"\n,got \"" + test2 + "\""); | |
109 | ||
110 | test2 += " for me to go!\n"; | |
111 | expectedValue = "Now is the time for me to go!\n"; | |
112 | if (test2 != expectedValue) | |
113 | errln("operator+=() failed: expected \"" + expectedValue + "\"\n,got \"" + test2 + "\""); | |
114 | ||
115 | if (test1.length() != 70) | |
116 | errln(UnicodeString("length() failed: expected 70, got ") + test1.length()); | |
117 | if (test2.length() != 30) | |
118 | errln(UnicodeString("length() failed: expected 30, got ") + test2.length()); | |
119 | ||
120 | UnicodeString test3; | |
121 | test3.append((UChar32)0x20402); | |
122 | if(test3 != CharsToUnicodeString("\\uD841\\uDC02")){ | |
123 | errln((UnicodeString)"append failed for UChar32, expected \"\\\\ud841\\\\udc02\", got " + prettify(test3)); | |
124 | } | |
125 | if(test3.length() != 2){ | |
126 | errln(UnicodeString("append or length failed for UChar32, expected 2, got ") + test3.length()); | |
127 | } | |
128 | test3.append((UChar32)0x0074); | |
129 | if(test3 != CharsToUnicodeString("\\uD841\\uDC02t")){ | |
130 | errln((UnicodeString)"append failed for UChar32, expected \"\\\\uD841\\\\uDC02t\", got " + prettify(test3)); | |
131 | } | |
132 | if(test3.length() != 3){ | |
133 | errln((UnicodeString)"append or length failed for UChar32, expected 2, got " + test3.length()); | |
134 | } | |
135 | ||
136 | // test some UChar32 overloads | |
137 | if( test3.setTo((UChar32)0x10330).length() != 2 || | |
138 | test3.insert(0, (UChar32)0x20100).length() != 4 || | |
139 | test3.replace(2, 2, (UChar32)0xe0061).length() != 4 || | |
140 | (test3 = (UChar32)0x14001).length() != 2 | |
141 | ) { | |
142 | errln((UnicodeString)"simple UChar32 overloads for replace, insert, setTo or = failed"); | |
143 | } | |
144 | ||
145 | { | |
146 | // test moveIndex32() | |
147 | UnicodeString s=UNICODE_STRING("\\U0002f999\\U0001d15f\\u00c4\\u1ed0", 32).unescape(); | |
148 | ||
149 | if( | |
150 | s.moveIndex32(2, -1)!=0 || | |
151 | s.moveIndex32(2, 1)!=4 || | |
152 | s.moveIndex32(2, 2)!=5 || | |
153 | s.moveIndex32(5, -2)!=2 || | |
154 | s.moveIndex32(0, -1)!=0 || | |
155 | s.moveIndex32(6, 1)!=6 | |
156 | ) { | |
157 | errln("UnicodeString::moveIndex32() failed"); | |
158 | } | |
159 | ||
160 | if(s.getChar32Start(1)!=0 || s.getChar32Start(2)!=2) { | |
161 | errln("UnicodeString::getChar32Start() failed"); | |
162 | } | |
163 | ||
164 | if(s.getChar32Limit(1)!=2 || s.getChar32Limit(2)!=2) { | |
165 | errln("UnicodeString::getChar32Limit() failed"); | |
166 | } | |
167 | } | |
168 | ||
169 | { | |
170 | // test new 2.2 constructors and setTo function that parallel Java's substring function. | |
171 | UnicodeString src("Hello folks how are you?"); | |
172 | UnicodeString target1("how are you?"); | |
173 | if (target1 != UnicodeString(src, 12)) { | |
174 | errln("UnicodeString(const UnicodeString&, int32_t) failed"); | |
175 | } | |
176 | UnicodeString target2("folks"); | |
177 | if (target2 != UnicodeString(src, 6, 5)) { | |
178 | errln("UnicodeString(const UnicodeString&, int32_t, int32_t) failed"); | |
179 | } | |
180 | if (target1 != target2.setTo(src, 12)) { | |
181 | errln("UnicodeString::setTo(const UnicodeString&, int32_t) failed"); | |
182 | } | |
183 | } | |
184 | ||
185 | { | |
186 | // op+ is new in ICU 2.8 | |
187 | UnicodeString s=UnicodeString("abc", "")+UnicodeString("def", "")+UnicodeString("ghi", ""); | |
188 | if(s!=UnicodeString("abcdefghi", "")) { | |
189 | errln("operator+(UniStr, UniStr) failed"); | |
190 | } | |
191 | } | |
192 | ||
193 | { | |
194 | // tests for Jitterbug 2360 | |
195 | // verify that APIs with source pointer + length accept length == -1 | |
196 | // mostly test only where modified, only few functions did not already do this | |
197 | if(UnicodeString("abc", -1, "")!=UnicodeString("abc", "")) { | |
198 | errln("UnicodeString(codepageData, dataLength, codepage) does not work with dataLength==-1"); | |
199 | } | |
200 | ||
201 | UChar buffer[10]={ 0x61, 0x62, 0x20ac, 0xd900, 0xdc05, 0, 0x62, 0xffff, 0xdbff, 0xdfff }; | |
202 | UnicodeString s, t(buffer, -1, LENGTHOF(buffer)); | |
203 | ||
204 | if(s.setTo(buffer, -1, LENGTHOF(buffer)).length()!=u_strlen(buffer)) { | |
205 | errln("UnicodeString.setTo(buffer, length, capacity) does not work with length==-1"); | |
206 | } | |
207 | if(t.length()!=u_strlen(buffer)) { | |
208 | errln("UnicodeString(buffer, length, capacity) does not work with length==-1"); | |
209 | } | |
210 | ||
211 | if(0!=s.caseCompare(buffer, -1, U_FOLD_CASE_DEFAULT)) { | |
212 | errln("UnicodeString.caseCompare(const UChar *, length, options) does not work with length==-1"); | |
213 | } | |
214 | if(0!=s.caseCompare(0, s.length(), buffer, U_FOLD_CASE_DEFAULT)) { | |
215 | errln("UnicodeString.caseCompare(start, _length, const UChar *, options) does not work"); | |
216 | } | |
217 | ||
218 | buffer[u_strlen(buffer)]=0xe4; | |
219 | UnicodeString u(buffer, -1, LENGTHOF(buffer)); | |
220 | if(s.setTo(buffer, -1, LENGTHOF(buffer)).length()!=LENGTHOF(buffer)) { | |
221 | errln("UnicodeString.setTo(buffer without NUL, length, capacity) does not work with length==-1"); | |
222 | } | |
223 | if(u.length()!=LENGTHOF(buffer)) { | |
224 | errln("UnicodeString(buffer without NUL, length, capacity) does not work with length==-1"); | |
225 | } | |
226 | ||
227 | static const char cs[]={ 0x61, (char)0xe4, (char)0x85, 0 }; | |
228 | UConverter *cnv; | |
229 | UErrorCode errorCode=U_ZERO_ERROR; | |
230 | ||
231 | cnv=ucnv_open("ISO-8859-1", &errorCode); | |
232 | UnicodeString v(cs, -1, cnv, errorCode); | |
233 | ucnv_close(cnv); | |
234 | if(v!=CharsToUnicodeString("a\\xe4\\x85")) { | |
235 | errln("UnicodeString(const char *, length, cnv, errorCode) does not work with length==-1"); | |
236 | } | |
237 | } | |
238 | ||
239 | #if U_CHARSET_IS_UTF8 | |
240 | { | |
241 | // Test the hardcoded-UTF-8 UnicodeString optimizations. | |
242 | static const uint8_t utf8[]={ 0x61, 0xC3, 0xA4, 0xC3, 0x9F, 0xE4, 0xB8, 0x80, 0 }; | |
243 | static const UChar utf16[]={ 0x61, 0xE4, 0xDF, 0x4E00 }; | |
244 | UnicodeString from8a = UnicodeString((const char *)utf8); | |
245 | UnicodeString from8b = UnicodeString((const char *)utf8, (int32_t)sizeof(utf8)-1); | |
246 | UnicodeString from16(FALSE, utf16, LENGTHOF(utf16)); | |
247 | if(from8a != from16 || from8b != from16) { | |
248 | errln("UnicodeString(const char * U_CHARSET_IS_UTF8) failed"); | |
249 | } | |
250 | char buffer[16]; | |
251 | int32_t length8=from16.extract(0, 0x7fffffff, buffer, (uint32_t)sizeof(buffer)); | |
252 | if(length8!=((int32_t)sizeof(utf8)-1) || 0!=uprv_memcmp(buffer, utf8, sizeof(utf8))) { | |
253 | errln("UnicodeString::extract(char * U_CHARSET_IS_UTF8) failed"); | |
254 | } | |
255 | length8=from16.extract(1, 2, buffer, (uint32_t)sizeof(buffer)); | |
256 | if(length8!=4 || buffer[length8]!=0 || 0!=uprv_memcmp(buffer, utf8+1, length8)) { | |
257 | errln("UnicodeString::extract(substring to char * U_CHARSET_IS_UTF8) failed"); | |
258 | } | |
259 | } | |
260 | #endif | |
261 | } | |
262 | ||
263 | void | |
264 | UnicodeStringTest::TestCompare() | |
265 | { | |
266 | UnicodeString test1("this is a test"); | |
267 | UnicodeString test2("this is a test"); | |
268 | UnicodeString test3("this is a test of the emergency broadcast system"); | |
269 | UnicodeString test4("never say, \"this is a test\"!!"); | |
270 | ||
271 | UnicodeString test5((UChar)0x5000); | |
272 | UnicodeString test6((UChar)0x5100); | |
273 | ||
274 | UChar uniChars[] = { 0x74, 0x68, 0x69, 0x73, 0x20, 0x69, 0x73, | |
275 | 0x20, 0x61, 0x20, 0x74, 0x65, 0x73, 0x74, 0 }; | |
276 | char chars[] = "this is a test"; | |
277 | ||
278 | // test operator== and operator!= | |
279 | if (test1 != test2 || test1 == test3 || test1 == test4) | |
280 | errln("operator== or operator!= failed"); | |
281 | ||
282 | // test operator> and operator< | |
283 | if (test1 > test2 || test1 < test2 || !(test1 < test3) || !(test1 > test4) || | |
284 | !(test5 < test6) | |
285 | ) { | |
286 | errln("operator> or operator< failed"); | |
287 | } | |
288 | ||
289 | // test operator>= and operator<= | |
290 | if (!(test1 >= test2) || !(test1 <= test2) || !(test1 <= test3) || !(test1 >= test4)) | |
291 | errln("operator>= or operator<= failed"); | |
292 | ||
293 | // test compare(UnicodeString) | |
294 | if (test1.compare(test2) != 0 || test1.compare(test3) >= 0 || test1.compare(test4) <= 0) | |
295 | errln("compare(UnicodeString) failed"); | |
296 | ||
297 | //test compare(offset, length, UnicodeString) | |
298 | if(test1.compare(0, 14, test2) != 0 || | |
299 | test3.compare(0, 14, test2) != 0 || | |
300 | test4.compare(12, 14, test2) != 0 || | |
301 | test3.compare(0, 18, test1) <=0 ) | |
302 | errln("compare(offset, length, UnicodeString) failes"); | |
303 | ||
304 | // test compare(UChar*) | |
305 | if (test2.compare(uniChars) != 0 || test3.compare(uniChars) <= 0 || test4.compare(uniChars) >= 0) | |
306 | errln("compare(UChar*) failed"); | |
307 | ||
308 | // test compare(char*) | |
309 | if (test2.compare(chars) != 0 || test3.compare(chars) <= 0 || test4.compare(chars) >= 0) | |
310 | errln("compare(char*) failed"); | |
311 | ||
312 | // test compare(UChar*, length) | |
313 | if (test1.compare(uniChars, 4) <= 0 || test1.compare(uniChars, 4) <= 0) | |
314 | errln("compare(UChar*, length) failed"); | |
315 | ||
316 | // test compare(thisOffset, thisLength, that, thatOffset, thatLength) | |
317 | if (test1.compare(0, 14, test2, 0, 14) != 0 | |
318 | || test1.compare(0, 14, test3, 0, 14) != 0 | |
319 | || test1.compare(0, 14, test4, 12, 14) != 0) | |
320 | errln("1. compare(thisOffset, thisLength, that, thatOffset, thatLength) failed"); | |
321 | ||
322 | if (test1.compare(10, 4, test2, 0, 4) >= 0 | |
323 | || test1.compare(10, 4, test3, 22, 9) <= 0 | |
324 | || test1.compare(10, 4, test4, 22, 4) != 0) | |
325 | errln("2. compare(thisOffset, thisLength, that, thatOffset, thatLength) failed"); | |
326 | ||
327 | // test compareBetween | |
328 | if (test1.compareBetween(0, 14, test2, 0, 14) != 0 || test1.compareBetween(0, 14, test3, 0, 14) != 0 | |
329 | || test1.compareBetween(0, 14, test4, 12, 26) != 0) | |
330 | errln("compareBetween failed"); | |
331 | ||
332 | if (test1.compareBetween(10, 14, test2, 0, 4) >= 0 || test1.compareBetween(10, 14, test3, 22, 31) <= 0 | |
333 | || test1.compareBetween(10, 14, test4, 22, 26) != 0) | |
334 | errln("compareBetween failed"); | |
335 | ||
336 | // test compare() etc. with strings that share a buffer but are not equal | |
337 | test2=test1; // share the buffer, length() too large for the stackBuffer | |
338 | test2.truncate(1); // change only the length, not the buffer | |
339 | if( test1==test2 || test1<=test2 || | |
340 | test1.compare(test2)<=0 || | |
341 | test1.compareCodePointOrder(test2)<=0 || | |
342 | test1.compareCodePointOrder(0, INT32_MAX, test2)<=0 || | |
343 | test1.compareCodePointOrder(0, INT32_MAX, test2, 0, INT32_MAX)<=0 || | |
344 | test1.compareCodePointOrderBetween(0, INT32_MAX, test2, 0, INT32_MAX)<=0 || | |
345 | test1.caseCompare(test2, U_FOLD_CASE_DEFAULT)<=0 | |
346 | ) { | |
347 | errln("UnicodeStrings that share a buffer but have different lengths compare as equal"); | |
348 | } | |
349 | ||
350 | /* test compareCodePointOrder() */ | |
351 | { | |
352 | /* these strings are in ascending order */ | |
353 | static const UChar strings[][4]={ | |
354 | { 0x61, 0 }, /* U+0061 */ | |
355 | { 0x20ac, 0xd801, 0 }, /* U+20ac U+d801 */ | |
356 | { 0x20ac, 0xd800, 0xdc00, 0 }, /* U+20ac U+10000 */ | |
357 | { 0xd800, 0 }, /* U+d800 */ | |
358 | { 0xd800, 0xff61, 0 }, /* U+d800 U+ff61 */ | |
359 | { 0xdfff, 0 }, /* U+dfff */ | |
360 | { 0xff61, 0xdfff, 0 }, /* U+ff61 U+dfff */ | |
361 | { 0xff61, 0xd800, 0xdc02, 0 }, /* U+ff61 U+10002 */ | |
362 | { 0xd800, 0xdc02, 0 }, /* U+10002 */ | |
363 | { 0xd84d, 0xdc56, 0 } /* U+23456 */ | |
364 | }; | |
365 | UnicodeString u[20]; // must be at least as long as strings[] | |
366 | int32_t i; | |
367 | ||
368 | for(i=0; i<(int32_t)(sizeof(strings)/sizeof(strings[0])); ++i) { | |
369 | u[i]=UnicodeString(TRUE, strings[i], -1); | |
370 | } | |
371 | ||
372 | for(i=0; i<(int32_t)(sizeof(strings)/sizeof(strings[0])-1); ++i) { | |
373 | if(u[i].compareCodePointOrder(u[i+1])>=0 || u[i].compareCodePointOrder(0, INT32_MAX, u[i+1].getBuffer())>=0) { | |
374 | errln("error: UnicodeString::compareCodePointOrder() fails for string %d and the following one\n", i); | |
375 | } | |
376 | } | |
377 | } | |
378 | ||
379 | /* test caseCompare() */ | |
380 | { | |
381 | static const UChar | |
382 | _mixed[]= { 0x61, 0x42, 0x131, 0x3a3, 0xdf, 0x130, 0x49, 0xfb03, 0xd93f, 0xdfff, 0 }, | |
383 | _otherDefault[]= { 0x41, 0x62, 0x131, 0x3c3, 0x73, 0x53, 0x69, 0x307, 0x69, 0x46, 0x66, 0x49, 0xd93f, 0xdfff, 0 }, | |
384 | _otherExcludeSpecialI[]={ 0x41, 0x62, 0x131, 0x3c3, 0x53, 0x73, 0x69, 0x131, 0x66, 0x46, 0x69, 0xd93f, 0xdfff, 0 }, | |
385 | _different[]= { 0x41, 0x62, 0x131, 0x3c3, 0x73, 0x53, 0x130, 0x49, 0x46, 0x66, 0x49, 0xd93f, 0xdffd, 0 }; | |
386 | ||
387 | UnicodeString | |
388 | mixed(TRUE, _mixed, -1), | |
389 | otherDefault(TRUE, _otherDefault, -1), | |
390 | otherExcludeSpecialI(TRUE, _otherExcludeSpecialI, -1), | |
391 | different(TRUE, _different, -1); | |
392 | ||
393 | int8_t result; | |
394 | ||
395 | /* test caseCompare() */ | |
396 | result=mixed.caseCompare(otherDefault, U_FOLD_CASE_DEFAULT); | |
397 | if(result!=0 || 0!=mixed.caseCompareBetween(0, INT32_MAX, otherDefault, 0, INT32_MAX, U_FOLD_CASE_DEFAULT)) { | |
398 | errln("error: mixed.caseCompare(other, default)=%ld instead of 0\n", result); | |
399 | } | |
400 | result=mixed.caseCompare(otherExcludeSpecialI, U_FOLD_CASE_EXCLUDE_SPECIAL_I); | |
401 | if(result!=0) { | |
402 | errln("error: mixed.caseCompare(otherExcludeSpecialI, U_FOLD_CASE_EXCLUDE_SPECIAL_I)=%ld instead of 0\n", result); | |
403 | } | |
404 | result=mixed.caseCompare(otherDefault, U_FOLD_CASE_EXCLUDE_SPECIAL_I); | |
405 | if(result==0 || 0==mixed.caseCompareBetween(0, INT32_MAX, otherDefault, 0, INT32_MAX, U_FOLD_CASE_EXCLUDE_SPECIAL_I)) { | |
406 | errln("error: mixed.caseCompare(other, U_FOLD_CASE_EXCLUDE_SPECIAL_I)=0 instead of !=0\n"); | |
407 | } | |
408 | ||
409 | /* test caseCompare() */ | |
410 | result=mixed.caseCompare(different, U_FOLD_CASE_DEFAULT); | |
411 | if(result<=0) { | |
412 | errln("error: mixed.caseCompare(different, default)=%ld instead of positive\n", result); | |
413 | } | |
414 | ||
415 | /* test caseCompare() - include the folded sharp s (U+00df) with different lengths */ | |
416 | result=mixed.caseCompare(1, 4, different, 1, 5, U_FOLD_CASE_DEFAULT); | |
417 | if(result!=0 || 0!=mixed.caseCompareBetween(1, 5, different, 1, 6, U_FOLD_CASE_DEFAULT)) { | |
418 | errln("error: mixed.caseCompare(mixed, 1, 4, different, 1, 5, default)=%ld instead of 0\n", result); | |
419 | } | |
420 | ||
421 | /* test caseCompare() - stop in the middle of the sharp s (U+00df) */ | |
422 | result=mixed.caseCompare(1, 4, different, 1, 4, U_FOLD_CASE_DEFAULT); | |
423 | if(result<=0) { | |
424 | errln("error: mixed.caseCompare(1, 4, different, 1, 4, default)=%ld instead of positive\n", result); | |
425 | } | |
426 | } | |
427 | ||
428 | // test that srcLength=-1 is handled in functions that | |
429 | // take input const UChar */int32_t srcLength (j785) | |
430 | { | |
431 | static const UChar u[]={ 0x61, 0x308, 0x62, 0 }; | |
432 | UnicodeString s=UNICODE_STRING("a\\u0308b", 8).unescape(); | |
433 | ||
434 | if(s.compare(u, -1)!=0 || s.compare(0, 999, u, 0, -1)!=0) { | |
435 | errln("error UnicodeString::compare(..., const UChar *, srcLength=-1) does not work"); | |
436 | } | |
437 | ||
438 | if(s.compareCodePointOrder(u, -1)!=0 || s.compareCodePointOrder(0, 999, u, 0, -1)!=0) { | |
439 | errln("error UnicodeString::compareCodePointOrder(..., const UChar *, srcLength=-1, ...) does not work"); | |
440 | } | |
441 | ||
442 | if(s.caseCompare(u, -1, U_FOLD_CASE_DEFAULT)!=0 || s.caseCompare(0, 999, u, 0, -1, U_FOLD_CASE_DEFAULT)!=0) { | |
443 | errln("error UnicodeString::caseCompare(..., const UChar *, srcLength=-1, ...) does not work"); | |
444 | } | |
445 | ||
446 | if(s.indexOf(u, 1, -1, 0, 999)!=1 || s.indexOf(u+1, -1, 0, 999)!=1 || s.indexOf(u+1, -1, 0)!=1) { | |
447 | errln("error UnicodeString::indexOf(const UChar *, srcLength=-1, ...) does not work"); | |
448 | } | |
449 | ||
450 | if(s.lastIndexOf(u, 1, -1, 0, 999)!=1 || s.lastIndexOf(u+1, -1, 0, 999)!=1 || s.lastIndexOf(u+1, -1, 0)!=1) { | |
451 | errln("error UnicodeString::lastIndexOf(const UChar *, srcLength=-1, ...) does not work"); | |
452 | } | |
453 | ||
454 | UnicodeString s2, s3; | |
455 | s2.replace(0, 0, u+1, -1); | |
456 | s3.replace(0, 0, u, 1, -1); | |
457 | if(s.compare(1, 999, s2)!=0 || s2!=s3) { | |
458 | errln("error UnicodeString::replace(..., const UChar *, srcLength=-1, ...) does not work"); | |
459 | } | |
460 | } | |
461 | } | |
462 | ||
463 | void | |
464 | UnicodeStringTest::TestExtract() | |
465 | { | |
466 | UnicodeString test1("Now is the time for all good men to come to the aid of their country.", ""); | |
467 | UnicodeString test2; | |
468 | UChar test3[13] = {1, 2, 3, 4, 5, 6, 7, 8, 8, 10, 11, 12, 13}; | |
469 | char test4[13] = {1, 2, 3, 4, 5, 6, 7, 8, 8, 10, 11, 12, 13}; | |
470 | UnicodeString test5; | |
471 | char test6[13] = {1, 2, 3, 4, 5, 6, 7, 8, 8, 10, 11, 12, 13}; | |
472 | ||
473 | test1.extract(11, 12, test2); | |
474 | test1.extract(11, 12, test3); | |
475 | if (test1.extract(11, 12, test4) != 12 || test4[12] != 0) { | |
476 | errln("UnicodeString.extract(char *) failed to return the correct size of destination buffer."); | |
477 | } | |
478 | ||
479 | // test proper pinning in extractBetween() | |
480 | test1.extractBetween(-3, 7, test5); | |
481 | if(test5!=UNICODE_STRING("Now is ", 7)) { | |
482 | errln("UnicodeString.extractBetween(-3, 7) did not pin properly."); | |
483 | } | |
484 | ||
485 | test1.extractBetween(11, 23, test5); | |
486 | if (test1.extract(60, 71, test6) != 9) { | |
487 | errln("UnicodeString.extract() failed to return the correct size of destination buffer for end of buffer."); | |
488 | } | |
489 | if (test1.extract(11, 12, test6) != 12) { | |
490 | errln("UnicodeString.extract() failed to return the correct size of destination buffer."); | |
491 | } | |
492 | ||
493 | // convert test4 back to Unicode for comparison | |
494 | UnicodeString test4b(test4, 12); | |
495 | ||
496 | if (test1.extract(11, 12, (char *)NULL) != 12) { | |
497 | errln("UnicodeString.extract(NULL) failed to return the correct size of destination buffer."); | |
498 | } | |
499 | if (test1.extract(11, -1, test6) != 0) { | |
500 | errln("UnicodeString.extract(-1) failed to stop reading the string."); | |
501 | } | |
502 | ||
503 | for (int32_t i = 0; i < 12; i++) { | |
504 | if (test1.charAt((int32_t)(11 + i)) != test2.charAt(i)) { | |
505 | errln(UnicodeString("extracting into a UnicodeString failed at position ") + i); | |
506 | break; | |
507 | } | |
508 | if (test1.charAt((int32_t)(11 + i)) != test3[i]) { | |
509 | errln(UnicodeString("extracting into an array of UChar failed at position ") + i); | |
510 | break; | |
511 | } | |
512 | if (((char)test1.charAt((int32_t)(11 + i))) != test4b.charAt(i)) { | |
513 | errln(UnicodeString("extracting into an array of char failed at position ") + i); | |
514 | break; | |
515 | } | |
516 | if (test1.charAt((int32_t)(11 + i)) != test5.charAt(i)) { | |
517 | errln(UnicodeString("extracting with extractBetween failed at position ") + i); | |
518 | break; | |
519 | } | |
520 | } | |
521 | ||
522 | // test preflighting and overflows with invariant conversion | |
523 | if (test1.extract(0, 10, (char *)NULL, "") != 10) { | |
524 | errln("UnicodeString.extract(0, 10, (char *)NULL, \"\") != 10"); | |
525 | } | |
526 | ||
527 | test4[2] = (char)0xff; | |
528 | if (test1.extract(0, 10, test4, 2, "") != 10) { | |
529 | errln("UnicodeString.extract(0, 10, test4, 2, \"\") != 10"); | |
530 | } | |
531 | if (test4[2] != (char)0xff) { | |
532 | errln("UnicodeString.extract(0, 10, test4, 2, \"\") overwrote test4[2]"); | |
533 | } | |
534 | ||
535 | { | |
536 | // test new, NUL-terminating extract() function | |
537 | UnicodeString s("terminate", ""); | |
538 | UChar dest[20]={ | |
539 | 0xa5, 0xa5, 0xa5, 0xa5, 0xa5, 0xa5, 0xa5, 0xa5, 0xa5, 0xa5, | |
540 | 0xa5, 0xa5, 0xa5, 0xa5, 0xa5, 0xa5, 0xa5, 0xa5, 0xa5, 0xa5 | |
541 | }; | |
542 | UErrorCode errorCode; | |
543 | int32_t length; | |
544 | ||
545 | errorCode=U_ZERO_ERROR; | |
546 | length=s.extract((UChar *)NULL, 0, errorCode); | |
547 | if(errorCode!=U_BUFFER_OVERFLOW_ERROR || length!=s.length()) { | |
548 | errln("UnicodeString.extract(NULL, 0)==%d (%s) expected %d (U_BUFFER_OVERFLOW_ERROR)", length, s.length(), u_errorName(errorCode)); | |
549 | } | |
550 | ||
551 | errorCode=U_ZERO_ERROR; | |
552 | length=s.extract(dest, s.length()-1, errorCode); | |
553 | if(errorCode!=U_BUFFER_OVERFLOW_ERROR || length!=s.length()) { | |
554 | errln("UnicodeString.extract(dest too short)==%d (%s) expected %d (U_BUFFER_OVERFLOW_ERROR)", | |
555 | length, u_errorName(errorCode), s.length()); | |
556 | } | |
557 | ||
558 | errorCode=U_ZERO_ERROR; | |
559 | length=s.extract(dest, s.length(), errorCode); | |
560 | if(errorCode!=U_STRING_NOT_TERMINATED_WARNING || length!=s.length()) { | |
561 | errln("UnicodeString.extract(dest just right without NUL)==%d (%s) expected %d (U_STRING_NOT_TERMINATED_WARNING)", | |
562 | length, u_errorName(errorCode), s.length()); | |
563 | } | |
564 | if(dest[length-1]!=s[length-1] || dest[length]!=0xa5) { | |
565 | errln("UnicodeString.extract(dest just right without NUL) did not extract the string correctly"); | |
566 | } | |
567 | ||
568 | errorCode=U_ZERO_ERROR; | |
569 | length=s.extract(dest, s.length()+1, errorCode); | |
570 | if(errorCode!=U_ZERO_ERROR || length!=s.length()) { | |
571 | errln("UnicodeString.extract(dest large enough)==%d (%s) expected %d (U_ZERO_ERROR)", | |
572 | length, u_errorName(errorCode), s.length()); | |
573 | } | |
574 | if(dest[length-1]!=s[length-1] || dest[length]!=0 || dest[length+1]!=0xa5) { | |
575 | errln("UnicodeString.extract(dest large enough) did not extract the string correctly"); | |
576 | } | |
577 | } | |
578 | ||
579 | { | |
580 | // test new UConverter extract() and constructor | |
581 | UnicodeString s=UNICODE_STRING("\\U0002f999\\U0001d15f\\u00c4\\u1ed0", 32).unescape(); | |
582 | char buffer[32]; | |
583 | static const char expect[]={ | |
584 | (char)0xf0, (char)0xaf, (char)0xa6, (char)0x99, | |
585 | (char)0xf0, (char)0x9d, (char)0x85, (char)0x9f, | |
586 | (char)0xc3, (char)0x84, | |
587 | (char)0xe1, (char)0xbb, (char)0x90 | |
588 | }; | |
589 | UErrorCode errorCode=U_ZERO_ERROR; | |
590 | UConverter *cnv=ucnv_open("UTF-8", &errorCode); | |
591 | int32_t length; | |
592 | ||
593 | if(U_SUCCESS(errorCode)) { | |
594 | // test preflighting | |
595 | if( (length=s.extract(NULL, 0, cnv, errorCode))!=13 || | |
596 | errorCode!=U_BUFFER_OVERFLOW_ERROR | |
597 | ) { | |
598 | errln("UnicodeString::extract(NULL, UConverter) preflighting failed (length=%ld, %s)", | |
599 | length, u_errorName(errorCode)); | |
600 | } | |
601 | errorCode=U_ZERO_ERROR; | |
602 | if( (length=s.extract(buffer, 2, cnv, errorCode))!=13 || | |
603 | errorCode!=U_BUFFER_OVERFLOW_ERROR | |
604 | ) { | |
605 | errln("UnicodeString::extract(too small, UConverter) preflighting failed (length=%ld, %s)", | |
606 | length, u_errorName(errorCode)); | |
607 | } | |
608 | ||
609 | // try error cases | |
610 | errorCode=U_ZERO_ERROR; | |
611 | if( s.extract(NULL, 2, cnv, errorCode)==13 || U_SUCCESS(errorCode)) { | |
612 | errln("UnicodeString::extract(UConverter) succeeded with an illegal destination"); | |
613 | } | |
614 | errorCode=U_ILLEGAL_ARGUMENT_ERROR; | |
615 | if( s.extract(NULL, 0, cnv, errorCode)==13 || U_SUCCESS(errorCode)) { | |
616 | errln("UnicodeString::extract(UConverter) succeeded with a previous error code"); | |
617 | } | |
618 | errorCode=U_ZERO_ERROR; | |
619 | ||
620 | // extract for real | |
621 | if( (length=s.extract(buffer, sizeof(buffer), cnv, errorCode))!=13 || | |
622 | uprv_memcmp(buffer, expect, 13)!=0 || | |
623 | buffer[13]!=0 || | |
624 | U_FAILURE(errorCode) | |
625 | ) { | |
626 | errln("UnicodeString::extract(UConverter) conversion failed (length=%ld, %s)", | |
627 | length, u_errorName(errorCode)); | |
628 | } | |
629 | // Test again with just the converter name. | |
630 | if( (length=s.extract(0, s.length(), buffer, sizeof(buffer), "UTF-8"))!=13 || | |
631 | uprv_memcmp(buffer, expect, 13)!=0 || | |
632 | buffer[13]!=0 || | |
633 | U_FAILURE(errorCode) | |
634 | ) { | |
635 | errln("UnicodeString::extract(\"UTF-8\") conversion failed (length=%ld, %s)", | |
636 | length, u_errorName(errorCode)); | |
637 | } | |
638 | ||
639 | // try the constructor | |
640 | UnicodeString t(expect, sizeof(expect), cnv, errorCode); | |
641 | if(U_FAILURE(errorCode) || s!=t) { | |
642 | errln("UnicodeString(UConverter) conversion failed (%s)", | |
643 | u_errorName(errorCode)); | |
644 | } | |
645 | ||
646 | ucnv_close(cnv); | |
647 | } | |
648 | } | |
649 | } | |
650 | ||
651 | void | |
652 | UnicodeStringTest::TestRemoveReplace() | |
653 | { | |
654 | UnicodeString test1("The rain in Spain stays mainly on the plain"); | |
655 | UnicodeString test2("eat SPAMburgers!"); | |
656 | UChar test3[] = { 0x53, 0x50, 0x41, 0x4d, 0x4d, 0 }; | |
657 | char test4[] = "SPAM"; | |
658 | UnicodeString& test5 = test1; | |
659 | ||
660 | test1.replace(4, 4, test2, 4, 4); | |
661 | test1.replace(12, 5, test3, 4); | |
662 | test3[4] = 0; | |
663 | test1.replace(17, 4, test3); | |
664 | test1.replace(23, 4, test4); | |
665 | test1.replaceBetween(37, 42, test2, 4, 8); | |
666 | ||
667 | if (test1 != "The SPAM in SPAM SPAMs SPAMly on the SPAM") | |
668 | errln("One of the replace methods failed:\n" | |
669 | " expected \"The SPAM in SPAM SPAMs SPAMly on the SPAM\",\n" | |
670 | " got \"" + test1 + "\""); | |
671 | ||
672 | test1.remove(21, 1); | |
673 | test1.removeBetween(26, 28); | |
674 | ||
675 | if (test1 != "The SPAM in SPAM SPAM SPAM on the SPAM") | |
676 | errln("One of the remove methods failed:\n" | |
677 | " expected \"The SPAM in SPAM SPAM SPAM on the SPAM\",\n" | |
678 | " got \"" + test1 + "\""); | |
679 | ||
680 | for (int32_t i = 0; i < test1.length(); i++) { | |
681 | if (test5[i] != 0x53 && test5[i] != 0x50 && test5[i] != 0x41 && test5[i] != 0x4d && test5[i] != 0x20) { | |
682 | test1.setCharAt(i, 0x78); | |
683 | } | |
684 | } | |
685 | ||
686 | if (test1 != "xxx SPAM xx SPAM SPAM SPAM xx xxx SPAM") | |
687 | errln("One of the remove methods failed:\n" | |
688 | " expected \"xxx SPAM xx SPAM SPAM SPAM xx xxx SPAM\",\n" | |
689 | " got \"" + test1 + "\""); | |
690 | ||
691 | test1.remove(); | |
692 | if (test1.length() != 0) | |
693 | errln("Remove() failed: expected empty string, got \"" + test1 + "\""); | |
694 | } | |
695 | ||
696 | void | |
697 | UnicodeStringTest::TestSearching() | |
698 | { | |
699 | UnicodeString test1("test test ttest tetest testesteststt"); | |
700 | UnicodeString test2("test"); | |
701 | UChar testChar = 0x74; | |
702 | ||
703 | UChar32 testChar32 = 0x20402; | |
704 | UChar testData[]={ | |
705 | // 0 1 2 3 4 5 6 7 | |
706 | 0xd841, 0xdc02, 0x0071, 0xdc02, 0xd841, 0x0071, 0xd841, 0xdc02, | |
707 | ||
708 | // 8 9 10 11 12 13 14 15 | |
709 | 0x0071, 0x0072, 0xd841, 0xdc02, 0x0071, 0xd841, 0xdc02, 0x0071, | |
710 | ||
711 | // 16 17 18 19 | |
712 | 0xdc02, 0xd841, 0x0073, 0x0000 | |
713 | }; | |
714 | UnicodeString test3(testData); | |
715 | UnicodeString test4(testChar32); | |
716 | ||
717 | uint16_t occurrences = 0; | |
718 | int32_t startPos = 0; | |
719 | for ( ; | |
720 | startPos != -1 && startPos < test1.length(); | |
721 | (startPos = test1.indexOf(test2, startPos)) != -1 ? (++occurrences, startPos += 4) : 0) | |
722 | ; | |
723 | if (occurrences != 6) | |
724 | errln(UnicodeString("indexOf failed: expected to find 6 occurrences, found ") + occurrences); | |
725 | ||
726 | for ( occurrences = 0, startPos = 10; | |
727 | startPos != -1 && startPos < test1.length(); | |
728 | (startPos = test1.indexOf(test2, startPos)) != -1 ? (++occurrences, startPos += 4) : 0) | |
729 | ; | |
730 | if (occurrences != 4) | |
731 | errln(UnicodeString("indexOf with starting offset failed: " | |
732 | "expected to find 4 occurrences, found ") + occurrences); | |
733 | ||
734 | int32_t endPos = 28; | |
735 | for ( occurrences = 0, startPos = 5; | |
736 | startPos != -1 && startPos < test1.length(); | |
737 | (startPos = test1.indexOf(test2, startPos, endPos - startPos)) != -1 ? (++occurrences, startPos += 4) : 0) | |
738 | ; | |
739 | if (occurrences != 4) | |
740 | errln(UnicodeString("indexOf with starting and ending offsets failed: " | |
741 | "expected to find 4 occurrences, found ") + occurrences); | |
742 | ||
743 | //using UChar32 string | |
744 | for ( startPos=0, occurrences=0; | |
745 | startPos != -1 && startPos < test3.length(); | |
746 | (startPos = test3.indexOf(test4, startPos)) != -1 ? (++occurrences, startPos += 2) : 0) | |
747 | ; | |
748 | if (occurrences != 4) | |
749 | errln((UnicodeString)"indexOf failed: expected to find 4 occurrences, found " + occurrences); | |
750 | ||
751 | for ( startPos=10, occurrences=0; | |
752 | startPos != -1 && startPos < test3.length(); | |
753 | (startPos = test3.indexOf(test4, startPos)) != -1 ? (++occurrences, startPos += 2) : 0) | |
754 | ; | |
755 | if (occurrences != 2) | |
756 | errln(UnicodeString("indexOf failed: expected to find 2 occurrences, found ") + occurrences); | |
757 | //--- | |
758 | ||
759 | for ( occurrences = 0, startPos = 0; | |
760 | startPos != -1 && startPos < test1.length(); | |
761 | (startPos = test1.indexOf(testChar, startPos)) != -1 ? (++occurrences, startPos += 1) : 0) | |
762 | ; | |
763 | if (occurrences != 16) | |
764 | errln(UnicodeString("indexOf with character failed: " | |
765 | "expected to find 16 occurrences, found ") + occurrences); | |
766 | ||
767 | for ( occurrences = 0, startPos = 10; | |
768 | startPos != -1 && startPos < test1.length(); | |
769 | (startPos = test1.indexOf(testChar, startPos)) != -1 ? (++occurrences, startPos += 1) : 0) | |
770 | ; | |
771 | if (occurrences != 12) | |
772 | errln(UnicodeString("indexOf with character & start offset failed: " | |
773 | "expected to find 12 occurrences, found ") + occurrences); | |
774 | ||
775 | for ( occurrences = 0, startPos = 5, endPos = 28; | |
776 | startPos != -1 && startPos < test1.length(); | |
777 | (startPos = test1.indexOf(testChar, startPos, endPos - startPos)) != -1 ? (++occurrences, startPos += 1) : 0) | |
778 | ; | |
779 | if (occurrences != 10) | |
780 | errln(UnicodeString("indexOf with character & start & end offsets failed: " | |
781 | "expected to find 10 occurrences, found ") + occurrences); | |
782 | ||
783 | //testing for UChar32 | |
784 | UnicodeString subString; | |
785 | for( occurrences =0, startPos=0; startPos < test3.length(); startPos +=1){ | |
786 | subString.append(test3, startPos, test3.length()); | |
787 | if(subString.indexOf(testChar32) != -1 ){ | |
788 | ++occurrences; | |
789 | } | |
790 | subString.remove(); | |
791 | } | |
792 | if (occurrences != 14) | |
793 | errln((UnicodeString)"indexOf failed: expected to find 14 occurrences, found " + occurrences); | |
794 | ||
795 | for ( occurrences = 0, startPos = 0; | |
796 | startPos != -1 && startPos < test3.length(); | |
797 | (startPos = test3.indexOf(testChar32, startPos)) != -1 ? (++occurrences, startPos += 1) : 0) | |
798 | ; | |
799 | if (occurrences != 4) | |
800 | errln((UnicodeString)"indexOf failed: expected to find 4 occurrences, found " + occurrences); | |
801 | ||
802 | endPos=test3.length(); | |
803 | for ( occurrences = 0, startPos = 5; | |
804 | startPos != -1 && startPos < test3.length(); | |
805 | (startPos = test3.indexOf(testChar32, startPos, endPos - startPos)) != -1 ? (++occurrences, startPos += 1) : 0) | |
806 | ; | |
807 | if (occurrences != 3) | |
808 | errln((UnicodeString)"indexOf with character & start & end offsets failed: expected to find 2 occurrences, found " + occurrences); | |
809 | //--- | |
810 | ||
811 | if(test1.lastIndexOf(test2)!=29) { | |
812 | errln("test1.lastIndexOf(test2)!=29"); | |
813 | } | |
814 | ||
815 | if(test1.lastIndexOf(test2, 15)!=29 || test1.lastIndexOf(test2, 29)!=29 || test1.lastIndexOf(test2, 30)!=-1) { | |
816 | errln("test1.lastIndexOf(test2, start) failed"); | |
817 | } | |
818 | ||
819 | for ( occurrences = 0, startPos = 32; | |
820 | startPos != -1; | |
821 | (startPos = test1.lastIndexOf(test2, 5, startPos - 5)) != -1 ? ++occurrences : 0) | |
822 | ; | |
823 | if (occurrences != 4) | |
824 | errln(UnicodeString("lastIndexOf with starting and ending offsets failed: " | |
825 | "expected to find 4 occurrences, found ") + occurrences); | |
826 | ||
827 | for ( occurrences = 0, startPos = 32; | |
828 | startPos != -1; | |
829 | (startPos = test1.lastIndexOf(testChar, 5, startPos - 5)) != -1 ? ++occurrences : 0) | |
830 | ; | |
831 | if (occurrences != 11) | |
832 | errln(UnicodeString("lastIndexOf with character & start & end offsets failed: " | |
833 | "expected to find 11 occurrences, found ") + occurrences); | |
834 | ||
835 | //testing UChar32 | |
836 | startPos=test3.length(); | |
837 | for ( occurrences = 0; | |
838 | startPos != -1; | |
839 | (startPos = test3.lastIndexOf(testChar32, 5, startPos - 5)) != -1 ? ++occurrences : 0) | |
840 | ; | |
841 | if (occurrences != 3) | |
842 | errln((UnicodeString)"lastIndexOf with character & start & end offsets failed: expected to find 3 occurrences, found " + occurrences); | |
843 | ||
844 | ||
845 | for ( occurrences = 0, endPos = test3.length(); endPos > 0; endPos -= 1){ | |
846 | subString.remove(); | |
847 | subString.append(test3, 0, endPos); | |
848 | if(subString.lastIndexOf(testChar32) != -1 ){ | |
849 | ++occurrences; | |
850 | } | |
851 | } | |
852 | if (occurrences != 18) | |
853 | errln((UnicodeString)"indexOf failed: expected to find 18 occurrences, found " + occurrences); | |
854 | //--- | |
855 | ||
856 | // test that indexOf(UChar32) and lastIndexOf(UChar32) | |
857 | // do not find surrogate code points when they are part of matched pairs | |
858 | // (= part of supplementary code points) | |
859 | // Jitterbug 1542 | |
860 | if(test3.indexOf((UChar32)0xd841) != 4 || test3.indexOf((UChar32)0xdc02) != 3) { | |
861 | errln("error: UnicodeString::indexOf(UChar32 surrogate) finds a partial supplementary code point"); | |
862 | } | |
863 | if( UnicodeString(test3, 0, 17).lastIndexOf((UChar)0xd841, 0) != 4 || | |
864 | UnicodeString(test3, 0, 17).lastIndexOf((UChar32)0xd841, 2) != 4 || | |
865 | test3.lastIndexOf((UChar32)0xd841, 0, 17) != 4 || test3.lastIndexOf((UChar32)0xdc02, 0, 17) != 16 | |
866 | ) { | |
867 | errln("error: UnicodeString::lastIndexOf(UChar32 surrogate) finds a partial supplementary code point"); | |
868 | } | |
869 | } | |
870 | ||
871 | void | |
872 | UnicodeStringTest::TestSpacePadding() | |
873 | { | |
874 | UnicodeString test1("hello"); | |
875 | UnicodeString test2(" there"); | |
876 | UnicodeString test3("Hi! How ya doin'? Beautiful day, isn't it?"); | |
877 | UnicodeString test4; | |
878 | UBool returnVal; | |
879 | UnicodeString expectedValue; | |
880 | ||
881 | returnVal = test1.padLeading(15); | |
882 | expectedValue = " hello"; | |
883 | if (returnVal == FALSE || test1 != expectedValue) | |
884 | errln("padLeading() failed: expected \"" + expectedValue + "\", got \"" + test1 + "\"."); | |
885 | ||
886 | returnVal = test2.padTrailing(15); | |
887 | expectedValue = " there "; | |
888 | if (returnVal == FALSE || test2 != expectedValue) | |
889 | errln("padTrailing() failed: expected \"" + expectedValue + "\", got \"" + test2 + "\"."); | |
890 | ||
891 | expectedValue = test3; | |
892 | returnVal = test3.padTrailing(15); | |
893 | if (returnVal == TRUE || test3 != expectedValue) | |
894 | errln("padTrailing() failed: expected \"" + expectedValue + "\", got \"" + test3 + "\"."); | |
895 | ||
896 | expectedValue = "hello"; | |
897 | test4.setTo(test1).trim(); | |
898 | ||
899 | if (test4 != expectedValue || test1 == expectedValue || test4 != expectedValue) | |
900 | errln("trim(UnicodeString&) failed"); | |
901 | ||
902 | test1.trim(); | |
903 | if (test1 != expectedValue) | |
904 | errln("trim() failed: expected \"" + expectedValue + "\", got \"" + test1 + "\"."); | |
905 | ||
906 | test2.trim(); | |
907 | expectedValue = "there"; | |
908 | if (test2 != expectedValue) | |
909 | errln("trim() failed: expected \"" + expectedValue + "\", got \"" + test2 + "\"."); | |
910 | ||
911 | test3.trim(); | |
912 | expectedValue = "Hi! How ya doin'? Beautiful day, isn't it?"; | |
913 | if (test3 != expectedValue) | |
914 | errln("trim() failed: expected \"" + expectedValue + "\", got \"" + test3 + "\"."); | |
915 | ||
916 | returnVal = test1.truncate(15); | |
917 | expectedValue = "hello"; | |
918 | if (returnVal == TRUE || test1 != expectedValue) | |
919 | errln("truncate() failed: expected \"" + expectedValue + "\", got \"" + test1 + "\"."); | |
920 | ||
921 | returnVal = test2.truncate(15); | |
922 | expectedValue = "there"; | |
923 | if (returnVal == TRUE || test2 != expectedValue) | |
924 | errln("truncate() failed: expected \"" + expectedValue + "\", got \"" + test2 + "\"."); | |
925 | ||
926 | returnVal = test3.truncate(15); | |
927 | expectedValue = "Hi! How ya doi"; | |
928 | if (returnVal == FALSE || test3 != expectedValue) | |
929 | errln("truncate() failed: expected \"" + expectedValue + "\", got \"" + test3 + "\"."); | |
930 | } | |
931 | ||
932 | void | |
933 | UnicodeStringTest::TestPrefixAndSuffix() | |
934 | { | |
935 | UnicodeString test1("Now is the time for all good men to come to the aid of their country."); | |
936 | UnicodeString test2("Now"); | |
937 | UnicodeString test3("country."); | |
938 | UnicodeString test4("count"); | |
939 | ||
940 | if (!test1.startsWith(test2) || !test1.startsWith(test2, 0, test2.length())) { | |
941 | errln("startsWith() failed: \"" + test2 + "\" should be a prefix of \"" + test1 + "\"."); | |
942 | } | |
943 | ||
944 | if (test1.startsWith(test3) || | |
945 | test1.startsWith(test3.getBuffer(), test3.length()) || | |
946 | test1.startsWith(test3.getTerminatedBuffer(), 0, -1) | |
947 | ) { | |
948 | errln("startsWith() failed: \"" + test3 + "\" shouldn't be a prefix of \"" + test1 + "\"."); | |
949 | } | |
950 | ||
951 | if (test1.endsWith(test2)) { | |
952 | errln("endsWith() failed: \"" + test2 + "\" shouldn't be a suffix of \"" + test1 + "\"."); | |
953 | } | |
954 | ||
955 | if (!test1.endsWith(test3)) { | |
956 | errln("endsWith(test3) failed: \"" + test3 + "\" should be a suffix of \"" + test1 + "\"."); | |
957 | } | |
958 | if (!test1.endsWith(test3, 0, INT32_MAX)) { | |
959 | errln("endsWith(test3, 0, INT32_MAX) failed: \"" + test3 + "\" should be a suffix of \"" + test1 + "\"."); | |
960 | } | |
961 | ||
962 | if(!test1.endsWith(test3.getBuffer(), test3.length())) { | |
963 | errln("endsWith(test3.getBuffer(), test3.length()) failed: \"" + test3 + "\" should be a suffix of \"" + test1 + "\"."); | |
964 | } | |
965 | if(!test1.endsWith(test3.getTerminatedBuffer(), 0, -1)) { | |
966 | errln("endsWith(test3.getTerminatedBuffer(), 0, -1) failed: \"" + test3 + "\" should be a suffix of \"" + test1 + "\"."); | |
967 | } | |
968 | ||
969 | if (!test3.startsWith(test4)) { | |
970 | errln("endsWith(test4) failed: \"" + test4 + "\" should be a prefix of \"" + test3 + "\"."); | |
971 | } | |
972 | ||
973 | if (test4.startsWith(test3)) { | |
974 | errln("startsWith(test3) failed: \"" + test3 + "\" shouldn't be a prefix of \"" + test4 + "\"."); | |
975 | } | |
976 | } | |
977 | ||
978 | void | |
979 | UnicodeStringTest::TestStartsWithAndEndsWithNulTerminated() { | |
980 | UnicodeString test("abcde"); | |
981 | const UChar ab[] = { 0x61, 0x62, 0 }; | |
982 | const UChar de[] = { 0x64, 0x65, 0 }; | |
983 | assertTrue("abcde.startsWith(ab, -1)", test.startsWith(ab, -1)); | |
984 | assertTrue("abcde.startsWith(ab, 0, -1)", test.startsWith(ab, 0, -1)); | |
985 | assertTrue("abcde.endsWith(de, -1)", test.endsWith(de, -1)); | |
986 | assertTrue("abcde.endsWith(de, 0, -1)", test.endsWith(de, 0, -1)); | |
987 | } | |
988 | ||
989 | void | |
990 | UnicodeStringTest::TestFindAndReplace() | |
991 | { | |
992 | UnicodeString test1("One potato, two potato, three potato, four\n"); | |
993 | UnicodeString test2("potato"); | |
994 | UnicodeString test3("MISSISSIPPI"); | |
995 | ||
996 | UnicodeString expectedValue; | |
997 | ||
998 | test1.findAndReplace(test2, test3); | |
999 | expectedValue = "One MISSISSIPPI, two MISSISSIPPI, three MISSISSIPPI, four\n"; | |
1000 | if (test1 != expectedValue) | |
1001 | errln("findAndReplace failed: expected \"" + expectedValue + "\", got \"" + test1 + "\"."); | |
1002 | test1.findAndReplace(2, 32, test3, test2); | |
1003 | expectedValue = "One potato, two potato, three MISSISSIPPI, four\n"; | |
1004 | if (test1 != expectedValue) | |
1005 | errln("findAndReplace failed: expected \"" + expectedValue + "\", got \"" + test1 + "\"."); | |
1006 | } | |
1007 | ||
1008 | void | |
1009 | UnicodeStringTest::TestReverse() | |
1010 | { | |
1011 | UnicodeString test("backwards words say to used I"); | |
1012 | ||
1013 | test.reverse(); | |
1014 | test.reverse(2, 4); | |
1015 | test.reverse(7, 2); | |
1016 | test.reverse(10, 3); | |
1017 | test.reverse(14, 5); | |
1018 | test.reverse(20, 9); | |
1019 | ||
1020 | if (test != "I used to say words backwards") | |
1021 | errln("reverse() failed: Expected \"I used to say words backwards\",\n got \"" | |
1022 | + test + "\""); | |
1023 | ||
1024 | test=UNICODE_STRING("\\U0002f999\\U0001d15f\\u00c4\\u1ed0", 32).unescape(); | |
1025 | test.reverse(); | |
1026 | if(test.char32At(0)!=0x1ed0 || test.char32At(1)!=0xc4 || test.char32At(2)!=0x1d15f || test.char32At(4)!=0x2f999) { | |
1027 | errln("reverse() failed with supplementary characters"); | |
1028 | } | |
1029 | ||
1030 | // Test case for ticket #8091: | |
1031 | // UnicodeString::reverse() failed to see a lead surrogate in the middle of | |
1032 | // an odd-length string that contains no other lead surrogates. | |
1033 | test=UNICODE_STRING_SIMPLE("ab\\U0001F4A9e").unescape(); | |
1034 | UnicodeString expected=UNICODE_STRING_SIMPLE("e\\U0001F4A9ba").unescape(); | |
1035 | test.reverse(); | |
1036 | if(test!=expected) { | |
1037 | errln("reverse() failed with only lead surrogate in the middle"); | |
1038 | } | |
1039 | } | |
1040 | ||
1041 | void | |
1042 | UnicodeStringTest::TestMiscellaneous() | |
1043 | { | |
1044 | UnicodeString test1("This is a test"); | |
1045 | UnicodeString test2("This is a test"); | |
1046 | UnicodeString test3("Me too!"); | |
1047 | ||
1048 | // test getBuffer(minCapacity) and releaseBuffer() | |
1049 | test1=UnicodeString(); // make sure that it starts with its stackBuffer | |
1050 | UChar *p=test1.getBuffer(20); | |
1051 | if(test1.getCapacity()<20) { | |
1052 | errln("UnicodeString::getBuffer(20).getCapacity()<20"); | |
1053 | } | |
1054 | ||
1055 | test1.append((UChar)7); // must not be able to modify the string here | |
1056 | test1.setCharAt(3, 7); | |
1057 | test1.reverse(); | |
1058 | if( test1.length()!=0 || | |
1059 | test1.charAt(0)!=0xffff || test1.charAt(3)!=0xffff || | |
1060 | test1.getBuffer(10)!=0 || test1.getBuffer()!=0 | |
1061 | ) { | |
1062 | errln("UnicodeString::getBuffer(minCapacity) allows read or write access to the UnicodeString"); | |
1063 | } | |
1064 | ||
1065 | p[0]=1; | |
1066 | p[1]=2; | |
1067 | p[2]=3; | |
1068 | test1.releaseBuffer(3); | |
1069 | test1.append((UChar)4); | |
1070 | ||
1071 | if(test1.length()!=4 || test1.charAt(0)!=1 || test1.charAt(1)!=2 || test1.charAt(2)!=3 || test1.charAt(3)!=4) { | |
1072 | errln("UnicodeString::releaseBuffer(newLength) does not properly reallow access to the UnicodeString"); | |
1073 | } | |
1074 | ||
1075 | // test releaseBuffer() without getBuffer(minCapacity) - must not have any effect | |
1076 | test1.releaseBuffer(1); | |
1077 | if(test1.length()!=4 || test1.charAt(0)!=1 || test1.charAt(1)!=2 || test1.charAt(2)!=3 || test1.charAt(3)!=4) { | |
1078 | errln("UnicodeString::releaseBuffer(newLength) without getBuffer(minCapacity) changed the UnicodeString"); | |
1079 | } | |
1080 | ||
1081 | // test getBuffer(const) | |
1082 | const UChar *q=test1.getBuffer(), *r=test1.getBuffer(); | |
1083 | if( test1.length()!=4 || | |
1084 | q[0]!=1 || q[1]!=2 || q[2]!=3 || q[3]!=4 || | |
1085 | r[0]!=1 || r[1]!=2 || r[2]!=3 || r[3]!=4 | |
1086 | ) { | |
1087 | errln("UnicodeString::getBuffer(const) does not return a usable buffer pointer"); | |
1088 | } | |
1089 | ||
1090 | // test releaseBuffer() with a NUL-terminated buffer | |
1091 | test1.getBuffer(20)[2]=0; | |
1092 | test1.releaseBuffer(); // implicit -1 | |
1093 | if(test1.length()!=2 || test1.charAt(0)!=1 || test1.charAt(1) !=2) { | |
1094 | errln("UnicodeString::releaseBuffer(-1) does not properly set the length of the UnicodeString"); | |
1095 | } | |
1096 | ||
1097 | // test releaseBuffer() with a non-NUL-terminated buffer | |
1098 | p=test1.getBuffer(256); | |
1099 | for(int32_t i=0; i<test1.getCapacity(); ++i) { | |
1100 | p[i]=(UChar)1; // fill the buffer with all non-NUL code units | |
1101 | } | |
1102 | test1.releaseBuffer(); // implicit -1 | |
1103 | if(test1.length()!=test1.getCapacity() || test1.charAt(1)!=1 || test1.charAt(100)!=1 || test1.charAt(test1.getCapacity()-1)!=1) { | |
1104 | errln("UnicodeString::releaseBuffer(-1 but no NUL) does not properly set the length of the UnicodeString"); | |
1105 | } | |
1106 | ||
1107 | // test getTerminatedBuffer() | |
1108 | test1=UnicodeString("This is another test.", ""); | |
1109 | test2=UnicodeString("This is another test.", ""); | |
1110 | q=test1.getTerminatedBuffer(); | |
1111 | if(q[test1.length()]!=0 || test1!=test2 || test2.compare(q, -1)!=0) { | |
1112 | errln("getTerminatedBuffer()[length]!=0"); | |
1113 | } | |
1114 | ||
1115 | const UChar u[]={ 5, 6, 7, 8, 0 }; | |
1116 | test1.setTo(FALSE, u, 3); | |
1117 | q=test1.getTerminatedBuffer(); | |
1118 | if(q==u || q[0]!=5 || q[1]!=6 || q[2]!=7 || q[3]!=0) { | |
1119 | errln("UnicodeString(u[3]).getTerminatedBuffer() returns a bad buffer"); | |
1120 | } | |
1121 | ||
1122 | test1.setTo(TRUE, u, -1); | |
1123 | q=test1.getTerminatedBuffer(); | |
1124 | if(q!=u || test1.length()!=4 || q[3]!=8 || q[4]!=0) { | |
1125 | errln("UnicodeString(u[-1]).getTerminatedBuffer() returns a bad buffer"); | |
1126 | } | |
1127 | ||
1128 | test1=UNICODE_STRING("la", 2); | |
1129 | test1.append(UNICODE_STRING(" lila", 5).getTerminatedBuffer(), 0, -1); | |
1130 | if(test1!=UNICODE_STRING("la lila", 7)) { | |
1131 | errln("UnicodeString::append(const UChar *, start, length) failed"); | |
1132 | } | |
1133 | ||
1134 | test1.insert(3, UNICODE_STRING("dudum ", 6), 0, INT32_MAX); | |
1135 | if(test1!=UNICODE_STRING("la dudum lila", 13)) { | |
1136 | errln("UnicodeString::insert(start, const UniStr &, start, length) failed"); | |
1137 | } | |
1138 | ||
1139 | static const UChar ucs[]={ 0x68, 0x6d, 0x20, 0 }; | |
1140 | test1.insert(9, ucs, -1); | |
1141 | if(test1!=UNICODE_STRING("la dudum hm lila", 16)) { | |
1142 | errln("UnicodeString::insert(start, const UChar *, length) failed"); | |
1143 | } | |
1144 | ||
1145 | test1.replace(9, 2, (UChar)0x2b); | |
1146 | if(test1!=UNICODE_STRING("la dudum + lila", 15)) { | |
1147 | errln("UnicodeString::replace(start, length, UChar) failed"); | |
1148 | } | |
1149 | ||
1150 | if(test1.hasMetaData() || UnicodeString().hasMetaData()) { | |
1151 | errln("UnicodeString::hasMetaData() returns TRUE"); | |
1152 | } | |
1153 | ||
1154 | // test getTerminatedBuffer() on a truncated, shared, heap-allocated string | |
1155 | test1=UNICODE_STRING_SIMPLE("abcdefghijklmnopqrstuvwxyz0123456789."); | |
1156 | test1.truncate(36); // ensure length()<getCapacity() | |
1157 | test2=test1; // share the buffer | |
1158 | test1.truncate(5); | |
1159 | if(test1.length()!=5 || test1.getTerminatedBuffer()[5]!=0) { | |
1160 | errln("UnicodeString(shared buffer).truncate() failed"); | |
1161 | } | |
1162 | if(test2.length()!=36 || test2[5]!=0x66 || u_strlen(test2.getTerminatedBuffer())!=36) { | |
1163 | errln("UnicodeString(shared buffer).truncate().getTerminatedBuffer() " | |
1164 | "modified another copy of the string!"); | |
1165 | } | |
1166 | test1=UNICODE_STRING_SIMPLE("abcdefghijklmnopqrstuvwxyz0123456789."); | |
1167 | test1.truncate(36); // ensure length()<getCapacity() | |
1168 | test2=test1; // share the buffer | |
1169 | test1.remove(); | |
1170 | if(test1.length()!=0 || test1.getTerminatedBuffer()[0]!=0) { | |
1171 | errln("UnicodeString(shared buffer).remove() failed"); | |
1172 | } | |
1173 | if(test2.length()!=36 || test2[0]!=0x61 || u_strlen(test2.getTerminatedBuffer())!=36) { | |
1174 | errln("UnicodeString(shared buffer).remove().getTerminatedBuffer() " | |
1175 | "modified another copy of the string!"); | |
1176 | } | |
1177 | } | |
1178 | ||
1179 | void | |
1180 | UnicodeStringTest::TestStackAllocation() | |
1181 | { | |
1182 | UChar testString[] ={ | |
1183 | 0x54, 0x68, 0x69, 0x73, 0x20, 0x69, 0x73, 0x20, 0x61, 0x20, 0x63, 0x72, 0x61, 0x7a, 0x79, 0x20, 0x74, 0x65, 0x73, 0x74, 0x2e, 0 }; | |
1184 | UChar guardWord = 0x4DED; | |
1185 | UnicodeString* test = 0; | |
1186 | ||
1187 | test = new UnicodeString(testString); | |
1188 | if (*test != "This is a crazy test.") | |
1189 | errln("Test string failed to initialize properly."); | |
1190 | if (guardWord != 0x04DED) | |
1191 | errln("Test string initialization overwrote guard word!"); | |
1192 | ||
1193 | test->insert(8, "only "); | |
1194 | test->remove(15, 6); | |
1195 | if (*test != "This is only a test.") | |
1196 | errln("Manipulation of test string failed to work right."); | |
1197 | if (guardWord != 0x4DED) | |
1198 | errln("Manipulation of test string overwrote guard word!"); | |
1199 | ||
1200 | // we have to deinitialize and release the backing store by calling the destructor | |
1201 | // explicitly, since we can't overload operator delete | |
1202 | delete test; | |
1203 | ||
1204 | UChar workingBuffer[] = { | |
1205 | 0x4e, 0x6f, 0x77, 0x20, 0x69, 0x73, 0x20, 0x74, 0x68, 0x65, 0x20, 0x74, 0x69, 0x6d, 0x65, 0x20, | |
1206 | 0x66, 0x6f, 0x72, 0x20, 0x61, 0x6c, 0x6c, 0x20, 0x6d, 0x65, 0x6e, 0x20, 0x74, 0x6f, 0x20, | |
1207 | 0x63, 0x6f, 0x6d, 0x65, 0xffff, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, | |
1208 | 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, | |
1209 | 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 }; | |
1210 | UChar guardWord2 = 0x4DED; | |
1211 | ||
1212 | test = new UnicodeString(workingBuffer, 35, 100); | |
1213 | if (*test != "Now is the time for all men to come") | |
1214 | errln("Stack-allocated backing store failed to initialize correctly."); | |
1215 | if (guardWord2 != 0x4DED) | |
1216 | errln("Stack-allocated backing store overwrote guard word!"); | |
1217 | ||
1218 | test->insert(24, "good "); | |
1219 | if (*test != "Now is the time for all good men to come") | |
1220 | errln("insert() on stack-allocated UnicodeString didn't work right"); | |
1221 | if (guardWord2 != 0x4DED) | |
1222 | errln("insert() on stack-allocated UnicodeString overwrote guard word!"); | |
1223 | ||
1224 | if (workingBuffer[24] != 0x67) | |
1225 | errln("insert() on stack-allocated UnicodeString didn't affect backing store"); | |
1226 | ||
1227 | *test += " to the aid of their country."; | |
1228 | if (*test != "Now is the time for all good men to come to the aid of their country.") | |
1229 | errln("Stack-allocated UnicodeString overflow didn't work"); | |
1230 | if (guardWord2 != 0x4DED) | |
1231 | errln("Stack-allocated UnicodeString overflow overwrote guard word!"); | |
1232 | ||
1233 | *test = "ha!"; | |
1234 | if (*test != "ha!") | |
1235 | errln("Assignment to stack-allocated UnicodeString didn't work"); | |
1236 | if (workingBuffer[0] != 0x4e) | |
1237 | errln("Change to UnicodeString after overflow are still affecting original buffer"); | |
1238 | if (guardWord2 != 0x4DED) | |
1239 | errln("Change to UnicodeString after overflow overwrote guard word!"); | |
1240 | ||
1241 | // test read-only aliasing with setTo() | |
1242 | workingBuffer[0] = 0x20ac; | |
1243 | workingBuffer[1] = 0x125; | |
1244 | workingBuffer[2] = 0; | |
1245 | test->setTo(TRUE, workingBuffer, 2); | |
1246 | if(test->length() != 2 || test->charAt(0) != 0x20ac || test->charAt(1) != 0x125) { | |
1247 | errln("UnicodeString.setTo(readonly alias) does not alias correctly"); | |
1248 | } | |
1249 | ||
1250 | UnicodeString *c=(UnicodeString *)test->clone(); | |
1251 | ||
1252 | workingBuffer[1] = 0x109; | |
1253 | if(test->charAt(1) != 0x109) { | |
1254 | errln("UnicodeString.setTo(readonly alias) made a copy: did not see change in buffer"); | |
1255 | } | |
1256 | ||
1257 | if(c->length() != 2 || c->charAt(1) != 0x125) { | |
1258 | errln("clone(alias) did not copy the buffer"); | |
1259 | } | |
1260 | delete c; | |
1261 | ||
1262 | test->setTo(TRUE, workingBuffer, -1); | |
1263 | if(test->length() != 2 || test->charAt(0) != 0x20ac || test->charAt(1) != 0x109) { | |
1264 | errln("UnicodeString.setTo(readonly alias, length -1) does not alias correctly"); | |
1265 | } | |
1266 | ||
1267 | test->setTo(FALSE, workingBuffer, -1); | |
1268 | if(!test->isBogus()) { | |
1269 | errln("UnicodeString.setTo(unterminated readonly alias, length -1) does not result in isBogus()"); | |
1270 | } | |
1271 | ||
1272 | delete test; | |
1273 | ||
1274 | test=new UnicodeString(); | |
1275 | UChar buffer[]={0x0061, 0x0062, 0x20ac, 0x0043, 0x0042, 0x0000}; | |
1276 | test->setTo(buffer, 4, 10); | |
1277 | if(test->length() !=4 || test->charAt(0) != 0x0061 || test->charAt(1) != 0x0062 || | |
1278 | test->charAt(2) != 0x20ac || test->charAt(3) != 0x0043){ | |
1279 | errln((UnicodeString)"UnicodeString.setTo(UChar*, length, capacity) does not work correctly\n" + prettify(*test)); | |
1280 | } | |
1281 | delete test; | |
1282 | ||
1283 | ||
1284 | // test the UChar32 constructor | |
1285 | UnicodeString c32Test((UChar32)0x10ff2a); | |
1286 | if( c32Test.length() != U16_LENGTH(0x10ff2a) || | |
1287 | c32Test.char32At(c32Test.length() - 1) != 0x10ff2a | |
1288 | ) { | |
1289 | errln("The UnicodeString(UChar32) constructor does not work with a 0x10ff2a filler"); | |
1290 | } | |
1291 | ||
1292 | // test the (new) capacity constructor | |
1293 | UnicodeString capTest(5, (UChar32)0x2a, 5); | |
1294 | if( capTest.length() != 5 * U16_LENGTH(0x2a) || | |
1295 | capTest.char32At(0) != 0x2a || | |
1296 | capTest.char32At(4) != 0x2a | |
1297 | ) { | |
1298 | errln("The UnicodeString capacity constructor does not work with an ASCII filler"); | |
1299 | } | |
1300 | ||
1301 | capTest = UnicodeString(5, (UChar32)0x10ff2a, 5); | |
1302 | if( capTest.length() != 5 * U16_LENGTH(0x10ff2a) || | |
1303 | capTest.char32At(0) != 0x10ff2a || | |
1304 | capTest.char32At(4) != 0x10ff2a | |
1305 | ) { | |
1306 | errln("The UnicodeString capacity constructor does not work with a 0x10ff2a filler"); | |
1307 | } | |
1308 | ||
1309 | capTest = UnicodeString(5, (UChar32)0, 0); | |
1310 | if(capTest.length() != 0) { | |
1311 | errln("The UnicodeString capacity constructor does not work with a 0x10ff2a filler"); | |
1312 | } | |
1313 | } | |
1314 | ||
1315 | /** | |
1316 | * Test the unescape() function. | |
1317 | */ | |
1318 | void UnicodeStringTest::TestUnescape(void) { | |
1319 | UnicodeString IN("abc\\u4567 \\n\\r \\U00101234xyz\\x1\\x{5289}\\x1b", -1, US_INV); | |
1320 | UnicodeString OUT("abc"); | |
1321 | OUT.append((UChar)0x4567); | |
1322 | OUT.append(" "); | |
1323 | OUT.append((UChar)0xA); | |
1324 | OUT.append((UChar)0xD); | |
1325 | OUT.append(" "); | |
1326 | OUT.append((UChar32)0x00101234); | |
1327 | OUT.append("xyz"); | |
1328 | OUT.append((UChar32)1).append((UChar32)0x5289).append((UChar)0x1b); | |
1329 | UnicodeString result = IN.unescape(); | |
1330 | if (result != OUT) { | |
1331 | errln("FAIL: " + prettify(IN) + ".unescape() -> " + | |
1332 | prettify(result) + ", expected " + | |
1333 | prettify(OUT)); | |
1334 | } | |
1335 | ||
1336 | // test that an empty string is returned in case of an error | |
1337 | if (!UNICODE_STRING("wrong \\u sequence", 17).unescape().isEmpty()) { | |
1338 | errln("FAIL: unescaping of a string with an illegal escape sequence did not return an empty string"); | |
1339 | } | |
1340 | } | |
1341 | ||
1342 | /* test code point counting functions --------------------------------------- */ | |
1343 | ||
1344 | /* reference implementation of UnicodeString::hasMoreChar32Than() */ | |
1345 | static int32_t | |
1346 | _refUnicodeStringHasMoreChar32Than(const UnicodeString &s, int32_t start, int32_t length, int32_t number) { | |
1347 | int32_t count=s.countChar32(start, length); | |
1348 | return count>number; | |
1349 | } | |
1350 | ||
1351 | /* compare the real function against the reference */ | |
1352 | void | |
1353 | UnicodeStringTest::_testUnicodeStringHasMoreChar32Than(const UnicodeString &s, int32_t start, int32_t length, int32_t number) { | |
1354 | if(s.hasMoreChar32Than(start, length, number)!=_refUnicodeStringHasMoreChar32Than(s, start, length, number)) { | |
1355 | errln("hasMoreChar32Than(%d, %d, %d)=%hd is wrong\n", | |
1356 | start, length, number, s.hasMoreChar32Than(start, length, number)); | |
1357 | } | |
1358 | } | |
1359 | ||
1360 | void | |
1361 | UnicodeStringTest::TestCountChar32(void) { | |
1362 | { | |
1363 | UnicodeString s=UNICODE_STRING("\\U0002f999\\U0001d15f\\u00c4\\u1ed0", 32).unescape(); | |
1364 | ||
1365 | // test countChar32() | |
1366 | // note that this also calls and tests u_countChar32(length>=0) | |
1367 | if( | |
1368 | s.countChar32()!=4 || | |
1369 | s.countChar32(1)!=4 || | |
1370 | s.countChar32(2)!=3 || | |
1371 | s.countChar32(2, 3)!=2 || | |
1372 | s.countChar32(2, 0)!=0 | |
1373 | ) { | |
1374 | errln("UnicodeString::countChar32() failed"); | |
1375 | } | |
1376 | ||
1377 | // NUL-terminate the string buffer and test u_countChar32(length=-1) | |
1378 | const UChar *buffer=s.getTerminatedBuffer(); | |
1379 | if( | |
1380 | u_countChar32(buffer, -1)!=4 || | |
1381 | u_countChar32(buffer+1, -1)!=4 || | |
1382 | u_countChar32(buffer+2, -1)!=3 || | |
1383 | u_countChar32(buffer+3, -1)!=3 || | |
1384 | u_countChar32(buffer+4, -1)!=2 || | |
1385 | u_countChar32(buffer+5, -1)!=1 || | |
1386 | u_countChar32(buffer+6, -1)!=0 | |
1387 | ) { | |
1388 | errln("u_countChar32(length=-1) failed"); | |
1389 | } | |
1390 | ||
1391 | // test u_countChar32() with bad input | |
1392 | if(u_countChar32(NULL, 5)!=0 || u_countChar32(buffer, -2)!=0) { | |
1393 | errln("u_countChar32(bad input) failed (returned non-zero counts)"); | |
1394 | } | |
1395 | } | |
1396 | ||
1397 | /* test data and variables for hasMoreChar32Than() */ | |
1398 | static const UChar str[]={ | |
1399 | 0x61, 0x62, 0xd800, 0xdc00, | |
1400 | 0xd801, 0xdc01, 0x63, 0xd802, | |
1401 | 0x64, 0xdc03, 0x65, 0x66, | |
1402 | 0xd804, 0xdc04, 0xd805, 0xdc05, | |
1403 | 0x67 | |
1404 | }; | |
1405 | UnicodeString string(str, LENGTHOF(str)); | |
1406 | int32_t start, length, number; | |
1407 | ||
1408 | /* test hasMoreChar32Than() */ | |
1409 | for(length=string.length(); length>=0; --length) { | |
1410 | for(start=0; start<=length; ++start) { | |
1411 | for(number=-1; number<=((length-start)+2); ++number) { | |
1412 | _testUnicodeStringHasMoreChar32Than(string, start, length-start, number); | |
1413 | } | |
1414 | } | |
1415 | } | |
1416 | ||
1417 | /* test hasMoreChar32Than() with pinning */ | |
1418 | for(start=-1; start<=string.length()+1; ++start) { | |
1419 | for(number=-1; number<=((string.length()-start)+2); ++number) { | |
1420 | _testUnicodeStringHasMoreChar32Than(string, start, 0x7fffffff, number); | |
1421 | } | |
1422 | } | |
1423 | ||
1424 | /* test hasMoreChar32Than() with a bogus string */ | |
1425 | string.setToBogus(); | |
1426 | for(length=-1; length<=1; ++length) { | |
1427 | for(start=-1; start<=length; ++start) { | |
1428 | for(number=-1; number<=((length-start)+2); ++number) { | |
1429 | _testUnicodeStringHasMoreChar32Than(string, start, length-start, number); | |
1430 | } | |
1431 | } | |
1432 | } | |
1433 | } | |
1434 | ||
1435 | void | |
1436 | UnicodeStringTest::TestBogus() { | |
1437 | UnicodeString test1("This is a test"); | |
1438 | UnicodeString test2("This is a test"); | |
1439 | UnicodeString test3("Me too!"); | |
1440 | ||
1441 | // test isBogus() and setToBogus() | |
1442 | if (test1.isBogus() || test2.isBogus() || test3.isBogus()) { | |
1443 | errln("A string returned TRUE for isBogus()!"); | |
1444 | } | |
1445 | ||
1446 | // NULL pointers are treated like empty strings | |
1447 | // use other illegal arguments to make a bogus string | |
1448 | test3.setTo(FALSE, test1.getBuffer(), -2); | |
1449 | if(!test3.isBogus()) { | |
1450 | errln("A bogus string returned FALSE for isBogus()!"); | |
1451 | } | |
1452 | if (test1.hashCode() != test2.hashCode() || test1.hashCode() == test3.hashCode()) { | |
1453 | errln("hashCode() failed"); | |
1454 | } | |
1455 | if(test3.getBuffer()!=0 || test3.getBuffer(20)!=0 || test3.getTerminatedBuffer()!=0) { | |
1456 | errln("bogus.getBuffer()!=0"); | |
1457 | } | |
1458 | if (test1.indexOf(test3) != -1) { | |
1459 | errln("bogus.indexOf() != -1"); | |
1460 | } | |
1461 | if (test1.lastIndexOf(test3) != -1) { | |
1462 | errln("bogus.lastIndexOf() != -1"); | |
1463 | } | |
1464 | if (test1.caseCompare(test3, U_FOLD_CASE_DEFAULT) != 1 || test3.caseCompare(test1, U_FOLD_CASE_DEFAULT) != -1) { | |
1465 | errln("caseCompare() doesn't work with bogus strings"); | |
1466 | } | |
1467 | if (test1.compareCodePointOrder(test3) != 1 || test3.compareCodePointOrder(test1) != -1) { | |
1468 | errln("compareCodePointOrder() doesn't work with bogus strings"); | |
1469 | } | |
1470 | ||
1471 | // verify that non-assignment modifications fail and do not revive a bogus string | |
1472 | test3.setToBogus(); | |
1473 | test3.append((UChar)0x61); | |
1474 | if(!test3.isBogus() || test3.getBuffer()!=0) { | |
1475 | errln("bogus.append('a') worked but must not"); | |
1476 | } | |
1477 | ||
1478 | test3.setToBogus(); | |
1479 | test3.findAndReplace(UnicodeString((UChar)0x61), test2); | |
1480 | if(!test3.isBogus() || test3.getBuffer()!=0) { | |
1481 | errln("bogus.findAndReplace() worked but must not"); | |
1482 | } | |
1483 | ||
1484 | test3.setToBogus(); | |
1485 | test3.trim(); | |
1486 | if(!test3.isBogus() || test3.getBuffer()!=0) { | |
1487 | errln("bogus.trim() revived bogus but must not"); | |
1488 | } | |
1489 | ||
1490 | test3.setToBogus(); | |
1491 | test3.remove(1); | |
1492 | if(!test3.isBogus() || test3.getBuffer()!=0) { | |
1493 | errln("bogus.remove(1) revived bogus but must not"); | |
1494 | } | |
1495 | ||
1496 | test3.setToBogus(); | |
1497 | if(!test3.setCharAt(0, 0x62).isBogus() || !test3.isEmpty()) { | |
1498 | errln("bogus.setCharAt(0, 'b') worked but must not"); | |
1499 | } | |
1500 | ||
1501 | test3.setToBogus(); | |
1502 | if(test3.truncate(1) || !test3.isBogus() || !test3.isEmpty()) { | |
1503 | errln("bogus.truncate(1) revived bogus but must not"); | |
1504 | } | |
1505 | ||
1506 | // verify that assignments revive a bogus string | |
1507 | test3.setToBogus(); | |
1508 | if(!test3.isBogus() || (test3=test1).isBogus() || test3!=test1) { | |
1509 | errln("bogus.operator=() failed"); | |
1510 | } | |
1511 | ||
1512 | test3.setToBogus(); | |
1513 | if(!test3.isBogus() || test3.fastCopyFrom(test1).isBogus() || test3!=test1) { | |
1514 | errln("bogus.fastCopyFrom() failed"); | |
1515 | } | |
1516 | ||
1517 | test3.setToBogus(); | |
1518 | if(!test3.isBogus() || test3.setTo(test1).isBogus() || test3!=test1) { | |
1519 | errln("bogus.setTo(UniStr) failed"); | |
1520 | } | |
1521 | ||
1522 | test3.setToBogus(); | |
1523 | if(!test3.isBogus() || test3.setTo(test1, 0).isBogus() || test3!=test1) { | |
1524 | errln("bogus.setTo(UniStr, 0) failed"); | |
1525 | } | |
1526 | ||
1527 | test3.setToBogus(); | |
1528 | if(!test3.isBogus() || test3.setTo(test1, 0, 0x7fffffff).isBogus() || test3!=test1) { | |
1529 | errln("bogus.setTo(UniStr, 0, len) failed"); | |
1530 | } | |
1531 | ||
1532 | test3.setToBogus(); | |
1533 | if(!test3.isBogus() || test3.setTo(test1.getBuffer(), test1.length()).isBogus() || test3!=test1) { | |
1534 | errln("bogus.setTo(const UChar *, len) failed"); | |
1535 | } | |
1536 | ||
1537 | test3.setToBogus(); | |
1538 | if(!test3.isBogus() || test3.setTo((UChar)0x2028).isBogus() || test3!=UnicodeString((UChar)0x2028)) { | |
1539 | errln("bogus.setTo(UChar) failed"); | |
1540 | } | |
1541 | ||
1542 | test3.setToBogus(); | |
1543 | if(!test3.isBogus() || test3.setTo((UChar32)0x1d157).isBogus() || test3!=UnicodeString((UChar32)0x1d157)) { | |
1544 | errln("bogus.setTo(UChar32) failed"); | |
1545 | } | |
1546 | ||
1547 | test3.setToBogus(); | |
1548 | if(!test3.isBogus() || test3.setTo(FALSE, test1.getBuffer(), test1.length()).isBogus() || test3!=test1) { | |
1549 | errln("bogus.setTo(readonly alias) failed"); | |
1550 | } | |
1551 | ||
1552 | // writable alias to another string's buffer: very bad idea, just convenient for this test | |
1553 | test3.setToBogus(); | |
1554 | if(!test3.isBogus() || test3.setTo((UChar *)test1.getBuffer(), test1.length(), test1.getCapacity()).isBogus() || test3!=test1) { | |
1555 | errln("bogus.setTo(writable alias) failed"); | |
1556 | } | |
1557 | ||
1558 | // verify simple, documented ways to turn a bogus string into an empty one | |
1559 | test3.setToBogus(); | |
1560 | if(!test3.isBogus() || (test3=UnicodeString()).isBogus() || !test3.isEmpty()) { | |
1561 | errln("bogus.operator=(UnicodeString()) failed"); | |
1562 | } | |
1563 | ||
1564 | test3.setToBogus(); | |
1565 | if(!test3.isBogus() || test3.setTo(UnicodeString()).isBogus() || !test3.isEmpty()) { | |
1566 | errln("bogus.setTo(UnicodeString()) failed"); | |
1567 | } | |
1568 | ||
1569 | test3.setToBogus(); | |
1570 | if(test3.remove().isBogus() || test3.getBuffer()==0 || !test3.isEmpty()) { | |
1571 | errln("bogus.remove() failed"); | |
1572 | } | |
1573 | ||
1574 | test3.setToBogus(); | |
1575 | if(test3.remove(0, INT32_MAX).isBogus() || test3.getBuffer()==0 || !test3.isEmpty()) { | |
1576 | errln("bogus.remove(0, INT32_MAX) failed"); | |
1577 | } | |
1578 | ||
1579 | test3.setToBogus(); | |
1580 | if(test3.truncate(0) || test3.isBogus() || !test3.isEmpty()) { | |
1581 | errln("bogus.truncate(0) failed"); | |
1582 | } | |
1583 | ||
1584 | test3.setToBogus(); | |
1585 | if(!test3.isBogus() || test3.setTo((UChar32)-1).isBogus() || !test3.isEmpty()) { | |
1586 | errln("bogus.setTo((UChar32)-1) failed"); | |
1587 | } | |
1588 | ||
1589 | static const UChar nul=0; | |
1590 | ||
1591 | test3.setToBogus(); | |
1592 | if(!test3.isBogus() || test3.setTo(&nul, 0).isBogus() || !test3.isEmpty()) { | |
1593 | errln("bogus.setTo(&nul, 0) failed"); | |
1594 | } | |
1595 | ||
1596 | test3.setToBogus(); | |
1597 | if(!test3.isBogus() || test3.getBuffer()!=0) { | |
1598 | errln("setToBogus() failed to make a string bogus"); | |
1599 | } | |
1600 | ||
1601 | test3.setToBogus(); | |
1602 | if(test1.isBogus() || !(test1=test3).isBogus()) { | |
1603 | errln("normal=bogus failed to make the left string bogus"); | |
1604 | } | |
1605 | ||
1606 | // test that NULL primitive input string values are treated like | |
1607 | // empty strings, not errors (bogus) | |
1608 | test2.setTo((UChar32)0x10005); | |
1609 | if(test2.insert(1, NULL, 1).length()!=2) { | |
1610 | errln("UniStr.insert(...NULL...) should not modify the string but does"); | |
1611 | } | |
1612 | ||
1613 | UErrorCode errorCode=U_ZERO_ERROR; | |
1614 | UnicodeString | |
1615 | test4((const UChar *)NULL), | |
1616 | test5(TRUE, (const UChar *)NULL, 1), | |
1617 | test6((UChar *)NULL, 5, 5), | |
1618 | test7((const char *)NULL, 3, NULL, errorCode); | |
1619 | if(test4.isBogus() || test5.isBogus() || test6.isBogus() || test7.isBogus()) { | |
1620 | errln("a constructor set to bogus for a NULL input string, should be empty"); | |
1621 | } | |
1622 | ||
1623 | test4.setTo(NULL, 3); | |
1624 | test5.setTo(TRUE, (const UChar *)NULL, 1); | |
1625 | test6.setTo((UChar *)NULL, 5, 5); | |
1626 | if(test4.isBogus() || test5.isBogus() || test6.isBogus()) { | |
1627 | errln("a setTo() set to bogus for a NULL input string, should be empty"); | |
1628 | } | |
1629 | ||
1630 | // test that bogus==bogus<any | |
1631 | if(test1!=test3 || test1.compare(test3)!=0) { | |
1632 | errln("bogus==bogus failed"); | |
1633 | } | |
1634 | ||
1635 | test2.remove(); | |
1636 | if(test1>=test2 || !(test2>test1) || test1.compare(test2)>=0 || !(test2.compare(test1)>0)) { | |
1637 | errln("bogus<empty failed"); | |
1638 | } | |
1639 | } | |
1640 | ||
1641 | // StringEnumeration ------------------------------------------------------- *** | |
1642 | // most of StringEnumeration is tested elsewhere | |
1643 | // this test improves code coverage | |
1644 | ||
1645 | static const char *const | |
1646 | testEnumStrings[]={ | |
1647 | "a", | |
1648 | "b", | |
1649 | "c", | |
1650 | "this is a long string which helps us test some buffer limits", | |
1651 | "eeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeee" | |
1652 | }; | |
1653 | ||
1654 | class TestEnumeration : public StringEnumeration { | |
1655 | public: | |
1656 | TestEnumeration() : i(0) {} | |
1657 | ||
1658 | virtual int32_t count(UErrorCode& /*status*/) const { | |
1659 | return LENGTHOF(testEnumStrings); | |
1660 | } | |
1661 | ||
1662 | virtual const UnicodeString *snext(UErrorCode &status) { | |
1663 | if(U_SUCCESS(status) && i<LENGTHOF(testEnumStrings)) { | |
1664 | unistr=UnicodeString(testEnumStrings[i++], ""); | |
1665 | return &unistr; | |
1666 | } | |
1667 | ||
1668 | return NULL; | |
1669 | } | |
1670 | ||
1671 | virtual void reset(UErrorCode& /*status*/) { | |
1672 | i=0; | |
1673 | } | |
1674 | ||
1675 | static inline UClassID getStaticClassID() { | |
1676 | return (UClassID)&fgClassID; | |
1677 | } | |
1678 | virtual UClassID getDynamicClassID() const { | |
1679 | return getStaticClassID(); | |
1680 | } | |
1681 | ||
1682 | private: | |
1683 | static const char fgClassID; | |
1684 | ||
1685 | int32_t i, length; | |
1686 | }; | |
1687 | ||
1688 | const char TestEnumeration::fgClassID=0; | |
1689 | ||
1690 | void | |
1691 | UnicodeStringTest::TestStringEnumeration() { | |
1692 | UnicodeString s; | |
1693 | TestEnumeration ten; | |
1694 | int32_t i, length; | |
1695 | UErrorCode status; | |
1696 | ||
1697 | const UChar *pu; | |
1698 | const char *pc; | |
1699 | ||
1700 | // test the next() default implementation and ensureCharsCapacity() | |
1701 | for(i=0; i<LENGTHOF(testEnumStrings); ++i) { | |
1702 | status=U_ZERO_ERROR; | |
1703 | pc=ten.next(&length, status); | |
1704 | s=UnicodeString(testEnumStrings[i], ""); | |
1705 | if(U_FAILURE(status) || pc==NULL || length!=s.length() || UnicodeString(pc, length, "")!=s) { | |
1706 | errln("StringEnumeration.next(%d) failed", i); | |
1707 | } | |
1708 | } | |
1709 | status=U_ZERO_ERROR; | |
1710 | if(ten.next(&length, status)!=NULL) { | |
1711 | errln("StringEnumeration.next(done)!=NULL"); | |
1712 | } | |
1713 | ||
1714 | // test the unext() default implementation | |
1715 | ten.reset(status); | |
1716 | for(i=0; i<LENGTHOF(testEnumStrings); ++i) { | |
1717 | status=U_ZERO_ERROR; | |
1718 | pu=ten.unext(&length, status); | |
1719 | s=UnicodeString(testEnumStrings[i], ""); | |
1720 | if(U_FAILURE(status) || pu==NULL || length!=s.length() || UnicodeString(TRUE, pu, length)!=s) { | |
1721 | errln("StringEnumeration.unext(%d) failed", i); | |
1722 | } | |
1723 | } | |
1724 | status=U_ZERO_ERROR; | |
1725 | if(ten.unext(&length, status)!=NULL) { | |
1726 | errln("StringEnumeration.unext(done)!=NULL"); | |
1727 | } | |
1728 | ||
1729 | // test that the default clone() implementation works, and returns NULL | |
1730 | if(ten.clone()!=NULL) { | |
1731 | errln("StringEnumeration.clone()!=NULL"); | |
1732 | } | |
1733 | ||
1734 | // test that uenum_openFromStringEnumeration() works | |
1735 | // Need a heap allocated string enumeration because it is adopted by the UEnumeration. | |
1736 | StringEnumeration *newTen = new TestEnumeration; | |
1737 | status=U_ZERO_ERROR; | |
1738 | UEnumeration *uten = uenum_openFromStringEnumeration(newTen, &status); | |
1739 | if (uten==NULL || U_FAILURE(status)) { | |
1740 | errln("fail at file %s, line %d, UErrorCode is %s\n", __FILE__, __LINE__, u_errorName(status)); | |
1741 | return; | |
1742 | } | |
1743 | ||
1744 | // test uenum_next() | |
1745 | for(i=0; i<LENGTHOF(testEnumStrings); ++i) { | |
1746 | status=U_ZERO_ERROR; | |
1747 | pc=uenum_next(uten, &length, &status); | |
1748 | if(U_FAILURE(status) || pc==NULL || strcmp(pc, testEnumStrings[i]) != 0) { | |
1749 | errln("File %s, line %d, StringEnumeration.next(%d) failed", __FILE__, __LINE__, i); | |
1750 | } | |
1751 | } | |
1752 | status=U_ZERO_ERROR; | |
1753 | if(uenum_next(uten, &length, &status)!=NULL) { | |
1754 | errln("File %s, line %d, uenum_next(done)!=NULL"); | |
1755 | } | |
1756 | ||
1757 | // test the uenum_unext() | |
1758 | uenum_reset(uten, &status); | |
1759 | for(i=0; i<LENGTHOF(testEnumStrings); ++i) { | |
1760 | status=U_ZERO_ERROR; | |
1761 | pu=uenum_unext(uten, &length, &status); | |
1762 | s=UnicodeString(testEnumStrings[i], ""); | |
1763 | if(U_FAILURE(status) || pu==NULL || length!=s.length() || UnicodeString(TRUE, pu, length)!=s) { | |
1764 | errln("File %s, Line %d, uenum_unext(%d) failed", __FILE__, __LINE__, i); | |
1765 | } | |
1766 | } | |
1767 | status=U_ZERO_ERROR; | |
1768 | if(uenum_unext(uten, &length, &status)!=NULL) { | |
1769 | errln("File %s, Line %d, uenum_unext(done)!=NULL" __FILE__, __LINE__); | |
1770 | } | |
1771 | ||
1772 | uenum_close(uten); | |
1773 | } | |
1774 | ||
1775 | /* | |
1776 | * Namespace test, to make sure that macros like UNICODE_STRING include the | |
1777 | * namespace qualifier. | |
1778 | * | |
1779 | * Define a (bogus) UnicodeString class in another namespace and check for ambiguity. | |
1780 | */ | |
1781 | namespace bogus { | |
1782 | class UnicodeString { | |
1783 | public: | |
1784 | enum EInvariant { kInvariant }; | |
1785 | UnicodeString() : i(1) {} | |
1786 | UnicodeString(UBool /*isTerminated*/, const UChar * /*text*/, int32_t textLength) : i(textLength) {} | |
1787 | UnicodeString(const char * /*src*/, int32_t length, enum EInvariant /*inv*/ | |
1788 | ) : i(length) {} | |
1789 | private: | |
1790 | int32_t i; | |
1791 | }; | |
1792 | } | |
1793 | ||
1794 | void | |
1795 | UnicodeStringTest::TestNameSpace() { | |
1796 | // Provoke name collision unless the UnicodeString macros properly | |
1797 | // qualify the icu::UnicodeString class. | |
1798 | using namespace bogus; | |
1799 | ||
1800 | // Use all UnicodeString macros from unistr.h. | |
1801 | icu::UnicodeString s1=icu::UnicodeString("abc", 3, US_INV); | |
1802 | icu::UnicodeString s2=UNICODE_STRING("def", 3); | |
1803 | icu::UnicodeString s3=UNICODE_STRING_SIMPLE("ghi"); | |
1804 | ||
1805 | // Make sure the compiler does not optimize away instantiation of s1, s2, s3. | |
1806 | icu::UnicodeString s4=s1+s2+s3; | |
1807 | if(s4.length()!=9) { | |
1808 | errln("Something wrong with UnicodeString::operator+()."); | |
1809 | } | |
1810 | } | |
1811 | ||
1812 | void | |
1813 | UnicodeStringTest::TestUTF32() { | |
1814 | // Input string length US_STACKBUF_SIZE to cause overflow of the | |
1815 | // initially chosen fStackBuffer due to supplementary characters. | |
1816 | static const UChar32 utf32[] = { | |
1817 | 0x41, 0xd900, 0x61, 0xdc00, -1, 0x110000, 0x5a, 0x50000, 0x7a, | |
1818 | 0x10000, 0x20000, 0xe0000, 0x10ffff | |
1819 | }; | |
1820 | static const UChar expected_utf16[] = { | |
1821 | 0x41, 0xfffd, 0x61, 0xfffd, 0xfffd, 0xfffd, 0x5a, 0xd900, 0xdc00, 0x7a, | |
1822 | 0xd800, 0xdc00, 0xd840, 0xdc00, 0xdb40, 0xdc00, 0xdbff, 0xdfff | |
1823 | }; | |
1824 | UnicodeString from32 = UnicodeString::fromUTF32(utf32, LENGTHOF(utf32)); | |
1825 | UnicodeString expected(FALSE, expected_utf16, LENGTHOF(expected_utf16)); | |
1826 | if(from32 != expected) { | |
1827 | errln("UnicodeString::fromUTF32() did not create the expected string."); | |
1828 | } | |
1829 | ||
1830 | static const UChar utf16[] = { | |
1831 | 0x41, 0xd900, 0x61, 0xdc00, 0x5a, 0xd900, 0xdc00, 0x7a, 0xd800, 0xdc00, 0xdbff, 0xdfff | |
1832 | }; | |
1833 | static const UChar32 expected_utf32[] = { | |
1834 | 0x41, 0xfffd, 0x61, 0xfffd, 0x5a, 0x50000, 0x7a, 0x10000, 0x10ffff | |
1835 | }; | |
1836 | UChar32 result32[16]; | |
1837 | UErrorCode errorCode = U_ZERO_ERROR; | |
1838 | int32_t length32 = | |
1839 | UnicodeString(FALSE, utf16, LENGTHOF(utf16)). | |
1840 | toUTF32(result32, LENGTHOF(result32), errorCode); | |
1841 | if( length32 != LENGTHOF(expected_utf32) || | |
1842 | 0 != uprv_memcmp(result32, expected_utf32, length32*4) || | |
1843 | result32[length32] != 0 | |
1844 | ) { | |
1845 | errln("UnicodeString::toUTF32() did not create the expected string."); | |
1846 | } | |
1847 | } | |
1848 | ||
1849 | class TestCheckedArrayByteSink : public CheckedArrayByteSink { | |
1850 | public: | |
1851 | TestCheckedArrayByteSink(char* outbuf, int32_t capacity) | |
1852 | : CheckedArrayByteSink(outbuf, capacity), calledFlush(FALSE) {} | |
1853 | virtual void Flush() { calledFlush = TRUE; } | |
1854 | UBool calledFlush; | |
1855 | }; | |
1856 | ||
1857 | void | |
1858 | UnicodeStringTest::TestUTF8() { | |
1859 | static const uint8_t utf8[] = { | |
1860 | // Code points: | |
1861 | // 0x41, 0xd900, | |
1862 | // 0x61, 0xdc00, | |
1863 | // 0x110000, 0x5a, | |
1864 | // 0x50000, 0x7a, | |
1865 | // 0x10000, 0x20000, | |
1866 | // 0xe0000, 0x10ffff | |
1867 | 0x41, 0xed, 0xa4, 0x80, | |
1868 | 0x61, 0xed, 0xb0, 0x80, | |
1869 | 0xf4, 0x90, 0x80, 0x80, 0x5a, | |
1870 | 0xf1, 0x90, 0x80, 0x80, 0x7a, | |
1871 | 0xf0, 0x90, 0x80, 0x80, 0xf0, 0xa0, 0x80, 0x80, | |
1872 | 0xf3, 0xa0, 0x80, 0x80, 0xf4, 0x8f, 0xbf, 0xbf | |
1873 | }; | |
1874 | static const UChar expected_utf16[] = { | |
1875 | 0x41, 0xfffd, | |
1876 | 0x61, 0xfffd, | |
1877 | 0xfffd, 0x5a, | |
1878 | 0xd900, 0xdc00, 0x7a, | |
1879 | 0xd800, 0xdc00, 0xd840, 0xdc00, | |
1880 | 0xdb40, 0xdc00, 0xdbff, 0xdfff | |
1881 | }; | |
1882 | UnicodeString from8 = UnicodeString::fromUTF8(StringPiece((const char *)utf8, (int32_t)sizeof(utf8))); | |
1883 | UnicodeString expected(FALSE, expected_utf16, LENGTHOF(expected_utf16)); | |
1884 | ||
1885 | if(from8 != expected) { | |
1886 | errln("UnicodeString::fromUTF8(StringPiece) did not create the expected string."); | |
1887 | } | |
1888 | #if U_HAVE_STD_STRING | |
1889 | std::string utf8_string((const char *)utf8, sizeof(utf8)); | |
1890 | UnicodeString from8b = UnicodeString::fromUTF8(utf8_string); | |
1891 | if(from8b != expected) { | |
1892 | errln("UnicodeString::fromUTF8(std::string) did not create the expected string."); | |
1893 | } | |
1894 | #endif | |
1895 | ||
1896 | static const UChar utf16[] = { | |
1897 | 0x41, 0xd900, 0x61, 0xdc00, 0x5a, 0xd900, 0xdc00, 0x7a, 0xd800, 0xdc00, 0xdbff, 0xdfff | |
1898 | }; | |
1899 | static const uint8_t expected_utf8[] = { | |
1900 | 0x41, 0xef, 0xbf, 0xbd, 0x61, 0xef, 0xbf, 0xbd, 0x5a, 0xf1, 0x90, 0x80, 0x80, 0x7a, | |
1901 | 0xf0, 0x90, 0x80, 0x80, 0xf4, 0x8f, 0xbf, 0xbf | |
1902 | }; | |
1903 | UnicodeString us(FALSE, utf16, LENGTHOF(utf16)); | |
1904 | ||
1905 | char buffer[64]; | |
1906 | TestCheckedArrayByteSink sink(buffer, (int32_t)sizeof(buffer)); | |
1907 | us.toUTF8(sink); | |
1908 | if( sink.NumberOfBytesWritten() != (int32_t)sizeof(expected_utf8) || | |
1909 | 0 != uprv_memcmp(buffer, expected_utf8, sizeof(expected_utf8)) | |
1910 | ) { | |
1911 | errln("UnicodeString::toUTF8() did not create the expected string."); | |
1912 | } | |
1913 | if(!sink.calledFlush) { | |
1914 | errln("UnicodeString::toUTF8(sink) did not sink.Flush()."); | |
1915 | } | |
1916 | #if U_HAVE_STD_STRING | |
1917 | // Initial contents for testing that toUTF8String() appends. | |
1918 | std::string result8 = "-->"; | |
1919 | std::string expected8 = "-->" + std::string((const char *)expected_utf8, sizeof(expected_utf8)); | |
1920 | // Use the return value just for testing. | |
1921 | std::string &result8r = us.toUTF8String(result8); | |
1922 | if(result8r != expected8 || &result8r != &result8) { | |
1923 | errln("UnicodeString::toUTF8String() did not create the expected string."); | |
1924 | } | |
1925 | #endif | |
1926 | } | |
1927 | ||
1928 | // Test if this compiler supports Return Value Optimization of unnamed temporary objects. | |
1929 | static UnicodeString wrapUChars(const UChar *uchars) { | |
1930 | return UnicodeString(TRUE, uchars, -1); | |
1931 | } | |
1932 | ||
1933 | void | |
1934 | UnicodeStringTest::TestReadOnlyAlias() { | |
1935 | UChar uchars[]={ 0x61, 0x62, 0 }; | |
1936 | UnicodeString alias(TRUE, uchars, 2); | |
1937 | if(alias.length()!=2 || alias.getBuffer()!=uchars || alias.getTerminatedBuffer()!=uchars) { | |
1938 | errln("UnicodeString read-only-aliasing constructor does not behave as expected."); | |
1939 | return; | |
1940 | } | |
1941 | alias.truncate(1); | |
1942 | if(alias.length()!=1 || alias.getBuffer()!=uchars) { | |
1943 | errln("UnicodeString(read-only-alias).truncate() did not preserve aliasing as expected."); | |
1944 | } | |
1945 | if(alias.getTerminatedBuffer()==uchars) { | |
1946 | errln("UnicodeString(read-only-alias).truncate().getTerminatedBuffer() " | |
1947 | "did not allocate and copy as expected."); | |
1948 | } | |
1949 | if(uchars[1]!=0x62) { | |
1950 | errln("UnicodeString(read-only-alias).truncate().getTerminatedBuffer() " | |
1951 | "modified the original buffer."); | |
1952 | } | |
1953 | if(1!=u_strlen(alias.getTerminatedBuffer())) { | |
1954 | errln("UnicodeString(read-only-alias).truncate().getTerminatedBuffer() " | |
1955 | "does not return a buffer terminated at the proper length."); | |
1956 | } | |
1957 | ||
1958 | alias.setTo(TRUE, uchars, 2); | |
1959 | if(alias.length()!=2 || alias.getBuffer()!=uchars || alias.getTerminatedBuffer()!=uchars) { | |
1960 | errln("UnicodeString read-only-aliasing setTo() does not behave as expected."); | |
1961 | return; | |
1962 | } | |
1963 | alias.remove(); | |
1964 | if(alias.length()!=0) { | |
1965 | errln("UnicodeString(read-only-alias).remove() did not work."); | |
1966 | } | |
1967 | if(alias.getTerminatedBuffer()==uchars) { | |
1968 | errln("UnicodeString(read-only-alias).remove().getTerminatedBuffer() " | |
1969 | "did not un-alias as expected."); | |
1970 | } | |
1971 | if(uchars[0]!=0x61) { | |
1972 | errln("UnicodeString(read-only-alias).remove().getTerminatedBuffer() " | |
1973 | "modified the original buffer."); | |
1974 | } | |
1975 | if(0!=u_strlen(alias.getTerminatedBuffer())) { | |
1976 | errln("UnicodeString.setTo(read-only-alias).remove().getTerminatedBuffer() " | |
1977 | "does not return a buffer terminated at length 0."); | |
1978 | } | |
1979 | ||
1980 | UnicodeString longString=UNICODE_STRING_SIMPLE("abcdefghijklmnopqrstuvwxyz0123456789"); | |
1981 | alias.setTo(FALSE, longString.getBuffer(), longString.length()); | |
1982 | alias.remove(0, 10); | |
1983 | if(longString.compare(10, INT32_MAX, alias)!=0 || alias.getBuffer()!=longString.getBuffer()+10) { | |
1984 | errln("UnicodeString.setTo(read-only-alias).remove(0, 10) did not preserve aliasing as expected."); | |
1985 | } | |
1986 | alias.setTo(FALSE, longString.getBuffer(), longString.length()); | |
1987 | alias.remove(27, 99); | |
1988 | if(longString.compare(0, 27, alias)!=0 || alias.getBuffer()!=longString.getBuffer()) { | |
1989 | errln("UnicodeString.setTo(read-only-alias).remove(27, 99) did not preserve aliasing as expected."); | |
1990 | } | |
1991 | alias.setTo(FALSE, longString.getBuffer(), longString.length()); | |
1992 | alias.retainBetween(6, 30); | |
1993 | if(longString.compare(6, 24, alias)!=0 || alias.getBuffer()!=longString.getBuffer()+6) { | |
1994 | errln("UnicodeString.setTo(read-only-alias).retainBetween(6, 30) did not preserve aliasing as expected."); | |
1995 | } | |
1996 | ||
1997 | UChar abc[]={ 0x61, 0x62, 0x63, 0 }; | |
1998 | UBool hasRVO= wrapUChars(abc).getBuffer()==abc; | |
1999 | ||
2000 | UnicodeString temp; | |
2001 | temp.fastCopyFrom(longString.tempSubString()); | |
2002 | if(temp!=longString || (hasRVO && temp.getBuffer()!=longString.getBuffer())) { | |
2003 | errln("UnicodeString.tempSubString() failed"); | |
2004 | } | |
2005 | temp.fastCopyFrom(longString.tempSubString(-3, 5)); | |
2006 | if(longString.compare(0, 5, temp)!=0 || (hasRVO && temp.getBuffer()!=longString.getBuffer())) { | |
2007 | errln("UnicodeString.tempSubString(-3, 5) failed"); | |
2008 | } | |
2009 | temp.fastCopyFrom(longString.tempSubString(17)); | |
2010 | if(longString.compare(17, INT32_MAX, temp)!=0 || (hasRVO && temp.getBuffer()!=longString.getBuffer()+17)) { | |
2011 | errln("UnicodeString.tempSubString(17) failed"); | |
2012 | } | |
2013 | temp.fastCopyFrom(longString.tempSubString(99)); | |
2014 | if(!temp.isEmpty()) { | |
2015 | errln("UnicodeString.tempSubString(99) failed"); | |
2016 | } | |
2017 | temp.fastCopyFrom(longString.tempSubStringBetween(6)); | |
2018 | if(longString.compare(6, INT32_MAX, temp)!=0 || (hasRVO && temp.getBuffer()!=longString.getBuffer()+6)) { | |
2019 | errln("UnicodeString.tempSubStringBetween(6) failed"); | |
2020 | } | |
2021 | temp.fastCopyFrom(longString.tempSubStringBetween(8, 18)); | |
2022 | if(longString.compare(8, 10, temp)!=0 || (hasRVO && temp.getBuffer()!=longString.getBuffer()+8)) { | |
2023 | errln("UnicodeString.tempSubStringBetween(8, 18) failed"); | |
2024 | } | |
2025 | UnicodeString bogusString; | |
2026 | bogusString.setToBogus(); | |
2027 | temp.fastCopyFrom(bogusString.tempSubStringBetween(8, 18)); | |
2028 | if(!temp.isBogus()) { | |
2029 | errln("UnicodeString.setToBogus().tempSubStringBetween(8, 18) failed"); | |
2030 | } | |
2031 | } | |
2032 | ||
2033 | void | |
2034 | UnicodeStringTest::doTestAppendable(UnicodeString &dest, Appendable &app) { | |
2035 | static const UChar cde[3]={ 0x63, 0x64, 0x65 }; | |
2036 | static const UChar fg[3]={ 0x66, 0x67, 0 }; | |
2037 | if(!app.reserveAppendCapacity(12)) { | |
2038 | errln("Appendable.reserve(12) failed"); | |
2039 | } | |
2040 | app.appendCodeUnit(0x61); | |
2041 | app.appendCodePoint(0x62); | |
2042 | app.appendCodePoint(0x50000); | |
2043 | app.appendString(cde, 3); | |
2044 | app.appendString(fg, -1); | |
2045 | UChar scratch[3]; | |
2046 | int32_t capacity=-1; | |
2047 | UChar *buffer=app.getAppendBuffer(3, 3, scratch, 3, &capacity); | |
2048 | if(capacity<3) { | |
2049 | errln("Appendable.getAppendBuffer(min=3) returned capacity=%d<3", (int)capacity); | |
2050 | return; | |
2051 | } | |
2052 | static const UChar hij[3]={ 0x68, 0x69, 0x6a }; | |
2053 | u_memcpy(buffer, hij, 3); | |
2054 | app.appendString(buffer, 3); | |
2055 | if(dest!=UNICODE_STRING_SIMPLE("ab\\U00050000cdefghij").unescape()) { | |
2056 | errln("Appendable.append(...) failed"); | |
2057 | } | |
2058 | buffer=app.getAppendBuffer(0, 3, scratch, 3, &capacity); | |
2059 | if(buffer!=NULL || capacity!=0) { | |
2060 | errln("Appendable.getAppendBuffer(min=0) failed"); | |
2061 | } | |
2062 | capacity=1; | |
2063 | buffer=app.getAppendBuffer(3, 3, scratch, 2, &capacity); | |
2064 | if(buffer!=NULL || capacity!=0) { | |
2065 | errln("Appendable.getAppendBuffer(scratch<min) failed"); | |
2066 | } | |
2067 | } | |
2068 | ||
2069 | class SimpleAppendable : public Appendable { | |
2070 | public: | |
2071 | explicit SimpleAppendable(UnicodeString &dest) : str(dest) {} | |
2072 | virtual UBool appendCodeUnit(UChar c) { str.append(c); return TRUE; } | |
2073 | SimpleAppendable &reset() { str.remove(); return *this; } | |
2074 | private: | |
2075 | UnicodeString &str; | |
2076 | }; | |
2077 | ||
2078 | void | |
2079 | UnicodeStringTest::TestAppendable() { | |
2080 | UnicodeString dest; | |
2081 | SimpleAppendable app(dest); | |
2082 | doTestAppendable(dest, app); | |
2083 | } | |
2084 | ||
2085 | void | |
2086 | UnicodeStringTest::TestUnicodeStringImplementsAppendable() { | |
2087 | UnicodeString dest; | |
2088 | UnicodeStringAppendable app(dest); | |
2089 | doTestAppendable(dest, app); | |
2090 | } | |
2091 | ||
2092 | void | |
2093 | UnicodeStringTest::TestSizeofUnicodeString() { | |
2094 | // See the comments in unistr.h near the declaration of UnicodeString's fields. | |
2095 | size_t sizeofUniStr=sizeof(UnicodeString); | |
2096 | size_t expected; | |
2097 | switch(sizeof(void *)) { | |
2098 | case 4: | |
2099 | expected=32; | |
2100 | break; | |
2101 | case 8: | |
2102 | expected=40; | |
2103 | break; | |
2104 | default: | |
2105 | logln("This platform has neither 32-bit nor 64-bit pointers."); | |
2106 | return; | |
2107 | } | |
2108 | if(expected!=sizeofUniStr) { | |
2109 | errln("sizeof(UnicodeString)=%d, expected %d", (int)sizeofUniStr, (int)expected); | |
2110 | } | |
2111 | } |