]>
Commit | Line | Data |
---|---|---|
b75a7d8f A |
1 | /******************************************************************** |
2 | * COPYRIGHT: | |
2ca993e8 | 3 | * Copyright (c) 1997-2016, International Business Machines Corporation and |
b75a7d8f A |
4 | * others. All Rights Reserved. |
5 | ********************************************************************/ | |
6 | //=============================================================================== | |
7 | // | |
57a6839d | 8 | // File apicoll.cpp |
b75a7d8f A |
9 | // |
10 | // | |
11 | // | |
12 | // Created by: Helena Shih | |
13 | // | |
14 | // Modification History: | |
15 | // | |
16 | // Date Name Description | |
17 | // 2/5/97 aliu Added streamIn and streamOut methods. Added | |
18 | // constructor which reads RuleBasedCollator object from | |
19 | // a binary file. Added writeToFile method which streams | |
20 | // RuleBasedCollator out to a binary file. The streamIn | |
21 | // and streamOut methods use istream and ostream objects | |
22 | // in binary mode. | |
23 | // 6/30/97 helena Added tests for CollationElementIterator::setText, getOffset | |
24 | // setOffset and DecompositionIterator::getOffset, setOffset. | |
25 | // DecompositionIterator is made public so add class scope | |
26 | // testing. | |
27 | // 02/10/98 damiba Added test for compare(UnicodeString&, UnicodeString&, int32_t) | |
28 | //=============================================================================== | |
29 | ||
30 | #include "unicode/utypes.h" | |
31 | ||
32 | #if !UCONFIG_NO_COLLATION | |
33 | ||
729e4ab9 | 34 | #include "unicode/localpointer.h" |
b75a7d8f A |
35 | #include "unicode/coll.h" |
36 | #include "unicode/tblcoll.h" | |
37 | #include "unicode/coleitr.h" | |
38 | #include "unicode/sortkey.h" | |
39 | #include "apicoll.h" | |
40 | #include "unicode/chariter.h" | |
41 | #include "unicode/schriter.h" | |
42 | #include "unicode/ustring.h" | |
73c04bcf | 43 | #include "unicode/ucol.h" |
b75a7d8f A |
44 | |
45 | #include "sfwdchit.h" | |
46 | #include "cmemory.h" | |
73c04bcf | 47 | #include <stdlib.h> |
b75a7d8f A |
48 | |
49 | void | |
50 | CollationAPITest::doAssert(UBool condition, const char *message) | |
51 | { | |
52 | if (!condition) { | |
53 | errln(UnicodeString("ERROR : ") + message); | |
54 | } | |
55 | } | |
56 | ||
b75a7d8f A |
57 | // Collator Class Properties |
58 | // ctor, dtor, createInstance, compare, getStrength/setStrength | |
59 | // getDecomposition/setDecomposition, getDisplayName | |
60 | void | |
61 | CollationAPITest::TestProperty(/* char* par */) | |
62 | { | |
63 | UErrorCode success = U_ZERO_ERROR; | |
64 | Collator *col = 0; | |
65 | /* | |
729e4ab9 A |
66 | * Expected version of the English collator. |
67 | * Currently, the major/minor version numbers change when the builder code | |
68 | * changes, | |
69 | * number 2 is from the tailoring data version and | |
70 | * number 3 is the UCA version. | |
71 | * This changes with every UCA version change, and the expected value | |
72 | * needs to be adjusted. | |
73 | * Same in cintltst/capitst.c. | |
74 | */ | |
75 | UVersionInfo currVersionArray = {0x31, 0xC0, 0x05, 0x2A}; // from ICU 4.4/UCA 5.2 | |
b75a7d8f | 76 | UVersionInfo versionArray; |
b75a7d8f A |
77 | |
78 | logln("The property tests begin : "); | |
79 | logln("Test ctors : "); | |
80 | col = Collator::createInstance(Locale::getEnglish(), success); | |
729e4ab9 A |
81 | if (U_FAILURE(success)){ |
82 | errcheckln(success, "Default Collator creation failed. - %s", u_errorName(success)); | |
83 | return; | |
84 | } | |
b75a7d8f | 85 | |
729e4ab9 A |
86 | StringEnumeration* kwEnum = col->getKeywordValuesForLocale("", Locale::getEnglish(),true,success); |
87 | if (U_FAILURE(success)){ | |
88 | errcheckln(success, "Get Keyword Values for Locale failed. - %s", u_errorName(success)); | |
b75a7d8f A |
89 | return; |
90 | } | |
729e4ab9 | 91 | delete kwEnum; |
b75a7d8f A |
92 | |
93 | col->getVersion(versionArray); | |
729e4ab9 A |
94 | // Check for a version greater than some value rather than equality |
95 | // so that we need not update the expected version each time. | |
96 | if (uprv_memcmp(versionArray, currVersionArray, 4)<0) { | |
97 | errln("Testing Collator::getVersion() - unexpected result: %02x.%02x.%02x.%02x", | |
98 | versionArray[0], versionArray[1], versionArray[2], versionArray[3]); | |
99 | } else { | |
100 | logln("Collator::getVersion() result: %02x.%02x.%02x.%02x", | |
b75a7d8f | 101 | versionArray[0], versionArray[1], versionArray[2], versionArray[3]); |
b75a7d8f A |
102 | } |
103 | ||
104 | doAssert((col->compare("ab", "abc") == Collator::LESS), "ab < abc comparison failed"); | |
105 | doAssert((col->compare("ab", "AB") == Collator::LESS), "ab < AB comparison failed"); | |
106 | doAssert((col->compare("blackbird", "black-bird") == Collator::GREATER), "black-bird > blackbird comparison failed"); | |
107 | doAssert((col->compare("black bird", "black-bird") == Collator::LESS), "black bird > black-bird comparison failed"); | |
108 | doAssert((col->compare("Hello", "hello") == Collator::GREATER), "Hello > hello comparison failed"); | |
729e4ab9 | 109 | doAssert((col->compare("","",success) == UCOL_EQUAL), "Comparison between empty strings failed"); |
b75a7d8f | 110 | |
729e4ab9 A |
111 | doAssert((col->compareUTF8("\x61\x62\xc3\xa4", "\x61\x62\xc3\x9f", success) == UCOL_LESS), "ab a-umlaut < ab sharp-s UTF-8 comparison failed"); |
112 | success = U_ZERO_ERROR; | |
113 | { | |
114 | UnicodeString abau=UNICODE_STRING_SIMPLE("\\x61\\x62\\xe4").unescape(); | |
115 | UnicodeString abss=UNICODE_STRING_SIMPLE("\\x61\\x62\\xdf").unescape(); | |
116 | UCharIterator abauIter, abssIter; | |
117 | uiter_setReplaceable(&abauIter, &abau); | |
118 | uiter_setReplaceable(&abssIter, &abss); | |
119 | doAssert((col->compare(abauIter, abssIter, success) == UCOL_LESS), "ab a-umlaut < ab sharp-s UCharIterator comparison failed"); | |
120 | success = U_ZERO_ERROR; | |
121 | } | |
b75a7d8f A |
122 | |
123 | /*start of update [Bertrand A. D. 02/10/98]*/ | |
124 | doAssert((col->compare("ab", "abc", 2) == Collator::EQUAL), "ab = abc with length 2 comparison failed"); | |
125 | doAssert((col->compare("ab", "AB", 2) == Collator::LESS), "ab < AB with length 2 comparison failed"); | |
126 | doAssert((col->compare("ab", "Aa", 1) == Collator::LESS), "ab < Aa with length 1 comparison failed"); | |
127 | doAssert((col->compare("ab", "Aa", 2) == Collator::GREATER), "ab > Aa with length 2 comparison failed"); | |
128 | doAssert((col->compare("black-bird", "blackbird", 5) == Collator::EQUAL), "black-bird = blackbird with length of 5 comparison failed"); | |
129 | doAssert((col->compare("black bird", "black-bird", 10) == Collator::LESS), "black bird < black-bird with length 10 comparison failed"); | |
130 | doAssert((col->compare("Hello", "hello", 5) == Collator::GREATER), "Hello > hello with length 5 comparison failed"); | |
131 | /*end of update [Bertrand A. D. 02/10/98]*/ | |
132 | ||
133 | ||
134 | logln("Test ctors ends."); | |
135 | logln("testing Collator::getStrength() method ..."); | |
136 | doAssert((col->getStrength() == Collator::TERTIARY), "collation object has the wrong strength"); | |
137 | doAssert((col->getStrength() != Collator::PRIMARY), "collation object's strength is primary difference"); | |
138 | ||
139 | ||
140 | logln("testing Collator::setStrength() method ..."); | |
141 | col->setStrength(Collator::SECONDARY); | |
142 | doAssert((col->getStrength() != Collator::TERTIARY), "collation object's strength is secondary difference"); | |
143 | doAssert((col->getStrength() != Collator::PRIMARY), "collation object's strength is primary difference"); | |
144 | doAssert((col->getStrength() == Collator::SECONDARY), "collation object has the wrong strength"); | |
145 | ||
146 | UnicodeString name; | |
147 | ||
148 | logln("Get display name for the US English collation in German : "); | |
149 | logln(Collator::getDisplayName(Locale::getUS(), Locale::getGerman(), name)); | |
150 | doAssert((name == UnicodeString("Englisch (Vereinigte Staaten)")), "getDisplayName failed"); | |
151 | ||
152 | logln("Get display name for the US English collation in English : "); | |
153 | logln(Collator::getDisplayName(Locale::getUS(), Locale::getEnglish(), name)); | |
154 | doAssert((name == UnicodeString("English (United States)")), "getDisplayName failed"); | |
155 | #if 0 | |
156 | // weiv : this test is bogus if we're running on any machine that has different default locale than English. | |
157 | // Therefore, it is banned! | |
158 | logln("Get display name for the US English in default locale language : "); | |
159 | logln(Collator::getDisplayName(Locale::US, name)); | |
160 | doAssert((name == UnicodeString("English (United States)")), "getDisplayName failed if this is an English machine"); | |
161 | #endif | |
162 | delete col; col = 0; | |
163 | RuleBasedCollator *rcol = (RuleBasedCollator *)Collator::createInstance("da_DK", | |
164 | success); | |
b331163b A |
165 | if (U_FAILURE(success)) { |
166 | errcheckln(success, "Collator::createInstance(\"da_DK\") failed - %s", u_errorName(success)); | |
167 | return; | |
168 | } | |
169 | const UnicodeString &daRules = rcol->getRules(); | |
170 | if(daRules.isEmpty()) { | |
171 | dataerrln("missing da_DK tailoring rule string"); | |
172 | } else { | |
173 | doAssert(daRules.indexOf("aa") >= 0, "da_DK rules do not contain 'aa'"); | |
174 | } | |
b75a7d8f A |
175 | delete rcol; |
176 | ||
177 | col = Collator::createInstance(Locale::getFrench(), success); | |
178 | if (U_FAILURE(success)) | |
179 | { | |
180 | errln("Creating French collation failed."); | |
181 | return; | |
182 | } | |
183 | ||
184 | col->setStrength(Collator::PRIMARY); | |
185 | logln("testing Collator::getStrength() method again ..."); | |
186 | doAssert((col->getStrength() != Collator::TERTIARY), "collation object has the wrong strength"); | |
187 | doAssert((col->getStrength() == Collator::PRIMARY), "collation object's strength is not primary difference"); | |
188 | ||
189 | logln("testing French Collator::setStrength() method ..."); | |
190 | col->setStrength(Collator::TERTIARY); | |
191 | doAssert((col->getStrength() == Collator::TERTIARY), "collation object's strength is not tertiary difference"); | |
192 | doAssert((col->getStrength() != Collator::PRIMARY), "collation object's strength is primary difference"); | |
193 | doAssert((col->getStrength() != Collator::SECONDARY), "collation object's strength is secondary difference"); | |
b331163b | 194 | delete col; |
b75a7d8f A |
195 | |
196 | logln("Create junk collation: "); | |
197 | Locale abcd("ab", "CD", ""); | |
198 | success = U_ZERO_ERROR; | |
199 | Collator *junk = 0; | |
200 | junk = Collator::createInstance(abcd, success); | |
201 | ||
202 | if (U_FAILURE(success)) | |
203 | { | |
204 | errln("Junk collation creation failed, should at least return default."); | |
b75a7d8f A |
205 | return; |
206 | } | |
207 | ||
b331163b A |
208 | doAssert(((RuleBasedCollator *)junk)->getRules().isEmpty(), |
209 | "The root collation should be returned for an unsupported language."); | |
729e4ab9 | 210 | Collator *frCol = Collator::createInstance(Locale::getCanadaFrench(), success); |
b75a7d8f A |
211 | if (U_FAILURE(success)) |
212 | { | |
729e4ab9 | 213 | errln("Creating fr_CA collator failed."); |
46f4442e | 214 | delete junk; |
b75a7d8f A |
215 | return; |
216 | } | |
217 | ||
46f4442e A |
218 | // If the default locale isn't French, the French and non-French collators |
219 | // should be different | |
729e4ab9 A |
220 | if (frCol->getLocale(ULOC_ACTUAL_LOCALE, success) != Locale::getCanadaFrench()) { |
221 | doAssert((*frCol != *junk), "The junk is the same as the fr_CA collator."); | |
46f4442e | 222 | } |
b75a7d8f | 223 | Collator *aFrCol = frCol->clone(); |
729e4ab9 | 224 | doAssert((*frCol == *aFrCol), "The cloning of a fr_CA collator failed."); |
b75a7d8f A |
225 | logln("Collator property test ended."); |
226 | ||
b75a7d8f A |
227 | delete frCol; |
228 | delete aFrCol; | |
229 | delete junk; | |
b75a7d8f A |
230 | } |
231 | ||
232 | void | |
233 | CollationAPITest::TestRuleBasedColl() | |
234 | { | |
235 | RuleBasedCollator *col1, *col2, *col3, *col4; | |
236 | UErrorCode status = U_ZERO_ERROR; | |
237 | ||
238 | UnicodeString ruleset1("&9 < a, A < b, B < c, C; ch, cH, Ch, CH < d, D, e, E"); | |
239 | UnicodeString ruleset2("&9 < a, A < b, B < c, C < d, D, e, E"); | |
240 | ||
241 | col1 = new RuleBasedCollator(ruleset1, status); | |
242 | if (U_FAILURE(status)) { | |
729e4ab9 | 243 | errcheckln(status, "RuleBased Collator creation failed. - %s", u_errorName(status)); |
b75a7d8f A |
244 | return; |
245 | } | |
246 | else { | |
247 | logln("PASS: RuleBased Collator creation passed\n"); | |
248 | } | |
249 | ||
250 | status = U_ZERO_ERROR; | |
251 | col2 = new RuleBasedCollator(ruleset2, status); | |
252 | if (U_FAILURE(status)) { | |
253 | errln("RuleBased Collator creation failed.\n"); | |
254 | return; | |
255 | } | |
256 | else { | |
257 | logln("PASS: RuleBased Collator creation passed\n"); | |
258 | } | |
259 | ||
260 | status = U_ZERO_ERROR; | |
261 | Locale locale("aa", "AA"); | |
262 | col3 = (RuleBasedCollator *)Collator::createInstance(locale, status); | |
263 | if (U_FAILURE(status)) { | |
264 | errln("Fallback Collator creation failed.: %s\n"); | |
265 | return; | |
266 | } | |
267 | else { | |
268 | logln("PASS: Fallback Collator creation passed\n"); | |
269 | } | |
270 | delete col3; | |
271 | ||
272 | status = U_ZERO_ERROR; | |
273 | col3 = (RuleBasedCollator *)Collator::createInstance(status); | |
274 | if (U_FAILURE(status)) { | |
275 | errln("Default Collator creation failed.: %s\n"); | |
276 | return; | |
277 | } | |
278 | else { | |
279 | logln("PASS: Default Collator creation passed\n"); | |
280 | } | |
281 | ||
282 | UnicodeString rule1 = col1->getRules(); | |
283 | UnicodeString rule2 = col2->getRules(); | |
284 | UnicodeString rule3 = col3->getRules(); | |
285 | ||
286 | doAssert(rule1 != rule2, "Default collator getRules failed"); | |
287 | doAssert(rule2 != rule3, "Default collator getRules failed"); | |
288 | doAssert(rule1 != rule3, "Default collator getRules failed"); | |
289 | ||
290 | col4 = new RuleBasedCollator(rule2, status); | |
291 | if (U_FAILURE(status)) { | |
292 | errln("RuleBased Collator creation failed.\n"); | |
293 | return; | |
294 | } | |
295 | ||
296 | UnicodeString rule4 = col4->getRules(); | |
297 | doAssert(rule2 == rule4, "Default collator getRules failed"); | |
298 | int32_t length4 = 0; | |
299 | uint8_t *clonedrule4 = col4->cloneRuleData(length4, status); | |
300 | if (U_FAILURE(status)) { | |
301 | errln("Cloned rule data failed.\n"); | |
302 | return; | |
303 | } | |
304 | ||
305 | // free(clonedrule4); BAD API!!!! | |
306 | uprv_free(clonedrule4); | |
307 | ||
308 | ||
309 | delete col1; | |
310 | delete col2; | |
311 | delete col3; | |
312 | delete col4; | |
313 | } | |
314 | ||
315 | void | |
316 | CollationAPITest::TestRules() | |
317 | { | |
318 | RuleBasedCollator *coll; | |
319 | UErrorCode status = U_ZERO_ERROR; | |
320 | UnicodeString rules; | |
321 | ||
322 | coll = (RuleBasedCollator *)Collator::createInstance(Locale::getEnglish(), status); | |
323 | if (U_FAILURE(status)) { | |
729e4ab9 | 324 | errcheckln(status, "English Collator creation failed. - %s", u_errorName(status)); |
b75a7d8f A |
325 | return; |
326 | } | |
327 | else { | |
328 | logln("PASS: RuleBased Collator creation passed\n"); | |
329 | } | |
330 | ||
331 | coll->getRules(UCOL_TAILORING_ONLY, rules); | |
729e4ab9 A |
332 | if (rules.length() != 0x00) { |
333 | errln("English tailored rules failed - length is 0x%x expected 0x%x", rules.length(), 0x00); | |
b75a7d8f A |
334 | } |
335 | ||
336 | coll->getRules(UCOL_FULL_RULES, rules); | |
337 | if (rules.length() < 0) { | |
338 | errln("English full rules failed"); | |
339 | } | |
340 | delete coll; | |
341 | } | |
342 | ||
343 | void | |
344 | CollationAPITest::TestDecomposition() { | |
345 | UErrorCode status = U_ZERO_ERROR; | |
346 | Collator *en_US = Collator::createInstance("en_US", status), | |
347 | *el_GR = Collator::createInstance("el_GR", status), | |
348 | *vi_VN = Collator::createInstance("vi_VN", status); | |
349 | ||
350 | if (U_FAILURE(status)) { | |
729e4ab9 | 351 | errcheckln(status, "ERROR: collation creation failed. - %s", u_errorName(status)); |
b75a7d8f A |
352 | return; |
353 | } | |
354 | ||
355 | /* there is no reason to have canonical decomposition in en_US OR default locale */ | |
356 | if (vi_VN->getAttribute(UCOL_NORMALIZATION_MODE, status) != UCOL_ON) | |
357 | { | |
374ca955 | 358 | errln("ERROR: vi_VN collation did not have canonical decomposition for normalization!\n"); |
b75a7d8f A |
359 | } |
360 | ||
361 | if (el_GR->getAttribute(UCOL_NORMALIZATION_MODE, status) != UCOL_ON) | |
362 | { | |
374ca955 | 363 | errln("ERROR: el_GR collation did not have canonical decomposition for normalization!\n"); |
b75a7d8f A |
364 | } |
365 | ||
366 | if (en_US->getAttribute(UCOL_NORMALIZATION_MODE, status) != UCOL_OFF) | |
367 | { | |
374ca955 | 368 | errln("ERROR: en_US collation had canonical decomposition for normalization!\n"); |
b75a7d8f A |
369 | } |
370 | ||
371 | delete en_US; | |
372 | delete el_GR; | |
373 | delete vi_VN; | |
374 | } | |
375 | ||
376 | void | |
377 | CollationAPITest::TestSafeClone() { | |
378 | static const int CLONETEST_COLLATOR_COUNT = 3; | |
379 | Collator *someCollators [CLONETEST_COLLATOR_COUNT]; | |
380 | Collator *col; | |
381 | UErrorCode err = U_ZERO_ERROR; | |
382 | int index; | |
383 | ||
384 | UnicodeString test1("abCda"); | |
385 | UnicodeString test2("abcda"); | |
386 | ||
387 | /* one default collator & two complex ones */ | |
388 | someCollators[0] = Collator::createInstance("en_US", err); | |
389 | someCollators[1] = Collator::createInstance("ko", err); | |
390 | someCollators[2] = Collator::createInstance("ja_JP", err); | |
391 | if(U_FAILURE(err)) { | |
729e4ab9 | 392 | errcheckln(err, "Couldn't instantiate collators. Error: %s", u_errorName(err)); |
b75a7d8f A |
393 | delete someCollators[0]; |
394 | delete someCollators[1]; | |
395 | delete someCollators[2]; | |
396 | return; | |
397 | } | |
398 | ||
399 | /* change orig & clone & make sure they are independent */ | |
400 | ||
401 | for (index = 0; index < CLONETEST_COLLATOR_COUNT; index++) | |
402 | { | |
403 | col = someCollators[index]->safeClone(); | |
404 | if (col == 0) { | |
405 | errln("SafeClone of collator should not return null\n"); | |
406 | break; | |
407 | } | |
408 | col->setStrength(Collator::TERTIARY); | |
409 | someCollators[index]->setStrength(Collator::PRIMARY); | |
410 | col->setAttribute(UCOL_CASE_LEVEL, UCOL_OFF, err); | |
411 | someCollators[index]->setAttribute(UCOL_CASE_LEVEL, UCOL_OFF, err); | |
412 | ||
413 | doAssert(col->greater(test1, test2), "Result should be \"abCda\" >>> \"abcda\" "); | |
414 | doAssert(someCollators[index]->equals(test1, test2), "Result should be \"abcda\" == \"abCda\""); | |
415 | delete col; | |
416 | delete someCollators[index]; | |
417 | } | |
418 | } | |
419 | ||
420 | void | |
421 | CollationAPITest::TestHashCode(/* char* par */) | |
422 | { | |
423 | logln("hashCode tests begin."); | |
424 | UErrorCode success = U_ZERO_ERROR; | |
425 | Collator *col1 = 0; | |
426 | col1 = Collator::createInstance(Locale::getEnglish(), success); | |
427 | if (U_FAILURE(success)) | |
428 | { | |
729e4ab9 | 429 | errcheckln(success, "Default collation creation failed. - %s", u_errorName(success)); |
b75a7d8f A |
430 | return; |
431 | } | |
432 | ||
433 | Collator *col2 = 0; | |
434 | Locale dk("da", "DK", ""); | |
435 | col2 = Collator::createInstance(dk, success); | |
436 | if (U_FAILURE(success)) | |
437 | { | |
438 | errln("Danish collation creation failed."); | |
439 | return; | |
440 | } | |
441 | ||
442 | Collator *col3 = 0; | |
443 | col3 = Collator::createInstance(Locale::getEnglish(), success); | |
444 | if (U_FAILURE(success)) | |
445 | { | |
446 | errln("2nd default collation creation failed."); | |
447 | return; | |
448 | } | |
449 | ||
450 | logln("Collator::hashCode() testing ..."); | |
451 | ||
452 | doAssert(col1->hashCode() != col2->hashCode(), "Hash test1 result incorrect" ); | |
453 | doAssert(!(col1->hashCode() == col2->hashCode()), "Hash test2 result incorrect" ); | |
454 | doAssert(col1->hashCode() == col3->hashCode(), "Hash result not equal" ); | |
455 | ||
456 | logln("hashCode tests end."); | |
457 | delete col1; | |
458 | delete col2; | |
459 | ||
460 | UnicodeString test1("Abcda"); | |
461 | UnicodeString test2("abcda"); | |
462 | ||
463 | CollationKey sortk1, sortk2, sortk3; | |
464 | UErrorCode status = U_ZERO_ERROR; | |
465 | ||
466 | col3->getCollationKey(test1, sortk1, status); | |
467 | col3->getCollationKey(test2, sortk2, status); | |
468 | col3->getCollationKey(test2, sortk3, status); | |
469 | ||
470 | doAssert(sortk1.hashCode() != sortk2.hashCode(), "Hash test1 result incorrect"); | |
471 | doAssert(sortk2.hashCode() == sortk3.hashCode(), "Hash result not equal" ); | |
472 | ||
473 | delete col3; | |
474 | } | |
475 | ||
476 | //---------------------------------------------------------------------------- | |
477 | // CollationKey -- Tests the CollationKey methods | |
478 | // | |
479 | void | |
480 | CollationAPITest::TestCollationKey(/* char* par */) | |
481 | { | |
482 | logln("testing CollationKey begins..."); | |
483 | Collator *col = 0; | |
484 | UErrorCode success=U_ZERO_ERROR; | |
485 | col = Collator::createInstance(Locale::getEnglish(), success); | |
486 | if (U_FAILURE(success)) | |
487 | { | |
729e4ab9 | 488 | errcheckln(success, "Default collation creation failed. - %s", u_errorName(success)); |
b75a7d8f A |
489 | return; |
490 | } | |
491 | col->setStrength(Collator::TERTIARY); | |
492 | ||
493 | CollationKey sortk1, sortk2; | |
494 | UnicodeString test1("Abcda"), test2("abcda"); | |
495 | UErrorCode key1Status = U_ZERO_ERROR, key2Status = U_ZERO_ERROR; | |
496 | ||
497 | logln("Testing weird arguments"); | |
57a6839d A |
498 | // No string vs. empty string vs. completely-ignorable string: |
499 | // See ICU ticket #10495. | |
500 | CollationKey sortkNone; | |
b75a7d8f | 501 | int32_t length; |
57a6839d A |
502 | sortkNone.getByteArray(length); |
503 | doAssert(!sortkNone.isBogus() && length == 0, | |
504 | "Default-constructed collation key should be empty"); | |
505 | CollationKey sortkEmpty; | |
506 | col->getCollationKey(NULL, 0, sortkEmpty, key1Status); | |
507 | // key gets reset here | |
508 | const uint8_t* byteArrayEmpty = sortkEmpty.getByteArray(length); | |
509 | doAssert(sortkEmpty.isBogus() == FALSE && length == 3 && | |
510 | byteArrayEmpty[0] == 1 && byteArrayEmpty[1] == 1 && byteArrayEmpty[2] == 0, | |
511 | "Empty string should return a collation key with empty levels"); | |
512 | doAssert(sortkNone.compareTo(sortkEmpty) == Collator::LESS, | |
513 | "Expected no collation key < collation key for empty string"); | |
514 | doAssert(sortkEmpty.compareTo(sortkNone) == Collator::GREATER, | |
515 | "Expected collation key for empty string > no collation key"); | |
516 | ||
517 | CollationKey sortkIgnorable; | |
518 | // Most control codes and CGJ are completely ignorable. | |
519 | // A string with only completely ignorables must compare equal to an empty string. | |
520 | col->getCollationKey(UnicodeString((UChar)1).append((UChar)0x34f), sortkIgnorable, key1Status); | |
521 | sortkIgnorable.getByteArray(length); | |
522 | doAssert(!sortkIgnorable.isBogus() && length == 3, | |
523 | "Completely ignorable string should return a collation key with empty levels"); | |
524 | doAssert(sortkIgnorable.compareTo(sortkEmpty) == Collator::EQUAL, | |
525 | "Completely ignorable string should compare equal to empty string"); | |
526 | ||
b75a7d8f A |
527 | // bogus key returned here |
528 | key1Status = U_ILLEGAL_ARGUMENT_ERROR; | |
529 | col->getCollationKey(NULL, 0, sortk1, key1Status); | |
51004dcb | 530 | doAssert(sortk1.isBogus() && (sortk1.getByteArray(length), length) == 0, |
b75a7d8f A |
531 | "Error code should return bogus collation key"); |
532 | ||
533 | key1Status = U_ZERO_ERROR; | |
534 | logln("Use tertiary comparison level testing ...."); | |
535 | ||
536 | col->getCollationKey(test1, sortk1, key1Status); | |
57a6839d A |
537 | if (U_FAILURE(key1Status)) { |
538 | errln("getCollationKey(Abcda) failed - %s", u_errorName(key1Status)); | |
539 | return; | |
540 | } | |
b75a7d8f A |
541 | doAssert((sortk1.compareTo(col->getCollationKey(test2, sortk2, key2Status))) |
542 | == Collator::GREATER, | |
543 | "Result should be \"Abcda\" >>> \"abcda\""); | |
544 | ||
57a6839d | 545 | CollationKey sortk3(sortk2), sortkNew; |
b75a7d8f A |
546 | |
547 | sortkNew = sortk1; | |
548 | doAssert((sortk1 != sortk2), "The sort keys should be different"); | |
549 | doAssert((sortk1.hashCode() != sortk2.hashCode()), "sort key hashCode() failed"); | |
550 | doAssert((sortk2 == sortk3), "The sort keys should be the same"); | |
551 | doAssert((sortk1 == sortkNew), "The sort keys assignment failed"); | |
552 | doAssert((sortk1.hashCode() == sortkNew.hashCode()), "sort key hashCode() failed"); | |
553 | doAssert((sortkNew != sortk3), "The sort keys should be different"); | |
554 | doAssert(sortk1.compareTo(sortk3) == Collator::GREATER, "Result should be \"Abcda\" >>> \"abcda\""); | |
555 | doAssert(sortk2.compareTo(sortk3) == Collator::EQUAL, "Result should be \"abcda\" == \"abcda\""); | |
556 | doAssert(sortkEmpty.compareTo(sortk1) == Collator::LESS, "Result should be (empty key) <<< \"Abcda\""); | |
557 | doAssert(sortk1.compareTo(sortkEmpty) == Collator::GREATER, "Result should be \"Abcda\" >>> (empty key)"); | |
558 | doAssert(sortkEmpty.compareTo(sortkEmpty) == Collator::EQUAL, "Result should be (empty key) == (empty key)"); | |
559 | doAssert(sortk1.compareTo(sortk3, success) == UCOL_GREATER, "Result should be \"Abcda\" >>> \"abcda\""); | |
560 | doAssert(sortk2.compareTo(sortk3, success) == UCOL_EQUAL, "Result should be \"abcda\" == \"abcda\""); | |
561 | doAssert(sortkEmpty.compareTo(sortk1, success) == UCOL_LESS, "Result should be (empty key) <<< \"Abcda\""); | |
562 | doAssert(sortk1.compareTo(sortkEmpty, success) == UCOL_GREATER, "Result should be \"Abcda\" >>> (empty key)"); | |
563 | doAssert(sortkEmpty.compareTo(sortkEmpty, success) == UCOL_EQUAL, "Result should be (empty key) == (empty key)"); | |
564 | ||
565 | int32_t cnt1, cnt2, cnt3, cnt4; | |
566 | ||
567 | const uint8_t* byteArray1 = sortk1.getByteArray(cnt1); | |
568 | const uint8_t* byteArray2 = sortk2.getByteArray(cnt2); | |
569 | ||
b75a7d8f A |
570 | const uint8_t* byteArray3 = 0; |
571 | byteArray3 = sortk1.getByteArray(cnt3); | |
572 | ||
573 | const uint8_t* byteArray4 = 0; | |
574 | byteArray4 = sortk2.getByteArray(cnt4); | |
575 | ||
576 | CollationKey sortk4(byteArray1, cnt1), sortk5(byteArray2, cnt2); | |
577 | CollationKey sortk6(byteArray3, cnt3), sortk7(byteArray4, cnt4); | |
578 | ||
b75a7d8f A |
579 | doAssert(sortk1.compareTo(sortk4) == Collator::EQUAL, "CollationKey::toByteArray(sortk1) Failed."); |
580 | doAssert(sortk2.compareTo(sortk5) == Collator::EQUAL, "CollationKey::toByteArray(sortk2) Failed."); | |
581 | doAssert(sortk4.compareTo(sortk5) == Collator::GREATER, "sortk4 >>> sortk5 Failed"); | |
582 | doAssert(sortk1.compareTo(sortk6) == Collator::EQUAL, "CollationKey::getByteArray(sortk1) Failed."); | |
583 | doAssert(sortk2.compareTo(sortk7) == Collator::EQUAL, "CollationKey::getByteArray(sortk2) Failed."); | |
584 | doAssert(sortk6.compareTo(sortk7) == Collator::GREATER, "sortk6 >>> sortk7 Failed"); | |
585 | ||
586 | logln("Equality tests : "); | |
587 | doAssert(sortk1 == sortk4, "sortk1 == sortk4 Failed."); | |
588 | doAssert(sortk2 == sortk5, "sortk2 == sortk5 Failed."); | |
589 | doAssert(sortk1 != sortk5, "sortk1 != sortk5 Failed."); | |
590 | doAssert(sortk1 == sortk6, "sortk1 == sortk6 Failed."); | |
591 | doAssert(sortk2 == sortk7, "sortk2 == sortk7 Failed."); | |
592 | doAssert(sortk1 != sortk7, "sortk1 != sortk7 Failed."); | |
593 | ||
594 | byteArray1 = 0; | |
595 | byteArray2 = 0; | |
596 | ||
597 | sortk3 = sortk1; | |
598 | doAssert(sortk1 == sortk3, "sortk1 = sortk3 assignment Failed."); | |
599 | doAssert(sortk2 != sortk3, "sortk2 != sortk3 Failed."); | |
600 | logln("testing sortkey ends..."); | |
601 | ||
602 | col->setStrength(Collator::SECONDARY); | |
603 | doAssert(col->getCollationKey(test1, sortk1, key1Status).compareTo( | |
604 | col->getCollationKey(test2, sortk2, key2Status)) | |
605 | == Collator::EQUAL, | |
606 | "Result should be \"Abcda\" == \"abcda\""); | |
607 | delete col; | |
608 | } | |
609 | ||
610 | //---------------------------------------------------------------------------- | |
611 | // Tests the CollatorElementIterator class. | |
612 | // ctor, RuleBasedCollator::createCollationElementIterator(), operator==, operator!= | |
613 | // | |
614 | void | |
615 | CollationAPITest::TestElemIter(/* char* par */) | |
616 | { | |
617 | logln("testing sortkey begins..."); | |
618 | Collator *col = 0; | |
619 | UErrorCode success = U_ZERO_ERROR; | |
620 | col = Collator::createInstance(Locale::getEnglish(), success); | |
621 | if (U_FAILURE(success)) | |
622 | { | |
729e4ab9 | 623 | errcheckln(success, "Default collation creation failed. - %s", u_errorName(success)); |
b75a7d8f A |
624 | return; |
625 | } | |
626 | ||
627 | UnicodeString testString1("XFILE What subset of all possible test cases has the highest probability of detecting the most errors?"); | |
628 | UnicodeString testString2("Xf_ile What subset of all possible test cases has the lowest probability of detecting the least errors?"); | |
629 | logln("Constructors and comparison testing...."); | |
630 | CollationElementIterator *iterator1 = ((RuleBasedCollator*)col)->createCollationElementIterator(testString1); | |
631 | ||
632 | CharacterIterator *chariter=new StringCharacterIterator(testString1); | |
633 | CollationElementIterator *coliter=((RuleBasedCollator*)col)->createCollationElementIterator(*chariter); | |
634 | ||
635 | // copy ctor | |
636 | CollationElementIterator *iterator2 = ((RuleBasedCollator*)col)->createCollationElementIterator(testString1); | |
637 | CollationElementIterator *iterator3 = ((RuleBasedCollator*)col)->createCollationElementIterator(testString2); | |
638 | ||
639 | int32_t offset = iterator1->getOffset(); | |
640 | if (offset != 0) { | |
641 | errln("Error in getOffset for collation element iterator\n"); | |
642 | return; | |
643 | } | |
644 | iterator1->setOffset(6, success); | |
645 | if (U_FAILURE(success)) { | |
646 | errln("Error in setOffset for collation element iterator\n"); | |
647 | return; | |
648 | } | |
649 | iterator1->setOffset(0, success); | |
650 | int32_t order1, order2, order3; | |
651 | doAssert((*iterator1 == *iterator2), "The two iterators should be the same"); | |
652 | doAssert((*iterator1 != *iterator3), "The two iterators should be different"); | |
653 | ||
654 | doAssert((*coliter == *iterator1), "The two iterators should be the same"); | |
655 | doAssert((*coliter == *iterator2), "The two iterators should be the same"); | |
656 | doAssert((*coliter != *iterator3), "The two iterators should be different"); | |
657 | ||
658 | order1 = iterator1->next(success); | |
659 | if (U_FAILURE(success)) | |
660 | { | |
661 | errln("Somehow ran out of memory stepping through the iterator."); | |
662 | return; | |
663 | } | |
664 | ||
665 | doAssert((*iterator1 != *iterator2), "The first iterator advance failed"); | |
666 | order2 = iterator2->getOffset(); | |
667 | doAssert((order1 != order2), "The order result should not be the same"); | |
668 | order2 = iterator2->next(success); | |
669 | if (U_FAILURE(success)) | |
670 | { | |
671 | errln("Somehow ran out of memory stepping through the iterator."); | |
672 | return; | |
673 | } | |
674 | ||
675 | doAssert((*iterator1 == *iterator2), "The second iterator advance failed"); | |
676 | doAssert((order1 == order2), "The order result should be the same"); | |
677 | order3 = iterator3->next(success); | |
678 | if (U_FAILURE(success)) | |
679 | { | |
680 | errln("Somehow ran out of memory stepping through the iterator."); | |
681 | return; | |
682 | } | |
683 | ||
684 | doAssert((CollationElementIterator::primaryOrder(order1) == | |
685 | CollationElementIterator::primaryOrder(order3)), "The primary orders should be the same"); | |
686 | doAssert((CollationElementIterator::secondaryOrder(order1) == | |
687 | CollationElementIterator::secondaryOrder(order3)), "The secondary orders should be the same"); | |
688 | doAssert((CollationElementIterator::tertiaryOrder(order1) == | |
689 | CollationElementIterator::tertiaryOrder(order3)), "The tertiary orders should be the same"); | |
690 | ||
691 | order1 = iterator1->next(success); order3 = iterator3->next(success); | |
692 | if (U_FAILURE(success)) | |
693 | { | |
694 | errln("Somehow ran out of memory stepping through the iterator."); | |
695 | return; | |
696 | } | |
697 | ||
698 | doAssert((CollationElementIterator::primaryOrder(order1) == | |
699 | CollationElementIterator::primaryOrder(order3)), "The primary orders should be identical"); | |
700 | doAssert((CollationElementIterator::tertiaryOrder(order1) != | |
701 | CollationElementIterator::tertiaryOrder(order3)), "The tertiary orders should be different"); | |
702 | ||
703 | order1 = iterator1->next(success); | |
704 | order3 = iterator3->next(success); | |
705 | /* NO! Secondary orders of two CEs are not related, especially in the case of '_' vs 'I' */ | |
706 | /* | |
707 | doAssert((CollationElementIterator::secondaryOrder(order1) != | |
708 | CollationElementIterator::secondaryOrder(order3)), "The secondary orders should not be the same"); | |
709 | */ | |
710 | doAssert((order1 != CollationElementIterator::NULLORDER), "Unexpected end of iterator reached"); | |
711 | ||
712 | iterator1->reset(); iterator2->reset(); iterator3->reset(); | |
713 | order1 = iterator1->next(success); | |
714 | if (U_FAILURE(success)) | |
715 | { | |
716 | errln("Somehow ran out of memory stepping through the iterator."); | |
717 | return; | |
718 | } | |
719 | ||
720 | doAssert((*iterator1 != *iterator2), "The first iterator advance failed"); | |
721 | ||
722 | order2 = iterator2->next(success); | |
723 | if (U_FAILURE(success)) | |
724 | { | |
725 | errln("Somehow ran out of memory stepping through the iterator."); | |
726 | return; | |
727 | } | |
728 | ||
729 | doAssert((*iterator1 == *iterator2), "The second iterator advance failed"); | |
730 | doAssert((order1 == order2), "The order result should be the same"); | |
731 | ||
732 | order3 = iterator3->next(success); | |
733 | if (U_FAILURE(success)) | |
734 | { | |
735 | errln("Somehow ran out of memory stepping through the iterator."); | |
736 | return; | |
737 | } | |
738 | ||
739 | doAssert((CollationElementIterator::primaryOrder(order1) == | |
740 | CollationElementIterator::primaryOrder(order3)), "The primary orders should be the same"); | |
741 | doAssert((CollationElementIterator::secondaryOrder(order1) == | |
742 | CollationElementIterator::secondaryOrder(order3)), "The secondary orders should be the same"); | |
743 | doAssert((CollationElementIterator::tertiaryOrder(order1) == | |
744 | CollationElementIterator::tertiaryOrder(order3)), "The tertiary orders should be the same"); | |
745 | ||
746 | order1 = iterator1->next(success); order2 = iterator2->next(success); order3 = iterator3->next(success); | |
747 | if (U_FAILURE(success)) | |
748 | { | |
749 | errln("Somehow ran out of memory stepping through the iterator."); | |
750 | return; | |
751 | } | |
752 | ||
753 | doAssert((CollationElementIterator::primaryOrder(order1) == | |
754 | CollationElementIterator::primaryOrder(order3)), "The primary orders should be identical"); | |
755 | doAssert((CollationElementIterator::tertiaryOrder(order1) != | |
756 | CollationElementIterator::tertiaryOrder(order3)), "The tertiary orders should be different"); | |
757 | ||
758 | order1 = iterator1->next(success); order3 = iterator3->next(success); | |
759 | if (U_FAILURE(success)) | |
760 | { | |
761 | errln("Somehow ran out of memory stepping through the iterator."); | |
762 | return; | |
763 | } | |
764 | ||
765 | /* NO! Secondary orders of two CEs are not related, especially in the case of '_' vs 'I' */ | |
766 | /* | |
767 | doAssert((CollationElementIterator::secondaryOrder(order1) != | |
768 | CollationElementIterator::secondaryOrder(order3)), "The secondary orders should not be the same"); | |
769 | */ | |
770 | doAssert((order1 != CollationElementIterator::NULLORDER), "Unexpected end of iterator reached"); | |
771 | doAssert((*iterator2 != *iterator3), "The iterators should be different"); | |
772 | ||
773 | ||
774 | //test error values | |
775 | success=U_UNSUPPORTED_ERROR; | |
776 | Collator *colerror=NULL; | |
777 | colerror=Collator::createInstance(Locale::getEnglish(), success); | |
778 | if (colerror != 0 || success == U_ZERO_ERROR){ | |
779 | errln("Error: createInstance(UErrorCode != U_ZERO_ERROR) should just return and not create an instance\n"); | |
780 | } | |
781 | int32_t position=coliter->previous(success); | |
782 | if(position != CollationElementIterator::NULLORDER){ | |
783 | errln((UnicodeString)"Expected NULLORDER got" + position); | |
784 | } | |
785 | coliter->reset(); | |
786 | coliter->setText(*chariter, success); | |
787 | if(!U_FAILURE(success)){ | |
788 | errln("Expeceted error"); | |
789 | } | |
790 | iterator1->setText((UnicodeString)"hello there", success); | |
791 | if(!U_FAILURE(success)){ | |
792 | errln("Expeceted error"); | |
793 | } | |
794 | ||
795 | delete chariter; | |
796 | delete coliter; | |
797 | delete iterator1; | |
798 | delete iterator2; | |
799 | delete iterator3; | |
800 | delete col; | |
801 | ||
802 | ||
803 | ||
804 | logln("testing CollationElementIterator ends..."); | |
805 | } | |
806 | ||
807 | // Test RuleBasedCollator ctor, dtor, operator==, operator!=, clone, copy, and getRules | |
808 | void | |
809 | CollationAPITest::TestOperators(/* char* par */) | |
810 | { | |
811 | UErrorCode success = U_ZERO_ERROR; | |
57a6839d A |
812 | UnicodeString ruleset1("&9 < a, A < b, B < c, C; ch, cH, Ch, CH < d, D, e, E"); |
813 | UnicodeString ruleset2("&9 < a, A < b, B < c, C < d, D, e, E"); | |
b75a7d8f A |
814 | RuleBasedCollator *col1 = new RuleBasedCollator(ruleset1, success); |
815 | if (U_FAILURE(success)) { | |
729e4ab9 | 816 | errcheckln(success, "RuleBasedCollator creation failed. - %s", u_errorName(success)); |
b75a7d8f A |
817 | return; |
818 | } | |
819 | success = U_ZERO_ERROR; | |
820 | RuleBasedCollator *col2 = new RuleBasedCollator(ruleset2, success); | |
821 | if (U_FAILURE(success)) { | |
822 | errln("The RuleBasedCollator constructor failed when building with the 2nd rule set."); | |
823 | return; | |
824 | } | |
825 | logln("The operator tests begin : "); | |
826 | logln("testing operator==, operator!=, clone methods ..."); | |
827 | doAssert((*col1 != *col2), "The two different table collations compared equal"); | |
828 | *col1 = *col2; | |
829 | doAssert((*col1 == *col2), "Collator objects not equal after assignment (operator=)"); | |
830 | ||
831 | success = U_ZERO_ERROR; | |
832 | Collator *col3 = Collator::createInstance(Locale::getEnglish(), success); | |
833 | if (U_FAILURE(success)) { | |
834 | errln("Default collation creation failed."); | |
835 | return; | |
836 | } | |
837 | doAssert((*col1 != *col3), "The two different table collations compared equal"); | |
838 | Collator* col4 = col1->clone(); | |
839 | Collator* col5 = col3->clone(); | |
840 | doAssert((*col1 == *col4), "Cloned collation objects not equal"); | |
841 | doAssert((*col3 != *col4), "Two different table collations compared equal"); | |
842 | doAssert((*col3 == *col5), "Cloned collation objects not equal"); | |
843 | doAssert((*col4 != *col5), "Two cloned collations compared equal"); | |
844 | ||
845 | const UnicodeString& defRules = ((RuleBasedCollator*)col3)->getRules(); | |
846 | RuleBasedCollator* col6 = new RuleBasedCollator(defRules, success); | |
847 | if (U_FAILURE(success)) { | |
848 | errln("Creating default collation with rules failed."); | |
849 | return; | |
850 | } | |
851 | doAssert((((RuleBasedCollator*)col3)->getRules() == col6->getRules()), "Default collator getRules failed"); | |
852 | ||
853 | success = U_ZERO_ERROR; | |
854 | RuleBasedCollator *col7 = new RuleBasedCollator(ruleset2, Collator::TERTIARY, success); | |
855 | if (U_FAILURE(success)) { | |
856 | errln("The RuleBasedCollator constructor failed when building with the 2nd rule set with tertiary strength."); | |
857 | return; | |
858 | } | |
859 | success = U_ZERO_ERROR; | |
860 | RuleBasedCollator *col8 = new RuleBasedCollator(ruleset2, UCOL_OFF, success); | |
861 | if (U_FAILURE(success)) { | |
862 | errln("The RuleBasedCollator constructor failed when building with the 2nd rule set with Normalizer::NO_OP."); | |
863 | return; | |
864 | } | |
865 | success = U_ZERO_ERROR; | |
866 | RuleBasedCollator *col9 = new RuleBasedCollator(ruleset2, Collator::PRIMARY, UCOL_ON, success); | |
867 | if (U_FAILURE(success)) { | |
868 | errln("The RuleBasedCollator constructor failed when building with the 2nd rule set with tertiary strength and Normalizer::NO_OP."); | |
869 | return; | |
870 | } | |
871 | // doAssert((*col7 == *col8), "The two equal table collations compared different"); | |
872 | doAssert((*col7 != *col9), "The two different table collations compared equal"); | |
873 | doAssert((*col8 != *col9), "The two different table collations compared equal"); | |
874 | ||
875 | logln("operator tests ended."); | |
876 | delete col1; | |
877 | delete col2; | |
878 | delete col3; | |
879 | delete col4; | |
880 | delete col5; | |
881 | delete col6; | |
882 | delete col7; | |
883 | delete col8; | |
884 | delete col9; | |
885 | } | |
886 | ||
887 | // test clone and copy | |
888 | void | |
889 | CollationAPITest::TestDuplicate(/* char* par */) | |
890 | { | |
891 | UErrorCode status = U_ZERO_ERROR; | |
892 | Collator *col1 = Collator::createInstance(Locale::getEnglish(), status); | |
893 | if (U_FAILURE(status)) { | |
894 | logln("Default collator creation failed."); | |
895 | return; | |
896 | } | |
897 | Collator *col2 = col1->clone(); | |
898 | doAssert((*col1 == *col2), "Cloned object is not equal to the orginal"); | |
57a6839d A |
899 | UnicodeString ruleset("&9 < a, A < b, B < c, C < d, D, e, E"); |
900 | RuleBasedCollator *col3 = new RuleBasedCollator(ruleset, status); | |
73c04bcf A |
901 | if (U_FAILURE(status)) { |
902 | logln("Collation tailoring failed."); | |
903 | return; | |
904 | } | |
57a6839d A |
905 | doAssert((*col1 != *col3), "Cloned object is equal to some dummy"); |
906 | *col3 = *((RuleBasedCollator*)col1); | |
907 | doAssert((*col1 == *col3), "Copied object is not equal to the orginal"); | |
73c04bcf A |
908 | |
909 | UCollationResult res; | |
910 | UnicodeString first((UChar)0x0061); | |
911 | UnicodeString second((UChar)0x0062); | |
912 | UnicodeString copiedEnglishRules(((RuleBasedCollator*)col1)->getRules()); | |
913 | ||
b75a7d8f | 914 | delete col1; |
73c04bcf A |
915 | |
916 | // Try using the cloned collators after deleting the original data | |
917 | res = col2->compare(first, second, status); | |
918 | if(res != UCOL_LESS) { | |
919 | errln("a should be less then b after tailoring"); | |
920 | } | |
921 | if (((RuleBasedCollator*)col2)->getRules() != copiedEnglishRules) { | |
922 | errln(UnicodeString("English rule difference. ") | |
923 | + copiedEnglishRules + UnicodeString("\ngetRules=") + ((RuleBasedCollator*)col2)->getRules()); | |
924 | } | |
925 | res = col3->compare(first, second, status); | |
926 | if(res != UCOL_LESS) { | |
927 | errln("a should be less then b after tailoring"); | |
928 | } | |
929 | if (col3->getRules() != copiedEnglishRules) { | |
930 | errln(UnicodeString("English rule difference. ") | |
931 | + copiedEnglishRules + UnicodeString("\ngetRules=") + col3->getRules()); | |
932 | } | |
933 | ||
b75a7d8f A |
934 | delete col2; |
935 | delete col3; | |
936 | } | |
937 | ||
938 | void | |
939 | CollationAPITest::TestCompare(/* char* par */) | |
940 | { | |
941 | logln("The compare tests begin : "); | |
942 | Collator *col = 0; | |
943 | UErrorCode success = U_ZERO_ERROR; | |
944 | col = Collator::createInstance(Locale::getEnglish(), success); | |
945 | if (U_FAILURE(success)) { | |
729e4ab9 | 946 | errcheckln(success, "Default collation creation failed. - %s", u_errorName(success)); |
b75a7d8f A |
947 | return; |
948 | } | |
949 | UnicodeString test1("Abcda"), test2("abcda"); | |
950 | logln("Use tertiary comparison level testing ...."); | |
951 | ||
952 | doAssert((!col->equals(test1, test2) ), "Result should be \"Abcda\" != \"abcda\""); | |
953 | doAssert((col->greater(test1, test2) ), "Result should be \"Abcda\" >>> \"abcda\""); | |
954 | doAssert((col->greaterOrEqual(test1, test2) ), "Result should be \"Abcda\" >>> \"abcda\""); | |
955 | ||
956 | col->setStrength(Collator::SECONDARY); | |
957 | logln("Use secondary comparison level testing ...."); | |
958 | ||
959 | doAssert((col->equals(test1, test2) ), "Result should be \"Abcda\" == \"abcda\""); | |
960 | doAssert((!col->greater(test1, test2) ), "Result should be \"Abcda\" == \"abcda\""); | |
961 | doAssert((col->greaterOrEqual(test1, test2) ), "Result should be \"Abcda\" == \"abcda\""); | |
962 | ||
963 | col->setStrength(Collator::PRIMARY); | |
964 | logln("Use primary comparison level testing ...."); | |
965 | ||
966 | doAssert((col->equals(test1, test2) ), "Result should be \"Abcda\" == \"abcda\""); | |
967 | doAssert((!col->greater(test1, test2) ), "Result should be \"Abcda\" == \"abcda\""); | |
968 | doAssert((col->greaterOrEqual(test1, test2) ), "Result should be \"Abcda\" == \"abcda\""); | |
969 | ||
970 | // Test different APIs | |
971 | const UChar* t1 = test1.getBuffer(); | |
972 | int32_t t1Len = test1.length(); | |
973 | const UChar* t2 = test2.getBuffer(); | |
974 | int32_t t2Len = test2.length(); | |
975 | ||
976 | doAssert((col->compare(test1, test2) == Collator::EQUAL), "Problem"); | |
977 | doAssert((col->compare(test1, test2, success) == UCOL_EQUAL), "Problem"); | |
978 | doAssert((col->compare(t1, t1Len, t2, t2Len) == Collator::EQUAL), "Problem"); | |
979 | doAssert((col->compare(t1, t1Len, t2, t2Len, success) == UCOL_EQUAL), "Problem"); | |
980 | doAssert((col->compare(test1, test2, t1Len) == Collator::EQUAL), "Problem"); | |
981 | doAssert((col->compare(test1, test2, t1Len, success) == UCOL_EQUAL), "Problem"); | |
982 | ||
983 | col->setAttribute(UCOL_STRENGTH, UCOL_TERTIARY, success); | |
984 | doAssert((col->compare(test1, test2) == Collator::GREATER), "Problem"); | |
985 | doAssert((col->compare(test1, test2, success) == UCOL_GREATER), "Problem"); | |
986 | doAssert((col->compare(t1, t1Len, t2, t2Len) == Collator::GREATER), "Problem"); | |
987 | doAssert((col->compare(t1, t1Len, t2, t2Len, success) == UCOL_GREATER), "Problem"); | |
988 | doAssert((col->compare(test1, test2, t1Len) == Collator::GREATER), "Problem"); | |
989 | doAssert((col->compare(test1, test2, t1Len, success) == UCOL_GREATER), "Problem"); | |
990 | ||
991 | ||
992 | ||
993 | logln("The compare tests end."); | |
994 | delete col; | |
995 | } | |
996 | ||
997 | void | |
998 | CollationAPITest::TestGetAll(/* char* par */) | |
999 | { | |
46f4442e A |
1000 | int32_t count1, count2; |
1001 | UErrorCode status = U_ZERO_ERROR; | |
1002 | ||
1003 | logln("Trying Collator::getAvailableLocales(int&)"); | |
1004 | ||
1005 | const Locale* list = Collator::getAvailableLocales(count1); | |
1006 | for (int32_t i = 0; i < count1; ++i) { | |
1007 | UnicodeString dispName; | |
1008 | logln(UnicodeString("Locale name: ") | |
1009 | + UnicodeString(list[i].getName()) | |
1010 | + UnicodeString(" , the display name is : ") | |
1011 | + UnicodeString(list[i].getDisplayName(dispName))); | |
1012 | } | |
1013 | ||
1014 | if (count1 == 0 || list == NULL) { | |
729e4ab9 | 1015 | dataerrln("getAvailableLocales(int&) returned an empty list"); |
46f4442e A |
1016 | } |
1017 | ||
1018 | logln("Trying Collator::getAvailableLocales()"); | |
1019 | StringEnumeration* localeEnum = Collator::getAvailableLocales(); | |
1020 | const UnicodeString* locStr; | |
1021 | const char *locCStr; | |
1022 | count2 = 0; | |
1023 | ||
1024 | if (localeEnum == NULL) { | |
729e4ab9 | 1025 | dataerrln("getAvailableLocales() returned NULL"); |
46f4442e A |
1026 | return; |
1027 | } | |
1028 | ||
1029 | while ((locStr = localeEnum->snext(status)) != NULL) | |
1030 | { | |
1031 | logln(UnicodeString("Locale name is: ") + *locStr); | |
1032 | count2++; | |
1033 | } | |
1034 | if (count1 != count2) { | |
1035 | errln("getAvailableLocales(int&) returned %d and getAvailableLocales() returned %d", count1, count2); | |
1036 | } | |
1037 | ||
1038 | logln("Trying Collator::getAvailableLocales() clone"); | |
1039 | count1 = 0; | |
1040 | StringEnumeration* localeEnum2 = localeEnum->clone(); | |
1041 | localeEnum2->reset(status); | |
1042 | while ((locCStr = localeEnum2->next(NULL, status)) != NULL) | |
1043 | { | |
1044 | logln(UnicodeString("Locale name is: ") + UnicodeString(locCStr)); | |
1045 | count1++; | |
1046 | } | |
1047 | if (count1 != count2) { | |
1048 | errln("getAvailableLocales(3rd time) returned %d and getAvailableLocales(2nd time) returned %d", count1, count2); | |
1049 | } | |
1050 | if (localeEnum->count(status) != count1) { | |
1051 | errln("localeEnum->count() returned %d and getAvailableLocales() returned %d", localeEnum->count(status), count1); | |
b75a7d8f | 1052 | } |
46f4442e A |
1053 | delete localeEnum; |
1054 | delete localeEnum2; | |
b75a7d8f A |
1055 | } |
1056 | ||
1057 | void CollationAPITest::TestSortKey() | |
1058 | { | |
1059 | UErrorCode status = U_ZERO_ERROR; | |
1060 | /* | |
1061 | this is supposed to open default date format, but later on it treats | |
1062 | it like it is "en_US" | |
1063 | - very bad if you try to run the tests on machine where default | |
1064 | locale is NOT "en_US" | |
1065 | */ | |
1066 | Collator *col = Collator::createInstance(Locale::getEnglish(), status); | |
1067 | if (U_FAILURE(status)) { | |
729e4ab9 | 1068 | errcheckln(status, "ERROR: Default collation creation failed.: %s\n", u_errorName(status)); |
b75a7d8f A |
1069 | return; |
1070 | } | |
1071 | ||
1072 | if (col->getStrength() != Collator::TERTIARY) | |
1073 | { | |
1074 | errln("ERROR: default collation did not have UCOL_DEFAULT_STRENGTH !\n"); | |
1075 | } | |
1076 | ||
1077 | /* Need to use identical strength */ | |
1078 | col->setAttribute(UCOL_STRENGTH, UCOL_IDENTICAL, status); | |
1079 | ||
b75a7d8f A |
1080 | UChar test1[6] = {0x41, 0x62, 0x63, 0x64, 0x61, 0}, |
1081 | test2[6] = {0x61, 0x62, 0x63, 0x64, 0x61, 0}, | |
1082 | test3[6] = {0x61, 0x62, 0x63, 0x64, 0x61, 0}; | |
1083 | ||
1084 | uint8_t sortkey1[64]; | |
1085 | uint8_t sortkey2[64]; | |
1086 | uint8_t sortkey3[64]; | |
1087 | ||
1088 | logln("Use tertiary comparison level testing ....\n"); | |
1089 | ||
1090 | CollationKey key1; | |
1091 | col->getCollationKey(test1, u_strlen(test1), key1, status); | |
1092 | ||
1093 | CollationKey key2; | |
1094 | col->getCollationKey(test2, u_strlen(test2), key2, status); | |
1095 | ||
1096 | CollationKey key3; | |
1097 | col->getCollationKey(test3, u_strlen(test3), key3, status); | |
1098 | ||
1099 | doAssert(key1.compareTo(key2) == Collator::GREATER, | |
1100 | "Result should be \"Abcda\" > \"abcda\""); | |
1101 | doAssert(key2.compareTo(key1) == Collator::LESS, | |
1102 | "Result should be \"abcda\" < \"Abcda\""); | |
1103 | doAssert(key2.compareTo(key3) == Collator::EQUAL, | |
1104 | "Result should be \"abcda\" == \"abcda\""); | |
1105 | ||
729e4ab9 | 1106 | // Clone the key2 sortkey for later. |
b75a7d8f | 1107 | int32_t keylength = 0; |
729e4ab9 A |
1108 | const uint8_t *key2primary_alias = key2.getByteArray(keylength); |
1109 | LocalArray<uint8_t> key2primary(new uint8_t[keylength]); | |
1110 | memcpy(key2primary.getAlias(), key2primary_alias, keylength); | |
b75a7d8f A |
1111 | |
1112 | col->getSortKey(test1, sortkey1, 64); | |
1113 | col->getSortKey(test2, sortkey2, 64); | |
1114 | col->getSortKey(test3, sortkey3, 64); | |
1115 | ||
1116 | const uint8_t *tempkey = key1.getByteArray(keylength); | |
1117 | doAssert(memcmp(tempkey, sortkey1, keylength) == 0, | |
1118 | "Test1 string should have the same collation key and sort key"); | |
1119 | tempkey = key2.getByteArray(keylength); | |
1120 | doAssert(memcmp(tempkey, sortkey2, keylength) == 0, | |
1121 | "Test2 string should have the same collation key and sort key"); | |
1122 | tempkey = key3.getByteArray(keylength); | |
1123 | doAssert(memcmp(tempkey, sortkey3, keylength) == 0, | |
1124 | "Test3 string should have the same collation key and sort key"); | |
1125 | ||
1126 | col->getSortKey(test1, 5, sortkey1, 64); | |
1127 | col->getSortKey(test2, 5, sortkey2, 64); | |
1128 | col->getSortKey(test3, 5, sortkey3, 64); | |
1129 | ||
1130 | tempkey = key1.getByteArray(keylength); | |
1131 | doAssert(memcmp(tempkey, sortkey1, keylength) == 0, | |
1132 | "Test1 string should have the same collation key and sort key"); | |
1133 | tempkey = key2.getByteArray(keylength); | |
1134 | doAssert(memcmp(tempkey, sortkey2, keylength) == 0, | |
1135 | "Test2 string should have the same collation key and sort key"); | |
1136 | tempkey = key3.getByteArray(keylength); | |
1137 | doAssert(memcmp(tempkey, sortkey3, keylength) == 0, | |
1138 | "Test3 string should have the same collation key and sort key"); | |
1139 | ||
1140 | UnicodeString strtest1(test1); | |
1141 | col->getSortKey(strtest1, sortkey1, 64); | |
1142 | UnicodeString strtest2(test2); | |
1143 | col->getSortKey(strtest2, sortkey2, 64); | |
1144 | UnicodeString strtest3(test3); | |
1145 | col->getSortKey(strtest3, sortkey3, 64); | |
1146 | ||
1147 | tempkey = key1.getByteArray(keylength); | |
1148 | doAssert(memcmp(tempkey, sortkey1, keylength) == 0, | |
1149 | "Test1 string should have the same collation key and sort key"); | |
1150 | tempkey = key2.getByteArray(keylength); | |
1151 | doAssert(memcmp(tempkey, sortkey2, keylength) == 0, | |
1152 | "Test2 string should have the same collation key and sort key"); | |
1153 | tempkey = key3.getByteArray(keylength); | |
1154 | doAssert(memcmp(tempkey, sortkey3, keylength) == 0, | |
1155 | "Test3 string should have the same collation key and sort key"); | |
1156 | ||
1157 | logln("Use secondary comparision level testing ...\n"); | |
1158 | col->setStrength(Collator::SECONDARY); | |
1159 | ||
1160 | col->getCollationKey(test1, u_strlen(test1), key1, status); | |
1161 | col->getCollationKey(test2, u_strlen(test2), key2, status); | |
1162 | col->getCollationKey(test3, u_strlen(test3), key3, status); | |
1163 | ||
1164 | doAssert(key1.compareTo(key2) == Collator::EQUAL, | |
1165 | "Result should be \"Abcda\" == \"abcda\""); | |
1166 | doAssert(key2.compareTo(key3) == Collator::EQUAL, | |
1167 | "Result should be \"abcda\" == \"abcda\""); | |
1168 | ||
1169 | tempkey = key2.getByteArray(keylength); | |
729e4ab9 A |
1170 | doAssert(memcmp(tempkey, key2primary.getAlias(), keylength - 1) == 0, |
1171 | "Binary format for 'abcda' sortkey different for secondary strength!"); | |
b75a7d8f A |
1172 | |
1173 | col->getSortKey(test1, sortkey1, 64); | |
1174 | col->getSortKey(test2, sortkey2, 64); | |
1175 | col->getSortKey(test3, sortkey3, 64); | |
1176 | ||
1177 | tempkey = key1.getByteArray(keylength); | |
1178 | doAssert(memcmp(tempkey, sortkey1, keylength) == 0, | |
1179 | "Test1 string should have the same collation key and sort key"); | |
1180 | tempkey = key2.getByteArray(keylength); | |
1181 | doAssert(memcmp(tempkey, sortkey2, keylength) == 0, | |
1182 | "Test2 string should have the same collation key and sort key"); | |
1183 | tempkey = key3.getByteArray(keylength); | |
1184 | doAssert(memcmp(tempkey, sortkey3, keylength) == 0, | |
1185 | "Test3 string should have the same collation key and sort key"); | |
1186 | ||
1187 | col->getSortKey(test1, 5, sortkey1, 64); | |
1188 | col->getSortKey(test2, 5, sortkey2, 64); | |
1189 | col->getSortKey(test3, 5, sortkey3, 64); | |
1190 | ||
1191 | tempkey = key1.getByteArray(keylength); | |
1192 | doAssert(memcmp(tempkey, sortkey1, keylength) == 0, | |
1193 | "Test1 string should have the same collation key and sort key"); | |
1194 | tempkey = key2.getByteArray(keylength); | |
1195 | doAssert(memcmp(tempkey, sortkey2, keylength) == 0, | |
1196 | "Test2 string should have the same collation key and sort key"); | |
1197 | tempkey = key3.getByteArray(keylength); | |
1198 | doAssert(memcmp(tempkey, sortkey3, keylength) == 0, | |
1199 | "Test3 string should have the same collation key and sort key"); | |
1200 | ||
1201 | col->getSortKey(strtest1, sortkey1, 64); | |
1202 | col->getSortKey(strtest2, sortkey2, 64); | |
1203 | col->getSortKey(strtest3, sortkey3, 64); | |
1204 | ||
1205 | tempkey = key1.getByteArray(keylength); | |
1206 | doAssert(memcmp(tempkey, sortkey1, keylength) == 0, | |
1207 | "Test1 string should have the same collation key and sort key"); | |
1208 | tempkey = key2.getByteArray(keylength); | |
1209 | doAssert(memcmp(tempkey, sortkey2, keylength) == 0, | |
1210 | "Test2 string should have the same collation key and sort key"); | |
1211 | tempkey = key3.getByteArray(keylength); | |
1212 | doAssert(memcmp(tempkey, sortkey3, keylength) == 0, | |
1213 | "Test3 string should have the same collation key and sort key"); | |
1214 | ||
1215 | logln("testing sortkey ends..."); | |
1216 | delete col; | |
1217 | } | |
1218 | ||
4388f060 A |
1219 | void CollationAPITest::TestSortKeyOverflow() { |
1220 | IcuTestErrorCode errorCode(*this, "TestSortKeyOverflow()"); | |
1221 | LocalPointer<Collator> col(Collator::createInstance(Locale::getEnglish(), errorCode)); | |
1222 | if (errorCode.logDataIfFailureAndReset("Collator::createInstance(English) failed")) { | |
1223 | return; | |
1224 | } | |
1225 | col->setAttribute(UCOL_STRENGTH, UCOL_PRIMARY, errorCode); | |
1226 | UChar i_and_phi[] = { 0x438, 0x3c6 }; // Cyrillic small i & Greek small phi. | |
1227 | // The sort key should be 6 bytes: | |
1228 | // 2 bytes for the Cyrillic i, 1 byte for the primary-compression terminator, | |
1229 | // 2 bytes for the Greek phi, and 1 byte for the NUL terminator. | |
1230 | uint8_t sortKey[12]; | |
b331163b | 1231 | int32_t length = col->getSortKey(i_and_phi, 2, sortKey, UPRV_LENGTHOF(sortKey)); |
4388f060 A |
1232 | uint8_t sortKey2[12]; |
1233 | for (int32_t capacity = 0; capacity < length; ++capacity) { | |
b331163b | 1234 | uprv_memset(sortKey2, 2, UPRV_LENGTHOF(sortKey2)); |
4388f060 A |
1235 | int32_t length2 = col->getSortKey(i_and_phi, 2, sortKey2, capacity); |
1236 | if (length2 != length || 0 != uprv_memcmp(sortKey, sortKey2, capacity)) { | |
1237 | errln("getSortKey(i_and_phi, capacity=%d) failed to write proper prefix", capacity); | |
1238 | } else if (sortKey2[capacity] != 2 || sortKey2[capacity + 1] != 2) { | |
1239 | errln("getSortKey(i_and_phi, capacity=%d) wrote beyond capacity", capacity); | |
1240 | } | |
1241 | } | |
1242 | ||
1243 | // Now try to break getCollationKey(). | |
1244 | // Internally, it always starts with a large stack buffer. | |
1245 | // Since we cannot control the initial capacity, we throw an increasing number | |
1246 | // of characters at it, with the problematic part at the end. | |
1247 | const int32_t longCapacity = 2000; | |
1248 | // Each 'a' in the prefix should result in one primary sort key byte. | |
1249 | // For i_and_phi we expect 6 bytes, then the NUL terminator. | |
1250 | const int32_t maxPrefixLength = longCapacity - 6 - 1; | |
1251 | LocalArray<uint8_t> longSortKey(new uint8_t[longCapacity]); | |
1252 | UnicodeString s(FALSE, i_and_phi, 2); | |
1253 | for (int32_t prefixLength = 0; prefixLength < maxPrefixLength; ++prefixLength) { | |
1254 | length = col->getSortKey(s, longSortKey.getAlias(), longCapacity); | |
1255 | CollationKey collKey; | |
1256 | col->getCollationKey(s, collKey, errorCode); | |
1257 | int32_t collKeyLength; | |
1258 | const uint8_t *collSortKey = collKey.getByteArray(collKeyLength); | |
1259 | if (collKeyLength != length || 0 != uprv_memcmp(longSortKey.getAlias(), collSortKey, length)) { | |
1260 | errln("getCollationKey(prefix[%d]+i_and_phi) failed to write proper sort key", prefixLength); | |
1261 | } | |
1262 | ||
1263 | // Insert an 'a' to match ++prefixLength. | |
1264 | s.insert(prefixLength, (UChar)0x61); | |
1265 | } | |
1266 | } | |
1267 | ||
b75a7d8f A |
1268 | void CollationAPITest::TestMaxExpansion() |
1269 | { | |
1270 | UErrorCode status = U_ZERO_ERROR; | |
1271 | UChar ch = 0; | |
374ca955 | 1272 | UChar32 unassigned = 0xEFFFD; |
b75a7d8f A |
1273 | uint32_t sorder = 0; |
1274 | uint32_t temporder = 0; | |
1275 | ||
1276 | UnicodeString rule("&a < ab < c/aba < d < z < ch"); | |
1277 | RuleBasedCollator coll(rule, status); | |
1278 | if(U_FAILURE(status)) { | |
729e4ab9 | 1279 | errcheckln(status, "Collator creation failed with error %s", u_errorName(status)); |
b75a7d8f A |
1280 | return; |
1281 | } | |
1282 | UnicodeString str(ch); | |
1283 | CollationElementIterator *iter = | |
1284 | coll.createCollationElementIterator(str); | |
1285 | ||
1286 | while (ch < 0xFFFF && U_SUCCESS(status)) { | |
1287 | int count = 1; | |
1288 | uint32_t order; | |
1289 | int32_t size = 0; | |
1290 | ||
1291 | ch ++; | |
1292 | ||
1293 | str.setCharAt(0, ch); | |
1294 | iter->setText(str, status); | |
1295 | order = iter->previous(status); | |
1296 | ||
1297 | /* thai management */ | |
1298 | if (order == 0) | |
1299 | order = iter->previous(status); | |
1300 | ||
57a6839d | 1301 | while (U_SUCCESS(status) && iter->previous(status) != CollationElementIterator::NULLORDER) { |
b75a7d8f A |
1302 | count ++; |
1303 | } | |
1304 | ||
1305 | size = coll.getMaxExpansion(order); | |
1306 | if (U_FAILURE(status) || size < count) { | |
729e4ab9 A |
1307 | errln("Failure at codepoint U+%04X, maximum expansion count %d < %d", |
1308 | ch, size, count); | |
b75a7d8f A |
1309 | } |
1310 | } | |
1311 | ||
1312 | /* testing for exact max expansion */ | |
729e4ab9 | 1313 | int32_t size; |
b75a7d8f A |
1314 | ch = 0; |
1315 | while (ch < 0x61) { | |
1316 | uint32_t order; | |
b75a7d8f A |
1317 | str.setCharAt(0, ch); |
1318 | iter->setText(str, status); | |
1319 | order = iter->previous(status); | |
1320 | size = coll.getMaxExpansion(order); | |
1321 | if (U_FAILURE(status) || size != 1) { | |
729e4ab9 A |
1322 | errln("Failure at codepoint U+%04X, maximum expansion count %d < %d", |
1323 | ch, size, 1); | |
b75a7d8f A |
1324 | } |
1325 | ch ++; | |
1326 | } | |
1327 | ||
1328 | ch = 0x63; | |
1329 | str.setTo(ch); | |
1330 | iter->setText(str, status); | |
1331 | temporder = iter->previous(status); | |
729e4ab9 A |
1332 | size = coll.getMaxExpansion(temporder); |
1333 | if (U_FAILURE(status) || size != 3) { | |
1334 | errln("Failure at codepoint U+%04X, CE %08x, maximum expansion count %d != %d", | |
1335 | ch, temporder, size, 3); | |
b75a7d8f A |
1336 | } |
1337 | ||
1338 | ch = 0x64; | |
1339 | str.setTo(ch); | |
1340 | iter->setText(str, status); | |
1341 | temporder = iter->previous(status); | |
729e4ab9 A |
1342 | size = coll.getMaxExpansion(temporder); |
1343 | if (U_FAILURE(status) || size != 1) { | |
1344 | errln("Failure at codepoint U+%04X, CE %08x, maximum expansion count %d != %d", | |
1345 | ch, temporder, size, 1); | |
b75a7d8f A |
1346 | } |
1347 | ||
374ca955 | 1348 | str.setTo(unassigned); |
b75a7d8f A |
1349 | iter->setText(str, status); |
1350 | sorder = iter->previous(status); | |
729e4ab9 A |
1351 | size = coll.getMaxExpansion(sorder); |
1352 | if (U_FAILURE(status) || size != 2) { | |
1353 | errln("Failure at supplementary codepoints, maximum expansion count %d < %d", | |
1354 | size, 2); | |
b75a7d8f A |
1355 | } |
1356 | ||
1357 | /* testing jamo */ | |
1358 | ch = 0x1165; | |
1359 | str.setTo(ch); | |
1360 | iter->setText(str, status); | |
1361 | temporder = iter->previous(status); | |
729e4ab9 A |
1362 | size = coll.getMaxExpansion(temporder); |
1363 | if (U_FAILURE(status) || size > 3) { | |
1364 | errln("Failure at codepoint U+%04X, maximum expansion count %d > %d", | |
1365 | ch, size, 3); | |
b75a7d8f A |
1366 | } |
1367 | ||
1368 | delete iter; | |
1369 | ||
1370 | /* testing special jamo &a<\u1160 */ | |
1371 | rule = CharsToUnicodeString("\\u0026\\u0071\\u003c\\u1165\\u002f\\u0071\\u0071\\u0071\\u0071"); | |
1372 | ||
1373 | RuleBasedCollator jamocoll(rule, status); | |
1374 | iter = jamocoll.createCollationElementIterator(str); | |
1375 | temporder = iter->previous(status); | |
729e4ab9 A |
1376 | size = iter->getMaxExpansion(temporder); |
1377 | if (U_FAILURE(status) || size != 6) { | |
1378 | errln("Failure at codepoint U+%04X, maximum expansion count %d > %d", | |
1379 | ch, size, 5); | |
b75a7d8f A |
1380 | } |
1381 | ||
1382 | delete iter; | |
1383 | } | |
1384 | ||
1385 | void CollationAPITest::TestDisplayName() | |
1386 | { | |
1387 | UErrorCode error = U_ZERO_ERROR; | |
1388 | Collator *coll = Collator::createInstance("en_US", error); | |
1389 | if (U_FAILURE(error)) { | |
729e4ab9 | 1390 | errcheckln(error, "Failure creating english collator - %s", u_errorName(error)); |
b75a7d8f A |
1391 | return; |
1392 | } | |
1393 | UnicodeString name; | |
1394 | UnicodeString result; | |
1395 | coll->getDisplayName(Locale::getCanadaFrench(), result); | |
1396 | Locale::getCanadaFrench().getDisplayName(name); | |
1397 | if (result.compare(name)) { | |
1398 | errln("Failure getting the correct name for locale en_US"); | |
1399 | } | |
1400 | ||
1401 | coll->getDisplayName(Locale::getSimplifiedChinese(), result); | |
1402 | Locale::getSimplifiedChinese().getDisplayName(name); | |
1403 | if (result.compare(name)) { | |
1404 | errln("Failure getting the correct name for locale zh_SG"); | |
1405 | } | |
1406 | delete coll; | |
1407 | } | |
1408 | ||
1409 | void CollationAPITest::TestAttribute() | |
1410 | { | |
1411 | UErrorCode error = U_ZERO_ERROR; | |
1412 | Collator *coll = Collator::createInstance(error); | |
1413 | ||
1414 | if (U_FAILURE(error)) { | |
729e4ab9 | 1415 | errcheckln(error, "Creation of default collator failed - %s", u_errorName(error)); |
b75a7d8f A |
1416 | return; |
1417 | } | |
1418 | ||
1419 | coll->setAttribute(UCOL_FRENCH_COLLATION, UCOL_OFF, error); | |
1420 | if (coll->getAttribute(UCOL_FRENCH_COLLATION, error) != UCOL_OFF || | |
1421 | U_FAILURE(error)) { | |
1422 | errln("Setting and retrieving of the french collation failed"); | |
1423 | } | |
1424 | ||
1425 | coll->setAttribute(UCOL_FRENCH_COLLATION, UCOL_ON, error); | |
1426 | if (coll->getAttribute(UCOL_FRENCH_COLLATION, error) != UCOL_ON || | |
1427 | U_FAILURE(error)) { | |
1428 | errln("Setting and retrieving of the french collation failed"); | |
1429 | } | |
1430 | ||
1431 | coll->setAttribute(UCOL_ALTERNATE_HANDLING, UCOL_SHIFTED, error); | |
1432 | if (coll->getAttribute(UCOL_ALTERNATE_HANDLING, error) != UCOL_SHIFTED || | |
1433 | U_FAILURE(error)) { | |
1434 | errln("Setting and retrieving of the alternate handling failed"); | |
1435 | } | |
1436 | ||
1437 | coll->setAttribute(UCOL_ALTERNATE_HANDLING, UCOL_NON_IGNORABLE, error); | |
1438 | if (coll->getAttribute(UCOL_ALTERNATE_HANDLING, error) != UCOL_NON_IGNORABLE || | |
1439 | U_FAILURE(error)) { | |
1440 | errln("Setting and retrieving of the alternate handling failed"); | |
1441 | } | |
1442 | ||
1443 | coll->setAttribute(UCOL_CASE_FIRST, UCOL_LOWER_FIRST, error); | |
1444 | if (coll->getAttribute(UCOL_CASE_FIRST, error) != UCOL_LOWER_FIRST || | |
1445 | U_FAILURE(error)) { | |
1446 | errln("Setting and retrieving of the case first attribute failed"); | |
1447 | } | |
1448 | ||
1449 | coll->setAttribute(UCOL_CASE_FIRST, UCOL_UPPER_FIRST, error); | |
1450 | if (coll->getAttribute(UCOL_CASE_FIRST, error) != UCOL_UPPER_FIRST || | |
1451 | U_FAILURE(error)) { | |
1452 | errln("Setting and retrieving of the case first attribute failed"); | |
1453 | } | |
1454 | ||
1455 | coll->setAttribute(UCOL_CASE_LEVEL, UCOL_ON, error); | |
1456 | if (coll->getAttribute(UCOL_CASE_LEVEL, error) != UCOL_ON || | |
1457 | U_FAILURE(error)) { | |
1458 | errln("Setting and retrieving of the case level attribute failed"); | |
1459 | } | |
1460 | ||
1461 | coll->setAttribute(UCOL_CASE_LEVEL, UCOL_OFF, error); | |
1462 | if (coll->getAttribute(UCOL_CASE_LEVEL, error) != UCOL_OFF || | |
1463 | U_FAILURE(error)) { | |
1464 | errln("Setting and retrieving of the case level attribute failed"); | |
1465 | } | |
1466 | ||
1467 | coll->setAttribute(UCOL_NORMALIZATION_MODE, UCOL_ON, error); | |
1468 | if (coll->getAttribute(UCOL_NORMALIZATION_MODE, error) != UCOL_ON || | |
1469 | U_FAILURE(error)) { | |
1470 | errln("Setting and retrieving of the normalization on/off attribute failed"); | |
1471 | } | |
1472 | ||
1473 | coll->setAttribute(UCOL_NORMALIZATION_MODE, UCOL_OFF, error); | |
1474 | if (coll->getAttribute(UCOL_NORMALIZATION_MODE, error) != UCOL_OFF || | |
1475 | U_FAILURE(error)) { | |
1476 | errln("Setting and retrieving of the normalization on/off attribute failed"); | |
1477 | } | |
1478 | ||
1479 | coll->setAttribute(UCOL_STRENGTH, UCOL_PRIMARY, error); | |
1480 | if (coll->getAttribute(UCOL_STRENGTH, error) != UCOL_PRIMARY || | |
1481 | U_FAILURE(error)) { | |
1482 | errln("Setting and retrieving of the collation strength failed"); | |
1483 | } | |
1484 | ||
1485 | coll->setAttribute(UCOL_STRENGTH, UCOL_SECONDARY, error); | |
1486 | if (coll->getAttribute(UCOL_STRENGTH, error) != UCOL_SECONDARY || | |
1487 | U_FAILURE(error)) { | |
1488 | errln("Setting and retrieving of the collation strength failed"); | |
1489 | } | |
1490 | ||
1491 | coll->setAttribute(UCOL_STRENGTH, UCOL_TERTIARY, error); | |
1492 | if (coll->getAttribute(UCOL_STRENGTH, error) != UCOL_TERTIARY || | |
1493 | U_FAILURE(error)) { | |
1494 | errln("Setting and retrieving of the collation strength failed"); | |
1495 | } | |
1496 | ||
1497 | coll->setAttribute(UCOL_STRENGTH, UCOL_QUATERNARY, error); | |
1498 | if (coll->getAttribute(UCOL_STRENGTH, error) != UCOL_QUATERNARY || | |
1499 | U_FAILURE(error)) { | |
1500 | errln("Setting and retrieving of the collation strength failed"); | |
1501 | } | |
1502 | ||
1503 | coll->setAttribute(UCOL_STRENGTH, UCOL_IDENTICAL, error); | |
1504 | if (coll->getAttribute(UCOL_STRENGTH, error) != UCOL_IDENTICAL || | |
1505 | U_FAILURE(error)) { | |
1506 | errln("Setting and retrieving of the collation strength failed"); | |
1507 | } | |
1508 | ||
1509 | delete coll; | |
1510 | } | |
1511 | ||
1512 | void CollationAPITest::TestVariableTopSetting() { | |
1513 | UErrorCode status = U_ZERO_ERROR; | |
1514 | ||
1515 | UChar vt[256] = { 0 }; | |
1516 | ||
57a6839d A |
1517 | // Use the root collator, not the default collator. |
1518 | // This test fails with en_US_POSIX which tailors the dollar sign after 'A'. | |
1519 | Collator *coll = Collator::createInstance(Locale::getRoot(), status); | |
b75a7d8f A |
1520 | if(U_FAILURE(status)) { |
1521 | delete coll; | |
729e4ab9 | 1522 | errcheckln(status, "Collator creation failed with error %s", u_errorName(status)); |
b75a7d8f A |
1523 | return; |
1524 | } | |
1525 | ||
1526 | uint32_t oldVarTop = coll->getVariableTop(status); | |
1527 | ||
57a6839d A |
1528 | // ICU 53+: The character must be in a supported reordering group, |
1529 | // and the variable top is pinned to the end of that group. | |
b75a7d8f A |
1530 | vt[0] = 0x0041; |
1531 | ||
57a6839d A |
1532 | (void)coll->setVariableTop(vt, 1, status); |
1533 | if(status != U_ILLEGAL_ARGUMENT_ERROR) { | |
1534 | errln("setVariableTop(letter) did not detect illegal argument - %s", u_errorName(status)); | |
1535 | } | |
1536 | ||
1537 | status = U_ZERO_ERROR; | |
1538 | vt[0] = 0x24; // dollar sign (currency symbol) | |
b75a7d8f | 1539 | uint32_t newVarTop = coll->setVariableTop(vt, 1, status); |
b331163b A |
1540 | if(U_FAILURE(status)) { |
1541 | errln("setVariableTop(dollar sign) failed: %s", u_errorName(status)); | |
1542 | return; | |
1543 | } | |
57a6839d A |
1544 | if(newVarTop != coll->getVariableTop(status)) { |
1545 | errln("setVariableTop(dollar sign) != following getVariableTop()"); | |
b75a7d8f A |
1546 | } |
1547 | ||
57a6839d A |
1548 | UnicodeString dollar((UChar)0x24); |
1549 | UnicodeString euro((UChar)0x20AC); | |
1550 | uint32_t newVarTop2 = coll->setVariableTop(euro, status); | |
1551 | assertEquals("setVariableTop(Euro sign) == following getVariableTop()", | |
1552 | (int64_t)newVarTop2, (int64_t)coll->getVariableTop(status)); | |
1553 | assertEquals("setVariableTop(Euro sign) == setVariableTop(dollar sign) (should pin to top of currency group)", | |
1554 | (int64_t)newVarTop2, (int64_t)newVarTop); | |
1555 | ||
1556 | coll->setAttribute(UCOL_ALTERNATE_HANDLING, UCOL_SHIFTED, status); | |
1557 | assertEquals("empty==dollar", UCOL_EQUAL, coll->compare(UnicodeString(), dollar)); | |
1558 | assertEquals("empty==euro", UCOL_EQUAL, coll->compare(UnicodeString(), euro)); | |
1559 | assertEquals("dollar<zero", UCOL_LESS, coll->compare(dollar, UnicodeString((UChar)0x30))); | |
1560 | ||
b75a7d8f A |
1561 | coll->setVariableTop(oldVarTop, status); |
1562 | ||
1563 | uint32_t newerVarTop = coll->setVariableTop(UnicodeString(vt, 1), status); | |
1564 | ||
57a6839d | 1565 | if(newVarTop != newerVarTop) { |
b75a7d8f A |
1566 | errln("Didn't set vartop properly from UnicodeString!\n"); |
1567 | } | |
1568 | ||
1569 | delete coll; | |
1570 | ||
1571 | } | |
1572 | ||
57a6839d A |
1573 | void CollationAPITest::TestMaxVariable() { |
1574 | UErrorCode errorCode = U_ZERO_ERROR; | |
1575 | LocalPointer<Collator> coll(Collator::createInstance(Locale::getRoot(), errorCode)); | |
1576 | if(U_FAILURE(errorCode)) { | |
1577 | errcheckln(errorCode, "Collator creation failed with error %s", u_errorName(errorCode)); | |
1578 | return; | |
1579 | } | |
1580 | ||
1581 | (void)coll->setMaxVariable(UCOL_REORDER_CODE_OTHERS, errorCode); | |
1582 | if(errorCode != U_ILLEGAL_ARGUMENT_ERROR) { | |
1583 | errln("setMaxVariable(others) did not detect illegal argument - %s", u_errorName(errorCode)); | |
1584 | } | |
1585 | ||
1586 | errorCode = U_ZERO_ERROR; | |
1587 | (void)coll->setMaxVariable(UCOL_REORDER_CODE_CURRENCY, errorCode); | |
1588 | ||
1589 | if(UCOL_REORDER_CODE_CURRENCY != coll->getMaxVariable()) { | |
1590 | errln("setMaxVariable(currency) != following getMaxVariable()"); | |
1591 | } | |
1592 | ||
1593 | coll->setAttribute(UCOL_ALTERNATE_HANDLING, UCOL_SHIFTED, errorCode); | |
1594 | assertEquals("empty==dollar", UCOL_EQUAL, coll->compare(UnicodeString(), UnicodeString((UChar)0x24))); | |
1595 | assertEquals("empty==euro", UCOL_EQUAL, coll->compare(UnicodeString(), UnicodeString((UChar)0x20AC))); | |
1596 | assertEquals("dollar<zero", UCOL_LESS, coll->compare(UnicodeString((UChar)0x24), UnicodeString((UChar)0x30))); | |
1597 | } | |
1598 | ||
b75a7d8f A |
1599 | void CollationAPITest::TestGetLocale() { |
1600 | UErrorCode status = U_ZERO_ERROR; | |
1601 | const char *rules = "&a<x<y<z"; | |
1602 | UChar rlz[256] = {0}; | |
1603 | ||
57a6839d A |
1604 | Collator *coll = Collator::createInstance("root", status); |
1605 | if(U_FAILURE(status)) { | |
1606 | dataerrln("Failed to open collator for \"root\" with %s", u_errorName(status)); | |
1607 | return; | |
1608 | } | |
1609 | Locale locale = coll->getLocale(ULOC_ACTUAL_LOCALE, status); | |
1610 | if(locale != Locale::getRoot()) { | |
1611 | errln("Collator::createInstance(\"root\").getLocale(actual) != Locale::getRoot(); " | |
1612 | "getLocale().getName() = \"%s\"", | |
1613 | locale.getName()); | |
1614 | } | |
1615 | delete coll; | |
1616 | ||
1617 | coll = Collator::createInstance("", status); | |
1618 | if(U_FAILURE(status)) { | |
1619 | dataerrln("Failed to open collator for \"\" with %s", u_errorName(status)); | |
1620 | return; | |
1621 | } | |
1622 | locale = coll->getLocale(ULOC_ACTUAL_LOCALE, status); | |
1623 | if(locale != Locale::getRoot()) { | |
1624 | errln("Collator::createInstance(\"\").getLocale(actual) != Locale::getRoot(); " | |
1625 | "getLocale().getName() = \"%s\"", | |
1626 | locale.getName()); | |
1627 | } | |
1628 | delete coll; | |
b75a7d8f A |
1629 | |
1630 | int32_t i = 0; | |
1631 | ||
1632 | static const struct { | |
1633 | const char* requestedLocale; | |
1634 | const char* validLocale; | |
1635 | const char* actualLocale; | |
1636 | } testStruct[] = { | |
57a6839d A |
1637 | // Note: Locale::getRoot().getName() == "" not "root". |
1638 | { "de_DE", "de", "" }, | |
1639 | { "sr_RS", "sr_Cyrl_RS", "sr" }, | |
1640 | { "en_US_CALIFORNIA", "en_US", "" }, | |
1641 | { "fr_FR_NONEXISTANT", "fr", "" }, | |
1642 | // pinyin is the default, therefore suppressed. | |
1643 | { "zh_CN", "zh_Hans_CN", "zh" }, | |
1644 | // zh_Hant has default=stroke but the data is in zh. | |
1645 | { "zh_TW", "zh_Hant_TW", "zh@collation=stroke" }, | |
1646 | { "zh_TW@collation=pinyin", "zh_Hant_TW@collation=pinyin", "zh" }, | |
1647 | { "zh_CN@collation=stroke", "zh_Hans_CN@collation=stroke", "zh@collation=stroke" } | |
b75a7d8f A |
1648 | }; |
1649 | ||
1650 | u_unescape(rules, rlz, 256); | |
1651 | ||
1652 | /* test opening collators for different locales */ | |
2ca993e8 | 1653 | for(i = 0; i<UPRV_LENGTHOF(testStruct); i++) { |
b75a7d8f A |
1654 | status = U_ZERO_ERROR; |
1655 | coll = Collator::createInstance(testStruct[i].requestedLocale, status); | |
1656 | if(U_FAILURE(status)) { | |
57a6839d | 1657 | errln("Failed to open collator for %s with %s", testStruct[i].requestedLocale, u_errorName(status)); |
b75a7d8f A |
1658 | delete coll; |
1659 | continue; | |
1660 | } | |
57a6839d A |
1661 | // The requested locale may be the same as the valid locale, |
1662 | // or may not be supported at all. See ticket #10477. | |
b75a7d8f | 1663 | locale = coll->getLocale(ULOC_REQUESTED_LOCALE, status); |
b331163b A |
1664 | if(U_SUCCESS(status) && |
1665 | locale != testStruct[i].requestedLocale && locale != testStruct[i].validLocale) { | |
57a6839d A |
1666 | errln("[Coll %s]: Error in requested locale, expected %s or %s, got %s", |
1667 | testStruct[i].requestedLocale, | |
1668 | testStruct[i].requestedLocale, testStruct[i].validLocale, locale.getName()); | |
b75a7d8f | 1669 | } |
b331163b | 1670 | status = U_ZERO_ERROR; |
b75a7d8f A |
1671 | locale = coll->getLocale(ULOC_VALID_LOCALE, status); |
1672 | if(locale != testStruct[i].validLocale) { | |
57a6839d A |
1673 | errln("[Coll %s]: Error in valid locale, expected %s, got %s", |
1674 | testStruct[i].requestedLocale, testStruct[i].validLocale, locale.getName()); | |
b75a7d8f A |
1675 | } |
1676 | locale = coll->getLocale(ULOC_ACTUAL_LOCALE, status); | |
1677 | if(locale != testStruct[i].actualLocale) { | |
57a6839d A |
1678 | errln("[Coll %s]: Error in actual locale, expected %s, got %s", |
1679 | testStruct[i].requestedLocale, testStruct[i].actualLocale, locale.getName()); | |
1680 | } | |
1681 | // If we open a collator for the actual locale, we should get an equivalent one again. | |
1682 | LocalPointer<Collator> coll2(Collator::createInstance(locale, status)); | |
1683 | if(U_FAILURE(status)) { | |
1684 | errln("Failed to open collator for actual locale \"%s\" with %s", | |
1685 | locale.getName(), u_errorName(status)); | |
1686 | } else { | |
1687 | Locale actual2 = coll2->getLocale(ULOC_ACTUAL_LOCALE, status); | |
1688 | if(actual2 != locale) { | |
1689 | errln("[Coll actual \"%s\"]: Error in actual locale, got different one: \"%s\"", | |
1690 | locale.getName(), actual2.getName()); | |
1691 | } | |
1692 | if(*coll2 != *coll) { | |
1693 | errln("[Coll actual \"%s\"]: Got different collator than before", locale.getName()); | |
1694 | } | |
b75a7d8f A |
1695 | } |
1696 | delete coll; | |
1697 | } | |
1698 | ||
b331163b | 1699 | /* completely non-existent locale for collator should get a root collator */ |
b75a7d8f | 1700 | { |
b331163b | 1701 | LocalPointer<Collator> coll(Collator::createInstance("blahaha", status)); |
b75a7d8f | 1702 | if(U_FAILURE(status)) { |
57a6839d | 1703 | errln("Failed to open collator with %s", u_errorName(status)); |
b75a7d8f A |
1704 | return; |
1705 | } | |
b331163b A |
1706 | Locale valid = coll->getLocale(ULOC_VALID_LOCALE, status); |
1707 | const char *name = valid.getName(); | |
1708 | if(*name != 0 && strcmp(name, "root") != 0) { | |
1709 | errln("Valid locale for nonexisting-locale collator is \"%s\" not root", name); | |
b75a7d8f | 1710 | } |
b331163b A |
1711 | Locale actual = coll->getLocale(ULOC_ACTUAL_LOCALE, status); |
1712 | name = actual.getName(); | |
1713 | if(*name != 0 && strcmp(name, "root") != 0) { | |
1714 | errln("Actual locale for nonexisting-locale collator is \"%s\" not root", name); | |
b75a7d8f | 1715 | } |
b75a7d8f A |
1716 | } |
1717 | ||
1718 | ||
1719 | ||
1720 | /* collator instantiated from rules should have all three locales NULL */ | |
1721 | coll = new RuleBasedCollator(rlz, status); | |
1722 | locale = coll->getLocale(ULOC_REQUESTED_LOCALE, status); | |
b331163b | 1723 | if(U_SUCCESS(status) && !locale.isBogus()) { |
57a6839d | 1724 | errln("For collator instantiated from rules, requested locale %s is not bogus", locale.getName()); |
b75a7d8f | 1725 | } |
b331163b | 1726 | status = U_ZERO_ERROR; |
b75a7d8f A |
1727 | locale = coll->getLocale(ULOC_VALID_LOCALE, status); |
1728 | if(!locale.isBogus()) { | |
57a6839d | 1729 | errln("For collator instantiated from rules, valid locale %s is not bogus", locale.getName()); |
b75a7d8f A |
1730 | } |
1731 | locale = coll->getLocale(ULOC_ACTUAL_LOCALE, status); | |
1732 | if(!locale.isBogus()) { | |
57a6839d | 1733 | errln("For collator instantiated from rules, actual locale %s is not bogus", locale.getName()); |
b75a7d8f A |
1734 | } |
1735 | delete coll; | |
1736 | } | |
1737 | ||
1738 | struct teststruct { | |
1739 | const char *original; | |
1740 | uint8_t key[256]; | |
1741 | }; | |
1742 | ||
1743 | ||
1744 | ||
1745 | U_CDECL_BEGIN | |
1746 | static int U_CALLCONV | |
1747 | compare_teststruct(const void *string1, const void *string2) { | |
1748 | return(strcmp((const char *)((struct teststruct *)string1)->key, (const char *)((struct teststruct *)string2)->key)); | |
1749 | } | |
1750 | U_CDECL_END | |
1751 | ||
1752 | ||
1753 | void CollationAPITest::TestBounds(void) { | |
1754 | UErrorCode status = U_ZERO_ERROR; | |
1755 | ||
1756 | Collator *coll = Collator::createInstance(Locale("sh"), status); | |
1757 | if(U_FAILURE(status)) { | |
1758 | delete coll; | |
729e4ab9 | 1759 | errcheckln(status, "Collator creation failed with %s", u_errorName(status)); |
b75a7d8f A |
1760 | return; |
1761 | } | |
1762 | ||
1763 | uint8_t sortkey[512], lower[512], upper[512]; | |
1764 | UChar buffer[512]; | |
1765 | ||
46f4442e | 1766 | static const char * const test[] = { |
b75a7d8f A |
1767 | "John Smith", |
1768 | "JOHN SMITH", | |
1769 | "john SMITH", | |
1770 | "j\\u00F6hn sm\\u00EFth", | |
1771 | "J\\u00F6hn Sm\\u00EFth", | |
1772 | "J\\u00D6HN SM\\u00CFTH", | |
1773 | "john smithsonian", | |
1774 | "John Smithsonian" | |
1775 | }; | |
1776 | ||
46f4442e | 1777 | struct teststruct tests[] = { |
b75a7d8f A |
1778 | {"\\u010CAKI MIHALJ", {0}}, |
1779 | {"\\u010CAKI MIHALJ", {0}}, | |
1780 | {"\\u010CAKI PIRO\\u0160KA", {0}}, | |
1781 | {"\\u010CABAI ANDRIJA", {0}}, | |
1782 | {"\\u010CABAI LAJO\\u0160", {0}}, | |
1783 | {"\\u010CABAI MARIJA", {0}}, | |
1784 | {"\\u010CABAI STEVAN", {0}}, | |
1785 | {"\\u010CABAI STEVAN", {0}}, | |
1786 | {"\\u010CABARKAPA BRANKO", {0}}, | |
1787 | {"\\u010CABARKAPA MILENKO", {0}}, | |
1788 | {"\\u010CABARKAPA MIROSLAV", {0}}, | |
1789 | {"\\u010CABARKAPA SIMO", {0}}, | |
1790 | {"\\u010CABARKAPA STANKO", {0}}, | |
1791 | {"\\u010CABARKAPA TAMARA", {0}}, | |
1792 | {"\\u010CABARKAPA TOMA\\u0160", {0}}, | |
1793 | {"\\u010CABDARI\\u0106 NIKOLA", {0}}, | |
1794 | {"\\u010CABDARI\\u0106 ZORICA", {0}}, | |
1795 | {"\\u010CABI NANDOR", {0}}, | |
1796 | {"\\u010CABOVI\\u0106 MILAN", {0}}, | |
1797 | {"\\u010CABRADI AGNEZIJA", {0}}, | |
1798 | {"\\u010CABRADI IVAN", {0}}, | |
1799 | {"\\u010CABRADI JELENA", {0}}, | |
1800 | {"\\u010CABRADI LJUBICA", {0}}, | |
1801 | {"\\u010CABRADI STEVAN", {0}}, | |
1802 | {"\\u010CABRDA MARTIN", {0}}, | |
1803 | {"\\u010CABRILO BOGDAN", {0}}, | |
1804 | {"\\u010CABRILO BRANISLAV", {0}}, | |
1805 | {"\\u010CABRILO LAZAR", {0}}, | |
1806 | {"\\u010CABRILO LJUBICA", {0}}, | |
1807 | {"\\u010CABRILO SPASOJA", {0}}, | |
1808 | {"\\u010CADE\\u0160 ZDENKA", {0}}, | |
1809 | {"\\u010CADESKI BLAGOJE", {0}}, | |
1810 | {"\\u010CADOVSKI VLADIMIR", {0}}, | |
1811 | {"\\u010CAGLJEVI\\u0106 TOMA", {0}}, | |
1812 | {"\\u010CAGOROVI\\u0106 VLADIMIR", {0}}, | |
1813 | {"\\u010CAJA VANKA", {0}}, | |
1814 | {"\\u010CAJI\\u0106 BOGOLJUB", {0}}, | |
1815 | {"\\u010CAJI\\u0106 BORISLAV", {0}}, | |
1816 | {"\\u010CAJI\\u0106 RADOSLAV", {0}}, | |
1817 | {"\\u010CAK\\u0160IRAN MILADIN", {0}}, | |
1818 | {"\\u010CAKAN EUGEN", {0}}, | |
1819 | {"\\u010CAKAN EVGENIJE", {0}}, | |
1820 | {"\\u010CAKAN IVAN", {0}}, | |
1821 | {"\\u010CAKAN JULIJAN", {0}}, | |
1822 | {"\\u010CAKAN MIHAJLO", {0}}, | |
1823 | {"\\u010CAKAN STEVAN", {0}}, | |
1824 | {"\\u010CAKAN VLADIMIR", {0}}, | |
1825 | {"\\u010CAKAN VLADIMIR", {0}}, | |
1826 | {"\\u010CAKAN VLADIMIR", {0}}, | |
1827 | {"\\u010CAKARA ANA", {0}}, | |
1828 | {"\\u010CAKAREVI\\u0106 MOMIR", {0}}, | |
1829 | {"\\u010CAKAREVI\\u0106 NEDELJKO", {0}}, | |
1830 | {"\\u010CAKI \\u0160ANDOR", {0}}, | |
1831 | {"\\u010CAKI AMALIJA", {0}}, | |
1832 | {"\\u010CAKI ANDRA\\u0160", {0}}, | |
1833 | {"\\u010CAKI LADISLAV", {0}}, | |
1834 | {"\\u010CAKI LAJO\\u0160", {0}}, | |
1835 | {"\\u010CAKI LASLO", {0}} | |
1836 | }; | |
1837 | ||
1838 | ||
1839 | ||
1840 | int32_t i = 0, j = 0, k = 0, buffSize = 0, skSize = 0, lowerSize = 0, upperSize = 0; | |
2ca993e8 | 1841 | int32_t arraySize = UPRV_LENGTHOF(tests); |
b75a7d8f | 1842 | |
57a6839d A |
1843 | (void)lowerSize; // Suppress unused variable warnings. |
1844 | (void)upperSize; | |
1845 | ||
b75a7d8f A |
1846 | for(i = 0; i<arraySize; i++) { |
1847 | buffSize = u_unescape(tests[i].original, buffer, 512); | |
1848 | skSize = coll->getSortKey(buffer, buffSize, tests[i].key, 512); | |
1849 | } | |
1850 | ||
1851 | qsort(tests, arraySize, sizeof(struct teststruct), compare_teststruct); | |
1852 | ||
1853 | for(i = 0; i < arraySize-1; i++) { | |
1854 | for(j = i+1; j < arraySize; j++) { | |
1855 | lowerSize = coll->getBound(tests[i].key, -1, UCOL_BOUND_LOWER, 1, lower, 512, status); | |
1856 | upperSize = coll->getBound(tests[j].key, -1, UCOL_BOUND_UPPER, 1, upper, 512, status); | |
1857 | for(k = i; k <= j; k++) { | |
1858 | if(strcmp((const char *)lower, (const char *)tests[k].key) > 0) { | |
1859 | errln("Problem with lower! j = %i (%s vs %s)", k, tests[k].original, tests[i].original); | |
1860 | } | |
1861 | if(strcmp((const char *)upper, (const char *)tests[k].key) <= 0) { | |
1862 | errln("Problem with upper! j = %i (%s vs %s)", k, tests[k].original, tests[j].original); | |
1863 | } | |
1864 | } | |
1865 | } | |
1866 | } | |
1867 | ||
1868 | ||
2ca993e8 | 1869 | for(i = 0; i<UPRV_LENGTHOF(test); i++) { |
b75a7d8f A |
1870 | buffSize = u_unescape(test[i], buffer, 512); |
1871 | skSize = coll->getSortKey(buffer, buffSize, sortkey, 512); | |
1872 | lowerSize = ucol_getBound(sortkey, skSize, UCOL_BOUND_LOWER, 1, lower, 512, &status); | |
1873 | upperSize = ucol_getBound(sortkey, skSize, UCOL_BOUND_UPPER_LONG, 1, upper, 512, &status); | |
2ca993e8 | 1874 | for(j = i+1; j<UPRV_LENGTHOF(test); j++) { |
b75a7d8f A |
1875 | buffSize = u_unescape(test[j], buffer, 512); |
1876 | skSize = coll->getSortKey(buffer, buffSize, sortkey, 512); | |
1877 | if(strcmp((const char *)lower, (const char *)sortkey) > 0) { | |
1878 | errln("Problem with lower! i = %i, j = %i (%s vs %s)", i, j, test[i], test[j]); | |
1879 | } | |
1880 | if(strcmp((const char *)upper, (const char *)sortkey) <= 0) { | |
1881 | errln("Problem with upper! i = %i, j = %i (%s vs %s)", i, j, test[i], test[j]); | |
1882 | } | |
1883 | } | |
1884 | } | |
1885 | delete coll; | |
1886 | } | |
1887 | ||
1888 | ||
1889 | void CollationAPITest::TestGetTailoredSet() | |
1890 | { | |
1891 | struct { | |
1892 | const char *rules; | |
1893 | const char *tests[20]; | |
1894 | int32_t testsize; | |
1895 | } setTest[] = { | |
1896 | { "&a < \\u212b", { "\\u212b", "A\\u030a", "\\u00c5" }, 3}, | |
1897 | { "& S < \\u0161 <<< \\u0160", { "\\u0161", "s\\u030C", "\\u0160", "S\\u030C" }, 4} | |
1898 | }; | |
1899 | ||
57a6839d | 1900 | int32_t i = 0, j = 0; |
b75a7d8f A |
1901 | UErrorCode status = U_ZERO_ERROR; |
1902 | ||
b75a7d8f A |
1903 | UnicodeString buff; |
1904 | UnicodeSet *set = NULL; | |
1905 | ||
b331163b | 1906 | for(i = 0; i < UPRV_LENGTHOF(setTest); i++) { |
57a6839d A |
1907 | buff = UnicodeString(setTest[i].rules, -1, US_INV).unescape(); |
1908 | RuleBasedCollator coll(buff, status); | |
b75a7d8f | 1909 | if(U_SUCCESS(status)) { |
57a6839d A |
1910 | set = coll.getTailoredSet(status); |
1911 | if(set->size() < setTest[i].testsize) { | |
1912 | errln("Tailored set size smaller (%d) than expected (%d)", set->size(), setTest[i].testsize); | |
b75a7d8f | 1913 | } |
57a6839d A |
1914 | for(j = 0; j < setTest[i].testsize; j++) { |
1915 | buff = UnicodeString(setTest[i].tests[j], -1, US_INV).unescape(); | |
b75a7d8f A |
1916 | if(!set->contains(buff)) { |
1917 | errln("Tailored set doesn't contain %s... It should", setTest[i].tests[j]); | |
1918 | } | |
1919 | } | |
1920 | delete set; | |
1921 | } else { | |
729e4ab9 | 1922 | errcheckln(status, "Couldn't open collator with rules %s - %s", setTest[i].rules, u_errorName(status)); |
b75a7d8f | 1923 | } |
b75a7d8f A |
1924 | } |
1925 | } | |
1926 | ||
1927 | void CollationAPITest::TestUClassID() | |
1928 | { | |
1929 | char id = *((char *)RuleBasedCollator::getStaticClassID()); | |
1930 | if (id != 0) { | |
1931 | errln("Static class id for RuleBasedCollator should be 0"); | |
1932 | } | |
1933 | UErrorCode status = U_ZERO_ERROR; | |
1934 | RuleBasedCollator *coll | |
1935 | = (RuleBasedCollator *)Collator::createInstance(status); | |
1936 | if(U_FAILURE(status)) { | |
1937 | delete coll; | |
729e4ab9 | 1938 | errcheckln(status, "Collator creation failed with %s", u_errorName(status)); |
b75a7d8f A |
1939 | return; |
1940 | } | |
1941 | id = *((char *)coll->getDynamicClassID()); | |
1942 | if (id != 0) { | |
1943 | errln("Dynamic class id for RuleBasedCollator should be 0"); | |
1944 | } | |
1945 | id = *((char *)CollationKey::getStaticClassID()); | |
1946 | if (id != 0) { | |
1947 | errln("Static class id for CollationKey should be 0"); | |
1948 | } | |
1949 | CollationKey *key = new CollationKey(); | |
1950 | id = *((char *)key->getDynamicClassID()); | |
1951 | if (id != 0) { | |
1952 | errln("Dynamic class id for CollationKey should be 0"); | |
1953 | } | |
1954 | id = *((char *)CollationElementIterator::getStaticClassID()); | |
1955 | if (id != 0) { | |
1956 | errln("Static class id for CollationElementIterator should be 0"); | |
1957 | } | |
1958 | UnicodeString str("testing"); | |
1959 | CollationElementIterator *iter = coll->createCollationElementIterator(str); | |
1960 | id = *((char *)iter->getDynamicClassID()); | |
1961 | if (id != 0) { | |
1962 | errln("Dynamic class id for CollationElementIterator should be 0"); | |
1963 | } | |
1964 | delete key; | |
1965 | delete iter; | |
1966 | delete coll; | |
1967 | } | |
1968 | ||
1969 | class TestCollator : public Collator | |
1970 | { | |
1971 | public: | |
1972 | virtual Collator* clone(void) const; | |
1973 | ||
51004dcb | 1974 | using Collator::compare; |
b75a7d8f A |
1975 | |
1976 | virtual UCollationResult compare(const UnicodeString& source, | |
1977 | const UnicodeString& target, | |
1978 | UErrorCode& status) const; | |
1979 | virtual UCollationResult compare(const UnicodeString& source, | |
1980 | const UnicodeString& target, | |
1981 | int32_t length, | |
1982 | UErrorCode& status) const; | |
1983 | virtual UCollationResult compare(const UChar* source, | |
1984 | int32_t sourceLength, | |
1985 | const UChar* target, | |
1986 | int32_t targetLength, | |
1987 | UErrorCode& status) const; | |
1988 | virtual CollationKey& getCollationKey(const UnicodeString& source, | |
1989 | CollationKey& key, | |
1990 | UErrorCode& status) const; | |
1991 | virtual CollationKey& getCollationKey(const UChar*source, | |
1992 | int32_t sourceLength, | |
1993 | CollationKey& key, | |
1994 | UErrorCode& status) const; | |
1995 | virtual int32_t hashCode(void) const; | |
51004dcb | 1996 | virtual Locale getLocale(ULocDataLocaleType type, UErrorCode& status) const; |
b75a7d8f A |
1997 | virtual ECollationStrength getStrength(void) const; |
1998 | virtual void setStrength(ECollationStrength newStrength); | |
1999 | virtual UClassID getDynamicClassID(void) const; | |
2000 | virtual void getVersion(UVersionInfo info) const; | |
2001 | virtual void setAttribute(UColAttribute attr, UColAttributeValue value, | |
2002 | UErrorCode &status); | |
2003 | virtual UColAttributeValue getAttribute(UColAttribute attr, | |
51004dcb | 2004 | UErrorCode &status) const; |
b75a7d8f A |
2005 | virtual uint32_t setVariableTop(const UChar *varTop, int32_t len, |
2006 | UErrorCode &status); | |
51004dcb | 2007 | virtual uint32_t setVariableTop(const UnicodeString &varTop, |
b75a7d8f | 2008 | UErrorCode &status); |
51004dcb | 2009 | virtual void setVariableTop(uint32_t varTop, UErrorCode &status); |
b75a7d8f | 2010 | virtual uint32_t getVariableTop(UErrorCode &status) const; |
b75a7d8f A |
2011 | virtual int32_t getSortKey(const UnicodeString& source, |
2012 | uint8_t* result, | |
2013 | int32_t resultLength) const; | |
2014 | virtual int32_t getSortKey(const UChar*source, int32_t sourceLength, | |
2015 | uint8_t*result, int32_t resultLength) const; | |
2016 | virtual UnicodeSet *getTailoredSet(UErrorCode &status) const; | |
51004dcb A |
2017 | virtual UBool operator==(const Collator& other) const; |
2018 | // Collator::operator!= calls !Collator::operator== which works for all subclasses. | |
46f4442e | 2019 | virtual void setLocales(const Locale& requestedLocale, const Locale& validLocale, const Locale& actualLocale); |
b75a7d8f A |
2020 | TestCollator() : Collator() {}; |
2021 | TestCollator(UCollationStrength collationStrength, | |
2022 | UNormalizationMode decompositionMode) : Collator(collationStrength, decompositionMode) {}; | |
2023 | }; | |
2024 | ||
51004dcb A |
2025 | inline UBool TestCollator::operator==(const Collator& other) const { |
2026 | // TestCollator has no fields, so we test for identity. | |
2027 | return this == &other; | |
b75a7d8f | 2028 | |
51004dcb A |
2029 | // Normally, subclasses should do something like the following: |
2030 | // if (this == &other) { return TRUE; } | |
2031 | // if (!Collator::operator==(other)) { return FALSE; } // not the same class | |
2032 | // | |
2033 | // const TestCollator &o = (const TestCollator&)other; | |
2034 | // (compare this vs. o's subclass fields) | |
2035 | } | |
b75a7d8f A |
2036 | |
2037 | Collator* TestCollator::clone() const | |
2038 | { | |
2039 | return new TestCollator(); | |
2040 | } | |
2041 | ||
2042 | UCollationResult TestCollator::compare(const UnicodeString& source, | |
2043 | const UnicodeString& target, | |
2044 | UErrorCode& status) const | |
2045 | { | |
2046 | if(U_SUCCESS(status)) { | |
2047 | return UCollationResult(source.compare(target)); | |
2048 | } else { | |
2049 | return UCOL_EQUAL; | |
2050 | } | |
2051 | } | |
2052 | ||
2053 | UCollationResult TestCollator::compare(const UnicodeString& source, | |
2054 | const UnicodeString& target, | |
2055 | int32_t length, | |
2056 | UErrorCode& status) const | |
2057 | { | |
2058 | if(U_SUCCESS(status)) { | |
2059 | return UCollationResult(source.compare(0, length, target)); | |
2060 | } else { | |
2061 | return UCOL_EQUAL; | |
2062 | } | |
2063 | } | |
2064 | ||
2065 | UCollationResult TestCollator::compare(const UChar* source, | |
2066 | int32_t sourceLength, | |
2067 | const UChar* target, | |
2068 | int32_t targetLength, | |
2069 | UErrorCode& status) const | |
2070 | { | |
2071 | UnicodeString s(source, sourceLength); | |
2072 | UnicodeString t(target, targetLength); | |
2073 | return compare(s, t, status); | |
2074 | } | |
2075 | ||
2076 | CollationKey& TestCollator::getCollationKey(const UnicodeString& source, | |
2077 | CollationKey& key, | |
2078 | UErrorCode& status) const | |
2079 | { | |
2080 | char temp[100]; | |
2081 | int length = 100; | |
2082 | length = source.extract(temp, length, NULL, status); | |
2083 | temp[length] = 0; | |
2084 | CollationKey tempkey((uint8_t*)temp, length); | |
2085 | key = tempkey; | |
2086 | return key; | |
2087 | } | |
2088 | ||
2089 | CollationKey& TestCollator::getCollationKey(const UChar*source, | |
2090 | int32_t sourceLength, | |
2091 | CollationKey& key, | |
2092 | UErrorCode& status) const | |
2093 | { | |
2094 | //s tack allocation used since collationkey does not keep the unicodestring | |
2095 | UnicodeString str(source, sourceLength); | |
2096 | return getCollationKey(str, key, status); | |
2097 | } | |
2098 | ||
2099 | int32_t TestCollator::getSortKey(const UnicodeString& source, uint8_t* result, | |
2100 | int32_t resultLength) const | |
2101 | { | |
2102 | UErrorCode status = U_ZERO_ERROR; | |
2103 | int32_t length = source.extract((char *)result, resultLength, NULL, | |
2104 | status); | |
2105 | result[length] = 0; | |
2106 | return length; | |
2107 | } | |
2108 | ||
2109 | int32_t TestCollator::getSortKey(const UChar*source, int32_t sourceLength, | |
2110 | uint8_t*result, int32_t resultLength) const | |
2111 | { | |
2112 | UnicodeString str(source, sourceLength); | |
2113 | return getSortKey(str, result, resultLength); | |
2114 | } | |
2115 | ||
2116 | int32_t TestCollator::hashCode() const | |
2117 | { | |
2118 | return 0; | |
2119 | } | |
2120 | ||
51004dcb | 2121 | Locale TestCollator::getLocale(ULocDataLocaleType type, UErrorCode& status) const |
b75a7d8f A |
2122 | { |
2123 | // api not used, this is to make the compiler happy | |
2124 | if (U_FAILURE(status)) { | |
57a6839d | 2125 | (void)type; |
b75a7d8f A |
2126 | } |
2127 | return NULL; | |
2128 | } | |
2129 | ||
2130 | Collator::ECollationStrength TestCollator::getStrength() const | |
2131 | { | |
2132 | return TERTIARY; | |
2133 | } | |
2134 | ||
2135 | void TestCollator::setStrength(Collator::ECollationStrength newStrength) | |
2136 | { | |
2137 | // api not used, this is to make the compiler happy | |
57a6839d | 2138 | (void)newStrength; |
b75a7d8f A |
2139 | } |
2140 | ||
2141 | UClassID TestCollator::getDynamicClassID(void) const | |
2142 | { | |
2143 | return 0; | |
2144 | } | |
2145 | ||
2146 | void TestCollator::getVersion(UVersionInfo info) const | |
2147 | { | |
2148 | // api not used, this is to make the compiler happy | |
2149 | memset(info, 0, U_MAX_VERSION_LENGTH); | |
2150 | } | |
2151 | ||
57a6839d A |
2152 | void TestCollator::setAttribute(UColAttribute /*attr*/, UColAttributeValue /*value*/, |
2153 | UErrorCode & /*status*/) | |
b75a7d8f | 2154 | { |
b75a7d8f A |
2155 | } |
2156 | ||
2157 | UColAttributeValue TestCollator::getAttribute(UColAttribute attr, | |
51004dcb | 2158 | UErrorCode &status) const |
b75a7d8f A |
2159 | { |
2160 | // api not used, this is to make the compiler happy | |
2161 | if (U_FAILURE(status) || attr == UCOL_ATTRIBUTE_COUNT) { | |
2162 | return UCOL_OFF; | |
2163 | } | |
2164 | return UCOL_DEFAULT; | |
2165 | } | |
2166 | ||
2167 | uint32_t TestCollator::setVariableTop(const UChar *varTop, int32_t len, | |
2168 | UErrorCode &status) | |
2169 | { | |
2170 | // api not used, this is to make the compiler happy | |
2171 | if (U_SUCCESS(status) && (varTop == 0 || len < -1)) { | |
2172 | status = U_ILLEGAL_ARGUMENT_ERROR; | |
2173 | } | |
2174 | return 0; | |
2175 | } | |
2176 | ||
51004dcb | 2177 | uint32_t TestCollator::setVariableTop(const UnicodeString &varTop, |
b75a7d8f A |
2178 | UErrorCode &status) |
2179 | { | |
2180 | // api not used, this is to make the compiler happy | |
2181 | if (U_SUCCESS(status) && varTop.length() == 0) { | |
2182 | status = U_ILLEGAL_ARGUMENT_ERROR; | |
2183 | } | |
2184 | return 0; | |
2185 | } | |
2186 | ||
51004dcb | 2187 | void TestCollator::setVariableTop(uint32_t varTop, UErrorCode &status) |
b75a7d8f A |
2188 | { |
2189 | // api not used, this is to make the compiler happy | |
2190 | if (U_SUCCESS(status) && varTop == 0) { | |
2191 | status = U_ILLEGAL_ARGUMENT_ERROR; | |
2192 | } | |
2193 | } | |
2194 | ||
2195 | uint32_t TestCollator::getVariableTop(UErrorCode &status) const | |
2196 | { | |
2197 | ||
2198 | // api not used, this is to make the compiler happy | |
2199 | if (U_SUCCESS(status)) { | |
2200 | return 0; | |
2201 | } | |
2202 | return (uint32_t)(0xFFFFFFFFu); | |
2203 | } | |
2204 | ||
b75a7d8f A |
2205 | UnicodeSet * TestCollator::getTailoredSet(UErrorCode &status) const |
2206 | { | |
2207 | return Collator::getTailoredSet(status); | |
2208 | } | |
2209 | ||
46f4442e | 2210 | void TestCollator::setLocales(const Locale& requestedLocale, const Locale& validLocale, const Locale& actualLocale) |
b75a7d8f | 2211 | { |
46f4442e | 2212 | Collator::setLocales(requestedLocale, validLocale, actualLocale); |
b75a7d8f A |
2213 | } |
2214 | ||
2215 | ||
2216 | void CollationAPITest::TestSubclass() | |
2217 | { | |
2218 | TestCollator col1; | |
2219 | TestCollator col2; | |
51004dcb | 2220 | doAssert(col1 != col2, "2 instances of TestCollator should be different"); |
b75a7d8f A |
2221 | if (col1.hashCode() != col2.hashCode()) { |
2222 | errln("Every TestCollator has the same hashcode"); | |
2223 | } | |
2224 | UnicodeString abc("abc", 3); | |
2225 | UnicodeString bcd("bcd", 3); | |
2226 | if (col1.compare(abc, bcd) != abc.compare(bcd)) { | |
2227 | errln("TestCollator compare should be the same as the default " | |
2228 | "string comparison"); | |
2229 | } | |
2230 | CollationKey key; | |
2231 | UErrorCode status = U_ZERO_ERROR; | |
2232 | col1.getCollationKey(abc, key, status); | |
2233 | int32_t length = 0; | |
2234 | const char* bytes = (const char *)key.getByteArray(length); | |
2235 | UnicodeString keyarray(bytes, length, NULL, status); | |
2236 | if (abc != keyarray) { | |
2237 | errln("TestCollator collationkey API is returning wrong values"); | |
2238 | } | |
2239 | ||
2240 | UnicodeSet expectedset(0, 0x10FFFF); | |
2241 | UnicodeSet *defaultset = col1.getTailoredSet(status); | |
2242 | if (!defaultset->containsAll(expectedset) | |
2243 | || !expectedset.containsAll(*defaultset)) { | |
2244 | errln("Error: expected default tailoring to be 0 to 0x10ffff"); | |
2245 | } | |
2246 | delete defaultset; | |
2247 | ||
2248 | // use base class implementation | |
2249 | Locale loc1 = Locale::getGermany(); | |
2250 | Locale loc2 = Locale::getFrance(); | |
46f4442e | 2251 | col1.setLocales(loc1, loc2, loc2); // default implementation has no effect |
b75a7d8f A |
2252 | |
2253 | UnicodeString displayName; | |
2254 | col1.getDisplayName(loc1, loc2, displayName); // de_DE collator in fr_FR locale | |
2255 | ||
2256 | TestCollator col3(UCOL_TERTIARY, UNORM_NONE); | |
2257 | UnicodeString a("a"); | |
2258 | UnicodeString b("b"); | |
2259 | Collator::EComparisonResult result = Collator::EComparisonResult(a.compare(b)); | |
2260 | if(col1.compare(a, b) != result) { | |
2261 | errln("Collator doesn't give default result"); | |
2262 | } | |
2263 | if(col1.compare(a, b, 1) != result) { | |
2264 | errln("Collator doesn't give default result"); | |
2265 | } | |
2266 | if(col1.compare(a.getBuffer(), a.length(), b.getBuffer(), b.length()) != result) { | |
2267 | errln("Collator doesn't give default result"); | |
2268 | } | |
2269 | } | |
2270 | ||
374ca955 A |
2271 | void CollationAPITest::TestNULLCharTailoring() |
2272 | { | |
2273 | UErrorCode status = U_ZERO_ERROR; | |
2274 | UChar buf[256] = {0}; | |
2275 | int32_t len = u_unescape("&a < '\\u0000'", buf, 256); | |
2276 | UnicodeString first((UChar)0x0061); | |
2277 | UnicodeString second((UChar)0); | |
2278 | RuleBasedCollator *coll = new RuleBasedCollator(UnicodeString(buf, len), status); | |
2279 | if(U_FAILURE(status)) { | |
729e4ab9 A |
2280 | delete coll; |
2281 | errcheckln(status, "Failed to open collator - %s", u_errorName(status)); | |
2282 | return; | |
374ca955 A |
2283 | } |
2284 | UCollationResult res = coll->compare(first, second, status); | |
2285 | if(res != UCOL_LESS) { | |
2286 | errln("a should be less then NULL after tailoring"); | |
2287 | } | |
2288 | delete coll; | |
2289 | } | |
2290 | ||
73c04bcf A |
2291 | void CollationAPITest::TestClone() { |
2292 | logln("\ninit c0"); | |
2293 | UErrorCode status = U_ZERO_ERROR; | |
2294 | RuleBasedCollator* c0 = (RuleBasedCollator*)Collator::createInstance(status); | |
46f4442e A |
2295 | |
2296 | if (U_FAILURE(status)) { | |
729e4ab9 | 2297 | errcheckln(status, "Collator::CreateInstance(status) failed with %s", u_errorName(status)); |
46f4442e A |
2298 | return; |
2299 | } | |
2300 | ||
73c04bcf A |
2301 | c0->setStrength(Collator::TERTIARY); |
2302 | dump("c0", c0, status); | |
2303 | ||
2304 | logln("\ninit c1"); | |
2305 | RuleBasedCollator* c1 = (RuleBasedCollator*)Collator::createInstance(status); | |
2306 | c1->setStrength(Collator::TERTIARY); | |
2307 | UColAttributeValue val = c1->getAttribute(UCOL_CASE_FIRST, status); | |
2308 | if(val == UCOL_LOWER_FIRST){ | |
2309 | c1->setAttribute(UCOL_CASE_FIRST, UCOL_UPPER_FIRST, status); | |
2310 | }else{ | |
2311 | c1->setAttribute(UCOL_CASE_FIRST, UCOL_LOWER_FIRST, status); | |
2312 | } | |
2313 | dump("c0", c0, status); | |
2314 | dump("c1", c1, status); | |
2315 | ||
2316 | logln("\ninit c2"); | |
2317 | RuleBasedCollator* c2 = (RuleBasedCollator*)c1->clone(); | |
2318 | val = c2->getAttribute(UCOL_CASE_FIRST, status); | |
2319 | if(val == UCOL_LOWER_FIRST){ | |
2320 | c2->setAttribute(UCOL_CASE_FIRST, UCOL_UPPER_FIRST, status); | |
2321 | }else{ | |
2322 | c2->setAttribute(UCOL_CASE_FIRST, UCOL_LOWER_FIRST, status); | |
2323 | } | |
2324 | if(U_FAILURE(status)){ | |
2325 | errln("set and get attributes of collator failed. %s\n", u_errorName(status)); | |
2326 | return; | |
2327 | } | |
2328 | dump("c0", c0, status); | |
2329 | dump("c1", c1, status); | |
2330 | dump("c2", c2, status); | |
2331 | if(*c1 == *c2){ | |
2332 | errln("The cloned objects refer to same data"); | |
2333 | } | |
2334 | delete c0; | |
2335 | delete c1; | |
2336 | delete c2; | |
2337 | } | |
2338 | ||
57a6839d A |
2339 | void CollationAPITest::TestCloneBinary() { |
2340 | IcuTestErrorCode errorCode(*this, "TestCloneBinary"); | |
2341 | LocalPointer<Collator> root(Collator::createInstance(Locale::getRoot(), errorCode)); | |
2342 | LocalPointer<Collator> coll(Collator::createInstance("de@collation=phonebook", errorCode)); | |
2343 | if(errorCode.logDataIfFailureAndReset("Collator::createInstance(de@collation=phonebook)")) { | |
2344 | return; | |
2345 | } | |
2346 | RuleBasedCollator *rbRoot = dynamic_cast<RuleBasedCollator *>(root.getAlias()); | |
2347 | RuleBasedCollator *rbc = dynamic_cast<RuleBasedCollator *>(coll.getAlias()); | |
2348 | if(rbRoot == NULL || rbc == NULL) { | |
2349 | infoln("root or de@collation=phonebook is not a RuleBasedCollator"); | |
2350 | return; | |
2351 | } | |
2352 | rbc->setAttribute(UCOL_STRENGTH, UCOL_PRIMARY, errorCode); | |
2353 | UnicodeString uUmlaut((UChar)0xfc); | |
2354 | UnicodeString ue = UNICODE_STRING_SIMPLE("ue"); | |
2355 | assertEquals("rbc/primary: u-umlaut==ue", UCOL_EQUAL, rbc->compare(uUmlaut, ue, errorCode)); | |
2356 | uint8_t bin[25000]; | |
b331163b | 2357 | int32_t binLength = rbc->cloneBinary(bin, UPRV_LENGTHOF(bin), errorCode); |
57a6839d A |
2358 | if(errorCode.logDataIfFailureAndReset("rbc->cloneBinary()")) { |
2359 | return; | |
2360 | } | |
2361 | logln("rbc->cloneBinary() -> %d bytes", (int)binLength); | |
2362 | ||
2363 | RuleBasedCollator rbc2(bin, binLength, rbRoot, errorCode); | |
2364 | if(errorCode.logDataIfFailureAndReset("RuleBasedCollator(rbc binary)")) { | |
2365 | return; | |
2366 | } | |
2367 | assertEquals("rbc2.strength==primary", UCOL_PRIMARY, rbc2.getAttribute(UCOL_STRENGTH, errorCode)); | |
2368 | assertEquals("rbc2: u-umlaut==ue", UCOL_EQUAL, rbc2.compare(uUmlaut, ue, errorCode)); | |
2369 | assertTrue("rbc==rbc2", *rbc == rbc2); | |
2370 | uint8_t bin2[25000]; | |
b331163b | 2371 | int32_t bin2Length = rbc2.cloneBinary(bin2, UPRV_LENGTHOF(bin2), errorCode); |
57a6839d A |
2372 | assertEquals("len(rbc binary)==len(rbc2 binary)", binLength, bin2Length); |
2373 | assertTrue("rbc binary==rbc2 binary", binLength == bin2Length && memcmp(bin, bin2, binLength) == 0); | |
b331163b A |
2374 | |
2375 | RuleBasedCollator rbc3(bin, -1, rbRoot, errorCode); | |
2376 | if(errorCode.logDataIfFailureAndReset("RuleBasedCollator(rbc binary, length<0)")) { | |
2377 | return; | |
2378 | } | |
2379 | assertEquals("rbc3.strength==primary", UCOL_PRIMARY, rbc3.getAttribute(UCOL_STRENGTH, errorCode)); | |
2380 | assertEquals("rbc3: u-umlaut==ue", UCOL_EQUAL, rbc3.compare(uUmlaut, ue, errorCode)); | |
2381 | assertTrue("rbc==rbc3", *rbc == rbc3); | |
57a6839d A |
2382 | } |
2383 | ||
2384 | void CollationAPITest::TestIterNumeric() { | |
2385 | // Regression test for ticket #9915. | |
2386 | // The collation code sometimes masked the continuation marker away | |
2387 | // but later tested the result for isContinuation(). | |
2388 | // This test case failed because the third bytes of the computed numeric-collation primaries | |
2389 | // were permutated with the script reordering table. | |
2390 | // It should have been possible to reproduce this with the root collator | |
2391 | // and characters with appropriate 3-byte primary weights. | |
2392 | // The effectiveness of this test depends completely on the collation elements | |
2393 | // and on the implementation code. | |
2394 | IcuTestErrorCode errorCode(*this, "TestIterNumeric"); | |
2395 | RuleBasedCollator coll(UnicodeString("[reorder Hang Hani]"), errorCode); | |
2396 | if(errorCode.logDataIfFailureAndReset("RuleBasedCollator constructor")) { | |
2397 | return; | |
2398 | } | |
2399 | coll.setAttribute(UCOL_NUMERIC_COLLATION, UCOL_ON, errorCode); | |
2400 | UCharIterator iter40, iter72; | |
2401 | uiter_setUTF8(&iter40, "\x34\x30", 2); | |
2402 | uiter_setUTF8(&iter72, "\x37\x32", 2); | |
2403 | UCollationResult result = coll.compare(iter40, iter72, errorCode); | |
2404 | assertEquals("40<72", (int32_t)UCOL_LESS, (int32_t)result); | |
2405 | } | |
2406 | ||
b331163b A |
2407 | void CollationAPITest::TestBadKeywords() { |
2408 | // Test locale IDs with errors. | |
2409 | // Valid locale IDs are tested via data-driven tests. | |
2410 | UErrorCode errorCode = U_ZERO_ERROR; | |
2411 | Locale bogusLocale(Locale::getRoot()); | |
2412 | bogusLocale.setToBogus(); | |
2413 | LocalPointer<Collator> coll(Collator::createInstance(bogusLocale, errorCode)); | |
2414 | if(errorCode != U_ILLEGAL_ARGUMENT_ERROR) { | |
2415 | errln("Collator::createInstance(bogus locale) did not fail as expected - %s", | |
2416 | u_errorName(errorCode)); | |
2417 | } | |
2418 | ||
2419 | // Unknown value. | |
2420 | const char *localeID = "it-u-ks-xyz"; | |
2421 | errorCode = U_ZERO_ERROR; | |
2422 | coll.adoptInstead(Collator::createInstance(localeID, errorCode)); | |
2423 | if(errorCode != U_ILLEGAL_ARGUMENT_ERROR) { | |
2424 | dataerrln("Collator::createInstance(%s) did not fail as expected - %s", | |
2425 | localeID, u_errorName(errorCode)); | |
2426 | } | |
2427 | ||
2428 | // Unsupported attributes. | |
2429 | localeID = "it@colHiraganaQuaternary=true"; | |
2430 | errorCode = U_ZERO_ERROR; | |
2431 | coll.adoptInstead(Collator::createInstance(localeID, errorCode)); | |
2432 | if(errorCode != U_UNSUPPORTED_ERROR) { | |
2433 | if (errorCode == U_FILE_ACCESS_ERROR) { | |
2434 | dataerrln("Collator::createInstance(it@colHiraganaQuaternary=true) : %s", u_errorName(errorCode)); | |
2435 | } else { | |
2436 | errln("Collator::createInstance(%s) did not fail as expected - %s", | |
2437 | localeID, u_errorName(errorCode)); | |
2438 | } | |
2439 | } | |
2440 | ||
2441 | localeID = "it-u-vt-u24"; | |
2442 | errorCode = U_ZERO_ERROR; | |
2443 | coll.adoptInstead(Collator::createInstance(localeID, errorCode)); | |
2444 | if(errorCode != U_UNSUPPORTED_ERROR) { | |
2445 | if (errorCode == U_ILLEGAL_ARGUMENT_ERROR || errorCode == U_FILE_ACCESS_ERROR) { | |
2446 | dataerrln("Collator::createInstance(it-u-vt-u24) : %s", u_errorName(errorCode)); | |
2447 | } else { | |
2448 | errln("Collator::createInstance(%s) did not fail as expected - %s", | |
2449 | localeID, u_errorName(errorCode)); | |
2450 | } | |
2451 | } | |
2452 | } | |
2453 | ||
73c04bcf A |
2454 | void CollationAPITest::dump(UnicodeString msg, RuleBasedCollator* c, UErrorCode& status) { |
2455 | const char* bigone = "One"; | |
2456 | const char* littleone = "one"; | |
2457 | ||
2458 | logln(msg + " " + c->compare(bigone, littleone) + | |
2459 | " s: " + c->getStrength() + | |
2460 | " u: " + c->getAttribute(UCOL_CASE_FIRST, status)); | |
2461 | } | |
b75a7d8f A |
2462 | void CollationAPITest::runIndexedTest( int32_t index, UBool exec, const char* &name, char* /*par */) |
2463 | { | |
2464 | if (exec) logln("TestSuite CollationAPITest: "); | |
4388f060 A |
2465 | TESTCASE_AUTO_BEGIN; |
2466 | TESTCASE_AUTO(TestProperty); | |
2467 | TESTCASE_AUTO(TestOperators); | |
2468 | TESTCASE_AUTO(TestDuplicate); | |
2469 | TESTCASE_AUTO(TestCompare); | |
2470 | TESTCASE_AUTO(TestHashCode); | |
2471 | TESTCASE_AUTO(TestCollationKey); | |
2472 | TESTCASE_AUTO(TestElemIter); | |
2473 | TESTCASE_AUTO(TestGetAll); | |
2474 | TESTCASE_AUTO(TestRuleBasedColl); | |
2475 | TESTCASE_AUTO(TestDecomposition); | |
2476 | TESTCASE_AUTO(TestSafeClone); | |
2477 | TESTCASE_AUTO(TestSortKey); | |
2478 | TESTCASE_AUTO(TestSortKeyOverflow); | |
2479 | TESTCASE_AUTO(TestMaxExpansion); | |
2480 | TESTCASE_AUTO(TestDisplayName); | |
2481 | TESTCASE_AUTO(TestAttribute); | |
2482 | TESTCASE_AUTO(TestVariableTopSetting); | |
57a6839d | 2483 | TESTCASE_AUTO(TestMaxVariable); |
4388f060 A |
2484 | TESTCASE_AUTO(TestRules); |
2485 | TESTCASE_AUTO(TestGetLocale); | |
2486 | TESTCASE_AUTO(TestBounds); | |
2487 | TESTCASE_AUTO(TestGetTailoredSet); | |
2488 | TESTCASE_AUTO(TestUClassID); | |
2489 | TESTCASE_AUTO(TestSubclass); | |
2490 | TESTCASE_AUTO(TestNULLCharTailoring); | |
2491 | TESTCASE_AUTO(TestClone); | |
57a6839d A |
2492 | TESTCASE_AUTO(TestCloneBinary); |
2493 | TESTCASE_AUTO(TestIterNumeric); | |
b331163b | 2494 | TESTCASE_AUTO(TestBadKeywords); |
4388f060 | 2495 | TESTCASE_AUTO_END; |
b75a7d8f A |
2496 | } |
2497 | ||
2498 | #endif /* #if !UCONFIG_NO_COLLATION */ |