git.saurik.com Git - apple/icu.git/blame_incremental - icuSources/test/cintltst/custrtst.c

... / ...

Commit	Line	Data
	1	/*
	2	******************************************************************************
	3	*
	4	* Copyright (C) 2002-2006, International Business Machines
	5	* Corporation and others. All Rights Reserved.
	6	*
	7	******************************************************************************
	8	* file name: custrtst.c
	9	* encoding: US-ASCII
	10	* tab size: 8 (not used)
	11	* indentation:4
	12	*
	13	* created on: 2002oct09
	14	* created by: Markus W. Scherer
	15	*
	16	* Tests of ustring.h Unicode string API functions.
	17	*/
	18
	19	#include "unicode/ustring.h"
	20	#include "unicode/ucnv.h"
	21	#include "unicode/uiter.h"
	22	#include "cintltst.h"
	23	#include <string.h>
	24
	25	#define LENGTHOF(array) (sizeof(array)/sizeof((array)[0]))
	26
	27	/* get the sign of an integer */
	28	#define _SIGN(value) ((value)==0 ? 0 : ((int32_t)(value)>>31)\|1)
	29
	30	/* test setup --------------------------------------------------------------- */
	31
	32	static void setUpDataTable(void);
	33	static void TestStringCopy(void);
	34	static void TestStringFunctions(void);
	35	static void TestStringSearching(void);
	36	static void TestSurrogateSearching(void);
	37	static void TestUnescape(void);
	38	static void TestCountChar32(void);
	39	static void TestUCharIterator(void);
	40	static void TestUNormIterator(void);
	41	static void TestBadUNormIterator(void);
	42
	43	void addUStringTest(TestNode** root);
	44
	45	void addUStringTest(TestNode** root)
	46	{
	47	addTest(root, &TestStringCopy, "tsutil/custrtst/TestStringCopy");
	48	addTest(root, &TestStringFunctions, "tsutil/custrtst/TestStringFunctions");
	49	addTest(root, &TestStringSearching, "tsutil/custrtst/TestStringSearching");
	50	addTest(root, &TestSurrogateSearching, "tsutil/custrtst/TestSurrogateSearching");
	51	addTest(root, &TestUnescape, "tsutil/custrtst/TestUnescape");
	52	addTest(root, &TestCountChar32, "tsutil/custrtst/TestCountChar32");
	53	addTest(root, &TestUCharIterator, "tsutil/custrtst/TestUCharIterator");
	54	addTest(root, &TestUNormIterator, "tsutil/custrtst/TestUNormIterator");
	55	addTest(root, &TestBadUNormIterator, "tsutil/custrtst/TestBadUNormIterator");
	56	}
	57
	58	/* test data for TestStringFunctions ---------------------------------------- */
	59
	60	UChar*** dataTable = NULL;
	61
	62	static const char* raw[3][4] = {
	63
	64	/* First String */
	65	{ "English_", "French_", "Croatian_", "English_"},
	66	/* Second String */
	67	{ "United States", "France", "Croatia", "Unites States"},
	68
	69	/* Concatenated string */
	70	{ "English_United States", "French_France", "Croatian_Croatia", "English_United States"}
	71	};
	72
	73	static void setUpDataTable()
	74	{
	75	int32_t i,j;
	76	if(dataTable == NULL) {
	77	dataTable = (UChar*)calloc(sizeof(UChar),3);
	78
	79	for (i = 0; i < 3; i++) {
	80	dataTable[i] = (UChar*)calloc(sizeof(UChar),4);
	81	for (j = 0; j < 4; j++){
	82	dataTable[i][j] = (UChar) malloc(sizeof(UChar)(strlen(raw[i][j])+1));
	83	u_uastrcpy(dataTable[i][j],raw[i][j]);
	84	}
	85	}
	86	}
	87	}
	88
	89	static void cleanUpDataTable()
	90	{
	91	int32_t i,j;
	92	if(dataTable != NULL) {
	93	for (i=0; i<3; i++) {
	94	for(j = 0; j<4; j++) {
	95	free(dataTable[i][j]);
	96	}
	97	free(dataTable[i]);
	98	}
	99	free(dataTable);
	100	}
	101	dataTable = NULL;
	102	}
	103
	104	/Tests for u_strcat(),u_strcmp(), u_strlen(), u_strcpy(),u_strncat(),u_strncmp(),u_strncpy, u_uastrcpy(),u_austrcpy(), u_uastrncpy(); /
	105	static void TestStringFunctions()
	106	{
	107	int32_t i,j,k;
	108	UChar temp[512];
	109	UChar nullTemp[512];
	110	char test[512];
	111	char tempOut[512];
	112
	113	setUpDataTable();
	114
	115	log_verbose("Testing u_strlen()\n");
	116	if( u_strlen(dataTable[0][0])!= u_strlen(dataTable[0][3]) \|\| u_strlen(dataTable[0][0]) == u_strlen(dataTable[0][2]))
	117	log_err("There is an error in u_strlen()");
	118
	119	log_verbose("Testing u_memcpy() and u_memcmp()\n");
	120
	121	for(i=0;i<3;++i)
	122	{
	123	for(j=0;j<4;++j)
	124	{
	125	log_verbose("Testing %s\n", u_austrcpy(tempOut, dataTable[i][j]));
	126	temp[0] = 0;
	127	temp[7] = 0xA4; /* Mark the end */
	128	u_memcpy(temp,dataTable[i][j], 7);
	129
	130	if(temp[7] != 0xA4)
	131	log_err("an error occured in u_memcpy()\n");
	132	if(u_memcmp(temp, dataTable[i][j], 7)!=0)
	133	log_err("an error occured in u_memcpy() or u_memcmp()\n");
	134	}
	135	}
	136	if(u_memcmp(dataTable[0][0], dataTable[1][1], 7)==0)
	137	log_err("an error occured in u_memcmp()\n");
	138
	139	log_verbose("Testing u_memset()\n");
	140	nullTemp[0] = 0;
	141	nullTemp[7] = 0;
	142	u_memset(nullTemp, 0xa4, 7);
	143	for (i = 0; i < 7; i++) {
	144	if(nullTemp[i] != 0xa4) {
	145	log_err("an error occured in u_memset()\n");
	146	}
	147	}
	148	if(nullTemp[7] != 0) {
	149	log_err("u_memset() went too far\n");
	150	}
	151
	152	u_memset(nullTemp, 0, 7);
	153	nullTemp[7] = 0xa4;
	154	temp[7] = 0;
	155	u_memcpy(temp,nullTemp, 7);
	156	if(u_memcmp(temp, nullTemp, 7)!=0 \|\| temp[7]!=0)
	157	log_err("an error occured in u_memcpy() or u_memcmp()\n");
	158
	159
	160	log_verbose("Testing u_memmove()\n");
	161	for (i = 0; i < 7; i++) {
	162	temp[i] = (UChar)i;
	163	}
	164	u_memmove(temp + 1, temp, 7);
	165	if(temp[0] != 0) {
	166	log_err("an error occured in u_memmove()\n");
	167	}
	168	for (i = 1; i <= 7; i++) {
	169	if(temp[i] != (i - 1)) {
	170	log_err("an error occured in u_memmove()\n");
	171	}
	172	}
	173
	174	log_verbose("Testing u_strcpy() and u_strcmp()\n");
	175
	176	for(i=0;i<3;++i)
	177	{
	178	for(j=0;j<4;++j)
	179	{
	180	log_verbose("Testing %s\n", u_austrcpy(tempOut, dataTable[i][j]));
	181	temp[0] = 0;
	182	u_strcpy(temp,dataTable[i][j]);
	183
	184	if(u_strcmp(temp,dataTable[i][j])!=0)
	185	log_err("something threw an error in u_strcpy() or u_strcmp()\n");
	186	}
	187	}
	188	if(u_strcmp(dataTable[0][0], dataTable[1][1])==0)
	189	log_err("an error occured in u_memcmp()\n");
	190
	191	log_verbose("testing u_strcat()\n");
	192	i=0;
	193	for(j=0; j<2;++j)
	194	{
	195	u_uastrcpy(temp, "");
	196	u_strcpy(temp,dataTable[i][j]);
	197	u_strcat(temp,dataTable[i+1][j]);
	198	if(u_strcmp(temp,dataTable[i+2][j])!=0)
	199	log_err("something threw an error in u_strcat()\n");
	200
	201	}
	202	log_verbose("Testing u_strncmp()\n");
	203	for(i=0,j=0;j<4; ++j)
	204	{
	205	k=u_strlen(dataTable[i][j]);
	206	if(u_strncmp(dataTable[i][j],dataTable[i+2][j],k)!=0)
	207	log_err("Something threw an error in u_strncmp\n");
	208	}
	209	if(u_strncmp(dataTable[0][0], dataTable[1][1], 7)==0)
	210	log_err("an error occured in u_memcmp()\n");
	211
	212
	213	log_verbose("Testing u_strncat\n");
	214	for(i=0,j=0;j<4; ++j)
	215	{
	216	k=u_strlen(dataTable[i][j]);
	217
	218	u_uastrcpy(temp,"");
	219
	220	if(u_strcmp(u_strncat(temp,dataTable[i+2][j],k),dataTable[i][j])!=0)
	221	log_err("something threw an error in u_strncat or u_uastrcpy()\n");
	222
	223	}
	224
	225	log_verbose("Testing u_strncpy() and u_uastrcpy()\n");
	226	for(i=2,j=0;j<4; ++j)
	227	{
	228	k=u_strlen(dataTable[i][j]);
	229	u_strncpy(temp, dataTable[i][j],k);
	230	temp[k] = 0xa4;
	231
	232	if(u_strncmp(temp, dataTable[i][j],k)!=0)
	233	log_err("something threw an error in u_strncpy()\n");
	234
	235	if(temp[k] != 0xa4)
	236	log_err("something threw an error in u_strncpy()\n");
	237
	238	u_memset(temp, 0x3F, (sizeof(temp) / sizeof(UChar)) - 1);
	239	u_uastrncpy(temp, raw[i][j], k-1);
	240	if(u_strncmp(temp, dataTable[i][j],k-1)!=0)
	241	log_err("something threw an error in u_uastrncpy(k-1)\n");
	242
	243	if(temp[k-1] != 0x3F)
	244	log_err("something threw an error in u_uastrncpy(k-1)\n");
	245
	246	u_memset(temp, 0x3F, (sizeof(temp) / sizeof(UChar)) - 1);
	247	u_uastrncpy(temp, raw[i][j], k+1);
	248	if(u_strcmp(temp, dataTable[i][j])!=0)
	249	log_err("something threw an error in u_uastrncpy(k+1)\n");
	250
	251	if(temp[k] != 0)
	252	log_err("something threw an error in u_uastrncpy(k+1)\n");
	253
	254	u_memset(temp, 0x3F, (sizeof(temp) / sizeof(UChar)) - 1);
	255	u_uastrncpy(temp, raw[i][j], k);
	256	if(u_strncmp(temp, dataTable[i][j], k)!=0)
	257	log_err("something threw an error in u_uastrncpy(k)\n");
	258
	259	if(temp[k] != 0x3F)
	260	log_err("something threw an error in u_uastrncpy(k)\n");
	261	}
	262
	263	log_verbose("Testing u_strchr() and u_memchr()\n");
	264
	265	for(i=2,j=0;j<4;j++)
	266	{
	267	UChar saveVal = dataTable[i][j][0];
	268	UChar *findPtr = u_strchr(dataTable[i][j], 0x005F);
	269	int32_t dataSize = (int32_t)(u_strlen(dataTable[i][j]) + 1);
	270
	271	log_verbose("%s ", u_austrcpy(tempOut, findPtr));
	272
	273	if (findPtr == NULL \|\| *findPtr != 0x005F) {
	274	log_err("u_strchr can't find '_' in the string\n");
	275	}
	276
	277	findPtr = u_strchr32(dataTable[i][j], 0x005F);
	278	if (findPtr == NULL \|\| *findPtr != 0x005F) {
	279	log_err("u_strchr32 can't find '_' in the string\n");
	280	}
	281
	282	findPtr = u_strchr(dataTable[i][j], 0);
	283	if (findPtr != (&(dataTable[i][j][dataSize - 1]))) {
	284	log_err("u_strchr can't find NULL in the string\n");
	285	}
	286
	287	findPtr = u_strchr32(dataTable[i][j], 0);
	288	if (findPtr != (&(dataTable[i][j][dataSize - 1]))) {
	289	log_err("u_strchr32 can't find NULL in the string\n");
	290	}
	291
	292	findPtr = u_memchr(dataTable[i][j], 0, dataSize);
	293	if (findPtr != (&(dataTable[i][j][dataSize - 1]))) {
	294	log_err("u_memchr can't find NULL in the string\n");
	295	}
	296
	297	findPtr = u_memchr32(dataTable[i][j], 0, dataSize);
	298	if (findPtr != (&(dataTable[i][j][dataSize - 1]))) {
	299	log_err("u_memchr32 can't find NULL in the string\n");
	300	}
	301
	302	dataTable[i][j][0] = 0;
	303	/* Make sure we skip over the NULL termination */
	304	findPtr = u_memchr(dataTable[i][j], 0x005F, dataSize);
	305	if (findPtr == NULL \|\| *findPtr != 0x005F) {
	306	log_err("u_memchr can't find '_' in the string\n");
	307	}
	308
	309	findPtr = u_memchr32(dataTable[i][j], 0x005F, dataSize);
	310	if (findPtr == NULL \|\| *findPtr != 0x005F) {
	311	log_err("u_memchr32 can't find '_' in the string\n");
	312	}
	313	findPtr = u_memchr32(dataTable[i][j], 0xFFFD, dataSize);
	314	if (findPtr != NULL) {
	315	log_err("Should have found NULL when the character is not there.\n");
	316	}
	317	dataTable[i][j][0] = saveVal; /* Put it back for the other tests */
	318	}
	319
	320	/*
	321	* test that u_strchr32()
	322	* does not find surrogate code points when they are part of matched pairs
	323	* (= part of supplementary code points)
	324	* Jitterbug 1542
	325	*/
	326	{
	327	static const UChar s[]={
	328	/* 0 1 2 3 4 5 6 7 8 9 */
	329	0x0061, 0xd841, 0xdc02, 0xd841, 0x0062, 0xdc02, 0xd841, 0xdc02, 0x0063, 0
	330	};
	331
	332	if(u_strchr32(s, 0xd841)!=(s+3) \|\| u_strchr32(s, 0xdc02)!=(s+5)) {
	333	log_err("error: u_strchr32(surrogate) finds a partial supplementary code point\n");
	334	}
	335	if(u_memchr32(s, 0xd841, 9)!=(s+3) \|\| u_memchr32(s, 0xdc02, 9)!=(s+5)) {
	336	log_err("error: u_memchr32(surrogate) finds a partial supplementary code point\n");
	337	}
	338	}
	339
	340	log_verbose("Testing u_austrcpy()");
	341	u_austrcpy(test,dataTable[0][0]);
	342	if(strcmp(test,raw[0][0])!=0)
	343	log_err("There is an error in u_austrcpy()");
	344
	345
	346	log_verbose("Testing u_strtok_r()");
	347	{
	348	const char tokString[] = " , 1 2 3 AHHHHH! 5.5 6 7 , 8\n";
	349	const char *tokens[] = {",", "1", "2", "3", "AHHHHH!", "5.5", "6", "7", "8\n"};
	350	UChar delimBuf[sizeof(test)];
	351	UChar currTokenBuf[sizeof(tokString)];
	352	UChar *state;
	353	uint32_t currToken = 0;
	354	UChar *ptr;
	355
	356	u_uastrcpy(temp, tokString);
	357	u_uastrcpy(delimBuf, " ");
	358
	359	ptr = u_strtok_r(temp, delimBuf, &state);
	360	u_uastrcpy(delimBuf, " ,");
	361	while (ptr != NULL) {
	362	u_uastrcpy(currTokenBuf, tokens[currToken]);
	363	if (u_strcmp(ptr, currTokenBuf) != 0) {
	364	log_err("u_strtok_r mismatch at %d. Got: %s, Expected: %s\n", currToken, ptr, tokens[currToken]);
	365	}
	366	ptr = u_strtok_r(NULL, delimBuf, &state);
	367	currToken++;
	368	}
	369
	370	if (currToken != sizeof(tokens)/sizeof(tokens[0])) {
	371	log_err("Didn't get correct number of tokens\n");
	372	}
	373	state = delimBuf; /* Give it an "invalid" saveState */
	374	u_uastrcpy(currTokenBuf, "");
	375	if (u_strtok_r(currTokenBuf, delimBuf, &state) != NULL) {
	376	log_err("Didn't get NULL for empty string\n");
	377	}
	378	if (state != NULL) {
	379	log_err("State should be NULL for empty string\n");
	380	}
	381	state = delimBuf; /* Give it an "invalid" saveState */
	382	u_uastrcpy(currTokenBuf, ", ,");
	383	if (u_strtok_r(currTokenBuf, delimBuf, &state) != NULL) {
	384	log_err("Didn't get NULL for a string of delimiters\n");
	385	}
	386	if (state != NULL) {
	387	log_err("State should be NULL for a string of delimiters\n");
	388	}
	389
	390	state = delimBuf; /* Give it an "invalid" saveState */
	391	u_uastrcpy(currTokenBuf, "q, ,");
	392	if (u_strtok_r(currTokenBuf, delimBuf, &state) == NULL) {
	393	log_err("Got NULL for a string that does not begin with delimiters\n");
	394	}
	395	if (u_strtok_r(NULL, delimBuf, &state) != NULL) {
	396	log_err("Didn't get NULL for a string that ends in delimiters\n");
	397	}
	398	if (state != NULL) {
	399	log_err("State should be NULL for empty string\n");
	400	}
	401
	402	state = delimBuf; /* Give it an "invalid" saveState */
	403	u_uastrcpy(currTokenBuf, tokString);
	404	u_uastrcpy(temp, tokString);
	405	u_uastrcpy(delimBuf, "q"); /* Give it a delimiter that it can't find. */
	406	ptr = u_strtok_r(currTokenBuf, delimBuf, &state);
	407	if (ptr == NULL \|\| u_strcmp(ptr, temp) != 0) {
	408	log_err("Should have recieved the same string when there are no delimiters\n");
	409	}
	410	if (u_strtok_r(NULL, delimBuf, &state) != NULL) {
	411	log_err("Should not have found another token in a one token string\n");
	412	}
	413	}
	414
	415	/* test u_strcmpCodePointOrder() */
	416	{
	417	/* these strings are in ascending order */
	418	static const UChar strings[][4]={
	419	{ 0x61, 0 }, /* U+0061 */
	420	{ 0x20ac, 0xd801, 0 }, /* U+20ac U+d801 */
	421	{ 0x20ac, 0xd800, 0xdc00, 0 }, /* U+20ac U+10000 */
	422	{ 0xd800, 0 }, /* U+d800 */
	423	{ 0xd800, 0xff61, 0 }, /* U+d800 U+ff61 */
	424	{ 0xdfff, 0 }, /* U+dfff */
	425	{ 0xff61, 0xdfff, 0 }, /* U+ff61 U+dfff */
	426	{ 0xff61, 0xd800, 0xdc02, 0 }, /* U+ff61 U+10002 */
	427	{ 0xd800, 0xdc02, 0 }, /* U+10002 */
	428	{ 0xd84d, 0xdc56, 0 } /* U+23456 */
	429	};
	430
	431	UCharIterator iter1, iter2;
	432	int32_t len1, len2, r1, r2;
	433
	434	for(i=0; i<(sizeof(strings)/sizeof(strings[0])-1); ++i) {
	435	if(u_strcmpCodePointOrder(strings[i], strings[i+1])>=0) {
	436	log_err("error: u_strcmpCodePointOrder() fails for string %d and the following one\n", i);
	437	}
	438	if(u_strncmpCodePointOrder(strings[i], strings[i+1], 10)>=0) {
	439	log_err("error: u_strncmpCodePointOrder() fails for string %d and the following one\n", i);
	440	}
	441
	442	/* There are at least 2 UChars in each string - verify that strncmp()==memcmp(). */
	443	if(u_strncmpCodePointOrder(strings[i], strings[i+1], 2)!=u_memcmpCodePointOrder(strings[i], strings[i+1], 2)) {
	444	log_err("error: u_strncmpCodePointOrder(2)!=u_memcmpCodePointOrder(2) for string %d and the following one\n", i);
	445	}
	446
	447	/* test u_strCompare(TRUE) */
	448	len1=u_strlen(strings[i]);
	449	len2=u_strlen(strings[i+1]);
	450	if( u_strCompare(strings[i], -1, strings[i+1], -1, TRUE)>=0 \|\|
	451	u_strCompare(strings[i], -1, strings[i+1], len2, TRUE)>=0 \|\|
	452	u_strCompare(strings[i], len1, strings[i+1], -1, TRUE)>=0 \|\|
	453	u_strCompare(strings[i], len1, strings[i+1], len2, TRUE)>=0
	454	) {
	455	log_err("error: u_strCompare(code point order) fails for string %d and the following one\n", i);
	456	}
	457
	458	/* test u_strCompare(FALSE) */
	459	r1=u_strCompare(strings[i], -1, strings[i+1], -1, FALSE);
	460	r2=u_strcmp(strings[i], strings[i+1]);
	461	if(_SIGN(r1)!=_SIGN(r2)) {
	462	log_err("error: u_strCompare(code unit order)!=u_strcmp() for string %d and the following one\n", i);
	463	}
	464
	465	/* test u_strCompareIter() */
	466	uiter_setString(&iter1, strings[i], len1);
	467	uiter_setString(&iter2, strings[i+1], len2);
	468	if(u_strCompareIter(&iter1, &iter2, TRUE)>=0) {
	469	log_err("error: u_strCompareIter(code point order) fails for string %d and the following one\n", i);
	470	}
	471	r1=u_strCompareIter(&iter1, &iter2, FALSE);
	472	if(_SIGN(r1)!=_SIGN(u_strcmp(strings[i], strings[i+1]))) {
	473	log_err("error: u_strCompareIter(code unit order)!=u_strcmp() for string %d and the following one\n", i);
	474	}
	475	}
	476	}
	477
	478	cleanUpDataTable();
	479	}
	480
	481	static void TestStringSearching()
	482	{
	483	const UChar testString[] = {0x0061, 0x0062, 0x0063, 0x0064, 0x0064, 0x0061, 0};
	484	const UChar testSurrogateString[] = {0xdbff, 0x0061, 0x0062, 0xdbff, 0xdfff, 0x0063, 0x0064, 0x0064, 0xdbff, 0xdfff, 0xdb00, 0xdf00, 0x0061, 0};
	485	const UChar surrMatchSet1[] = {0xdbff, 0xdfff, 0};
	486	const UChar surrMatchSet2[] = {0x0061, 0x0062, 0xdbff, 0xdfff, 0};
	487	const UChar surrMatchSet3[] = {0xdb00, 0xdf00, 0xdbff, 0xdfff, 0};
	488	const UChar surrMatchSet4[] = {0x0000};
	489	const UChar surrMatchSetBad[] = {0xdbff, 0x0061, 0};
	490	const UChar surrMatchSetBad2[] = {0x0061, 0xdbff, 0};
	491	const UChar surrMatchSetBad3[] = {0xdbff, 0x0061, 0x0062, 0xdbff, 0xdfff, 0}; /* has partial surrogate */
	492	const UChar
	493	empty[] = { 0 },
	494	a[] = { 0x61, 0 },
	495	ab[] = { 0x61, 0x62, 0 },
	496	ba[] = { 0x62, 0x61, 0 },
	497	abcd[] = { 0x61, 0x62, 0x63, 0x64, 0 },
	498	cd[] = { 0x63, 0x64, 0 },
	499	dc[] = { 0x64, 0x63, 0 },
	500	cdh[] = { 0x63, 0x64, 0x68, 0 },
	501	f[] = { 0x66, 0 },
	502	fg[] = { 0x66, 0x67, 0 },
	503	gf[] = { 0x67, 0x66, 0 };
	504
	505	log_verbose("Testing u_strpbrk()");
	506
	507	if (u_strpbrk(testString, a) != &testString[0]) {
	508	log_err("u_strpbrk couldn't find first letter a.\n");
	509	}
	510	if (u_strpbrk(testString, dc) != &testString[2]) {
	511	log_err("u_strpbrk couldn't find d or c.\n");
	512	}
	513	if (u_strpbrk(testString, cd) != &testString[2]) {
	514	log_err("u_strpbrk couldn't find c or d.\n");
	515	}
	516	if (u_strpbrk(testString, cdh) != &testString[2]) {
	517	log_err("u_strpbrk couldn't find c, d or h.\n");
	518	}
	519	if (u_strpbrk(testString, f) != NULL) {
	520	log_err("u_strpbrk didn't return NULL for \"f\".\n");
	521	}
	522	if (u_strpbrk(testString, fg) != NULL) {
	523	log_err("u_strpbrk didn't return NULL for \"fg\".\n");
	524	}
	525	if (u_strpbrk(testString, gf) != NULL) {
	526	log_err("u_strpbrk didn't return NULL for \"gf\".\n");
	527	}
	528	if (u_strpbrk(testString, empty) != NULL) {
	529	log_err("u_strpbrk didn't return NULL for \"\".\n");
	530	}
	531
	532	log_verbose("Testing u_strpbrk() with surrogates");
	533
	534	if (u_strpbrk(testSurrogateString, a) != &testSurrogateString[1]) {
	535	log_err("u_strpbrk couldn't find first letter a.\n");
	536	}
	537	if (u_strpbrk(testSurrogateString, dc) != &testSurrogateString[5]) {
	538	log_err("u_strpbrk couldn't find d or c.\n");
	539	}
	540	if (u_strpbrk(testSurrogateString, cd) != &testSurrogateString[5]) {
	541	log_err("u_strpbrk couldn't find c or d.\n");
	542	}
	543	if (u_strpbrk(testSurrogateString, cdh) != &testSurrogateString[5]) {
	544	log_err("u_strpbrk couldn't find c, d or h.\n");
	545	}
	546	if (u_strpbrk(testSurrogateString, f) != NULL) {
	547	log_err("u_strpbrk didn't return NULL for \"f\".\n");
	548	}
	549	if (u_strpbrk(testSurrogateString, fg) != NULL) {
	550	log_err("u_strpbrk didn't return NULL for \"fg\".\n");
	551	}
	552	if (u_strpbrk(testSurrogateString, gf) != NULL) {
	553	log_err("u_strpbrk didn't return NULL for \"gf\".\n");
	554	}
	555	if (u_strpbrk(testSurrogateString, surrMatchSet1) != &testSurrogateString[3]) {
	556	log_err("u_strpbrk couldn't find \"0xdbff, 0xdfff\".\n");
	557	}
	558	if (u_strpbrk(testSurrogateString, surrMatchSet2) != &testSurrogateString[1]) {
	559	log_err("u_strpbrk couldn't find \"0xdbff, a, b, 0xdbff, 0xdfff\".\n");
	560	}
	561	if (u_strpbrk(testSurrogateString, surrMatchSet3) != &testSurrogateString[3]) {
	562	log_err("u_strpbrk couldn't find \"0xdb00, 0xdf00, 0xdbff, 0xdfff\".\n");
	563	}
	564	if (u_strpbrk(testSurrogateString, surrMatchSet4) != NULL) {
	565	log_err("u_strpbrk should have returned NULL for empty string.\n");
	566	}
	567	if (u_strpbrk(testSurrogateString, surrMatchSetBad) != &testSurrogateString[0]) {
	568	log_err("u_strpbrk should have found bad surrogate.\n");
	569	}
	570
	571	log_verbose("Testing u_strcspn()");
	572
	573	if (u_strcspn(testString, a) != 0) {
	574	log_err("u_strcspn couldn't find first letter a.\n");
	575	}
	576	if (u_strcspn(testString, dc) != 2) {
	577	log_err("u_strcspn couldn't find d or c.\n");
	578	}
	579	if (u_strcspn(testString, cd) != 2) {
	580	log_err("u_strcspn couldn't find c or d.\n");
	581	}
	582	if (u_strcspn(testString, cdh) != 2) {
	583	log_err("u_strcspn couldn't find c, d or h.\n");
	584	}
	585	if (u_strcspn(testString, f) != u_strlen(testString)) {
	586	log_err("u_strcspn didn't return NULL for \"f\".\n");
	587	}
	588	if (u_strcspn(testString, fg) != u_strlen(testString)) {
	589	log_err("u_strcspn didn't return NULL for \"fg\".\n");
	590	}
	591	if (u_strcspn(testString, gf) != u_strlen(testString)) {
	592	log_err("u_strcspn didn't return NULL for \"gf\".\n");
	593	}
	594
	595	log_verbose("Testing u_strcspn() with surrogates");
	596
	597	if (u_strcspn(testSurrogateString, a) != 1) {
	598	log_err("u_strcspn couldn't find first letter a.\n");
	599	}
	600	if (u_strcspn(testSurrogateString, dc) != 5) {
	601	log_err("u_strcspn couldn't find d or c.\n");
	602	}
	603	if (u_strcspn(testSurrogateString, cd) != 5) {
	604	log_err("u_strcspn couldn't find c or d.\n");
	605	}
	606	if (u_strcspn(testSurrogateString, cdh) != 5) {
	607	log_err("u_strcspn couldn't find c, d or h.\n");
	608	}
	609	if (u_strcspn(testSurrogateString, f) != u_strlen(testSurrogateString)) {
	610	log_err("u_strcspn didn't return NULL for \"f\".\n");
	611	}
	612	if (u_strcspn(testSurrogateString, fg) != u_strlen(testSurrogateString)) {
	613	log_err("u_strcspn didn't return NULL for \"fg\".\n");
	614	}
	615	if (u_strcspn(testSurrogateString, gf) != u_strlen(testSurrogateString)) {
	616	log_err("u_strcspn didn't return NULL for \"gf\".\n");
	617	}
	618	if (u_strcspn(testSurrogateString, surrMatchSet1) != 3) {
	619	log_err("u_strcspn couldn't find \"0xdbff, 0xdfff\".\n");
	620	}
	621	if (u_strcspn(testSurrogateString, surrMatchSet2) != 1) {
	622	log_err("u_strcspn couldn't find \"a, b, 0xdbff, 0xdfff\".\n");
	623	}
	624	if (u_strcspn(testSurrogateString, surrMatchSet3) != 3) {
	625	log_err("u_strcspn couldn't find \"0xdb00, 0xdf00, 0xdbff, 0xdfff\".\n");
	626	}
	627	if (u_strcspn(testSurrogateString, surrMatchSet4) != u_strlen(testSurrogateString)) {
	628	log_err("u_strcspn should have returned strlen for empty string.\n");
	629	}
	630
	631
	632	log_verbose("Testing u_strspn()");
	633
	634	if (u_strspn(testString, a) != 1) {
	635	log_err("u_strspn couldn't skip first letter a.\n");
	636	}
	637	if (u_strspn(testString, ab) != 2) {
	638	log_err("u_strspn couldn't skip a or b.\n");
	639	}
	640	if (u_strspn(testString, ba) != 2) {
	641	log_err("u_strspn couldn't skip a or b.\n");
	642	}
	643	if (u_strspn(testString, f) != 0) {
	644	log_err("u_strspn didn't return 0 for \"f\".\n");
	645	}
	646	if (u_strspn(testString, dc) != 0) {
	647	log_err("u_strspn couldn't find first letter a (skip d or c).\n");
	648	}
	649	if (u_strspn(testString, abcd) != u_strlen(testString)) {
	650	log_err("u_strspn couldn't skip over the whole string.\n");
	651	}
	652	if (u_strspn(testString, empty) != 0) {
	653	log_err("u_strspn should have returned 0 for empty string.\n");
	654	}
	655
	656	log_verbose("Testing u_strspn() with surrogates");
	657	if (u_strspn(testSurrogateString, surrMatchSetBad) != 2) {
	658	log_err("u_strspn couldn't skip 0xdbff or a.\n");
	659	}
	660	if (u_strspn(testSurrogateString, surrMatchSetBad2) != 2) {
	661	log_err("u_strspn couldn't skip 0xdbff or a.\n");
	662	}
	663	if (u_strspn(testSurrogateString, f) != 0) {
	664	log_err("u_strspn couldn't skip d or c (skip first letter).\n");
	665	}
	666	if (u_strspn(testSurrogateString, dc) != 0) {
	667	log_err("u_strspn couldn't skip d or c (skip first letter).\n");
	668	}
	669	if (u_strspn(testSurrogateString, cd) != 0) {
	670	log_err("u_strspn couldn't skip d or c (skip first letter).\n");
	671	}
	672	if (u_strspn(testSurrogateString, testSurrogateString) != u_strlen(testSurrogateString)) {
	673	log_err("u_strspn couldn't skip whole string.\n");
	674	}
	675	if (u_strspn(testSurrogateString, surrMatchSet1) != 0) {
	676	log_err("u_strspn couldn't skip \"0xdbff, 0xdfff\" (get first letter).\n");
	677	}
	678	if (u_strspn(testSurrogateString, surrMatchSetBad3) != 5) {
	679	log_err("u_strspn couldn't skip \"0xdbff, a, b, 0xdbff, 0xdfff\".\n");
	680	}
	681	if (u_strspn(testSurrogateString, surrMatchSet4) != 0) {
	682	log_err("u_strspn should have returned 0 for empty string.\n");
	683	}
	684	}
	685
	686	/*
	687	* All binary Unicode string searches should behave the same for equivalent input.
	688	* See Jitterbug 2145.
	689	* There are some new functions, too - just test them all.
	690	*/
	691	static void
	692	TestSurrogateSearching() {
	693	static const UChar s[]={
	694	/* 0 1 2 3 4 5 6 7 8 9 10 11 */
	695	0x61, 0xd801, 0xdc02, 0x61, 0xdc02, 0x61, 0xd801, 0x61, 0xd801, 0xdc02, 0x61, 0
	696	}, sub_a[]={
	697	0x61, 0
	698	}, sub_b[]={
	699	0x62, 0
	700	}, sub_lead[]={
	701	0xd801, 0
	702	}, sub_trail[]={
	703	0xdc02, 0
	704	}, sub_supp[]={
	705	0xd801, 0xdc02, 0
	706	}, sub_supp2[]={
	707	0xd801, 0xdc03, 0
	708	}, sub_a_lead[]={
	709	0x61, 0xd801, 0
	710	}, sub_trail_a[]={
	711	0xdc02, 0x61, 0
	712	}, sub_aba[]={
	713	0x61, 0x62, 0x61, 0
	714	};
	715	static const UChar a=0x61, b=0x62, lead=0xd801, trail=0xdc02, nul=0;
	716	static const UChar32 supp=0x10402, supp2=0x10403, ill=0x123456;
	717
	718	const UChar first, last;
	719
	720	/* search for NUL code point: find end of string */
	721	first=s+u_strlen(s);
	722
	723	if(
	724	first!=u_strchr(s, nul) \|\|
	725	first!=u_strchr32(s, nul) \|\|
	726	first!=u_memchr(s, nul, LENGTHOF(s)) \|\|
	727	first!=u_memchr32(s, nul, LENGTHOF(s)) \|\|
	728	first!=u_strrchr(s, nul) \|\|
	729	first!=u_strrchr32(s, nul) \|\|
	730	first!=u_memrchr(s, nul, LENGTHOF(s)) \|\|
	731	first!=u_memrchr32(s, nul, LENGTHOF(s))
	732	) {
	733	log_err("error: one of the u_str[\|mem][r]chr[32](s, nul) does not find the terminator of s\n");
	734	}
	735
	736	/* search for empty substring: find beginning of string */
	737	if(
	738	s!=u_strstr(s, &nul) \|\|
	739	s!=u_strFindFirst(s, -1, &nul, -1) \|\|
	740	s!=u_strFindFirst(s, -1, &nul, 0) \|\|
	741	s!=u_strFindFirst(s, LENGTHOF(s), &nul, -1) \|\|
	742	s!=u_strFindFirst(s, LENGTHOF(s), &nul, 0) \|\|
	743	s!=u_strrstr(s, &nul) \|\|
	744	s!=u_strFindLast(s, -1, &nul, -1) \|\|
	745	s!=u_strFindLast(s, -1, &nul, 0) \|\|
	746	s!=u_strFindLast(s, LENGTHOF(s), &nul, -1) \|\|
	747	s!=u_strFindLast(s, LENGTHOF(s), &nul, 0)
	748	) {
	749	log_err("error: one of the u_str[str etc](s, \"\") does not find s itself\n");
	750	}
	751
	752	/* find 'a' in s[1..10[ */
	753	first=s+3;
	754	last=s+7;
	755	if(
	756	first!=u_strchr(s+1, a) \|\|
	757	first!=u_strchr32(s+1, a) \|\|
	758	first!=u_memchr(s+1, a, 9) \|\|
	759	first!=u_memchr32(s+1, a, 9) \|\|
	760	first!=u_strstr(s+1, sub_a) \|\|
	761	first!=u_strFindFirst(s+1, -1, sub_a, -1) \|\|
	762	first!=u_strFindFirst(s+1, -1, &a, 1) \|\|
	763	first!=u_strFindFirst(s+1, 9, sub_a, -1) \|\|
	764	first!=u_strFindFirst(s+1, 9, &a, 1) \|\|
	765	(s+10)!=u_strrchr(s+1, a) \|\|
	766	(s+10)!=u_strrchr32(s+1, a) \|\|
	767	last!=u_memrchr(s+1, a, 9) \|\|
	768	last!=u_memrchr32(s+1, a, 9) \|\|
	769	(s+10)!=u_strrstr(s+1, sub_a) \|\|
	770	(s+10)!=u_strFindLast(s+1, -1, sub_a, -1) \|\|
	771	(s+10)!=u_strFindLast(s+1, -1, &a, 1) \|\|
	772	last!=u_strFindLast(s+1, 9, sub_a, -1) \|\|
	773	last!=u_strFindLast(s+1, 9, &a, 1)
	774	) {
	775	log_err("error: one of the u_str[chr etc]('a') does not find the correct place\n");
	776	}
	777
	778	/* do not find 'b' in s[1..10[ */
	779	if(
	780	NULL!=u_strchr(s+1, b) \|\|
	781	NULL!=u_strchr32(s+1, b) \|\|
	782	NULL!=u_memchr(s+1, b, 9) \|\|
	783	NULL!=u_memchr32(s+1, b, 9) \|\|
	784	NULL!=u_strstr(s+1, sub_b) \|\|
	785	NULL!=u_strFindFirst(s+1, -1, sub_b, -1) \|\|
	786	NULL!=u_strFindFirst(s+1, -1, &b, 1) \|\|
	787	NULL!=u_strFindFirst(s+1, 9, sub_b, -1) \|\|
	788	NULL!=u_strFindFirst(s+1, 9, &b, 1) \|\|
	789	NULL!=u_strrchr(s+1, b) \|\|
	790	NULL!=u_strrchr32(s+1, b) \|\|
	791	NULL!=u_memrchr(s+1, b, 9) \|\|
	792	NULL!=u_memrchr32(s+1, b, 9) \|\|
	793	NULL!=u_strrstr(s+1, sub_b) \|\|
	794	NULL!=u_strFindLast(s+1, -1, sub_b, -1) \|\|
	795	NULL!=u_strFindLast(s+1, -1, &b, 1) \|\|
	796	NULL!=u_strFindLast(s+1, 9, sub_b, -1) \|\|
	797	NULL!=u_strFindLast(s+1, 9, &b, 1)
	798	) {
	799	log_err("error: one of the u_str[chr etc]('b') incorrectly finds something\n");
	800	}
	801
	802	/* do not find a non-code point in s[1..10[ */
	803	if(
	804	NULL!=u_strchr32(s+1, ill) \|\|
	805	NULL!=u_memchr32(s+1, ill, 9) \|\|
	806	NULL!=u_strrchr32(s+1, ill) \|\|
	807	NULL!=u_memrchr32(s+1, ill, 9)
	808	) {
	809	log_err("error: one of the u_str[chr etc](illegal code point) incorrectly finds something\n");
	810	}
	811
	812	/* find U+d801 in s[1..10[ */
	813	first=s+6;
	814	if(
	815	first!=u_strchr(s+1, lead) \|\|
	816	first!=u_strchr32(s+1, lead) \|\|
	817	first!=u_memchr(s+1, lead, 9) \|\|
	818	first!=u_memchr32(s+1, lead, 9) \|\|
	819	first!=u_strstr(s+1, sub_lead) \|\|
	820	first!=u_strFindFirst(s+1, -1, sub_lead, -1) \|\|
	821	first!=u_strFindFirst(s+1, -1, &lead, 1) \|\|
	822	first!=u_strFindFirst(s+1, 9, sub_lead, -1) \|\|
	823	first!=u_strFindFirst(s+1, 9, &lead, 1) \|\|
	824	first!=u_strrchr(s+1, lead) \|\|
	825	first!=u_strrchr32(s+1, lead) \|\|
	826	first!=u_memrchr(s+1, lead, 9) \|\|
	827	first!=u_memrchr32(s+1, lead, 9) \|\|
	828	first!=u_strrstr(s+1, sub_lead) \|\|
	829	first!=u_strFindLast(s+1, -1, sub_lead, -1) \|\|
	830	first!=u_strFindLast(s+1, -1, &lead, 1) \|\|
	831	first!=u_strFindLast(s+1, 9, sub_lead, -1) \|\|
	832	first!=u_strFindLast(s+1, 9, &lead, 1)
	833	) {
	834	log_err("error: one of the u_str[chr etc](U+d801) does not find the correct place\n");
	835	}
	836
	837	/* find U+dc02 in s[1..10[ */
	838	first=s+4;
	839	if(
	840	first!=u_strchr(s+1, trail) \|\|
	841	first!=u_strchr32(s+1, trail) \|\|
	842	first!=u_memchr(s+1, trail, 9) \|\|
	843	first!=u_memchr32(s+1, trail, 9) \|\|
	844	first!=u_strstr(s+1, sub_trail) \|\|
	845	first!=u_strFindFirst(s+1, -1, sub_trail, -1) \|\|
	846	first!=u_strFindFirst(s+1, -1, &trail, 1) \|\|
	847	first!=u_strFindFirst(s+1, 9, sub_trail, -1) \|\|
	848	first!=u_strFindFirst(s+1, 9, &trail, 1) \|\|
	849	first!=u_strrchr(s+1, trail) \|\|
	850	first!=u_strrchr32(s+1, trail) \|\|
	851	first!=u_memrchr(s+1, trail, 9) \|\|
	852	first!=u_memrchr32(s+1, trail, 9) \|\|
	853	first!=u_strrstr(s+1, sub_trail) \|\|
	854	first!=u_strFindLast(s+1, -1, sub_trail, -1) \|\|
	855	first!=u_strFindLast(s+1, -1, &trail, 1) \|\|
	856	first!=u_strFindLast(s+1, 9, sub_trail, -1) \|\|
	857	first!=u_strFindLast(s+1, 9, &trail, 1)
	858	) {
	859	log_err("error: one of the u_str[chr etc](U+dc02) does not find the correct place\n");
	860	}
	861
	862	/* find U+10402 in s[1..10[ */
	863	first=s+1;
	864	last=s+8;
	865	if(
	866	first!=u_strchr32(s+1, supp) \|\|
	867	first!=u_memchr32(s+1, supp, 9) \|\|
	868	first!=u_strstr(s+1, sub_supp) \|\|
	869	first!=u_strFindFirst(s+1, -1, sub_supp, -1) \|\|
	870	first!=u_strFindFirst(s+1, -1, sub_supp, 2) \|\|
	871	first!=u_strFindFirst(s+1, 9, sub_supp, -1) \|\|
	872	first!=u_strFindFirst(s+1, 9, sub_supp, 2) \|\|
	873	last!=u_strrchr32(s+1, supp) \|\|
	874	last!=u_memrchr32(s+1, supp, 9) \|\|
	875	last!=u_strrstr(s+1, sub_supp) \|\|
	876	last!=u_strFindLast(s+1, -1, sub_supp, -1) \|\|
	877	last!=u_strFindLast(s+1, -1, sub_supp, 2) \|\|
	878	last!=u_strFindLast(s+1, 9, sub_supp, -1) \|\|
	879	last!=u_strFindLast(s+1, 9, sub_supp, 2)
	880	) {
	881	log_err("error: one of the u_str[chr etc](U+10402) does not find the correct place\n");
	882	}
	883
	884	/* do not find U+10402 in a single UChar */
	885	if(
	886	NULL!=u_memchr32(s+1, supp, 1) \|\|
	887	NULL!=u_strFindFirst(s+1, 1, sub_supp, -1) \|\|
	888	NULL!=u_strFindFirst(s+1, 1, sub_supp, 2) \|\|
	889	NULL!=u_memrchr32(s+1, supp, 1) \|\|
	890	NULL!=u_strFindLast(s+1, 1, sub_supp, -1) \|\|
	891	NULL!=u_strFindLast(s+1, 1, sub_supp, 2) \|\|
	892	NULL!=u_memrchr32(s+2, supp, 1) \|\|
	893	NULL!=u_strFindLast(s+2, 1, sub_supp, -1) \|\|
	894	NULL!=u_strFindLast(s+2, 1, sub_supp, 2)
	895	) {
	896	log_err("error: one of the u_str[chr etc](U+10402) incorrectly finds a supplementary c.p. in a single UChar\n");
	897	}
	898
	899	/* do not find U+10403 in s[1..10[ */
	900	if(
	901	NULL!=u_strchr32(s+1, supp2) \|\|
	902	NULL!=u_memchr32(s+1, supp2, 9) \|\|
	903	NULL!=u_strstr(s+1, sub_supp2) \|\|
	904	NULL!=u_strFindFirst(s+1, -1, sub_supp2, -1) \|\|
	905	NULL!=u_strFindFirst(s+1, -1, sub_supp2, 2) \|\|
	906	NULL!=u_strFindFirst(s+1, 9, sub_supp2, -1) \|\|
	907	NULL!=u_strFindFirst(s+1, 9, sub_supp2, 2) \|\|
	908	NULL!=u_strrchr32(s+1, supp2) \|\|
	909	NULL!=u_memrchr32(s+1, supp2, 9) \|\|
	910	NULL!=u_strrstr(s+1, sub_supp2) \|\|
	911	NULL!=u_strFindLast(s+1, -1, sub_supp2, -1) \|\|
	912	NULL!=u_strFindLast(s+1, -1, sub_supp2, 2) \|\|
	913	NULL!=u_strFindLast(s+1, 9, sub_supp2, -1) \|\|
	914	NULL!=u_strFindLast(s+1, 9, sub_supp2, 2)
	915	) {
	916	log_err("error: one of the u_str[chr etc](U+10403) incorrectly finds something\n");
	917	}
	918
	919	/* find <0061 d801> in s[1..10[ */
	920	first=s+5;
	921	if(
	922	first!=u_strstr(s+1, sub_a_lead) \|\|
	923	first!=u_strFindFirst(s+1, -1, sub_a_lead, -1) \|\|
	924	first!=u_strFindFirst(s+1, -1, sub_a_lead, 2) \|\|
	925	first!=u_strFindFirst(s+1, 9, sub_a_lead, -1) \|\|
	926	first!=u_strFindFirst(s+1, 9, sub_a_lead, 2) \|\|
	927	first!=u_strrstr(s+1, sub_a_lead) \|\|
	928	first!=u_strFindLast(s+1, -1, sub_a_lead, -1) \|\|
	929	first!=u_strFindLast(s+1, -1, sub_a_lead, 2) \|\|
	930	first!=u_strFindLast(s+1, 9, sub_a_lead, -1) \|\|
	931	first!=u_strFindLast(s+1, 9, sub_a_lead, 2)
	932	) {
	933	log_err("error: one of the u_str[str etc](<0061 d801>) does not find the correct place\n");
	934	}
	935
	936	/* find <dc02 0061> in s[1..10[ */
	937	first=s+4;
	938	if(
	939	first!=u_strstr(s+1, sub_trail_a) \|\|
	940	first!=u_strFindFirst(s+1, -1, sub_trail_a, -1) \|\|
	941	first!=u_strFindFirst(s+1, -1, sub_trail_a, 2) \|\|
	942	first!=u_strFindFirst(s+1, 9, sub_trail_a, -1) \|\|
	943	first!=u_strFindFirst(s+1, 9, sub_trail_a, 2) \|\|
	944	first!=u_strrstr(s+1, sub_trail_a) \|\|
	945	first!=u_strFindLast(s+1, -1, sub_trail_a, -1) \|\|
	946	first!=u_strFindLast(s+1, -1, sub_trail_a, 2) \|\|
	947	first!=u_strFindLast(s+1, 9, sub_trail_a, -1) \|\|
	948	first!=u_strFindLast(s+1, 9, sub_trail_a, 2)
	949	) {
	950	log_err("error: one of the u_str[str etc](<dc02 0061>) does not find the correct place\n");
	951	}
	952
	953	/* do not find "aba" in s[1..10[ */
	954	if(
	955	NULL!=u_strstr(s+1, sub_aba) \|\|
	956	NULL!=u_strFindFirst(s+1, -1, sub_aba, -1) \|\|
	957	NULL!=u_strFindFirst(s+1, -1, sub_aba, 3) \|\|
	958	NULL!=u_strFindFirst(s+1, 9, sub_aba, -1) \|\|
	959	NULL!=u_strFindFirst(s+1, 9, sub_aba, 3) \|\|
	960	NULL!=u_strrstr(s+1, sub_aba) \|\|
	961	NULL!=u_strFindLast(s+1, -1, sub_aba, -1) \|\|
	962	NULL!=u_strFindLast(s+1, -1, sub_aba, 3) \|\|
	963	NULL!=u_strFindLast(s+1, 9, sub_aba, -1) \|\|
	964	NULL!=u_strFindLast(s+1, 9, sub_aba, 3)
	965	) {
	966	log_err("error: one of the u_str[str etc](\"aba\") incorrectly finds something\n");
	967	}
	968	}
	969
	970	static void TestStringCopy()
	971	{
	972	UChar temp[40];
	973	UChar *result=0;
	974	UChar subString[5];
	975	UChar uchars[]={0x61, 0x62, 0x63, 0x00};
	976	char charOut[40];
	977	char chars[]="abc"; /* needs default codepage */
	978
	979	log_verbose("Testing u_uastrncpy() and u_uastrcpy()");
	980
	981	u_uastrcpy(temp, "abc");
	982	if(u_strcmp(temp, uchars) != 0) {
	983	log_err("There is an error in u_uastrcpy() Expected %s Got %s\n", austrdup(uchars), austrdup(temp));
	984	}
	985
	986	temp[0] = 0xFB; /* load garbage into it */
	987	temp[1] = 0xFB;
	988	temp[2] = 0xFB;
	989	temp[3] = 0xFB;
	990
	991	u_uastrncpy(temp, "abcabcabc", 3);
	992	if(u_strncmp(uchars, temp, 3) != 0){
	993	log_err("There is an error in u_uastrncpy() Expected %s Got %s\n", austrdup(uchars), austrdup(temp));
	994	}
	995	if(temp[3] != 0xFB) {
	996	log_err("u_uastrncpy wrote past it's bounds. Expected undisturbed byte at 3\n");
	997	}
	998
	999	charOut[0] = (char)0x7B; /* load garbage into it */
	1000	charOut[1] = (char)0x7B;
	1001	charOut[2] = (char)0x7B;
	1002	charOut[3] = (char)0x7B;
	1003
	1004	temp[0] = 0x0061;
	1005	temp[1] = 0x0062;
	1006	temp[2] = 0x0063;
	1007	temp[3] = 0x0061;
	1008	temp[4] = 0x0062;
	1009	temp[5] = 0x0063;
	1010	temp[6] = 0x0000;
	1011
	1012	u_austrncpy(charOut, temp, 3);
	1013	if(strncmp(chars, charOut, 3) != 0){
	1014	log_err("There is an error in u_austrncpy() Expected %s Got %s\n", austrdup(uchars), austrdup(temp));
	1015	}
	1016	if(charOut[3] != (char)0x7B) {
	1017	log_err("u_austrncpy wrote past it's bounds. Expected undisturbed byte at 3\n");
	1018	}
	1019
	1020	/Testing u_strchr()/
	1021	log_verbose("Testing u_strchr\n");
	1022	temp[0]=0x42;
	1023	temp[1]=0x62;
	1024	temp[2]=0x62;
	1025	temp[3]=0x63;
	1026	temp[4]=0xd841;
	1027	temp[5]=0xd841;
	1028	temp[6]=0xdc02;
	1029	temp[7]=0;
	1030	result=u_strchr(temp, (UChar)0x62);
	1031	if(result != temp+1){
	1032	log_err("There is an error in u_strchr() Expected match at position 1 Got %ld (pointer 0x%lx)\n", result-temp, result);
	1033	}
	1034	/Testing u_strstr()/
	1035	log_verbose("Testing u_strstr\n");
	1036	subString[0]=0x62;
	1037	subString[1]=0x63;
	1038	subString[2]=0;
	1039	result=u_strstr(temp, subString);
	1040	if(result != temp+2){
	1041	log_err("There is an error in u_strstr() Expected match at position 2 Got %ld (pointer 0x%lx)\n", result-temp, result);
	1042	}
	1043	result=u_strstr(temp, subString+2); /* subString+2 is an empty string */
	1044	if(result != temp){
	1045	log_err("There is an error in u_strstr() Expected match at position 0 Got %ld (pointer 0x%lx)\n", result-temp, result);
	1046	}
	1047	result=u_strstr(subString, temp);
	1048	if(result != NULL){
	1049	log_err("There is an error in u_strstr() Expected NULL \"not found\" Got non-NULL \"found\" result\n");
	1050	}
	1051
	1052	/Testing u_strchr32/
	1053	log_verbose("Testing u_strchr32\n");
	1054	result=u_strchr32(temp, (UChar32)0x62);
	1055	if(result != temp+1){
	1056	log_err("There is an error in u_strchr32() Expected match at position 1 Got %ld (pointer 0x%lx)\n", result-temp, result);
	1057	}
	1058	result=u_strchr32(temp, (UChar32)0xfb);
	1059	if(result != NULL){
	1060	log_err("There is an error in u_strchr32() Expected NULL \"not found\" Got non-NULL \"found\" result\n");
	1061	}
	1062	result=u_strchr32(temp, (UChar32)0x20402);
	1063	if(result != temp+5){
	1064	log_err("There is an error in u_strchr32() Expected match at position 5 Got %ld (pointer 0x%lx)\n", result-temp, result);
	1065	}
	1066
	1067	temp[7]=0xfc00;
	1068	result=u_memchr32(temp, (UChar32)0x20402, 7);
	1069	if(result != temp+5){
	1070	log_err("There is an error in u_memchr32() Expected match at position 5 Got %ld (pointer 0x%lx)\n", result-temp, result);
	1071	}
	1072	result=u_memchr32(temp, (UChar32)0x20402, 6);
	1073	if(result != NULL){
	1074	log_err("There is an error in u_memchr32() Expected no match Got %ld (pointer 0x%lx)\n", result-temp, result);
	1075	}
	1076	result=u_memchr32(temp, (UChar32)0x20402, 1);
	1077	if(result != NULL){
	1078	log_err("There is an error in u_memchr32() Expected no match Got %ld (pointer 0x%lx)\n", result-temp, result);
	1079	}
	1080	result=u_memchr32(temp, (UChar32)0xfc00, 8);
	1081	if(result != temp+7){
	1082	log_err("There is an error in u_memchr32() Expected match at position 7 Got %ld (pointer 0x%lx)\n", result-temp, result);
	1083	}
	1084	}
	1085
	1086	/* test u_unescape() and u_unescapeAt() ------------------------------------- */
	1087
	1088	static void
	1089	TestUnescape() {
	1090	static UChar buffer[200];
	1091
	1092	static const char* input =
	1093	"Sch\\u00f6nes Auto: \\u20ac 11240.\\fPrivates Zeichen: \\U00102345\\e\\cC\\n \\x1b\\x{263a}";
	1094
	1095	static const UChar expect[]={
	1096	0x53, 0x63, 0x68, 0xf6, 0x6e, 0x65, 0x73, 0x20, 0x41, 0x75, 0x74, 0x6f, 0x3a, 0x20,
	1097	0x20ac, 0x20, 0x31, 0x31, 0x32, 0x34, 0x30, 0x2e, 0x0c,
	1098	0x50, 0x72, 0x69, 0x76, 0x61, 0x74, 0x65, 0x73, 0x20,
	1099	0x5a, 0x65, 0x69, 0x63, 0x68, 0x65, 0x6e, 0x3a, 0x20, 0xdbc8, 0xdf45, 0x1b, 0x03, 0x0a, 0x20, 0x1b, 0x263A, 0
	1100	};
	1101	static const int32_t explength = sizeof(expect)/sizeof(expect[0])-1;
	1102	int32_t length;
	1103
	1104	/* test u_unescape() */
	1105	length=u_unescape(input, buffer, sizeof(buffer)/sizeof(buffer[0]));
	1106	if(length!=explength \|\| u_strcmp(buffer, expect)!=0) {
	1107	log_err("failure in u_unescape(): length %d!=%d and/or incorrect result string\n", length,
	1108	explength);
	1109	}
	1110
	1111	/* try preflighting */
	1112	length=u_unescape(input, NULL, sizeof(buffer)/sizeof(buffer[0]));
	1113	if(length!=explength \|\| u_strcmp(buffer, expect)!=0) {
	1114	log_err("failure in u_unescape(preflighting): length %d!=%d\n", length, explength);
	1115	}
	1116
	1117	/* ### TODO: test u_unescapeAt() */
	1118	}
	1119
	1120	/* test code point counting functions --------------------------------------- */
	1121
	1122	/* reference implementation of u_strHasMoreChar32Than() */
	1123	static int32_t
	1124	_refStrHasMoreChar32Than(const UChar *s, int32_t length, int32_t number) {
	1125	int32_t count=u_countChar32(s, length);
	1126	return count>number;
	1127	}
	1128
	1129	/* compare the real function against the reference */
	1130	static void
	1131	_testStrHasMoreChar32Than(const UChar *s, int32_t i, int32_t length, int32_t number) {
	1132	if(u_strHasMoreChar32Than(s, length, number)!=_refStrHasMoreChar32Than(s, length, number)) {
	1133	log_err("u_strHasMoreChar32Than(s+%d, %d, %d)=%hd is wrong\n",
	1134	i, length, number, u_strHasMoreChar32Than(s, length, number));
	1135	}
	1136	}
	1137
	1138	static void
	1139	TestCountChar32() {
	1140	static const UChar string[]={
	1141	0x61, 0x62, 0xd800, 0xdc00,
	1142	0xd801, 0xdc01, 0x63, 0xd802,
	1143	0x64, 0xdc03, 0x65, 0x66,
	1144	0xd804, 0xdc04, 0xd805, 0xdc05,
	1145	0x67
	1146	};
	1147	UChar buffer[100];
	1148	int32_t i, length, number;
	1149
	1150	/* test u_strHasMoreChar32Than() with length>=0 */
	1151	length=LENGTHOF(string);
	1152	while(length>=0) {
	1153	for(i=0; i<=length; ++i) {
	1154	for(number=-1; number<=((length-i)+2); ++number) {
	1155	_testStrHasMoreChar32Than(string+i, i, length-i, number);
	1156	}
	1157	}
	1158	--length;
	1159	}
	1160
	1161	/* test u_strHasMoreChar32Than() with NUL-termination (length=-1) */
	1162	length=LENGTHOF(string);
	1163	u_memcpy(buffer, string, length);
	1164	while(length>=0) {
	1165	buffer[length]=0;
	1166	for(i=0; i<=length; ++i) {
	1167	for(number=-1; number<=((length-i)+2); ++number) {
	1168	_testStrHasMoreChar32Than(string+i, i, -1, number);
	1169	}
	1170	}
	1171	--length;
	1172	}
	1173
	1174	/* test u_strHasMoreChar32Than() with NULL string (bad input) */
	1175	for(length=-1; length<=1; ++length) {
	1176	for(i=0; i<=length; ++i) {
	1177	for(number=-2; number<=2; ++number) {
	1178	_testStrHasMoreChar32Than(NULL, 0, length, number);
	1179	}
	1180	}
	1181	}
	1182	}
	1183
	1184	/* UCharIterator ------------------------------------------------------------ */
	1185
	1186	/*
	1187	* Compare results from two iterators, should be same.
	1188	* Assume that the text is not empty and that
	1189	* iteration start==0 and iteration limit==length.
	1190	*/
	1191	static void
	1192	compareIterators(UCharIterator iter1, const char n1,
	1193	UCharIterator iter2, const char n2) {
	1194	int32_t i, pos1, pos2, middle, length;
	1195	UChar32 c1, c2;
	1196
	1197	/* compare lengths */
	1198	length=iter1->getIndex(iter1, UITER_LENGTH);
	1199	pos2=iter2->getIndex(iter2, UITER_LENGTH);
	1200	if(length!=pos2) {
	1201	log_err("%s->getIndex(length)=%d != %d=%s->getIndex(length)\n", n1, length, pos2, n2);
	1202	return;
	1203	}
	1204
	1205	/* set into the middle */
	1206	middle=length/2;
	1207
	1208	pos1=iter1->move(iter1, middle, UITER_ZERO);
	1209	if(pos1!=middle) {
	1210	log_err("%s->move(from 0 to middle %d)=%d does not move to the middle\n", n1, middle, pos1);
	1211	return;
	1212	}
	1213
	1214	pos2=iter2->move(iter2, middle, UITER_ZERO);
	1215	if(pos2!=middle) {
	1216	log_err("%s->move(from 0 to middle %d)=%d does not move to the middle\n", n2, middle, pos2);
	1217	return;
	1218	}
	1219
	1220	/* test current() */
	1221	c1=iter1->current(iter1);
	1222	c2=iter2->current(iter2);
	1223	if(c1!=c2) {
	1224	log_err("%s->current()=U+%04x != U+%04x=%s->current() at middle=%d\n", n1, c1, c2, n2, middle);
	1225	return;
	1226	}
	1227
	1228	/* move forward 3 UChars */
	1229	for(i=0; i<3; ++i) {
	1230	c1=iter1->next(iter1);
	1231	c2=iter2->next(iter2);
	1232	if(c1!=c2) {
	1233	log_err("%s->next()=U+%04x != U+%04x=%s->next() at %d (started in middle)\n", n1, c1, c2, n2, iter1->getIndex(iter1, UITER_CURRENT));
	1234	return;
	1235	}
	1236	}
	1237
	1238	/* move backward 5 UChars */
	1239	for(i=0; i<5; ++i) {
	1240	c1=iter1->previous(iter1);
	1241	c2=iter2->previous(iter2);
	1242	if(c1!=c2) {
	1243	log_err("%s->previous()=U+%04x != U+%04x=%s->previous() at %d (started in middle)\n", n1, c1, c2, n2, iter1->getIndex(iter1, UITER_CURRENT));
	1244	return;
	1245	}
	1246	}
	1247
	1248	/* iterate forward from the beginning */
	1249	pos1=iter1->move(iter1, 0, UITER_START);
	1250	if(pos1<0) {
	1251	log_err("%s->move(start) failed\n", n1);
	1252	return;
	1253	}
	1254	if(!iter1->hasNext(iter1)) {
	1255	log_err("%s->hasNext() at the start returns FALSE\n", n1);
	1256	return;
	1257	}
	1258
	1259	pos2=iter2->move(iter2, 0, UITER_START);
	1260	if(pos2<0) {
	1261	log_err("%s->move(start) failed\n", n2);
	1262	return;
	1263	}
	1264	if(!iter2->hasNext(iter2)) {
	1265	log_err("%s->hasNext() at the start returns FALSE\n", n2);
	1266	return;
	1267	}
	1268
	1269	do {
	1270	c1=iter1->next(iter1);
	1271	c2=iter2->next(iter2);
	1272	if(c1!=c2) {
	1273	log_err("%s->next()=U+%04x != U+%04x=%s->next() at %d\n", n1, c1, c2, n2, iter1->getIndex(iter1, UITER_CURRENT));
	1274	return;
	1275	}
	1276	} while(c1>=0);
	1277
	1278	if(iter1->hasNext(iter1)) {
	1279	log_err("%s->hasNext() at the end returns TRUE\n", n1);
	1280	return;
	1281	}
	1282	if(iter2->hasNext(iter2)) {
	1283	log_err("%s->hasNext() at the end returns TRUE\n", n2);
	1284	return;
	1285	}
	1286
	1287	/* back to the middle */
	1288	pos1=iter1->move(iter1, middle, UITER_ZERO);
	1289	if(pos1!=middle) {
	1290	log_err("%s->move(from end to middle %d)=%d does not move to the middle\n", n1, middle, pos1);
	1291	return;
	1292	}
	1293
	1294	pos2=iter2->move(iter2, middle, UITER_ZERO);
	1295	if(pos2!=middle) {
	1296	log_err("%s->move(from end to middle %d)=%d does not move to the middle\n", n2, middle, pos2);
	1297	return;
	1298	}
	1299
	1300	/* move to index 1 */
	1301	pos1=iter1->move(iter1, 1, UITER_ZERO);
	1302	if(pos1!=1) {
	1303	log_err("%s->move(from middle %d to 1)=%d does not move to 1\n", n1, middle, pos1);
	1304	return;
	1305	}
	1306
	1307	pos2=iter2->move(iter2, 1, UITER_ZERO);
	1308	if(pos2!=1) {
	1309	log_err("%s->move(from middle %d to 1)=%d does not move to 1\n", n2, middle, pos2);
	1310	return;
	1311	}
	1312
	1313	/* iterate backward from the end */
	1314	pos1=iter1->move(iter1, 0, UITER_LIMIT);
	1315	if(pos1<0) {
	1316	log_err("%s->move(limit) failed\n", n1);
	1317	return;
	1318	}
	1319	if(!iter1->hasPrevious(iter1)) {
	1320	log_err("%s->hasPrevious() at the end returns FALSE\n", n1);
	1321	return;
	1322	}
	1323
	1324	pos2=iter2->move(iter2, 0, UITER_LIMIT);
	1325	if(pos2<0) {
	1326	log_err("%s->move(limit) failed\n", n2);
	1327	return;
	1328	}
	1329	if(!iter2->hasPrevious(iter2)) {
	1330	log_err("%s->hasPrevious() at the end returns FALSE\n", n2);
	1331	return;
	1332	}
	1333
	1334	do {
	1335	c1=iter1->previous(iter1);
	1336	c2=iter2->previous(iter2);
	1337	if(c1!=c2) {
	1338	log_err("%s->previous()=U+%04x != U+%04x=%s->previous() at %d\n", n1, c1, c2, n2, iter1->getIndex(iter1, UITER_CURRENT));
	1339	return;
	1340	}
	1341	} while(c1>=0);
	1342
	1343	if(iter1->hasPrevious(iter1)) {
	1344	log_err("%s->hasPrevious() at the start returns TRUE\n", n1);
	1345	return;
	1346	}
	1347	if(iter2->hasPrevious(iter2)) {
	1348	log_err("%s->hasPrevious() at the start returns TRUE\n", n2);
	1349	return;
	1350	}
	1351	}
	1352
	1353	/*
	1354	* Test the iterator's getState() and setState() functions.
	1355	* iter1 and iter2 must be set up for the same iterator type and the same string
	1356	* but may be physically different structs (different addresses).
	1357	*
	1358	* Assume that the text is not empty and that
	1359	* iteration start==0 and iteration limit==length.
	1360	* It must be 2<=middle<=length-2.
	1361	*/
	1362	static void
	1363	testIteratorState(UCharIterator iter1, UCharIterator iter2, const char *n, int32_t middle) {
	1364	UChar32 u[4];
	1365
	1366	UErrorCode errorCode;
	1367	UChar32 c;
	1368	uint32_t state;
	1369	int32_t i, j;
	1370
	1371	/* get four UChars from the middle of the string */
	1372	iter1->move(iter1, middle-2, UITER_ZERO);
	1373	for(i=0; i<4; ++i) {
	1374	c=iter1->next(iter1);
	1375	if(c<0) {
	1376	/* the test violates the assumptions, see comment above */
	1377	log_err("test error: %s[%d]=%d\n", n, middle-2+i, c);
	1378	return;
	1379	}
	1380	u[i]=c;
	1381	}
	1382
	1383	/* move to the middle and get the state */
	1384	iter1->move(iter1, -2, UITER_CURRENT);
	1385	state=uiter_getState(iter1);
	1386
	1387	/* set the state into the second iterator and compare the results */
	1388	errorCode=U_ZERO_ERROR;
	1389	uiter_setState(iter2, state, &errorCode);
	1390	if(U_FAILURE(errorCode)) {
	1391	log_err("%s->setState(0x%x) failed: %s\n", n, state, u_errorName(errorCode));
	1392	return;
	1393	}
	1394
	1395	c=iter2->current(iter2);
	1396	if(c!=u[2]) {
	1397	log_err("%s->current(at %d)=U+%04x!=U+%04x\n", n, middle, c, u[2]);
	1398	}
	1399
	1400	c=iter2->previous(iter2);
	1401	if(c!=u[1]) {
	1402	log_err("%s->previous(at %d)=U+%04x!=U+%04x\n", n, middle-1, c, u[1]);
	1403	}
	1404
	1405	iter2->move(iter2, 2, UITER_CURRENT);
	1406	c=iter2->next(iter2);
	1407	if(c!=u[3]) {
	1408	log_err("%s->next(at %d)=U+%04x!=U+%04x\n", n, middle+1, c, u[3]);
	1409	}
	1410
	1411	iter2->move(iter2, -3, UITER_CURRENT);
	1412	c=iter2->previous(iter2);
	1413	if(c!=u[0]) {
	1414	log_err("%s->previous(at %d)=U+%04x!=U+%04x\n", n, middle-2, c, u[0]);
	1415	}
	1416
	1417	/* move the second iterator back to the middle */
	1418	iter2->move(iter2, 1, UITER_CURRENT);
	1419	iter2->next(iter2);
	1420
	1421	/* check that both are in the middle */
	1422	i=iter1->getIndex(iter1, UITER_CURRENT);
	1423	j=iter2->getIndex(iter2, UITER_CURRENT);
	1424	if(i!=middle) {
	1425	log_err("%s->getIndex(current)=%d!=%d as expected\n", n, i, middle);
	1426	}
	1427	if(i!=j) {
	1428	log_err("%s->getIndex(current)=%d!=%d after setState()\n", n, j, i);
	1429	}
	1430
	1431	/* compare lengths */
	1432	i=iter1->getIndex(iter1, UITER_LENGTH);
	1433	j=iter2->getIndex(iter2, UITER_LENGTH);
	1434	if(i!=j) {
	1435	log_err("%s->getIndex(length)=%d!=%d before/after setState()\n", n, i, j);
	1436	}
	1437	}
	1438
	1439	static void
	1440	TestUCharIterator() {
	1441	static const UChar text[]={
	1442	0x61, 0x62, 0x63, 0xd801, 0xdffd, 0x78, 0x79, 0x7a, 0
	1443	};
	1444	char bytes[40];
	1445
	1446	UCharIterator iter, iter1, iter2;
	1447	UConverter *cnv;
	1448	UErrorCode errorCode;
	1449	int32_t length;
	1450
	1451	/* simple API/code coverage - test NOOP UCharIterator */
	1452	uiter_setString(&iter, NULL, 0);
	1453	if( iter.current(&iter)!=-1 \|\| iter.next(&iter)!=-1 \|\| iter.previous(&iter)!=-1 \|\|
	1454	iter.move(&iter, 1, UITER_CURRENT) \|\| iter.getIndex(&iter, UITER_CURRENT)!=0 \|\|
	1455	iter.hasNext(&iter) \|\| iter.hasPrevious(&iter)
	1456	) {
	1457	log_err("NOOP UCharIterator behaves unexpectedly\n");
	1458	}
	1459
	1460	/* test get/set state */
	1461	length=LENGTHOF(text)-1;
	1462	uiter_setString(&iter1, text, -1);
	1463	uiter_setString(&iter2, text, length);
	1464	testIteratorState(&iter1, &iter2, "UTF16IteratorState", length/2);
	1465	testIteratorState(&iter1, &iter2, "UTF16IteratorStatePlus1", length/2+1);
	1466
	1467	/* compare the same string between UTF-16 and UTF-8 UCharIterators ------ */
	1468	errorCode=U_ZERO_ERROR;
	1469	u_strToUTF8(bytes, sizeof(bytes), &length, text, -1, &errorCode);
	1470	if(U_FAILURE(errorCode)) {
	1471	log_err("u_strToUTF8() failed, %s\n", u_errorName(errorCode));
	1472	return;
	1473	}
	1474
	1475	uiter_setString(&iter1, text, -1);
	1476	uiter_setUTF8(&iter2, bytes, length);
	1477	compareIterators(&iter1, "UTF16Iterator", &iter2, "UTF8Iterator");
	1478
	1479	/* try again with length=-1 */
	1480	uiter_setUTF8(&iter2, bytes, -1);
	1481	compareIterators(&iter1, "UTF16Iterator", &iter2, "UTF8Iterator_1");
	1482
	1483	/* test get/set state */
	1484	length=LENGTHOF(text)-1;
	1485	uiter_setUTF8(&iter1, bytes, -1);
	1486	testIteratorState(&iter1, &iter2, "UTF8IteratorState", length/2);
	1487	testIteratorState(&iter1, &iter2, "UTF8IteratorStatePlus1", length/2+1);
	1488
	1489	/* compare the same string between UTF-16 and UTF-16BE UCharIterators --- */
	1490	errorCode=U_ZERO_ERROR;
	1491	cnv=ucnv_open("UTF-16BE", &errorCode);
	1492	length=ucnv_fromUChars(cnv, bytes, sizeof(bytes), text, -1, &errorCode);
	1493	ucnv_close(cnv);
	1494	if(U_FAILURE(errorCode)) {
	1495	log_err("ucnv_fromUChars(UTF-16BE) failed, %s\n", u_errorName(errorCode));
	1496	return;
	1497	}
	1498
	1499	/* terminate with a _pair_ of 0 bytes - a UChar NUL in UTF-16BE (length is known to be ok) */
	1500	bytes[length]=bytes[length+1]=0;
	1501
	1502	uiter_setString(&iter1, text, -1);
	1503	uiter_setUTF16BE(&iter2, bytes, length);
	1504	compareIterators(&iter1, "UTF16Iterator", &iter2, "UTF16BEIterator");
	1505
	1506	/* try again with length=-1 */
	1507	uiter_setUTF16BE(&iter2, bytes, -1);
	1508	compareIterators(&iter1, "UTF16Iterator", &iter2, "UTF16BEIterator_1");
	1509
	1510	/* try again after moving the bytes up one, and with length=-1 */
	1511	memmove(bytes+1, bytes, length+2);
	1512	uiter_setUTF16BE(&iter2, bytes+1, -1);
	1513	compareIterators(&iter1, "UTF16Iterator", &iter2, "UTF16BEIteratorMoved1");
	1514
	1515	/* ### TODO test other iterators: CharacterIterator, Replaceable */
	1516	}
	1517
	1518	#if UCONFIG_NO_COLLATION
	1519
	1520	static void
	1521	TestUNormIterator() {
	1522	/* test nothing */
	1523	}
	1524
	1525	static void
	1526	TestBadUNormIterator(void) {
	1527	/* test nothing, as well */
	1528	}
	1529
	1530	#else
	1531
	1532	#include "unicode/unorm.h"
	1533	#include "unorm_it.h"
	1534
	1535	/*
	1536	* Compare results from two iterators, should be same.
	1537	* Assume that the text is not empty and that
	1538	* iteration start==0 and iteration limit==length.
	1539	*
	1540	* Modified version of compareIterators() but does not assume that indexes
	1541	* are available.
	1542	*/
	1543	static void
	1544	compareIterNoIndexes(UCharIterator iter1, const char n1,
	1545	UCharIterator iter2, const char n2,
	1546	int32_t middle) {
	1547	uint32_t state;
	1548	int32_t i;
	1549	UChar32 c1, c2;
	1550	UErrorCode errorCode;
	1551
	1552	/* code coverage for unorm_it.c/unormIteratorGetIndex() */
	1553	if(
	1554	iter2->getIndex(iter2, UITER_START)!=0 \|\|
	1555	iter2->getIndex(iter2, UITER_LENGTH)!=UITER_UNKNOWN_INDEX
	1556	) {
	1557	log_err("UNormIterator.getIndex() failed\n");
	1558	}
	1559
	1560	/* set into the middle */
	1561	iter1->move(iter1, middle, UITER_ZERO);
	1562	iter2->move(iter2, middle, UITER_ZERO);
	1563
	1564	/* test current() */
	1565	c1=iter1->current(iter1);
	1566	c2=iter2->current(iter2);
	1567	if(c1!=c2) {
	1568	log_err("%s->current()=U+%04x != U+%04x=%s->current() at middle=%d\n", n1, c1, c2, n2, middle);
	1569	return;
	1570	}
	1571
	1572	/* move forward 3 UChars */
	1573	for(i=0; i<3; ++i) {
	1574	c1=iter1->next(iter1);
	1575	c2=iter2->next(iter2);
	1576	if(c1!=c2) {
	1577	log_err("%s->next()=U+%04x != U+%04x=%s->next() at %d (started in middle)\n", n1, c1, c2, n2, iter1->getIndex(iter1, UITER_CURRENT));
	1578	return;
	1579	}
	1580	}
	1581
	1582	/* move backward 5 UChars */
	1583	for(i=0; i<5; ++i) {
	1584	c1=iter1->previous(iter1);
	1585	c2=iter2->previous(iter2);
	1586	if(c1!=c2) {
	1587	log_err("%s->previous()=U+%04x != U+%04x=%s->previous() at %d (started in middle)\n", n1, c1, c2, n2, iter1->getIndex(iter1, UITER_CURRENT));
	1588	return;
	1589	}
	1590	}
	1591
	1592	/* iterate forward from the beginning */
	1593	iter1->move(iter1, 0, UITER_START);
	1594	if(!iter1->hasNext(iter1)) {
	1595	log_err("%s->hasNext() at the start returns FALSE\n", n1);
	1596	return;
	1597	}
	1598
	1599	iter2->move(iter2, 0, UITER_START);
	1600	if(!iter2->hasNext(iter2)) {
	1601	log_err("%s->hasNext() at the start returns FALSE\n", n2);
	1602	return;
	1603	}
	1604
	1605	do {
	1606	c1=iter1->next(iter1);
	1607	c2=iter2->next(iter2);
	1608	if(c1!=c2) {
	1609	log_err("%s->next()=U+%04x != U+%04x=%s->next() at %d\n", n1, c1, c2, n2, iter1->getIndex(iter1, UITER_CURRENT));
	1610	return;
	1611	}
	1612	} while(c1>=0);
	1613
	1614	if(iter1->hasNext(iter1)) {
	1615	log_err("%s->hasNext() at the end returns TRUE\n", n1);
	1616	return;
	1617	}
	1618	if(iter2->hasNext(iter2)) {
	1619	log_err("%s->hasNext() at the end returns TRUE\n", n2);
	1620	return;
	1621	}
	1622
	1623	/* iterate backward */
	1624	do {
	1625	c1=iter1->previous(iter1);
	1626	c2=iter2->previous(iter2);
	1627	if(c1!=c2) {
	1628	log_err("%s->previous()=U+%04x != U+%04x=%s->previous() at %d\n", n1, c1, c2, n2, iter1->getIndex(iter1, UITER_CURRENT));
	1629	return;
	1630	}
	1631	} while(c1>=0);
	1632
	1633	/* back to the middle */
	1634	iter1->move(iter1, middle, UITER_ZERO);
	1635	iter2->move(iter2, middle, UITER_ZERO);
	1636
	1637	/* try get/set state */
	1638	while((state=uiter_getState(iter2))==UITER_NO_STATE) {
	1639	if(!iter2->hasNext(iter2)) {
	1640	log_err("%s has no known state from middle=%d to the end\n", n2, middle);
	1641	return;
	1642	}
	1643	iter2->next(iter2);
	1644	}
	1645
	1646	errorCode=U_ZERO_ERROR;
	1647
	1648	c2=iter2->current(iter2);
	1649	iter2->move(iter2, 0, UITER_ZERO);
	1650	uiter_setState(iter2, state, &errorCode);
	1651	c1=iter2->current(iter2);
	1652	if(U_FAILURE(errorCode) \|\| c1!=c2) {
	1653	log_err("%s->current() differs across get/set state, U+%04x vs. U+%04x\n", n2, c2, c1);
	1654	return;
	1655	}
	1656
	1657	c2=iter2->previous(iter2);
	1658	iter2->move(iter2, 0, UITER_ZERO);
	1659	uiter_setState(iter2, state, &errorCode);
	1660	c1=iter2->previous(iter2);
	1661	if(U_FAILURE(errorCode) \|\| c1!=c2) {
	1662	log_err("%s->previous() differs across get/set state, U+%04x vs. U+%04x\n", n2, c2, c1);
	1663	return;
	1664	}
	1665
	1666	/* iterate backward from the end */
	1667	iter1->move(iter1, 0, UITER_LIMIT);
	1668	if(!iter1->hasPrevious(iter1)) {
	1669	log_err("%s->hasPrevious() at the end returns FALSE\n", n1);
	1670	return;
	1671	}
	1672
	1673	iter2->move(iter2, 0, UITER_LIMIT);
	1674	if(!iter2->hasPrevious(iter2)) {
	1675	log_err("%s->hasPrevious() at the end returns FALSE\n", n2);
	1676	return;
	1677	}
	1678
	1679	do {
	1680	c1=iter1->previous(iter1);
	1681	c2=iter2->previous(iter2);
	1682	if(c1!=c2) {
	1683	log_err("%s->previous()=U+%04x != U+%04x=%s->previous() at %d\n", n1, c1, c2, n2, iter1->getIndex(iter1, UITER_CURRENT));
	1684	return;
	1685	}
	1686	} while(c1>=0);
	1687
	1688	if(iter1->hasPrevious(iter1)) {
	1689	log_err("%s->hasPrevious() at the start returns TRUE\n", n1);
	1690	return;
	1691	}
	1692	if(iter2->hasPrevious(iter2)) {
	1693	log_err("%s->hasPrevious() at the start returns TRUE\n", n2);
	1694	return;
	1695	}
	1696	}
	1697
	1698	/* n2 must have a digit 1 at the end, will be incremented with the normalization mode */
	1699	static void
	1700	testUNormIteratorWithText(const UChar *text, int32_t textLength, int32_t middle,
	1701	const char name1, const char n2) {
	1702	UChar buffer[600];
	1703	char name2[40];
	1704
	1705	UCharIterator iter1, iter2, *iter;
	1706	UNormIterator *uni;
	1707
	1708	UNormalizationMode mode;
	1709	UErrorCode errorCode;
	1710	int32_t length;
	1711
	1712	/* open a normalizing iterator */
	1713	errorCode=U_ZERO_ERROR;
	1714	uni=unorm_openIter(NULL, 0, &errorCode);
	1715	if(U_FAILURE(errorCode)) {
	1716	log_err("unorm_openIter() fails: %s\n", u_errorName(errorCode));
	1717	return;
	1718	}
	1719
	1720	/* set iterator 2 to the original text */
	1721	uiter_setString(&iter2, text, textLength);
	1722
	1723	strcpy(name2, n2);
	1724
	1725	/* test the normalizing iterator for each mode */
	1726	for(mode=UNORM_NONE; mode<UNORM_MODE_COUNT; ++mode) {
	1727	length=unorm_normalize(text, textLength, mode, 0, buffer, LENGTHOF(buffer), &errorCode);
	1728	if(U_FAILURE(errorCode)) {
	1729	log_err("unorm_normalize(mode %d) failed: %s\n", mode, u_errorName(errorCode));
	1730	break;
	1731	}
	1732
	1733	/* set iterator 1 to the normalized text */
	1734	uiter_setString(&iter1, buffer, length);
	1735
	1736	/* set the normalizing iterator to use iter2 */
	1737	iter=unorm_setIter(uni, &iter2, mode, &errorCode);
	1738	if(U_FAILURE(errorCode)) {
	1739	log_err("unorm_setIter(mode %d) failed: %s\n", mode, u_errorName(errorCode));
	1740	break;
	1741	}
	1742
	1743	compareIterNoIndexes(&iter1, name1, iter, name2, middle);
	1744	++name2[strlen(name2)-1];
	1745	}
	1746
	1747	unorm_closeIter(uni);
	1748	}
	1749
	1750	static void
	1751	TestUNormIterator() {
	1752	static const UChar text[]={ /* must contain <00C5 0327> see u_strchr() below */
	1753	0x61, /* 'a' */
	1754	0xe4, 0x61, 0x308, /* variations of 'a'+umlaut */
	1755	0xc5, 0x327, 0x41, 0x30a, 0x327, 0x41, 0x327, 0x30a, /* variations of 'A'+ring+cedilla */
	1756	0xfb03, 0xfb00, 0x69, 0x66, 0x66, 0x69, 0x66, 0xfb01 /* variations of 'ffi' */
	1757	};
	1758	static const UChar surrogateText[]={
	1759	0x6e, 0xd900, 0x6a, 0xdc00, 0xd900, 0xdc00, 0x61
	1760	};
	1761
	1762	UChar longText[600];
	1763	int32_t i, middle, length;
	1764
	1765	length=LENGTHOF(text);
	1766	testUNormIteratorWithText(text, length, length/2, "UCharIter", "UNormIter1");
	1767	testUNormIteratorWithText(text, length, length, "UCharIterEnd", "UNormIterEnd1");
	1768
	1769	/* test again, this time with an insane string to cause internal buffer overflows */
	1770	middle=(int32_t)(u_strchr(text, 0x327)-text); /* see comment at text[] */
	1771	memcpy(longText, text, middle*U_SIZEOF_UCHAR);
	1772	for(i=0; i<150; ++i) {
	1773	longText[middle+i]=0x30a; /* insert many rings between 'A-ring' and cedilla */
	1774	}
	1775	memcpy(longText+middle+i, text+middle, (LENGTHOF(text)-middle)*U_SIZEOF_UCHAR);
	1776	length=LENGTHOF(text)+i;
	1777
	1778	/* append another copy of this string for more overflows */
	1779	memcpy(longText+length, longText, length*U_SIZEOF_UCHAR);
	1780	length*=2;
	1781
	1782	/* the first test of the following two starts at length/4, inside the sea of combining rings */
	1783	testUNormIteratorWithText(longText, length, length/4, "UCharIterLong", "UNormIterLong1");
	1784	testUNormIteratorWithText(longText, length, length, "UCharIterLongEnd", "UNormIterLongEnd1");
	1785
	1786	length=LENGTHOF(surrogateText);
	1787	testUNormIteratorWithText(surrogateText, length, length/4, "UCharIterSurr", "UNormIterSurr1");
	1788	testUNormIteratorWithText(surrogateText, length, length, "UCharIterSurrEnd", "UNormIterSurrEnd1");
	1789	}
	1790
	1791	static void
	1792	TestBadUNormIterator(void) {
	1793	#if !UCONFIG_NO_NORMALIZATION
	1794	UErrorCode status = U_ILLEGAL_ESCAPE_SEQUENCE;
	1795	UNormIterator *uni;
	1796
	1797	unorm_setIter(NULL, NULL, UNORM_NONE, &status);
	1798	if (status != U_ILLEGAL_ESCAPE_SEQUENCE) {
	1799	log_err("unorm_setIter changed the error code to: %s\n", u_errorName(status));
	1800	}
	1801	status = U_ZERO_ERROR;
	1802	unorm_setIter(NULL, NULL, UNORM_NONE, &status);
	1803	if (status != U_ILLEGAL_ARGUMENT_ERROR) {
	1804	log_err("unorm_setIter didn't react correctly to bad arguments: %s\n", u_errorName(status));
	1805	}
	1806	status = U_ZERO_ERROR;
	1807	uni=unorm_openIter(NULL, 0, &status);
	1808	if(U_FAILURE(status)) {
	1809	log_err("unorm_openIter() fails: %s\n", u_errorName(status));
	1810	return;
	1811	}
	1812	unorm_setIter(uni, NULL, UNORM_NONE, &status);
	1813	unorm_closeIter(uni);
	1814	#endif
	1815	}
	1816
	1817	#endif