[apple/icu.git] / icuSources / common / usetiter.cpp

// © 2016 and later: Unicode, Inc. and others.
// License & terms of use: http://www.unicode.org/copyright.html
/*
**********************************************************************
* Copyright (c) 2002-2006, International Business Machines
* Corporation and others.  All Rights Reserved.
**********************************************************************
*/
#include "unicode/usetiter.h"
#include "unicode/uniset.h"
#include "unicode/unistr.h"
#include "uvector.h"

U_NAMESPACE_BEGIN

UOBJECT_DEFINE_RTTI_IMPLEMENTATION(UnicodeSetIterator)

/**
 * Create an iterator
 * @param set set to iterate over
 */
UnicodeSetIterator::UnicodeSetIterator(const UnicodeSet& uSet) {
    cpString  = NULL;
    reset(uSet);
}

/**
 * Create an iterator. Convenience for when the contents are to be set later.
 */
UnicodeSetIterator::UnicodeSetIterator() {
    this->set = NULL;
    cpString  = NULL;
    reset();
}

UnicodeSetIterator::~UnicodeSetIterator() {
    delete cpString;
}

/**
 * Returns the next element in the set.
 * @return true if there was another element in the set.
 * if so, if codepoint == IS_STRING, the value is a string in the string field
 * else the value is a single code point in the codepoint field.
 * <br>You are guaranteed that the codepoints are in sorted order, and the strings are in sorted order,
 * and that all code points are returned before any strings are returned.
 * <br>Note also that the codepointEnd is undefined after calling this method.
 */
UBool UnicodeSetIterator::next() {
    if (nextElement <= endElement) {
        codepoint = codepointEnd = nextElement++;
        string = NULL;
        return TRUE;
    }
    if (range < endRange) {
        loadRange(++range);
        codepoint = codepointEnd = nextElement++;
        string = NULL;
        return TRUE;
    }

    if (nextString >= stringCount) return FALSE;
    codepoint = (UChar32)IS_STRING; // signal that value is actually a string
    string = (const UnicodeString*) set->strings->elementAt(nextString++);
    return TRUE;
}

/**
 * @return true if there was another element in the set.
 * if so, if codepoint == IS_STRING, the value is a string in the string field
 * else the value is a range of codepoints in the <codepoint, codepointEnd> fields.
 * <br>Note that the codepoints are in sorted order, and the strings are in sorted order,
 * and that all code points are returned before any strings are returned.
 * <br>You are guaranteed that the ranges are in sorted order, and the strings are in sorted order,
 * and that all ranges are returned before any strings are returned.
 * <br>You are also guaranteed that ranges are disjoint and non-contiguous.
 * <br>Note also that the codepointEnd is undefined after calling this method.
 */
UBool UnicodeSetIterator::nextRange() {
    string = NULL;
    if (nextElement <= endElement) {
        codepointEnd = endElement;
        codepoint = nextElement;
        nextElement = endElement+1;
        return TRUE;
    }
    if (range < endRange) {
        loadRange(++range);
        codepointEnd = endElement;
        codepoint = nextElement;
        nextElement = endElement+1;
        return TRUE;
    }

    if (nextString >= stringCount) return FALSE;
    codepoint = (UChar32)IS_STRING; // signal that value is actually a string
    string = (const UnicodeString*) set->strings->elementAt(nextString++);
    return TRUE;
}

/**
 *@param set the set to iterate over. This allows reuse of the iterator.
 */
void UnicodeSetIterator::reset(const UnicodeSet& uSet) {
    this->set = &uSet;
    reset();
}

/**
 * Resets to the start, to allow the iteration to start over again.
 */
void UnicodeSetIterator::reset() {
    if (set == NULL) {
        // Set up indices to empty iteration
        endRange = -1;
        stringCount = 0;
    } else {
        endRange = set->getRangeCount() - 1;
        stringCount = set->stringsSize();
    }
    range = 0;
    endElement = -1;
    nextElement = 0;            
    if (endRange >= 0) {
        loadRange(range);
    }
    nextString = 0;
    string = NULL;
}

void UnicodeSetIterator::loadRange(int32_t iRange) {
    nextElement = set->getRangeStart(iRange);
    endElement = set->getRangeEnd(iRange);
}


const UnicodeString& UnicodeSetIterator::getString()  {
    if (string==NULL && codepoint!=(UChar32)IS_STRING) {
       if (cpString == NULL) {
          cpString = new UnicodeString();
       }
       if (cpString != NULL) {
          cpString->setTo((UChar32)codepoint);
       }
       string = cpString;
    }
    return *string;
}

U_NAMESPACE_END

//eof
Commit	Line	Data
f3c0d7a5 A	1	// © 2016 and later: Unicode, Inc. and others.
f3c0d7a5 A	2	// License & terms of use: http://www.unicode.org/copyright.html
b75a7d8f A	3	/*
b75a7d8f A	4	**********************************************************************
73c04bcf	5	* Copyright (c) 2002-2006, International Business Machines
b75a7d8f A	6	* Corporation and others. All Rights Reserved.
b75a7d8f A	7	**********************************************************************
b75a7d8f A	8	*/
	9	#include "unicode/usetiter.h"
	10	#include "unicode/uniset.h"
	11	#include "unicode/unistr.h"
	12	#include "uvector.h"
	13
	14	U_NAMESPACE_BEGIN
	15
374ca955	16	UOBJECT_DEFINE_RTTI_IMPLEMENTATION(UnicodeSetIterator)
b75a7d8f A	17
	18	/**
	19	* Create an iterator
	20	* @param set set to iterate over
	21	*/
	22	UnicodeSetIterator::UnicodeSetIterator(const UnicodeSet& uSet) {
73c04bcf	23	cpString = NULL;
b75a7d8f A	24	reset(uSet);
	25	}
	26
	27	/**
	28	* Create an iterator. Convenience for when the contents are to be set later.
	29	*/
	30	UnicodeSetIterator::UnicodeSetIterator() {
	31	this->set = NULL;
73c04bcf	32	cpString = NULL;
b75a7d8f A	33	reset();
	34	}
	35
	36	UnicodeSetIterator::~UnicodeSetIterator() {
73c04bcf	37	delete cpString;
b75a7d8f A	38	}
	39
	40	/**
	41	* Returns the next element in the set.
	42	* @return true if there was another element in the set.
	43	* if so, if codepoint == IS_STRING, the value is a string in the string field
	44	* else the value is a single code point in the codepoint field.
	45	* <br>You are guaranteed that the codepoints are in sorted order, and the strings are in sorted order,
	46	* and that all code points are returned before any strings are returned.
	47	* <br>Note also that the codepointEnd is undefined after calling this method.
	48	*/
	49	UBool UnicodeSetIterator::next() {
	50	if (nextElement <= endElement) {
	51	codepoint = codepointEnd = nextElement++;
73c04bcf	52	string = NULL;
b75a7d8f A	53	return TRUE;
	54	}
	55	if (range < endRange) {
	56	loadRange(++range);
	57	codepoint = codepointEnd = nextElement++;
73c04bcf	58	string = NULL;
b75a7d8f A	59	return TRUE;
	60	}
	61
	62	if (nextString >= stringCount) return FALSE;
	63	codepoint = (UChar32)IS_STRING; // signal that value is actually a string
	64	string = (const UnicodeString*) set->strings->elementAt(nextString++);
	65	return TRUE;
	66	}
	67
	68	/**
	69	* @return true if there was another element in the set.
	70	* if so, if codepoint == IS_STRING, the value is a string in the string field
	71	* else the value is a range of codepoints in the <codepoint, codepointEnd> fields.
	72	* <br>Note that the codepoints are in sorted order, and the strings are in sorted order,
	73	* and that all code points are returned before any strings are returned.
	74	* <br>You are guaranteed that the ranges are in sorted order, and the strings are in sorted order,
	75	* and that all ranges are returned before any strings are returned.
	76	* <br>You are also guaranteed that ranges are disjoint and non-contiguous.
	77	* <br>Note also that the codepointEnd is undefined after calling this method.
	78	*/
	79	UBool UnicodeSetIterator::nextRange() {
73c04bcf	80	string = NULL;
b75a7d8f A	81	if (nextElement <= endElement) {
	82	codepointEnd = endElement;
	83	codepoint = nextElement;
	84	nextElement = endElement+1;
	85	return TRUE;
	86	}
	87	if (range < endRange) {
	88	loadRange(++range);
	89	codepointEnd = endElement;
	90	codepoint = nextElement;
	91	nextElement = endElement+1;
	92	return TRUE;
	93	}
	94
	95	if (nextString >= stringCount) return FALSE;
	96	codepoint = (UChar32)IS_STRING; // signal that value is actually a string
	97	string = (const UnicodeString*) set->strings->elementAt(nextString++);
	98	return TRUE;
	99	}
	100
	101	/**
	102	*@param set the set to iterate over. This allows reuse of the iterator.
	103	*/
	104	void UnicodeSetIterator::reset(const UnicodeSet& uSet) {
	105	this->set = &uSet;
	106	reset();
	107	}
	108
	109	/**
	110	* Resets to the start, to allow the iteration to start over again.
	111	*/
	112	void UnicodeSetIterator::reset() {
	113	if (set == NULL) {
	114	// Set up indices to empty iteration
	115	endRange = -1;
	116	stringCount = 0;
	117	} else {
	118	endRange = set->getRangeCount() - 1;
3d1f044b	119	stringCount = set->stringsSize();
b75a7d8f A	120	}
	121	range = 0;
	122	endElement = -1;
	123	nextElement = 0;
	124	if (endRange >= 0) {
	125	loadRange(range);
	126	}
	127	nextString = 0;
73c04bcf	128	string = NULL;
b75a7d8f A	129	}
	130
	131	void UnicodeSetIterator::loadRange(int32_t iRange) {
	132	nextElement = set->getRangeStart(iRange);
	133	endElement = set->getRangeEnd(iRange);
	134	}
	135
73c04bcf A	136
	137	const UnicodeString& UnicodeSetIterator::getString() {
	138	if (string==NULL && codepoint!=(UChar32)IS_STRING) {
	139	if (cpString == NULL) {
	140	cpString = new UnicodeString();
	141	}
	142	if (cpString != NULL) {
	143	cpString->setTo((UChar32)codepoint);
	144	}
	145	string = cpString;
	146	}
	147	return *string;
	148	}
	149
b75a7d8f A	150	U_NAMESPACE_END
	151
	152	//eof