]>
Commit | Line | Data |
---|---|---|
b75a7d8f A |
1 | /* |
2 | ********************************************************************** | |
73c04bcf | 3 | * Copyright (C) 1998-2005, International Business Machines |
b75a7d8f A |
4 | * Corporation and others. All Rights Reserved. |
5 | ********************************************************************** | |
6 | */ | |
7 | ||
8 | #ifndef UCHRITER_H | |
9 | #define UCHRITER_H | |
10 | ||
11 | #include "unicode/utypes.h" | |
12 | #include "unicode/chariter.h" | |
13 | ||
73c04bcf A |
14 | /** |
15 | * \file | |
16 | * \brief C++ API: UChar Character Iterator | |
17 | */ | |
18 | ||
b75a7d8f A |
19 | U_NAMESPACE_BEGIN |
20 | ||
21 | /** | |
22 | * A concrete subclass of CharacterIterator that iterates over the | |
23 | * characters (code units or code points) in a UChar array. | |
24 | * It's possible not only to create an | |
25 | * iterator that iterates over an entire UChar array, but also to | |
26 | * create one that iterates over only a subrange of a UChar array | |
27 | * (iterators over different subranges of the same UChar array don't | |
28 | * compare equal). | |
29 | * @see CharacterIterator | |
30 | * @see ForwardCharacterIterator | |
31 | * @stable ICU 2.0 | |
32 | */ | |
33 | class U_COMMON_API UCharCharacterIterator : public CharacterIterator { | |
34 | public: | |
35 | /** | |
36 | * Create an iterator over the UChar array referred to by "textPtr". | |
37 | * The iteration range is 0 to <code>length-1</code>. | |
38 | * text is only aliased, not adopted (the | |
39 | * destructor will not delete it). | |
40 | * @param textPtr The UChar array to be iterated over | |
41 | * @param length The length of the UChar array | |
42 | * @stable ICU 2.0 | |
43 | */ | |
44 | UCharCharacterIterator(const UChar* textPtr, int32_t length); | |
45 | ||
46 | /** | |
47 | * Create an iterator over the UChar array referred to by "textPtr". | |
48 | * The iteration range is 0 to <code>length-1</code>. | |
49 | * text is only aliased, not adopted (the | |
50 | * destructor will not delete it). | |
51 | * The starting | |
52 | * position is specified by "position". If "position" is outside the valid | |
53 | * iteration range, the behavior of this object is undefined. | |
54 | * @param textPtr The UChar array to be iteratd over | |
55 | * @param length The length of the UChar array | |
56 | * @param position The starting position of the iteration | |
57 | * @stable ICU 2.0 | |
58 | */ | |
59 | UCharCharacterIterator(const UChar* textPtr, int32_t length, | |
60 | int32_t position); | |
61 | ||
62 | /** | |
63 | * Create an iterator over the UChar array referred to by "textPtr". | |
64 | * The iteration range is 0 to <code>end-1</code>. | |
65 | * text is only aliased, not adopted (the | |
66 | * destructor will not delete it). | |
67 | * The starting | |
68 | * position is specified by "position". If begin and end do not | |
69 | * form a valid iteration range or "position" is outside the valid | |
70 | * iteration range, the behavior of this object is undefined. | |
71 | * @param textPtr The UChar array to be iterated over | |
72 | * @param length The length of the UChar array | |
73 | * @param textBegin The begin position of the iteration range | |
74 | * @param textEnd The end position of the iteration range | |
75 | * @param position The starting position of the iteration | |
76 | * @stable ICU 2.0 | |
77 | */ | |
78 | UCharCharacterIterator(const UChar* textPtr, int32_t length, | |
79 | int32_t textBegin, | |
80 | int32_t textEnd, | |
81 | int32_t position); | |
82 | ||
83 | /** | |
84 | * Copy constructor. The new iterator iterates over the same range | |
85 | * of the same string as "that", and its initial position is the | |
374ca955 | 86 | * same as "that"'s current position. |
b75a7d8f A |
87 | * @param that The UCharCharacterIterator to be copied |
88 | * @stable ICU 2.0 | |
89 | */ | |
90 | UCharCharacterIterator(const UCharCharacterIterator& that); | |
91 | ||
92 | /** | |
374ca955 | 93 | * Destructor. |
b75a7d8f A |
94 | * @stable ICU 2.0 |
95 | */ | |
374ca955 | 96 | virtual ~UCharCharacterIterator(); |
b75a7d8f A |
97 | |
98 | /** | |
99 | * Assignment operator. *this is altered to iterate over the sane | |
100 | * range of the same string as "that", and refers to the same | |
374ca955 | 101 | * character within that string as "that" does. |
b75a7d8f | 102 | * @param that The object to be copied |
374ca955 | 103 | * @return the newly created object |
b75a7d8f A |
104 | * @stable ICU 2.0 |
105 | */ | |
106 | UCharCharacterIterator& | |
107 | operator=(const UCharCharacterIterator& that); | |
108 | ||
109 | /** | |
110 | * Returns true if the iterators iterate over the same range of the | |
374ca955 | 111 | * same string and are pointing at the same character. |
b75a7d8f A |
112 | * @param that The ForwardCharacterIterator used to be compared for equality |
113 | * @return true if the iterators iterate over the same range of the | |
114 | * same string and are pointing at the same character. | |
115 | * @stable ICU 2.0 | |
116 | */ | |
117 | virtual UBool operator==(const ForwardCharacterIterator& that) const; | |
118 | ||
119 | /** | |
374ca955 | 120 | * Generates a hash code for this iterator. |
b75a7d8f A |
121 | * @return the hash code. |
122 | * @stable ICU 2.0 | |
123 | */ | |
124 | virtual int32_t hashCode(void) const; | |
125 | ||
126 | /** | |
127 | * Returns a new UCharCharacterIterator referring to the same | |
128 | * character in the same range of the same string as this one. The | |
374ca955 | 129 | * caller must delete the new iterator. |
b75a7d8f A |
130 | * @return the CharacterIterator newly created |
131 | * @stable ICU 2.0 | |
132 | */ | |
133 | virtual CharacterIterator* clone(void) const; | |
374ca955 | 134 | |
b75a7d8f A |
135 | /** |
136 | * Sets the iterator to refer to the first code unit in its | |
137 | * iteration range, and returns that code unit. | |
138 | * This can be used to begin an iteration with next(). | |
139 | * @return the first code unit in its iteration range. | |
140 | * @stable ICU 2.0 | |
141 | */ | |
142 | virtual UChar first(void); | |
143 | ||
144 | /** | |
145 | * Sets the iterator to refer to the first code unit in its | |
146 | * iteration range, returns that code unit, and moves the position | |
147 | * to the second code unit. This is an alternative to setToStart() | |
148 | * for forward iteration with nextPostInc(). | |
149 | * @return the first code unit in its iteration range | |
150 | * @stable ICU 2.0 | |
151 | */ | |
152 | virtual UChar firstPostInc(void); | |
153 | ||
154 | /** | |
155 | * Sets the iterator to refer to the first code point in its | |
156 | * iteration range, and returns that code unit, | |
157 | * This can be used to begin an iteration with next32(). | |
158 | * Note that an iteration with next32PostInc(), beginning with, | |
159 | * e.g., setToStart() or firstPostInc(), is more efficient. | |
160 | * @return the first code point in its iteration range | |
161 | * @stable ICU 2.0 | |
162 | */ | |
163 | virtual UChar32 first32(void); | |
164 | ||
165 | /** | |
166 | * Sets the iterator to refer to the first code point in its | |
167 | * iteration range, returns that code point, and moves the position | |
168 | * to the second code point. This is an alternative to setToStart() | |
169 | * for forward iteration with next32PostInc(). | |
170 | * @return the first code point in its iteration range. | |
171 | * @stable ICU 2.0 | |
172 | */ | |
173 | virtual UChar32 first32PostInc(void); | |
174 | ||
175 | /** | |
176 | * Sets the iterator to refer to the last code unit in its | |
177 | * iteration range, and returns that code unit. | |
178 | * This can be used to begin an iteration with previous(). | |
179 | * @return the last code unit in its iteration range. | |
180 | * @stable ICU 2.0 | |
181 | */ | |
182 | virtual UChar last(void); | |
183 | ||
184 | /** | |
185 | * Sets the iterator to refer to the last code point in its | |
186 | * iteration range, and returns that code unit. | |
187 | * This can be used to begin an iteration with previous32(). | |
188 | * @return the last code point in its iteration range. | |
189 | * @stable ICU 2.0 | |
190 | */ | |
191 | virtual UChar32 last32(void); | |
192 | ||
193 | /** | |
194 | * Sets the iterator to refer to the "position"-th code unit | |
195 | * in the text-storage object the iterator refers to, and | |
374ca955 A |
196 | * returns that code unit. |
197 | * @param position the position within the text-storage object | |
b75a7d8f A |
198 | * @return the code unit |
199 | * @stable ICU 2.0 | |
200 | */ | |
201 | virtual UChar setIndex(int32_t position); | |
202 | ||
203 | /** | |
204 | * Sets the iterator to refer to the beginning of the code point | |
205 | * that contains the "position"-th code unit | |
206 | * in the text-storage object the iterator refers to, and | |
207 | * returns that code point. | |
208 | * The current position is adjusted to the beginning of the code point | |
209 | * (its first code unit). | |
374ca955 | 210 | * @param position the position within the text-storage object |
b75a7d8f A |
211 | * @return the code unit |
212 | * @stable ICU 2.0 | |
213 | */ | |
214 | virtual UChar32 setIndex32(int32_t position); | |
215 | ||
216 | /** | |
374ca955 | 217 | * Returns the code unit the iterator currently refers to. |
b75a7d8f A |
218 | * @return the code unit the iterator currently refers to. |
219 | * @stable ICU 2.0 | |
220 | */ | |
221 | virtual UChar current(void) const; | |
222 | ||
223 | /** | |
374ca955 | 224 | * Returns the code point the iterator currently refers to. |
b75a7d8f A |
225 | * @return the code point the iterator currently refers to. |
226 | * @stable ICU 2.0 | |
227 | */ | |
228 | virtual UChar32 current32(void) const; | |
229 | ||
230 | /** | |
231 | * Advances to the next code unit in the iteration range (toward | |
232 | * endIndex()), and returns that code unit. If there are no more | |
374ca955 A |
233 | * code units to return, returns DONE. |
234 | * @return the next code unit in the iteration range. | |
b75a7d8f A |
235 | * @stable ICU 2.0 |
236 | */ | |
237 | virtual UChar next(void); | |
238 | ||
239 | /** | |
240 | * Gets the current code unit for returning and advances to the next code unit | |
241 | * in the iteration range | |
242 | * (toward endIndex()). If there are | |
243 | * no more code units to return, returns DONE. | |
244 | * @return the current code unit. | |
245 | * @stable ICU 2.0 | |
246 | */ | |
247 | virtual UChar nextPostInc(void); | |
374ca955 | 248 | |
b75a7d8f A |
249 | /** |
250 | * Advances to the next code point in the iteration range (toward | |
251 | * endIndex()), and returns that code point. If there are no more | |
374ca955 | 252 | * code points to return, returns DONE. |
b75a7d8f A |
253 | * Note that iteration with "pre-increment" semantics is less |
254 | * efficient than iteration with "post-increment" semantics | |
255 | * that is provided by next32PostInc(). | |
256 | * @return the next code point in the iteration range. | |
257 | * @stable ICU 2.0 | |
258 | */ | |
259 | virtual UChar32 next32(void); | |
260 | ||
261 | /** | |
262 | * Gets the current code point for returning and advances to the next code point | |
263 | * in the iteration range | |
264 | * (toward endIndex()). If there are | |
265 | * no more code points to return, returns DONE. | |
266 | * @return the current point. | |
267 | * @stable ICU 2.0 | |
268 | */ | |
269 | virtual UChar32 next32PostInc(void); | |
374ca955 | 270 | |
b75a7d8f A |
271 | /** |
272 | * Returns FALSE if there are no more code units or code points | |
273 | * at or after the current position in the iteration range. | |
274 | * This is used with nextPostInc() or next32PostInc() in forward | |
275 | * iteration. | |
276 | * @return FALSE if there are no more code units or code points | |
277 | * at or after the current position in the iteration range. | |
278 | * @stable ICU 2.0 | |
279 | */ | |
280 | virtual UBool hasNext(); | |
281 | ||
282 | /** | |
283 | * Advances to the previous code unit in the iteration range (toward | |
284 | * startIndex()), and returns that code unit. If there are no more | |
374ca955 | 285 | * code units to return, returns DONE. |
b75a7d8f A |
286 | * @return the previous code unit in the iteration range. |
287 | * @stable ICU 2.0 | |
288 | */ | |
289 | virtual UChar previous(void); | |
290 | ||
291 | /** | |
292 | * Advances to the previous code point in the iteration range (toward | |
293 | * startIndex()), and returns that code point. If there are no more | |
294 | * code points to return, returns DONE. | |
374ca955 | 295 | * @return the previous code point in the iteration range. |
b75a7d8f A |
296 | * @stable ICU 2.0 |
297 | */ | |
298 | virtual UChar32 previous32(void); | |
299 | ||
300 | /** | |
301 | * Returns FALSE if there are no more code units or code points | |
302 | * before the current position in the iteration range. | |
303 | * This is used with previous() or previous32() in backward | |
304 | * iteration. | |
305 | * @return FALSE if there are no more code units or code points | |
306 | * before the current position in the iteration range. | |
307 | * @stable ICU 2.0 | |
308 | */ | |
309 | virtual UBool hasPrevious(); | |
310 | ||
311 | /** | |
312 | * Moves the current position relative to the start or end of the | |
313 | * iteration range, or relative to the current position itself. | |
314 | * The movement is expressed in numbers of code units forward | |
315 | * or backward by specifying a positive or negative delta. | |
374ca955 | 316 | * @param delta the position relative to origin. A positive delta means forward; |
b75a7d8f | 317 | * a negative delta means backward. |
374ca955 | 318 | * @param origin Origin enumeration {kStart, kCurrent, kEnd} |
b75a7d8f A |
319 | * @return the new position |
320 | * @stable ICU 2.0 | |
321 | */ | |
322 | virtual int32_t move(int32_t delta, EOrigin origin); | |
323 | ||
324 | /** | |
325 | * Moves the current position relative to the start or end of the | |
326 | * iteration range, or relative to the current position itself. | |
327 | * The movement is expressed in numbers of code points forward | |
328 | * or backward by specifying a positive or negative delta. | |
374ca955 | 329 | * @param delta the position relative to origin. A positive delta means forward; |
b75a7d8f | 330 | * a negative delta means backward. |
374ca955 | 331 | * @param origin Origin enumeration {kStart, kCurrent, kEnd} |
b75a7d8f A |
332 | * @return the new position |
333 | * @stable ICU 2.0 | |
334 | */ | |
335 | virtual int32_t move32(int32_t delta, EOrigin origin); | |
336 | ||
337 | /** | |
338 | * Sets the iterator to iterate over a new range of text | |
339 | * @stable ICU 2.0 | |
340 | */ | |
341 | void setText(const UChar* newText, int32_t newTextLength); | |
374ca955 | 342 | |
b75a7d8f A |
343 | /** |
344 | * Copies the UChar array under iteration into the UnicodeString | |
345 | * referred to by "result". Even if this iterator iterates across | |
346 | * only a part of this string, the whole string is copied. | |
374ca955 | 347 | * @param result Receives a copy of the text under iteration. |
b75a7d8f A |
348 | * @stable ICU 2.0 |
349 | */ | |
350 | virtual void getText(UnicodeString& result); | |
351 | ||
352 | /** | |
374ca955 A |
353 | * Return a class ID for this class (not really public) |
354 | * @return a class ID for this class | |
b75a7d8f A |
355 | * @stable ICU 2.0 |
356 | */ | |
374ca955 | 357 | static UClassID U_EXPORT2 getStaticClassID(void); |
b75a7d8f A |
358 | |
359 | /** | |
374ca955 A |
360 | * Return a class ID for this object (not really public) |
361 | * @return a class ID for this object. | |
b75a7d8f A |
362 | * @stable ICU 2.0 |
363 | */ | |
374ca955 | 364 | virtual UClassID getDynamicClassID(void) const; |
b75a7d8f A |
365 | |
366 | protected: | |
367 | /** | |
368 | * Protected constructor | |
369 | * @stable ICU 2.0 | |
370 | */ | |
371 | UCharCharacterIterator(); | |
372 | /** | |
373 | * Protected member text | |
374 | * @stable ICU 2.0 | |
374ca955 | 375 | */ |
b75a7d8f A |
376 | const UChar* text; |
377 | ||
b75a7d8f A |
378 | }; |
379 | ||
b75a7d8f A |
380 | U_NAMESPACE_END |
381 | #endif |