]>
Commit | Line | Data |
---|---|---|
f3c0d7a5 A |
1 | // © 2016 and later: Unicode, Inc. and others. |
2 | // License & terms of use: http://www.unicode.org/copyright.html | |
b75a7d8f A |
3 | /* |
4 | ********************************************************************** | |
73c04bcf | 5 | * Copyright (C) 1998-2005, International Business Machines |
b75a7d8f A |
6 | * Corporation and others. All Rights Reserved. |
7 | ********************************************************************** | |
8 | */ | |
9 | ||
10 | #ifndef UCHRITER_H | |
11 | #define UCHRITER_H | |
12 | ||
13 | #include "unicode/utypes.h" | |
14 | #include "unicode/chariter.h" | |
15 | ||
73c04bcf A |
16 | /** |
17 | * \file | |
f3c0d7a5 | 18 | * \brief C++ API: char16_t Character Iterator |
73c04bcf A |
19 | */ |
20 | ||
f3c0d7a5 | 21 | #if U_SHOW_CPLUSPLUS_API |
b75a7d8f A |
22 | U_NAMESPACE_BEGIN |
23 | ||
24 | /** | |
25 | * A concrete subclass of CharacterIterator that iterates over the | |
f3c0d7a5 | 26 | * characters (code units or code points) in a char16_t array. |
b75a7d8f | 27 | * It's possible not only to create an |
f3c0d7a5 A |
28 | * iterator that iterates over an entire char16_t array, but also to |
29 | * create one that iterates over only a subrange of a char16_t array | |
30 | * (iterators over different subranges of the same char16_t array don't | |
b75a7d8f A |
31 | * compare equal). |
32 | * @see CharacterIterator | |
33 | * @see ForwardCharacterIterator | |
34 | * @stable ICU 2.0 | |
35 | */ | |
36 | class U_COMMON_API UCharCharacterIterator : public CharacterIterator { | |
37 | public: | |
38 | /** | |
f3c0d7a5 | 39 | * Create an iterator over the char16_t array referred to by "textPtr". |
b75a7d8f A |
40 | * The iteration range is 0 to <code>length-1</code>. |
41 | * text is only aliased, not adopted (the | |
42 | * destructor will not delete it). | |
f3c0d7a5 A |
43 | * @param textPtr The char16_t array to be iterated over |
44 | * @param length The length of the char16_t array | |
b75a7d8f A |
45 | * @stable ICU 2.0 |
46 | */ | |
f3c0d7a5 | 47 | UCharCharacterIterator(ConstChar16Ptr textPtr, int32_t length); |
b75a7d8f A |
48 | |
49 | /** | |
f3c0d7a5 | 50 | * Create an iterator over the char16_t array referred to by "textPtr". |
b75a7d8f A |
51 | * The iteration range is 0 to <code>length-1</code>. |
52 | * text is only aliased, not adopted (the | |
53 | * destructor will not delete it). | |
54 | * The starting | |
55 | * position is specified by "position". If "position" is outside the valid | |
56 | * iteration range, the behavior of this object is undefined. | |
f3c0d7a5 A |
57 | * @param textPtr The char16_t array to be iteratd over |
58 | * @param length The length of the char16_t array | |
b75a7d8f A |
59 | * @param position The starting position of the iteration |
60 | * @stable ICU 2.0 | |
61 | */ | |
f3c0d7a5 | 62 | UCharCharacterIterator(ConstChar16Ptr textPtr, int32_t length, |
b75a7d8f A |
63 | int32_t position); |
64 | ||
65 | /** | |
f3c0d7a5 | 66 | * Create an iterator over the char16_t array referred to by "textPtr". |
b75a7d8f A |
67 | * The iteration range is 0 to <code>end-1</code>. |
68 | * text is only aliased, not adopted (the | |
69 | * destructor will not delete it). | |
70 | * The starting | |
71 | * position is specified by "position". If begin and end do not | |
72 | * form a valid iteration range or "position" is outside the valid | |
73 | * iteration range, the behavior of this object is undefined. | |
f3c0d7a5 A |
74 | * @param textPtr The char16_t array to be iterated over |
75 | * @param length The length of the char16_t array | |
b75a7d8f A |
76 | * @param textBegin The begin position of the iteration range |
77 | * @param textEnd The end position of the iteration range | |
78 | * @param position The starting position of the iteration | |
79 | * @stable ICU 2.0 | |
80 | */ | |
f3c0d7a5 | 81 | UCharCharacterIterator(ConstChar16Ptr textPtr, int32_t length, |
b75a7d8f A |
82 | int32_t textBegin, |
83 | int32_t textEnd, | |
84 | int32_t position); | |
85 | ||
86 | /** | |
87 | * Copy constructor. The new iterator iterates over the same range | |
88 | * of the same string as "that", and its initial position is the | |
374ca955 | 89 | * same as "that"'s current position. |
b75a7d8f A |
90 | * @param that The UCharCharacterIterator to be copied |
91 | * @stable ICU 2.0 | |
92 | */ | |
93 | UCharCharacterIterator(const UCharCharacterIterator& that); | |
94 | ||
95 | /** | |
374ca955 | 96 | * Destructor. |
b75a7d8f A |
97 | * @stable ICU 2.0 |
98 | */ | |
374ca955 | 99 | virtual ~UCharCharacterIterator(); |
b75a7d8f A |
100 | |
101 | /** | |
102 | * Assignment operator. *this is altered to iterate over the sane | |
103 | * range of the same string as "that", and refers to the same | |
374ca955 | 104 | * character within that string as "that" does. |
b75a7d8f | 105 | * @param that The object to be copied |
374ca955 | 106 | * @return the newly created object |
b75a7d8f A |
107 | * @stable ICU 2.0 |
108 | */ | |
109 | UCharCharacterIterator& | |
110 | operator=(const UCharCharacterIterator& that); | |
111 | ||
112 | /** | |
113 | * Returns true if the iterators iterate over the same range of the | |
374ca955 | 114 | * same string and are pointing at the same character. |
b75a7d8f A |
115 | * @param that The ForwardCharacterIterator used to be compared for equality |
116 | * @return true if the iterators iterate over the same range of the | |
117 | * same string and are pointing at the same character. | |
118 | * @stable ICU 2.0 | |
119 | */ | |
120 | virtual UBool operator==(const ForwardCharacterIterator& that) const; | |
121 | ||
122 | /** | |
374ca955 | 123 | * Generates a hash code for this iterator. |
b75a7d8f A |
124 | * @return the hash code. |
125 | * @stable ICU 2.0 | |
126 | */ | |
127 | virtual int32_t hashCode(void) const; | |
128 | ||
129 | /** | |
130 | * Returns a new UCharCharacterIterator referring to the same | |
131 | * character in the same range of the same string as this one. The | |
374ca955 | 132 | * caller must delete the new iterator. |
b75a7d8f A |
133 | * @return the CharacterIterator newly created |
134 | * @stable ICU 2.0 | |
135 | */ | |
136 | virtual CharacterIterator* clone(void) const; | |
374ca955 | 137 | |
b75a7d8f A |
138 | /** |
139 | * Sets the iterator to refer to the first code unit in its | |
140 | * iteration range, and returns that code unit. | |
141 | * This can be used to begin an iteration with next(). | |
142 | * @return the first code unit in its iteration range. | |
143 | * @stable ICU 2.0 | |
144 | */ | |
f3c0d7a5 | 145 | virtual char16_t first(void); |
b75a7d8f A |
146 | |
147 | /** | |
148 | * Sets the iterator to refer to the first code unit in its | |
149 | * iteration range, returns that code unit, and moves the position | |
150 | * to the second code unit. This is an alternative to setToStart() | |
151 | * for forward iteration with nextPostInc(). | |
152 | * @return the first code unit in its iteration range | |
153 | * @stable ICU 2.0 | |
154 | */ | |
f3c0d7a5 | 155 | virtual char16_t firstPostInc(void); |
b75a7d8f A |
156 | |
157 | /** | |
158 | * Sets the iterator to refer to the first code point in its | |
159 | * iteration range, and returns that code unit, | |
160 | * This can be used to begin an iteration with next32(). | |
161 | * Note that an iteration with next32PostInc(), beginning with, | |
162 | * e.g., setToStart() or firstPostInc(), is more efficient. | |
163 | * @return the first code point in its iteration range | |
164 | * @stable ICU 2.0 | |
165 | */ | |
166 | virtual UChar32 first32(void); | |
167 | ||
168 | /** | |
169 | * Sets the iterator to refer to the first code point in its | |
170 | * iteration range, returns that code point, and moves the position | |
171 | * to the second code point. This is an alternative to setToStart() | |
172 | * for forward iteration with next32PostInc(). | |
173 | * @return the first code point in its iteration range. | |
174 | * @stable ICU 2.0 | |
175 | */ | |
176 | virtual UChar32 first32PostInc(void); | |
177 | ||
178 | /** | |
179 | * Sets the iterator to refer to the last code unit in its | |
180 | * iteration range, and returns that code unit. | |
181 | * This can be used to begin an iteration with previous(). | |
182 | * @return the last code unit in its iteration range. | |
183 | * @stable ICU 2.0 | |
184 | */ | |
f3c0d7a5 | 185 | virtual char16_t last(void); |
b75a7d8f A |
186 | |
187 | /** | |
188 | * Sets the iterator to refer to the last code point in its | |
189 | * iteration range, and returns that code unit. | |
190 | * This can be used to begin an iteration with previous32(). | |
191 | * @return the last code point in its iteration range. | |
192 | * @stable ICU 2.0 | |
193 | */ | |
194 | virtual UChar32 last32(void); | |
195 | ||
196 | /** | |
197 | * Sets the iterator to refer to the "position"-th code unit | |
198 | * in the text-storage object the iterator refers to, and | |
374ca955 A |
199 | * returns that code unit. |
200 | * @param position the position within the text-storage object | |
b75a7d8f A |
201 | * @return the code unit |
202 | * @stable ICU 2.0 | |
203 | */ | |
f3c0d7a5 | 204 | virtual char16_t setIndex(int32_t position); |
b75a7d8f A |
205 | |
206 | /** | |
207 | * Sets the iterator to refer to the beginning of the code point | |
208 | * that contains the "position"-th code unit | |
209 | * in the text-storage object the iterator refers to, and | |
210 | * returns that code point. | |
211 | * The current position is adjusted to the beginning of the code point | |
212 | * (its first code unit). | |
374ca955 | 213 | * @param position the position within the text-storage object |
b75a7d8f A |
214 | * @return the code unit |
215 | * @stable ICU 2.0 | |
216 | */ | |
217 | virtual UChar32 setIndex32(int32_t position); | |
218 | ||
219 | /** | |
374ca955 | 220 | * Returns the code unit the iterator currently refers to. |
b75a7d8f A |
221 | * @return the code unit the iterator currently refers to. |
222 | * @stable ICU 2.0 | |
223 | */ | |
f3c0d7a5 | 224 | virtual char16_t current(void) const; |
b75a7d8f A |
225 | |
226 | /** | |
374ca955 | 227 | * Returns the code point the iterator currently refers to. |
b75a7d8f A |
228 | * @return the code point the iterator currently refers to. |
229 | * @stable ICU 2.0 | |
230 | */ | |
231 | virtual UChar32 current32(void) const; | |
232 | ||
233 | /** | |
234 | * Advances to the next code unit in the iteration range (toward | |
235 | * endIndex()), and returns that code unit. If there are no more | |
374ca955 A |
236 | * code units to return, returns DONE. |
237 | * @return the next code unit in the iteration range. | |
b75a7d8f A |
238 | * @stable ICU 2.0 |
239 | */ | |
f3c0d7a5 | 240 | virtual char16_t next(void); |
b75a7d8f A |
241 | |
242 | /** | |
243 | * Gets the current code unit for returning and advances to the next code unit | |
244 | * in the iteration range | |
245 | * (toward endIndex()). If there are | |
246 | * no more code units to return, returns DONE. | |
247 | * @return the current code unit. | |
248 | * @stable ICU 2.0 | |
249 | */ | |
f3c0d7a5 | 250 | virtual char16_t nextPostInc(void); |
374ca955 | 251 | |
b75a7d8f A |
252 | /** |
253 | * Advances to the next code point in the iteration range (toward | |
254 | * endIndex()), and returns that code point. If there are no more | |
374ca955 | 255 | * code points to return, returns DONE. |
b75a7d8f A |
256 | * Note that iteration with "pre-increment" semantics is less |
257 | * efficient than iteration with "post-increment" semantics | |
258 | * that is provided by next32PostInc(). | |
259 | * @return the next code point in the iteration range. | |
260 | * @stable ICU 2.0 | |
261 | */ | |
262 | virtual UChar32 next32(void); | |
263 | ||
264 | /** | |
265 | * Gets the current code point for returning and advances to the next code point | |
266 | * in the iteration range | |
267 | * (toward endIndex()). If there are | |
268 | * no more code points to return, returns DONE. | |
269 | * @return the current point. | |
270 | * @stable ICU 2.0 | |
271 | */ | |
272 | virtual UChar32 next32PostInc(void); | |
374ca955 | 273 | |
b75a7d8f A |
274 | /** |
275 | * Returns FALSE if there are no more code units or code points | |
276 | * at or after the current position in the iteration range. | |
277 | * This is used with nextPostInc() or next32PostInc() in forward | |
278 | * iteration. | |
279 | * @return FALSE if there are no more code units or code points | |
280 | * at or after the current position in the iteration range. | |
281 | * @stable ICU 2.0 | |
282 | */ | |
283 | virtual UBool hasNext(); | |
284 | ||
285 | /** | |
286 | * Advances to the previous code unit in the iteration range (toward | |
287 | * startIndex()), and returns that code unit. If there are no more | |
374ca955 | 288 | * code units to return, returns DONE. |
b75a7d8f A |
289 | * @return the previous code unit in the iteration range. |
290 | * @stable ICU 2.0 | |
291 | */ | |
f3c0d7a5 | 292 | virtual char16_t previous(void); |
b75a7d8f A |
293 | |
294 | /** | |
295 | * Advances to the previous code point in the iteration range (toward | |
296 | * startIndex()), and returns that code point. If there are no more | |
297 | * code points to return, returns DONE. | |
374ca955 | 298 | * @return the previous code point in the iteration range. |
b75a7d8f A |
299 | * @stable ICU 2.0 |
300 | */ | |
301 | virtual UChar32 previous32(void); | |
302 | ||
303 | /** | |
304 | * Returns FALSE if there are no more code units or code points | |
305 | * before the current position in the iteration range. | |
306 | * This is used with previous() or previous32() in backward | |
307 | * iteration. | |
308 | * @return FALSE if there are no more code units or code points | |
309 | * before the current position in the iteration range. | |
310 | * @stable ICU 2.0 | |
311 | */ | |
312 | virtual UBool hasPrevious(); | |
313 | ||
314 | /** | |
315 | * Moves the current position relative to the start or end of the | |
316 | * iteration range, or relative to the current position itself. | |
317 | * The movement is expressed in numbers of code units forward | |
318 | * or backward by specifying a positive or negative delta. | |
374ca955 | 319 | * @param delta the position relative to origin. A positive delta means forward; |
b75a7d8f | 320 | * a negative delta means backward. |
374ca955 | 321 | * @param origin Origin enumeration {kStart, kCurrent, kEnd} |
b75a7d8f A |
322 | * @return the new position |
323 | * @stable ICU 2.0 | |
324 | */ | |
325 | virtual int32_t move(int32_t delta, EOrigin origin); | |
326 | ||
327 | /** | |
328 | * Moves the current position relative to the start or end of the | |
329 | * iteration range, or relative to the current position itself. | |
330 | * The movement is expressed in numbers of code points forward | |
331 | * or backward by specifying a positive or negative delta. | |
374ca955 | 332 | * @param delta the position relative to origin. A positive delta means forward; |
b75a7d8f | 333 | * a negative delta means backward. |
374ca955 | 334 | * @param origin Origin enumeration {kStart, kCurrent, kEnd} |
b75a7d8f A |
335 | * @return the new position |
336 | * @stable ICU 2.0 | |
337 | */ | |
f3c0d7a5 A |
338 | #ifdef move32 |
339 | // One of the system headers right now is sometimes defining a conflicting macro we don't use | |
340 | #undef move32 | |
341 | #endif | |
b75a7d8f A |
342 | virtual int32_t move32(int32_t delta, EOrigin origin); |
343 | ||
344 | /** | |
345 | * Sets the iterator to iterate over a new range of text | |
346 | * @stable ICU 2.0 | |
347 | */ | |
f3c0d7a5 | 348 | void setText(ConstChar16Ptr newText, int32_t newTextLength); |
374ca955 | 349 | |
b75a7d8f | 350 | /** |
f3c0d7a5 | 351 | * Copies the char16_t array under iteration into the UnicodeString |
b75a7d8f A |
352 | * referred to by "result". Even if this iterator iterates across |
353 | * only a part of this string, the whole string is copied. | |
374ca955 | 354 | * @param result Receives a copy of the text under iteration. |
b75a7d8f A |
355 | * @stable ICU 2.0 |
356 | */ | |
357 | virtual void getText(UnicodeString& result); | |
358 | ||
359 | /** | |
374ca955 A |
360 | * Return a class ID for this class (not really public) |
361 | * @return a class ID for this class | |
b75a7d8f A |
362 | * @stable ICU 2.0 |
363 | */ | |
374ca955 | 364 | static UClassID U_EXPORT2 getStaticClassID(void); |
b75a7d8f A |
365 | |
366 | /** | |
374ca955 A |
367 | * Return a class ID for this object (not really public) |
368 | * @return a class ID for this object. | |
b75a7d8f A |
369 | * @stable ICU 2.0 |
370 | */ | |
374ca955 | 371 | virtual UClassID getDynamicClassID(void) const; |
b75a7d8f A |
372 | |
373 | protected: | |
374 | /** | |
375 | * Protected constructor | |
376 | * @stable ICU 2.0 | |
377 | */ | |
378 | UCharCharacterIterator(); | |
379 | /** | |
380 | * Protected member text | |
381 | * @stable ICU 2.0 | |
374ca955 | 382 | */ |
f3c0d7a5 | 383 | const char16_t* text; |
b75a7d8f | 384 | |
b75a7d8f A |
385 | }; |
386 | ||
b75a7d8f | 387 | U_NAMESPACE_END |
f3c0d7a5 A |
388 | #endif // U_SHOW_CPLUSPLUS_API |
389 | ||
b75a7d8f | 390 | #endif |