1 // Copyright (C) 2016 and later: Unicode, Inc. and others.
2 // License & terms of use: http://www.unicode.org/copyright.html
3 /*
4 **********************************************************************
5 *   Copyright (C) 1998-2005, International Business Machines
6 *   Corporation and others.  All Rights Reserved.
7 **********************************************************************
8 */
9 
10 #ifndef UCHRITER_H
11 #define UCHRITER_H
12 
13 #include "unicode/utypes.h"
14 #include "unicode/chariter.h"
15 
16 /**
17  * \file
18  * \brief C++ API: UChar Character Iterator
19  */
20 
21 U_NAMESPACE_BEGIN
22 
23 /**
24  * A concrete subclass of CharacterIterator that iterates over the
25  * characters (code units or code points) in a UChar array.
26  * It's possible not only to create an
27  * iterator that iterates over an entire UChar array, but also to
28  * create one that iterates over only a subrange of a UChar array
29  * (iterators over different subranges of the same UChar array don't
30  * compare equal).
31  * @see CharacterIterator
32  * @see ForwardCharacterIterator
33  * @stable ICU 2.0
34  */
35 class U_COMMON_API UCharCharacterIterator : public CharacterIterator {
36 public:
37   /**
38    * Create an iterator over the UChar array referred to by "textPtr".
39    * The iteration range is 0 to <code>length-1</code>.
40    * text is only aliased, not adopted (the
41    * destructor will not delete it).
42    * @param textPtr The UChar array to be iterated over
43    * @param length The length of the UChar array
44    * @stable ICU 2.0
45    */
46   UCharCharacterIterator(const UChar* textPtr, int32_t length);
47 
48   /**
49    * Create an iterator over the UChar array referred to by "textPtr".
50    * The iteration range is 0 to <code>length-1</code>.
51    * text is only aliased, not adopted (the
52    * destructor will not delete it).
53    * The starting
54    * position is specified by "position". If "position" is outside the valid
55    * iteration range, the behavior of this object is undefined.
56    * @param textPtr The UChar array to be iteratd over
57    * @param length The length of the UChar array
58    * @param position The starting position of the iteration
59    * @stable ICU 2.0
60    */
61   UCharCharacterIterator(const UChar* textPtr, int32_t length,
62                          int32_t position);
63 
64   /**
65    * Create an iterator over the UChar array referred to by "textPtr".
66    * The iteration range is 0 to <code>end-1</code>.
67    * text is only aliased, not adopted (the
68    * destructor will not delete it).
69    * The starting
70    * position is specified by "position". If begin and end do not
71    * form a valid iteration range or "position" is outside the valid
72    * iteration range, the behavior of this object is undefined.
73    * @param textPtr The UChar array to be iterated over
74    * @param length The length of the UChar array
75    * @param textBegin  The begin position of the iteration range
76    * @param textEnd    The end position of the iteration range
77    * @param position    The starting position of the iteration
78    * @stable ICU 2.0
79    */
80   UCharCharacterIterator(const UChar* textPtr, int32_t length,
81                          int32_t textBegin,
82                          int32_t textEnd,
83                          int32_t position);
84 
85   /**
86    * Copy constructor.  The new iterator iterates over the same range
87    * of the same string as "that", and its initial position is the
88    * same as "that"'s current position.
89    * @param that The UCharCharacterIterator to be copied
90    * @stable ICU 2.0
91    */
92   UCharCharacterIterator(const UCharCharacterIterator&  that);
93 
94   /**
95    * Destructor.
96    * @stable ICU 2.0
97    */
98   virtual ~UCharCharacterIterator();
99 
100   /**
101    * Assignment operator.  *this is altered to iterate over the sane
102    * range of the same string as "that", and refers to the same
103    * character within that string as "that" does.
104    * @param that The object to be copied
105    * @return the newly created object
106    * @stable ICU 2.0
107    */
108   UCharCharacterIterator&
109   operator=(const UCharCharacterIterator&    that);
110 
111   /**
112    * Returns true if the iterators iterate over the same range of the
113    * same string and are pointing at the same character.
114    * @param that The ForwardCharacterIterator used to be compared for equality
115    * @return true if the iterators iterate over the same range of the
116    * same string and are pointing at the same character.
117    * @stable ICU 2.0
118    */
119   virtual UBool          operator==(const ForwardCharacterIterator& that) const;
120 
121   /**
122    * Generates a hash code for this iterator.
123    * @return the hash code.
124    * @stable ICU 2.0
125    */
126   virtual int32_t         hashCode(void) const;
127 
128   /**
129    * Returns a new UCharCharacterIterator referring to the same
130    * character in the same range of the same string as this one.  The
131    * caller must delete the new iterator.
132    * @return the CharacterIterator newly created
133    * @stable ICU 2.0
134    */
135   virtual CharacterIterator* clone(void) const;
136 
137   /**
138    * Sets the iterator to refer to the first code unit in its
139    * iteration range, and returns that code unit.
140    * This can be used to begin an iteration with next().
141    * @return the first code unit in its iteration range.
142    * @stable ICU 2.0
143    */
144   virtual UChar         first(void);
145 
146   /**
147    * Sets the iterator to refer to the first code unit in its
148    * iteration range, returns that code unit, and moves the position
149    * to the second code unit. This is an alternative to setToStart()
150    * for forward iteration with nextPostInc().
151    * @return the first code unit in its iteration range
152    * @stable ICU 2.0
153    */
154   virtual UChar         firstPostInc(void);
155 
156   /**
157    * Sets the iterator to refer to the first code point in its
158    * iteration range, and returns that code unit,
159    * This can be used to begin an iteration with next32().
160    * Note that an iteration with next32PostInc(), beginning with,
161    * e.g., setToStart() or firstPostInc(), is more efficient.
162    * @return the first code point in its iteration range
163    * @stable ICU 2.0
164    */
165   virtual UChar32       first32(void);
166 
167   /**
168    * Sets the iterator to refer to the first code point in its
169    * iteration range, returns that code point, and moves the position
170    * to the second code point. This is an alternative to setToStart()
171    * for forward iteration with next32PostInc().
172    * @return the first code point in its iteration range.
173    * @stable ICU 2.0
174    */
175   virtual UChar32       first32PostInc(void);
176 
177   /**
178    * Sets the iterator to refer to the last code unit in its
179    * iteration range, and returns that code unit.
180    * This can be used to begin an iteration with previous().
181    * @return the last code unit in its iteration range.
182    * @stable ICU 2.0
183    */
184   virtual UChar         last(void);
185 
186   /**
187    * Sets the iterator to refer to the last code point in its
188    * iteration range, and returns that code unit.
189    * This can be used to begin an iteration with previous32().
190    * @return the last code point in its iteration range.
191    * @stable ICU 2.0
192    */
193   virtual UChar32       last32(void);
194 
195   /**
196    * Sets the iterator to refer to the "position"-th code unit
197    * in the text-storage object the iterator refers to, and
198    * returns that code unit.
199    * @param position the position within the text-storage object
200    * @return the code unit
201    * @stable ICU 2.0
202    */
203   virtual UChar         setIndex(int32_t position);
204 
205   /**
206    * Sets the iterator to refer to the beginning of the code point
207    * that contains the "position"-th code unit
208    * in the text-storage object the iterator refers to, and
209    * returns that code point.
210    * The current position is adjusted to the beginning of the code point
211    * (its first code unit).
212    * @param position the position within the text-storage object
213    * @return the code unit
214    * @stable ICU 2.0
215    */
216   virtual UChar32       setIndex32(int32_t position);
217 
218   /**
219    * Returns the code unit the iterator currently refers to.
220    * @return the code unit the iterator currently refers to.
221    * @stable ICU 2.0
222    */
223   virtual UChar         current(void) const;
224 
225   /**
226    * Returns the code point the iterator currently refers to.
227    * @return the code point the iterator currently refers to.
228    * @stable ICU 2.0
229    */
230   virtual UChar32       current32(void) const;
231 
232   /**
233    * Advances to the next code unit in the iteration range (toward
234    * endIndex()), and returns that code unit.  If there are no more
235    * code units to return, returns DONE.
236    * @return the next code unit in the iteration range.
237    * @stable ICU 2.0
238    */
239   virtual UChar         next(void);
240 
241   /**
242    * Gets the current code unit for returning and advances to the next code unit
243    * in the iteration range
244    * (toward endIndex()).  If there are
245    * no more code units to return, returns DONE.
246    * @return the current code unit.
247    * @stable ICU 2.0
248    */
249   virtual UChar         nextPostInc(void);
250 
251   /**
252    * Advances to the next code point in the iteration range (toward
253    * endIndex()), and returns that code point.  If there are no more
254    * code points to return, returns DONE.
255    * Note that iteration with "pre-increment" semantics is less
256    * efficient than iteration with "post-increment" semantics
257    * that is provided by next32PostInc().
258    * @return the next code point in the iteration range.
259    * @stable ICU 2.0
260    */
261   virtual UChar32       next32(void);
262 
263   /**
264    * Gets the current code point for returning and advances to the next code point
265    * in the iteration range
266    * (toward endIndex()).  If there are
267    * no more code points to return, returns DONE.
268    * @return the current point.
269    * @stable ICU 2.0
270    */
271   virtual UChar32       next32PostInc(void);
272 
273   /**
274    * Returns FALSE if there are no more code units or code points
275    * at or after the current position in the iteration range.
276    * This is used with nextPostInc() or next32PostInc() in forward
277    * iteration.
278    * @return FALSE if there are no more code units or code points
279    * at or after the current position in the iteration range.
280    * @stable ICU 2.0
281    */
282   virtual UBool        hasNext();
283 
284   /**
285    * Advances to the previous code unit in the iteration range (toward
286    * startIndex()), and returns that code unit.  If there are no more
287    * code units to return, returns DONE.
288    * @return the previous code unit in the iteration range.
289    * @stable ICU 2.0
290    */
291   virtual UChar         previous(void);
292 
293   /**
294    * Advances to the previous code point in the iteration range (toward
295    * startIndex()), and returns that code point.  If there are no more
296    * code points to return, returns DONE.
297    * @return the previous code point in the iteration range.
298    * @stable ICU 2.0
299    */
300   virtual UChar32       previous32(void);
301 
302   /**
303    * Returns FALSE if there are no more code units or code points
304    * before the current position in the iteration range.
305    * This is used with previous() or previous32() in backward
306    * iteration.
307    * @return FALSE if there are no more code units or code points
308    * before the current position in the iteration range.
309    * @stable ICU 2.0
310    */
311   virtual UBool        hasPrevious();
312 
313   /**
314    * Moves the current position relative to the start or end of the
315    * iteration range, or relative to the current position itself.
316    * The movement is expressed in numbers of code units forward
317    * or backward by specifying a positive or negative delta.
318    * @param delta the position relative to origin. A positive delta means forward;
319    * a negative delta means backward.
320    * @param origin Origin enumeration {kStart, kCurrent, kEnd}
321    * @return the new position
322    * @stable ICU 2.0
323    */
324   virtual int32_t      move(int32_t delta, EOrigin origin);
325 
326   /**
327    * Moves the current position relative to the start or end of the
328    * iteration range, or relative to the current position itself.
329    * The movement is expressed in numbers of code points forward
330    * or backward by specifying a positive or negative delta.
331    * @param delta the position relative to origin. A positive delta means forward;
332    * a negative delta means backward.
333    * @param origin Origin enumeration {kStart, kCurrent, kEnd}
334    * @return the new position
335    * @stable ICU 2.0
336    */
337   virtual int32_t      move32(int32_t delta, EOrigin origin);
338 
339   /**
340    * Sets the iterator to iterate over a new range of text
341    * @stable ICU 2.0
342    */
343   void setText(const UChar* newText, int32_t newTextLength);
344 
345   /**
346    * Copies the UChar array under iteration into the UnicodeString
347    * referred to by "result".  Even if this iterator iterates across
348    * only a part of this string, the whole string is copied.
349    * @param result Receives a copy of the text under iteration.
350    * @stable ICU 2.0
351    */
352   virtual void            getText(UnicodeString& result);
353 
354   /**
355    * Return a class ID for this class (not really public)
356    * @return a class ID for this class
357    * @stable ICU 2.0
358    */
359   static UClassID         U_EXPORT2 getStaticClassID(void);
360 
361   /**
362    * Return a class ID for this object (not really public)
363    * @return a class ID for this object.
364    * @stable ICU 2.0
365    */
366   virtual UClassID        getDynamicClassID(void) const;
367 
368 protected:
369   /**
370    * Protected constructor
371    * @stable ICU 2.0
372    */
373   UCharCharacterIterator();
374   /**
375    * Protected member text
376    * @stable ICU 2.0
377    */
378   const UChar*            text;
379 
380 };
381 
382 U_NAMESPACE_END
383 #endif
384