1 // Copyright (C) 2016 and later: Unicode, Inc. and others.
2 // License & terms of use: http://www.unicode.org/copyright.html
3 /*
4 *******************************************************************************
5 *
6 *   Copyright (C) 2002-2012, International Business Machines
7 *   Corporation and others.  All Rights Reserved.
8 *
9 *******************************************************************************
10 */
11 
12 #ifndef STRENUM_H
13 #define STRENUM_H
14 
15 #include "unicode/uobject.h"
16 #include "unicode/unistr.h"
17 
18 /**
19  * \file
20  * \brief C++ API: String Enumeration
21  */
22 
23 U_NAMESPACE_BEGIN
24 
25 /**
26  * Base class for 'pure' C++ implementations of uenum api.  Adds a
27  * method that returns the next UnicodeString since in C++ this can
28  * be a common storage format for strings.
29  *
30  * <p>The model is that the enumeration is over strings maintained by
31  * a 'service.'  At any point, the service might change, invalidating
32  * the enumerator (though this is expected to be rare).  The iterator
33  * returns an error if this has occurred.  Lack of the error is no
34  * guarantee that the service didn't change immediately after the
35  * call, so the returned string still might not be 'valid' on
36  * subsequent use.</p>
37  *
38  * <p>Strings may take the form of const char*, const UChar*, or const
39  * UnicodeString*.  The type you get is determine by the variant of
40  * 'next' that you call.  In general the StringEnumeration is
41  * optimized for one of these types, but all StringEnumerations can
42  * return all types.  Returned strings are each terminated with a NUL.
43  * Depending on the service data, they might also include embedded NUL
44  * characters, so API is provided to optionally return the true
45  * length, counting the embedded NULs but not counting the terminating
46  * NUL.</p>
47  *
48  * <p>The pointers returned by next, unext, and snext become invalid
49  * upon any subsequent call to the enumeration's destructor, next,
50  * unext, snext, or reset.</p>
51  *
52  * ICU 2.8 adds some default implementations and helper functions
53  * for subclasses.
54  *
55  * @stable ICU 2.4
56  */
57 class U_COMMON_API StringEnumeration : public UObject {
58 public:
59     /**
60      * Destructor.
61      * @stable ICU 2.4
62      */
63     virtual ~StringEnumeration();
64 
65     /**
66      * Clone this object, an instance of a subclass of StringEnumeration.
67      * Clones can be used concurrently in multiple threads.
68      * If a subclass does not implement clone(), or if an error occurs,
69      * then NULL is returned.
70      * The clone functions in all subclasses return a base class pointer
71      * because some compilers do not support covariant (same-as-this)
72      * return types; cast to the appropriate subclass if necessary.
73      * The caller must delete the clone.
74      *
75      * @return a clone of this object
76      *
77      * @see getDynamicClassID
78      * @stable ICU 2.8
79      */
80     virtual StringEnumeration *clone() const;
81 
82     /**
83      * <p>Return the number of elements that the iterator traverses.  If
84      * the iterator is out of sync with its service, status is set to
85      * U_ENUM_OUT_OF_SYNC_ERROR, and the return value is zero.</p>
86      *
87      * <p>The return value will not change except possibly as a result of
88      * a subsequent call to reset, or if the iterator becomes out of sync.</p>
89      *
90      * <p>This is a convenience function. It can end up being very
91      * expensive as all the items might have to be pre-fetched
92      * (depending on the storage format of the data being
93      * traversed).</p>
94      *
95      * @param status the error code.
96      * @return number of elements in the iterator.
97      *
98      * @stable ICU 2.4 */
99     virtual int32_t count(UErrorCode& status) const = 0;
100 
101     /**
102      * <p>Returns the next element as a NUL-terminated char*.  If there
103      * are no more elements, returns NULL.  If the resultLength pointer
104      * is not NULL, the length of the string (not counting the
105      * terminating NUL) is returned at that address.  If an error
106      * status is returned, the value at resultLength is undefined.</p>
107      *
108      * <p>The returned pointer is owned by this iterator and must not be
109      * deleted by the caller.  The pointer is valid until the next call
110      * to next, unext, snext, reset, or the enumerator's destructor.</p>
111      *
112      * <p>If the iterator is out of sync with its service, status is set
113      * to U_ENUM_OUT_OF_SYNC_ERROR and NULL is returned.</p>
114      *
115      * <p>If the native service string is a UChar* string, it is
116      * converted to char* with the invariant converter.  If the
117      * conversion fails (because a character cannot be converted) then
118      * status is set to U_INVARIANT_CONVERSION_ERROR and the return
119      * value is undefined (though not NULL).</p>
120      *
121      * Starting with ICU 2.8, the default implementation calls snext()
122      * and handles the conversion.
123      * Either next() or snext() must be implemented differently by a subclass.
124      *
125      * @param status the error code.
126      * @param resultLength a pointer to receive the length, can be NULL.
127      * @return a pointer to the string, or NULL.
128      *
129      * @stable ICU 2.4
130      */
131     virtual const char* next(int32_t *resultLength, UErrorCode& status);
132 
133     /**
134      * <p>Returns the next element as a NUL-terminated UChar*.  If there
135      * are no more elements, returns NULL.  If the resultLength pointer
136      * is not NULL, the length of the string (not counting the
137      * terminating NUL) is returned at that address.  If an error
138      * status is returned, the value at resultLength is undefined.</p>
139      *
140      * <p>The returned pointer is owned by this iterator and must not be
141      * deleted by the caller.  The pointer is valid until the next call
142      * to next, unext, snext, reset, or the enumerator's destructor.</p>
143      *
144      * <p>If the iterator is out of sync with its service, status is set
145      * to U_ENUM_OUT_OF_SYNC_ERROR and NULL is returned.</p>
146      *
147      * Starting with ICU 2.8, the default implementation calls snext()
148      * and handles the conversion.
149      *
150      * @param status the error code.
151      * @param resultLength a ponter to receive the length, can be NULL.
152      * @return a pointer to the string, or NULL.
153      *
154      * @stable ICU 2.4
155      */
156     virtual const UChar* unext(int32_t *resultLength, UErrorCode& status);
157 
158     /**
159      * <p>Returns the next element a UnicodeString*.  If there are no
160      * more elements, returns NULL.</p>
161      *
162      * <p>The returned pointer is owned by this iterator and must not be
163      * deleted by the caller.  The pointer is valid until the next call
164      * to next, unext, snext, reset, or the enumerator's destructor.</p>
165      *
166      * <p>If the iterator is out of sync with its service, status is set
167      * to U_ENUM_OUT_OF_SYNC_ERROR and NULL is returned.</p>
168      *
169      * Starting with ICU 2.8, the default implementation calls next()
170      * and handles the conversion.
171      * Either next() or snext() must be implemented differently by a subclass.
172      *
173      * @param status the error code.
174      * @return a pointer to the string, or NULL.
175      *
176      * @stable ICU 2.4
177      */
178     virtual const UnicodeString* snext(UErrorCode& status);
179 
180     /**
181      * <p>Resets the iterator.  This re-establishes sync with the
182      * service and rewinds the iterator to start at the first
183      * element.</p>
184      *
185      * <p>Previous pointers returned by next, unext, or snext become
186      * invalid, and the value returned by count might change.</p>
187      *
188      * @param status the error code.
189      *
190      * @stable ICU 2.4
191      */
192     virtual void reset(UErrorCode& status) = 0;
193 
194     /**
195      * Compares this enumeration to other to check if both are equal
196      *
197      * @param that The other string enumeration to compare this object to
198      * @return TRUE if the enumerations are equal. FALSE if not.
199      * @stable ICU 3.6
200      */
201     virtual UBool operator==(const StringEnumeration& that)const;
202     /**
203      * Compares this enumeration to other to check if both are not equal
204      *
205      * @param that The other string enumeration to compare this object to
206      * @return TRUE if the enumerations are equal. FALSE if not.
207      * @stable ICU 3.6
208      */
209     virtual UBool operator!=(const StringEnumeration& that)const;
210 
211 protected:
212     /**
213      * UnicodeString field for use with default implementations and subclasses.
214      * @stable ICU 2.8
215      */
216     UnicodeString unistr;
217     /**
218      * char * default buffer for use with default implementations and subclasses.
219      * @stable ICU 2.8
220      */
221     char charsBuffer[32];
222     /**
223      * char * buffer for use with default implementations and subclasses.
224      * Allocated in constructor and in ensureCharsCapacity().
225      * @stable ICU 2.8
226      */
227     char *chars;
228     /**
229      * Capacity of chars, for use with default implementations and subclasses.
230      * @stable ICU 2.8
231      */
232     int32_t charsCapacity;
233 
234     /**
235      * Default constructor for use with default implementations and subclasses.
236      * @stable ICU 2.8
237      */
238     StringEnumeration();
239 
240     /**
241      * Ensures that chars is at least as large as the requested capacity.
242      * For use with default implementations and subclasses.
243      *
244      * @param capacity Requested capacity.
245      * @param status ICU in/out error code.
246      * @stable ICU 2.8
247      */
248     void ensureCharsCapacity(int32_t capacity, UErrorCode &status);
249 
250     /**
251      * Converts s to Unicode and sets unistr to the result.
252      * For use with default implementations and subclasses,
253      * especially for implementations of snext() in terms of next().
254      * This is provided with a helper function instead of a default implementation
255      * of snext() to avoid potential infinite loops between next() and snext().
256      *
257      * For example:
258      * \code
259      * const UnicodeString* snext(UErrorCode& status) {
260      *   int32_t resultLength=0;
261      *   const char *s=next(&resultLength, status);
262      *   return setChars(s, resultLength, status);
263      * }
264      * \endcode
265      *
266      * @param s String to be converted to Unicode.
267      * @param length Length of the string.
268      * @param status ICU in/out error code.
269      * @return A pointer to unistr.
270      * @stable ICU 2.8
271      */
272     UnicodeString *setChars(const char *s, int32_t length, UErrorCode &status);
273 };
274 
275 U_NAMESPACE_END
276 
277 /* STRENUM_H */
278 #endif
279