• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1 // © 2016 and later: Unicode, Inc. and others.
2 // License & terms of use: http://www.unicode.org/copyright.html
3 /*
4 *******************************************************************************
5 *
6 *   Copyright (C) 2002-2012, International Business Machines
7 *   Corporation and others.  All Rights Reserved.
8 *
9 *******************************************************************************
10 */
11 
12 #ifndef STRENUM_H
13 #define STRENUM_H
14 
15 #include "unicode/utypes.h"
16 
17 #if U_SHOW_CPLUSPLUS_API
18 
19 #include "unicode/uobject.h"
20 #include "unicode/unistr.h"
21 
22 /**
23  * \file
24  * \brief C++ API: String Enumeration
25  */
26 
27 U_NAMESPACE_BEGIN
28 
29 /**
30  * Base class for 'pure' C++ implementations of uenum api.  Adds a
31  * method that returns the next UnicodeString since in C++ this can
32  * be a common storage format for strings.
33  *
34  * <p>The model is that the enumeration is over strings maintained by
35  * a 'service.'  At any point, the service might change, invalidating
36  * the enumerator (though this is expected to be rare).  The iterator
37  * returns an error if this has occurred.  Lack of the error is no
38  * guarantee that the service didn't change immediately after the
39  * call, so the returned string still might not be 'valid' on
40  * subsequent use.</p>
41  *
42  * <p>Strings may take the form of const char*, const char16_t*, or const
43  * UnicodeString*.  The type you get is determine by the variant of
44  * 'next' that you call.  In general the StringEnumeration is
45  * optimized for one of these types, but all StringEnumerations can
46  * return all types.  Returned strings are each terminated with a NUL.
47  * Depending on the service data, they might also include embedded NUL
48  * characters, so API is provided to optionally return the true
49  * length, counting the embedded NULs but not counting the terminating
50  * NUL.</p>
51  *
52  * <p>The pointers returned by next, unext, and snext become invalid
53  * upon any subsequent call to the enumeration's destructor, next,
54  * unext, snext, or reset.</p>
55  *
56  * ICU 2.8 adds some default implementations and helper functions
57  * for subclasses.
58  *
59  * @stable ICU 2.4
60  */
61 class U_COMMON_API StringEnumeration : public UObject {
62 public:
63     /**
64      * Destructor.
65      * @stable ICU 2.4
66      */
67     virtual ~StringEnumeration();
68 
69     /**
70      * Clone this object, an instance of a subclass of StringEnumeration.
71      * Clones can be used concurrently in multiple threads.
72      * If a subclass does not implement clone(), or if an error occurs,
73      * then NULL is returned.
74      * The caller must delete the clone.
75      *
76      * @return a clone of this object
77      *
78      * @see getDynamicClassID
79      * @stable ICU 2.8
80      */
81     virtual StringEnumeration *clone() const;
82 
83     /**
84      * <p>Return the number of elements that the iterator traverses.  If
85      * the iterator is out of sync with its service, status is set to
86      * U_ENUM_OUT_OF_SYNC_ERROR, and the return value is zero.</p>
87      *
88      * <p>The return value will not change except possibly as a result of
89      * a subsequent call to reset, or if the iterator becomes out of sync.</p>
90      *
91      * <p>This is a convenience function. It can end up being very
92      * expensive as all the items might have to be pre-fetched
93      * (depending on the storage format of the data being
94      * traversed).</p>
95      *
96      * @param status the error code.
97      * @return number of elements in the iterator.
98      *
99      * @stable ICU 2.4 */
100     virtual int32_t count(UErrorCode& status) const = 0;
101 
102     /**
103      * <p>Returns the next element as a NUL-terminated char*.  If there
104      * are no more elements, returns NULL.  If the resultLength pointer
105      * is not NULL, the length of the string (not counting the
106      * terminating NUL) is returned at that address.  If an error
107      * status is returned, the value at resultLength is undefined.</p>
108      *
109      * <p>The returned pointer is owned by this iterator and must not be
110      * deleted by the caller.  The pointer is valid until the next call
111      * to next, unext, snext, reset, or the enumerator's destructor.</p>
112      *
113      * <p>If the iterator is out of sync with its service, status is set
114      * to U_ENUM_OUT_OF_SYNC_ERROR and NULL is returned.</p>
115      *
116      * <p>If the native service string is a char16_t* string, it is
117      * converted to char* with the invariant converter.  If the
118      * conversion fails (because a character cannot be converted) then
119      * status is set to U_INVARIANT_CONVERSION_ERROR and the return
120      * value is undefined (though not NULL).</p>
121      *
122      * Starting with ICU 2.8, the default implementation calls snext()
123      * and handles the conversion.
124      * Either next() or snext() must be implemented differently by a subclass.
125      *
126      * @param status the error code.
127      * @param resultLength a pointer to receive the length, can be NULL.
128      * @return a pointer to the string, or NULL.
129      *
130      * @stable ICU 2.4
131      */
132     virtual const char* next(int32_t *resultLength, UErrorCode& status);
133 
134     /**
135      * <p>Returns the next element as a NUL-terminated char16_t*.  If there
136      * are no more elements, returns NULL.  If the resultLength pointer
137      * is not NULL, the length of the string (not counting the
138      * terminating NUL) is returned at that address.  If an error
139      * status is returned, the value at resultLength is undefined.</p>
140      *
141      * <p>The returned pointer is owned by this iterator and must not be
142      * deleted by the caller.  The pointer is valid until the next call
143      * to next, unext, snext, reset, or the enumerator's destructor.</p>
144      *
145      * <p>If the iterator is out of sync with its service, status is set
146      * to U_ENUM_OUT_OF_SYNC_ERROR and NULL is returned.</p>
147      *
148      * Starting with ICU 2.8, the default implementation calls snext()
149      * and handles the conversion.
150      *
151      * @param status the error code.
152      * @param resultLength a ponter to receive the length, can be NULL.
153      * @return a pointer to the string, or NULL.
154      *
155      * @stable ICU 2.4
156      */
157     virtual const char16_t* unext(int32_t *resultLength, UErrorCode& status);
158 
159     /**
160      * <p>Returns the next element a UnicodeString*.  If there are no
161      * more elements, returns NULL.</p>
162      *
163      * <p>The returned pointer is owned by this iterator and must not be
164      * deleted by the caller.  The pointer is valid until the next call
165      * to next, unext, snext, reset, or the enumerator's destructor.</p>
166      *
167      * <p>If the iterator is out of sync with its service, status is set
168      * to U_ENUM_OUT_OF_SYNC_ERROR and NULL is returned.</p>
169      *
170      * Starting with ICU 2.8, the default implementation calls next()
171      * and handles the conversion.
172      * Either next() or snext() must be implemented differently by a subclass.
173      *
174      * @param status the error code.
175      * @return a pointer to the string, or NULL.
176      *
177      * @stable ICU 2.4
178      */
179     virtual const UnicodeString* snext(UErrorCode& status);
180 
181     /**
182      * <p>Resets the iterator.  This re-establishes sync with the
183      * service and rewinds the iterator to start at the first
184      * element.</p>
185      *
186      * <p>Previous pointers returned by next, unext, or snext become
187      * invalid, and the value returned by count might change.</p>
188      *
189      * @param status the error code.
190      *
191      * @stable ICU 2.4
192      */
193     virtual void reset(UErrorCode& status) = 0;
194 
195     /**
196      * Compares this enumeration to other to check if both are equal
197      *
198      * @param that The other string enumeration to compare this object to
199      * @return TRUE if the enumerations are equal. FALSE if not.
200      * @stable ICU 3.6
201      */
202     virtual UBool operator==(const StringEnumeration& that)const;
203     /**
204      * Compares this enumeration to other to check if both are not equal
205      *
206      * @param that The other string enumeration to compare this object to
207      * @return TRUE if the enumerations are equal. FALSE if not.
208      * @stable ICU 3.6
209      */
210     virtual UBool operator!=(const StringEnumeration& that)const;
211 
212 protected:
213     /**
214      * UnicodeString field for use with default implementations and subclasses.
215      * @stable ICU 2.8
216      */
217     UnicodeString unistr;
218     /**
219      * char * default buffer for use with default implementations and subclasses.
220      * @stable ICU 2.8
221      */
222     char charsBuffer[32];
223     /**
224      * char * buffer for use with default implementations and subclasses.
225      * Allocated in constructor and in ensureCharsCapacity().
226      * @stable ICU 2.8
227      */
228     char *chars;
229     /**
230      * Capacity of chars, for use with default implementations and subclasses.
231      * @stable ICU 2.8
232      */
233     int32_t charsCapacity;
234 
235     /**
236      * Default constructor for use with default implementations and subclasses.
237      * @stable ICU 2.8
238      */
239     StringEnumeration();
240 
241     /**
242      * Ensures that chars is at least as large as the requested capacity.
243      * For use with default implementations and subclasses.
244      *
245      * @param capacity Requested capacity.
246      * @param status ICU in/out error code.
247      * @stable ICU 2.8
248      */
249     void ensureCharsCapacity(int32_t capacity, UErrorCode &status);
250 
251     /**
252      * Converts s to Unicode and sets unistr to the result.
253      * For use with default implementations and subclasses,
254      * especially for implementations of snext() in terms of next().
255      * This is provided with a helper function instead of a default implementation
256      * of snext() to avoid potential infinite loops between next() and snext().
257      *
258      * For example:
259      * \code
260      * const UnicodeString* snext(UErrorCode& status) {
261      *   int32_t resultLength=0;
262      *   const char *s=next(&resultLength, status);
263      *   return setChars(s, resultLength, status);
264      * }
265      * \endcode
266      *
267      * @param s String to be converted to Unicode.
268      * @param length Length of the string.
269      * @param status ICU in/out error code.
270      * @return A pointer to unistr.
271      * @stable ICU 2.8
272      */
273     UnicodeString *setChars(const char *s, int32_t length, UErrorCode &status);
274 };
275 
276 U_NAMESPACE_END
277 
278 #endif /* U_SHOW_CPLUSPLUS_API */
279 
280 /* STRENUM_H */
281 #endif
282