|
1 /* |
|
2 ******************************************************************************* |
|
3 * |
|
4 * Copyright (C) 2002-2012, International Business Machines |
|
5 * Corporation and others. All Rights Reserved. |
|
6 * |
|
7 ******************************************************************************* |
|
8 */ |
|
9 |
|
10 #ifndef STRENUM_H |
|
11 #define STRENUM_H |
|
12 |
|
13 #include "unicode/uobject.h" |
|
14 #include "unicode/unistr.h" |
|
15 |
|
16 /** |
|
17 * \file |
|
18 * \brief C++ API: String Enumeration |
|
19 */ |
|
20 |
|
21 U_NAMESPACE_BEGIN |
|
22 |
|
23 /** |
|
24 * Base class for 'pure' C++ implementations of uenum api. Adds a |
|
25 * method that returns the next UnicodeString since in C++ this can |
|
26 * be a common storage format for strings. |
|
27 * |
|
28 * <p>The model is that the enumeration is over strings maintained by |
|
29 * a 'service.' At any point, the service might change, invalidating |
|
30 * the enumerator (though this is expected to be rare). The iterator |
|
31 * returns an error if this has occurred. Lack of the error is no |
|
32 * guarantee that the service didn't change immediately after the |
|
33 * call, so the returned string still might not be 'valid' on |
|
34 * subsequent use.</p> |
|
35 * |
|
36 * <p>Strings may take the form of const char*, const UChar*, or const |
|
37 * UnicodeString*. The type you get is determine by the variant of |
|
38 * 'next' that you call. In general the StringEnumeration is |
|
39 * optimized for one of these types, but all StringEnumerations can |
|
40 * return all types. Returned strings are each terminated with a NUL. |
|
41 * Depending on the service data, they might also include embedded NUL |
|
42 * characters, so API is provided to optionally return the true |
|
43 * length, counting the embedded NULs but not counting the terminating |
|
44 * NUL.</p> |
|
45 * |
|
46 * <p>The pointers returned by next, unext, and snext become invalid |
|
47 * upon any subsequent call to the enumeration's destructor, next, |
|
48 * unext, snext, or reset.</p> |
|
49 * |
|
50 * ICU 2.8 adds some default implementations and helper functions |
|
51 * for subclasses. |
|
52 * |
|
53 * @stable ICU 2.4 |
|
54 */ |
|
55 class U_COMMON_API StringEnumeration : public UObject { |
|
56 public: |
|
57 /** |
|
58 * Destructor. |
|
59 * @stable ICU 2.4 |
|
60 */ |
|
61 virtual ~StringEnumeration(); |
|
62 |
|
63 /** |
|
64 * Clone this object, an instance of a subclass of StringEnumeration. |
|
65 * Clones can be used concurrently in multiple threads. |
|
66 * If a subclass does not implement clone(), or if an error occurs, |
|
67 * then NULL is returned. |
|
68 * The clone functions in all subclasses return a base class pointer |
|
69 * because some compilers do not support covariant (same-as-this) |
|
70 * return types; cast to the appropriate subclass if necessary. |
|
71 * The caller must delete the clone. |
|
72 * |
|
73 * @return a clone of this object |
|
74 * |
|
75 * @see getDynamicClassID |
|
76 * @stable ICU 2.8 |
|
77 */ |
|
78 virtual StringEnumeration *clone() const; |
|
79 |
|
80 /** |
|
81 * <p>Return the number of elements that the iterator traverses. If |
|
82 * the iterator is out of sync with its service, status is set to |
|
83 * U_ENUM_OUT_OF_SYNC_ERROR, and the return value is zero.</p> |
|
84 * |
|
85 * <p>The return value will not change except possibly as a result of |
|
86 * a subsequent call to reset, or if the iterator becomes out of sync.</p> |
|
87 * |
|
88 * <p>This is a convenience function. It can end up being very |
|
89 * expensive as all the items might have to be pre-fetched |
|
90 * (depending on the storage format of the data being |
|
91 * traversed).</p> |
|
92 * |
|
93 * @param status the error code. |
|
94 * @return number of elements in the iterator. |
|
95 * |
|
96 * @stable ICU 2.4 */ |
|
97 virtual int32_t count(UErrorCode& status) const = 0; |
|
98 |
|
99 /** |
|
100 * <p>Returns the next element as a NUL-terminated char*. If there |
|
101 * are no more elements, returns NULL. If the resultLength pointer |
|
102 * is not NULL, the length of the string (not counting the |
|
103 * terminating NUL) is returned at that address. If an error |
|
104 * status is returned, the value at resultLength is undefined.</p> |
|
105 * |
|
106 * <p>The returned pointer is owned by this iterator and must not be |
|
107 * deleted by the caller. The pointer is valid until the next call |
|
108 * to next, unext, snext, reset, or the enumerator's destructor.</p> |
|
109 * |
|
110 * <p>If the iterator is out of sync with its service, status is set |
|
111 * to U_ENUM_OUT_OF_SYNC_ERROR and NULL is returned.</p> |
|
112 * |
|
113 * <p>If the native service string is a UChar* string, it is |
|
114 * converted to char* with the invariant converter. If the |
|
115 * conversion fails (because a character cannot be converted) then |
|
116 * status is set to U_INVARIANT_CONVERSION_ERROR and the return |
|
117 * value is undefined (though not NULL).</p> |
|
118 * |
|
119 * Starting with ICU 2.8, the default implementation calls snext() |
|
120 * and handles the conversion. |
|
121 * Either next() or snext() must be implemented differently by a subclass. |
|
122 * |
|
123 * @param status the error code. |
|
124 * @param resultLength a pointer to receive the length, can be NULL. |
|
125 * @return a pointer to the string, or NULL. |
|
126 * |
|
127 * @stable ICU 2.4 |
|
128 */ |
|
129 virtual const char* next(int32_t *resultLength, UErrorCode& status); |
|
130 |
|
131 /** |
|
132 * <p>Returns the next element as a NUL-terminated UChar*. If there |
|
133 * are no more elements, returns NULL. If the resultLength pointer |
|
134 * is not NULL, the length of the string (not counting the |
|
135 * terminating NUL) is returned at that address. If an error |
|
136 * status is returned, the value at resultLength is undefined.</p> |
|
137 * |
|
138 * <p>The returned pointer is owned by this iterator and must not be |
|
139 * deleted by the caller. The pointer is valid until the next call |
|
140 * to next, unext, snext, reset, or the enumerator's destructor.</p> |
|
141 * |
|
142 * <p>If the iterator is out of sync with its service, status is set |
|
143 * to U_ENUM_OUT_OF_SYNC_ERROR and NULL is returned.</p> |
|
144 * |
|
145 * Starting with ICU 2.8, the default implementation calls snext() |
|
146 * and handles the conversion. |
|
147 * |
|
148 * @param status the error code. |
|
149 * @param resultLength a ponter to receive the length, can be NULL. |
|
150 * @return a pointer to the string, or NULL. |
|
151 * |
|
152 * @stable ICU 2.4 |
|
153 */ |
|
154 virtual const UChar* unext(int32_t *resultLength, UErrorCode& status); |
|
155 |
|
156 /** |
|
157 * <p>Returns the next element a UnicodeString*. If there are no |
|
158 * more elements, returns NULL.</p> |
|
159 * |
|
160 * <p>The returned pointer is owned by this iterator and must not be |
|
161 * deleted by the caller. The pointer is valid until the next call |
|
162 * to next, unext, snext, reset, or the enumerator's destructor.</p> |
|
163 * |
|
164 * <p>If the iterator is out of sync with its service, status is set |
|
165 * to U_ENUM_OUT_OF_SYNC_ERROR and NULL is returned.</p> |
|
166 * |
|
167 * Starting with ICU 2.8, the default implementation calls next() |
|
168 * and handles the conversion. |
|
169 * Either next() or snext() must be implemented differently by a subclass. |
|
170 * |
|
171 * @param status the error code. |
|
172 * @return a pointer to the string, or NULL. |
|
173 * |
|
174 * @stable ICU 2.4 |
|
175 */ |
|
176 virtual const UnicodeString* snext(UErrorCode& status); |
|
177 |
|
178 /** |
|
179 * <p>Resets the iterator. This re-establishes sync with the |
|
180 * service and rewinds the iterator to start at the first |
|
181 * element.</p> |
|
182 * |
|
183 * <p>Previous pointers returned by next, unext, or snext become |
|
184 * invalid, and the value returned by count might change.</p> |
|
185 * |
|
186 * @param status the error code. |
|
187 * |
|
188 * @stable ICU 2.4 |
|
189 */ |
|
190 virtual void reset(UErrorCode& status) = 0; |
|
191 |
|
192 /** |
|
193 * Compares this enumeration to other to check if both are equal |
|
194 * |
|
195 * @param that The other string enumeration to compare this object to |
|
196 * @return TRUE if the enumerations are equal. FALSE if not. |
|
197 * @stable ICU 3.6 |
|
198 */ |
|
199 virtual UBool operator==(const StringEnumeration& that)const; |
|
200 /** |
|
201 * Compares this enumeration to other to check if both are not equal |
|
202 * |
|
203 * @param that The other string enumeration to compare this object to |
|
204 * @return TRUE if the enumerations are equal. FALSE if not. |
|
205 * @stable ICU 3.6 |
|
206 */ |
|
207 virtual UBool operator!=(const StringEnumeration& that)const; |
|
208 |
|
209 protected: |
|
210 /** |
|
211 * UnicodeString field for use with default implementations and subclasses. |
|
212 * @stable ICU 2.8 |
|
213 */ |
|
214 UnicodeString unistr; |
|
215 /** |
|
216 * char * default buffer for use with default implementations and subclasses. |
|
217 * @stable ICU 2.8 |
|
218 */ |
|
219 char charsBuffer[32]; |
|
220 /** |
|
221 * char * buffer for use with default implementations and subclasses. |
|
222 * Allocated in constructor and in ensureCharsCapacity(). |
|
223 * @stable ICU 2.8 |
|
224 */ |
|
225 char *chars; |
|
226 /** |
|
227 * Capacity of chars, for use with default implementations and subclasses. |
|
228 * @stable ICU 2.8 |
|
229 */ |
|
230 int32_t charsCapacity; |
|
231 |
|
232 /** |
|
233 * Default constructor for use with default implementations and subclasses. |
|
234 * @stable ICU 2.8 |
|
235 */ |
|
236 StringEnumeration(); |
|
237 |
|
238 /** |
|
239 * Ensures that chars is at least as large as the requested capacity. |
|
240 * For use with default implementations and subclasses. |
|
241 * |
|
242 * @param capacity Requested capacity. |
|
243 * @param status ICU in/out error code. |
|
244 * @stable ICU 2.8 |
|
245 */ |
|
246 void ensureCharsCapacity(int32_t capacity, UErrorCode &status); |
|
247 |
|
248 /** |
|
249 * Converts s to Unicode and sets unistr to the result. |
|
250 * For use with default implementations and subclasses, |
|
251 * especially for implementations of snext() in terms of next(). |
|
252 * This is provided with a helper function instead of a default implementation |
|
253 * of snext() to avoid potential infinite loops between next() and snext(). |
|
254 * |
|
255 * For example: |
|
256 * \code |
|
257 * const UnicodeString* snext(UErrorCode& status) { |
|
258 * int32_t resultLength=0; |
|
259 * const char *s=next(&resultLength, status); |
|
260 * return setChars(s, resultLength, status); |
|
261 * } |
|
262 * \endcode |
|
263 * |
|
264 * @param s String to be converted to Unicode. |
|
265 * @param length Length of the string. |
|
266 * @param status ICU in/out error code. |
|
267 * @return A pointer to unistr. |
|
268 * @stable ICU 2.8 |
|
269 */ |
|
270 UnicodeString *setChars(const char *s, int32_t length, UErrorCode &status); |
|
271 }; |
|
272 |
|
273 U_NAMESPACE_END |
|
274 |
|
275 /* STRENUM_H */ |
|
276 #endif |