1 | // © 2016 and later: Unicode, Inc. and others. |
2 | // License & terms of use: http://www.unicode.org/copyright.html |
3 | /* |
4 | ******************************************************************************* |
5 | * |
6 | * Copyright (C) 2002-2012, International Business Machines |
7 | * Corporation and others. All Rights Reserved. |
8 | * |
9 | ******************************************************************************* |
10 | */ |
11 | |
12 | #ifndef STRENUM_H |
13 | #define STRENUM_H |
14 | |
15 | #include "unicode/utypes.h" |
16 | |
17 | #if U_SHOW_CPLUSPLUS_API |
18 | |
19 | #include "unicode/uobject.h" |
20 | #include "unicode/unistr.h" |
21 | |
22 | /** |
23 | * \file |
24 | * \brief C++ API: String Enumeration |
25 | */ |
26 | |
27 | U_NAMESPACE_BEGIN |
28 | |
29 | /** |
30 | * Base class for 'pure' C++ implementations of uenum api. Adds a |
31 | * method that returns the next UnicodeString since in C++ this can |
32 | * be a common storage format for strings. |
33 | * |
34 | * <p>The model is that the enumeration is over strings maintained by |
35 | * a 'service.' At any point, the service might change, invalidating |
36 | * the enumerator (though this is expected to be rare). The iterator |
37 | * returns an error if this has occurred. Lack of the error is no |
38 | * guarantee that the service didn't change immediately after the |
39 | * call, so the returned string still might not be 'valid' on |
40 | * subsequent use.</p> |
41 | * |
42 | * <p>Strings may take the form of const char*, const char16_t*, or const |
43 | * UnicodeString*. The type you get is determine by the variant of |
44 | * 'next' that you call. In general the StringEnumeration is |
45 | * optimized for one of these types, but all StringEnumerations can |
46 | * return all types. Returned strings are each terminated with a NUL. |
47 | * Depending on the service data, they might also include embedded NUL |
48 | * characters, so API is provided to optionally return the true |
49 | * length, counting the embedded NULs but not counting the terminating |
50 | * NUL.</p> |
51 | * |
52 | * <p>The pointers returned by next, unext, and snext become invalid |
53 | * upon any subsequent call to the enumeration's destructor, next, |
54 | * unext, snext, or reset.</p> |
55 | * |
56 | * ICU 2.8 adds some default implementations and helper functions |
57 | * for subclasses. |
58 | * |
59 | * @stable ICU 2.4 |
60 | */ |
61 | class U_COMMON_API StringEnumeration : public UObject { |
62 | public: |
63 | /** |
64 | * Destructor. |
65 | * @stable ICU 2.4 |
66 | */ |
67 | virtual ~StringEnumeration(); |
68 | |
69 | /** |
70 | * Clone this object, an instance of a subclass of StringEnumeration. |
71 | * Clones can be used concurrently in multiple threads. |
72 | * If a subclass does not implement clone(), or if an error occurs, |
73 | * then NULL is returned. |
74 | * The caller must delete the clone. |
75 | * |
76 | * @return a clone of this object |
77 | * |
78 | * @see getDynamicClassID |
79 | * @stable ICU 2.8 |
80 | */ |
81 | virtual StringEnumeration *clone() const; |
82 | |
83 | /** |
84 | * <p>Return the number of elements that the iterator traverses. If |
85 | * the iterator is out of sync with its service, status is set to |
86 | * U_ENUM_OUT_OF_SYNC_ERROR, and the return value is zero.</p> |
87 | * |
88 | * <p>The return value will not change except possibly as a result of |
89 | * a subsequent call to reset, or if the iterator becomes out of sync.</p> |
90 | * |
91 | * <p>This is a convenience function. It can end up being very |
92 | * expensive as all the items might have to be pre-fetched |
93 | * (depending on the storage format of the data being |
94 | * traversed).</p> |
95 | * |
96 | * @param status the error code. |
97 | * @return number of elements in the iterator. |
98 | * |
99 | * @stable ICU 2.4 */ |
100 | virtual int32_t count(UErrorCode& status) const = 0; |
101 | |
102 | /** |
103 | * <p>Returns the next element as a NUL-terminated char*. If there |
104 | * are no more elements, returns NULL. If the resultLength pointer |
105 | * is not NULL, the length of the string (not counting the |
106 | * terminating NUL) is returned at that address. If an error |
107 | * status is returned, the value at resultLength is undefined.</p> |
108 | * |
109 | * <p>The returned pointer is owned by this iterator and must not be |
110 | * deleted by the caller. The pointer is valid until the next call |
111 | * to next, unext, snext, reset, or the enumerator's destructor.</p> |
112 | * |
113 | * <p>If the iterator is out of sync with its service, status is set |
114 | * to U_ENUM_OUT_OF_SYNC_ERROR and NULL is returned.</p> |
115 | * |
116 | * <p>If the native service string is a char16_t* string, it is |
117 | * converted to char* with the invariant converter. If the |
118 | * conversion fails (because a character cannot be converted) then |
119 | * status is set to U_INVARIANT_CONVERSION_ERROR and the return |
120 | * value is undefined (though not NULL).</p> |
121 | * |
122 | * Starting with ICU 2.8, the default implementation calls snext() |
123 | * and handles the conversion. |
124 | * Either next() or snext() must be implemented differently by a subclass. |
125 | * |
126 | * @param status the error code. |
127 | * @param resultLength a pointer to receive the length, can be NULL. |
128 | * @return a pointer to the string, or NULL. |
129 | * |
130 | * @stable ICU 2.4 |
131 | */ |
132 | virtual const char* next(int32_t *resultLength, UErrorCode& status); |
133 | |
134 | /** |
135 | * <p>Returns the next element as a NUL-terminated char16_t*. If there |
136 | * are no more elements, returns NULL. If the resultLength pointer |
137 | * is not NULL, the length of the string (not counting the |
138 | * terminating NUL) is returned at that address. If an error |
139 | * status is returned, the value at resultLength is undefined.</p> |
140 | * |
141 | * <p>The returned pointer is owned by this iterator and must not be |
142 | * deleted by the caller. The pointer is valid until the next call |
143 | * to next, unext, snext, reset, or the enumerator's destructor.</p> |
144 | * |
145 | * <p>If the iterator is out of sync with its service, status is set |
146 | * to U_ENUM_OUT_OF_SYNC_ERROR and NULL is returned.</p> |
147 | * |
148 | * Starting with ICU 2.8, the default implementation calls snext() |
149 | * and handles the conversion. |
150 | * |
151 | * @param status the error code. |
152 | * @param resultLength a pointer to receive the length, can be NULL. |
153 | * @return a pointer to the string, or NULL. |
154 | * |
155 | * @stable ICU 2.4 |
156 | */ |
157 | virtual const char16_t* unext(int32_t *resultLength, UErrorCode& status); |
158 | |
159 | /** |
160 | * <p>Returns the next element a UnicodeString*. If there are no |
161 | * more elements, returns NULL.</p> |
162 | * |
163 | * <p>The returned pointer is owned by this iterator and must not be |
164 | * deleted by the caller. The pointer is valid until the next call |
165 | * to next, unext, snext, reset, or the enumerator's destructor.</p> |
166 | * |
167 | * <p>If the iterator is out of sync with its service, status is set |
168 | * to U_ENUM_OUT_OF_SYNC_ERROR and NULL is returned.</p> |
169 | * |
170 | * Starting with ICU 2.8, the default implementation calls next() |
171 | * and handles the conversion. |
172 | * Either next() or snext() must be implemented differently by a subclass. |
173 | * |
174 | * @param status the error code. |
175 | * @return a pointer to the string, or NULL. |
176 | * |
177 | * @stable ICU 2.4 |
178 | */ |
179 | virtual const UnicodeString* snext(UErrorCode& status); |
180 | |
181 | /** |
182 | * <p>Resets the iterator. This re-establishes sync with the |
183 | * service and rewinds the iterator to start at the first |
184 | * element.</p> |
185 | * |
186 | * <p>Previous pointers returned by next, unext, or snext become |
187 | * invalid, and the value returned by count might change.</p> |
188 | * |
189 | * @param status the error code. |
190 | * |
191 | * @stable ICU 2.4 |
192 | */ |
193 | virtual void reset(UErrorCode& status) = 0; |
194 | |
195 | /** |
196 | * Compares this enumeration to other to check if both are equal |
197 | * |
198 | * @param that The other string enumeration to compare this object to |
199 | * @return true if the enumerations are equal. false if not. |
200 | * @stable ICU 3.6 |
201 | */ |
202 | virtual bool operator==(const StringEnumeration& that)const; |
203 | /** |
204 | * Compares this enumeration to other to check if both are not equal |
205 | * |
206 | * @param that The other string enumeration to compare this object to |
207 | * @return true if the enumerations are equal. false if not. |
208 | * @stable ICU 3.6 |
209 | */ |
210 | virtual bool operator!=(const StringEnumeration& that)const; |
211 | |
212 | protected: |
213 | /** |
214 | * UnicodeString field for use with default implementations and subclasses. |
215 | * @stable ICU 2.8 |
216 | */ |
217 | UnicodeString unistr; |
218 | /** |
219 | * char * default buffer for use with default implementations and subclasses. |
220 | * @stable ICU 2.8 |
221 | */ |
222 | char charsBuffer[32]; |
223 | /** |
224 | * char * buffer for use with default implementations and subclasses. |
225 | * Allocated in constructor and in ensureCharsCapacity(). |
226 | * @stable ICU 2.8 |
227 | */ |
228 | char *chars; |
229 | /** |
230 | * Capacity of chars, for use with default implementations and subclasses. |
231 | * @stable ICU 2.8 |
232 | */ |
233 | int32_t charsCapacity; |
234 | |
235 | /** |
236 | * Default constructor for use with default implementations and subclasses. |
237 | * @stable ICU 2.8 |
238 | */ |
239 | StringEnumeration(); |
240 | |
241 | /** |
242 | * Ensures that chars is at least as large as the requested capacity. |
243 | * For use with default implementations and subclasses. |
244 | * |
245 | * @param capacity Requested capacity. |
246 | * @param status ICU in/out error code. |
247 | * @stable ICU 2.8 |
248 | */ |
249 | void ensureCharsCapacity(int32_t capacity, UErrorCode &status); |
250 | |
251 | /** |
252 | * Converts s to Unicode and sets unistr to the result. |
253 | * For use with default implementations and subclasses, |
254 | * especially for implementations of snext() in terms of next(). |
255 | * This is provided with a helper function instead of a default implementation |
256 | * of snext() to avoid potential infinite loops between next() and snext(). |
257 | * |
258 | * For example: |
259 | * \code |
260 | * const UnicodeString* snext(UErrorCode& status) { |
261 | * int32_t resultLength=0; |
262 | * const char *s=next(&resultLength, status); |
263 | * return setChars(s, resultLength, status); |
264 | * } |
265 | * \endcode |
266 | * |
267 | * @param s String to be converted to Unicode. |
268 | * @param length Length of the string. |
269 | * @param status ICU in/out error code. |
270 | * @return A pointer to unistr. |
271 | * @stable ICU 2.8 |
272 | */ |
273 | UnicodeString *setChars(const char *s, int32_t length, UErrorCode &status); |
274 | }; |
275 | |
276 | U_NAMESPACE_END |
277 | |
278 | #endif /* U_SHOW_CPLUSPLUS_API */ |
279 | |
280 | /* STRENUM_H */ |
281 | #endif |
282 | |