| 1 | /* |
| 2 | ******************************************************************************* |
| 3 | * |
| 4 | * Copyright (C) 2002-2012, International Business Machines |
| 5 | * Corporation and others. All Rights Reserved. |
| 6 | * |
| 7 | ******************************************************************************* |
| 8 | */ |
| 9 | |
| 10 | #ifndef STRENUM_H |
| 11 | #define STRENUM_H |
| 12 | |
| 13 | #include "unicode/uobject.h" |
| 14 | #include "unicode/unistr.h" |
| 15 | |
| 16 | /** |
| 17 | * \file |
| 18 | * \brief C++ API: String Enumeration |
| 19 | */ |
| 20 | |
| 21 | U_NAMESPACE_BEGIN |
| 22 | |
| 23 | /** |
| 24 | * Base class for 'pure' C++ implementations of uenum api. Adds a |
| 25 | * method that returns the next UnicodeString since in C++ this can |
| 26 | * be a common storage format for strings. |
| 27 | * |
| 28 | * <p>The model is that the enumeration is over strings maintained by |
| 29 | * a 'service.' At any point, the service might change, invalidating |
| 30 | * the enumerator (though this is expected to be rare). The iterator |
| 31 | * returns an error if this has occurred. Lack of the error is no |
| 32 | * guarantee that the service didn't change immediately after the |
| 33 | * call, so the returned string still might not be 'valid' on |
| 34 | * subsequent use.</p> |
| 35 | * |
| 36 | * <p>Strings may take the form of const char*, const UChar*, or const |
| 37 | * UnicodeString*. The type you get is determine by the variant of |
| 38 | * 'next' that you call. In general the StringEnumeration is |
| 39 | * optimized for one of these types, but all StringEnumerations can |
| 40 | * return all types. Returned strings are each terminated with a NUL. |
| 41 | * Depending on the service data, they might also include embedded NUL |
| 42 | * characters, so API is provided to optionally return the true |
| 43 | * length, counting the embedded NULs but not counting the terminating |
| 44 | * NUL.</p> |
| 45 | * |
| 46 | * <p>The pointers returned by next, unext, and snext become invalid |
| 47 | * upon any subsequent call to the enumeration's destructor, next, |
| 48 | * unext, snext, or reset.</p> |
| 49 | * |
| 50 | * ICU 2.8 adds some default implementations and helper functions |
| 51 | * for subclasses. |
| 52 | * |
| 53 | * @stable ICU 2.4 |
| 54 | */ |
| 55 | class U_COMMON_API StringEnumeration : public UObject { |
| 56 | public: |
| 57 | /** |
| 58 | * Destructor. |
| 59 | * @stable ICU 2.4 |
| 60 | */ |
| 61 | virtual ~StringEnumeration(); |
| 62 | |
| 63 | /** |
| 64 | * Clone this object, an instance of a subclass of StringEnumeration. |
| 65 | * Clones can be used concurrently in multiple threads. |
| 66 | * If a subclass does not implement clone(), or if an error occurs, |
| 67 | * then NULL is returned. |
| 68 | * The clone functions in all subclasses return a base class pointer |
| 69 | * because some compilers do not support covariant (same-as-this) |
| 70 | * return types; cast to the appropriate subclass if necessary. |
| 71 | * The caller must delete the clone. |
| 72 | * |
| 73 | * @return a clone of this object |
| 74 | * |
| 75 | * @see getDynamicClassID |
| 76 | * @stable ICU 2.8 |
| 77 | */ |
| 78 | virtual StringEnumeration *clone() const; |
| 79 | |
| 80 | /** |
| 81 | * <p>Return the number of elements that the iterator traverses. If |
| 82 | * the iterator is out of sync with its service, status is set to |
| 83 | * U_ENUM_OUT_OF_SYNC_ERROR, and the return value is zero.</p> |
| 84 | * |
| 85 | * <p>The return value will not change except possibly as a result of |
| 86 | * a subsequent call to reset, or if the iterator becomes out of sync.</p> |
| 87 | * |
| 88 | * <p>This is a convenience function. It can end up being very |
| 89 | * expensive as all the items might have to be pre-fetched |
| 90 | * (depending on the storage format of the data being |
| 91 | * traversed).</p> |
| 92 | * |
| 93 | * @param status the error code. |
| 94 | * @return number of elements in the iterator. |
| 95 | * |
| 96 | * @stable ICU 2.4 */ |
| 97 | virtual int32_t count(UErrorCode& status) const = 0; |
| 98 | |
| 99 | /** |
| 100 | * <p>Returns the next element as a NUL-terminated char*. If there |
| 101 | * are no more elements, returns NULL. If the resultLength pointer |
| 102 | * is not NULL, the length of the string (not counting the |
| 103 | * terminating NUL) is returned at that address. If an error |
| 104 | * status is returned, the value at resultLength is undefined.</p> |
| 105 | * |
| 106 | * <p>The returned pointer is owned by this iterator and must not be |
| 107 | * deleted by the caller. The pointer is valid until the next call |
| 108 | * to next, unext, snext, reset, or the enumerator's destructor.</p> |
| 109 | * |
| 110 | * <p>If the iterator is out of sync with its service, status is set |
| 111 | * to U_ENUM_OUT_OF_SYNC_ERROR and NULL is returned.</p> |
| 112 | * |
| 113 | * <p>If the native service string is a UChar* string, it is |
| 114 | * converted to char* with the invariant converter. If the |
| 115 | * conversion fails (because a character cannot be converted) then |
| 116 | * status is set to U_INVARIANT_CONVERSION_ERROR and the return |
| 117 | * value is undefined (though not NULL).</p> |
| 118 | * |
| 119 | * Starting with ICU 2.8, the default implementation calls snext() |
| 120 | * and handles the conversion. |
| 121 | * Either next() or snext() must be implemented differently by a subclass. |
| 122 | * |
| 123 | * @param status the error code. |
| 124 | * @param resultLength a pointer to receive the length, can be NULL. |
| 125 | * @return a pointer to the string, or NULL. |
| 126 | * |
| 127 | * @stable ICU 2.4 |
| 128 | */ |
| 129 | virtual const char* next(int32_t *resultLength, UErrorCode& status); |
| 130 | |
| 131 | /** |
| 132 | * <p>Returns the next element as a NUL-terminated UChar*. If there |
| 133 | * are no more elements, returns NULL. If the resultLength pointer |
| 134 | * is not NULL, the length of the string (not counting the |
| 135 | * terminating NUL) is returned at that address. If an error |
| 136 | * status is returned, the value at resultLength is undefined.</p> |
| 137 | * |
| 138 | * <p>The returned pointer is owned by this iterator and must not be |
| 139 | * deleted by the caller. The pointer is valid until the next call |
| 140 | * to next, unext, snext, reset, or the enumerator's destructor.</p> |
| 141 | * |
| 142 | * <p>If the iterator is out of sync with its service, status is set |
| 143 | * to U_ENUM_OUT_OF_SYNC_ERROR and NULL is returned.</p> |
| 144 | * |
| 145 | * Starting with ICU 2.8, the default implementation calls snext() |
| 146 | * and handles the conversion. |
| 147 | * |
| 148 | * @param status the error code. |
| 149 | * @param resultLength a ponter to receive the length, can be NULL. |
| 150 | * @return a pointer to the string, or NULL. |
| 151 | * |
| 152 | * @stable ICU 2.4 |
| 153 | */ |
| 154 | virtual const UChar* unext(int32_t *resultLength, UErrorCode& status); |
| 155 | |
| 156 | /** |
| 157 | * <p>Returns the next element a UnicodeString*. If there are no |
| 158 | * more elements, returns NULL.</p> |
| 159 | * |
| 160 | * <p>The returned pointer is owned by this iterator and must not be |
| 161 | * deleted by the caller. The pointer is valid until the next call |
| 162 | * to next, unext, snext, reset, or the enumerator's destructor.</p> |
| 163 | * |
| 164 | * <p>If the iterator is out of sync with its service, status is set |
| 165 | * to U_ENUM_OUT_OF_SYNC_ERROR and NULL is returned.</p> |
| 166 | * |
| 167 | * Starting with ICU 2.8, the default implementation calls next() |
| 168 | * and handles the conversion. |
| 169 | * Either next() or snext() must be implemented differently by a subclass. |
| 170 | * |
| 171 | * @param status the error code. |
| 172 | * @return a pointer to the string, or NULL. |
| 173 | * |
| 174 | * @stable ICU 2.4 |
| 175 | */ |
| 176 | virtual const UnicodeString* snext(UErrorCode& status); |
| 177 | |
| 178 | /** |
| 179 | * <p>Resets the iterator. This re-establishes sync with the |
| 180 | * service and rewinds the iterator to start at the first |
| 181 | * element.</p> |
| 182 | * |
| 183 | * <p>Previous pointers returned by next, unext, or snext become |
| 184 | * invalid, and the value returned by count might change.</p> |
| 185 | * |
| 186 | * @param status the error code. |
| 187 | * |
| 188 | * @stable ICU 2.4 |
| 189 | */ |
| 190 | virtual void reset(UErrorCode& status) = 0; |
| 191 | |
| 192 | /** |
| 193 | * Compares this enumeration to other to check if both are equal |
| 194 | * |
| 195 | * @param that The other string enumeration to compare this object to |
| 196 | * @return TRUE if the enumerations are equal. FALSE if not. |
| 197 | * @stable ICU 3.6 |
| 198 | */ |
| 199 | virtual UBool operator==(const StringEnumeration& that)const; |
| 200 | /** |
| 201 | * Compares this enumeration to other to check if both are not equal |
| 202 | * |
| 203 | * @param that The other string enumeration to compare this object to |
| 204 | * @return TRUE if the enumerations are equal. FALSE if not. |
| 205 | * @stable ICU 3.6 |
| 206 | */ |
| 207 | virtual UBool operator!=(const StringEnumeration& that)const; |
| 208 | |
| 209 | protected: |
| 210 | /** |
| 211 | * UnicodeString field for use with default implementations and subclasses. |
| 212 | * @stable ICU 2.8 |
| 213 | */ |
| 214 | UnicodeString unistr; |
| 215 | /** |
| 216 | * char * default buffer for use with default implementations and subclasses. |
| 217 | * @stable ICU 2.8 |
| 218 | */ |
| 219 | char charsBuffer[32]; |
| 220 | /** |
| 221 | * char * buffer for use with default implementations and subclasses. |
| 222 | * Allocated in constructor and in ensureCharsCapacity(). |
| 223 | * @stable ICU 2.8 |
| 224 | */ |
| 225 | char *chars; |
| 226 | /** |
| 227 | * Capacity of chars, for use with default implementations and subclasses. |
| 228 | * @stable ICU 2.8 |
| 229 | */ |
| 230 | int32_t charsCapacity; |
| 231 | |
| 232 | /** |
| 233 | * Default constructor for use with default implementations and subclasses. |
| 234 | * @stable ICU 2.8 |
| 235 | */ |
| 236 | StringEnumeration(); |
| 237 | |
| 238 | /** |
| 239 | * Ensures that chars is at least as large as the requested capacity. |
| 240 | * For use with default implementations and subclasses. |
| 241 | * |
| 242 | * @param capacity Requested capacity. |
| 243 | * @param status ICU in/out error code. |
| 244 | * @stable ICU 2.8 |
| 245 | */ |
| 246 | void ensureCharsCapacity(int32_t capacity, UErrorCode &status); |
| 247 | |
| 248 | /** |
| 249 | * Converts s to Unicode and sets unistr to the result. |
| 250 | * For use with default implementations and subclasses, |
| 251 | * especially for implementations of snext() in terms of next(). |
| 252 | * This is provided with a helper function instead of a default implementation |
| 253 | * of snext() to avoid potential infinite loops between next() and snext(). |
| 254 | * |
| 255 | * For example: |
| 256 | * \code |
| 257 | * const UnicodeString* snext(UErrorCode& status) { |
| 258 | * int32_t resultLength=0; |
| 259 | * const char *s=next(&resultLength, status); |
| 260 | * return setChars(s, resultLength, status); |
| 261 | * } |
| 262 | * \endcode |
| 263 | * |
| 264 | * @param s String to be converted to Unicode. |
| 265 | * @param length Length of the string. |
| 266 | * @param status ICU in/out error code. |
| 267 | * @return A pointer to unistr. |
| 268 | * @stable ICU 2.8 |
| 269 | */ |
| 270 | UnicodeString *setChars(const char *s, int32_t length, UErrorCode &status); |
| 271 | }; |
| 272 | |
| 273 | U_NAMESPACE_END |
| 274 | |
| 275 | /* STRENUM_H */ |
| 276 | #endif |
| 277 | |