| 1 | // © 2016 and later: Unicode, Inc. and others. |
| 2 | // License & terms of use: http://www.unicode.org/copyright.html |
| 3 | /* |
| 4 | ******************************************************************************* |
| 5 | * |
| 6 | * Copyright (C) 2002-2012, International Business Machines |
| 7 | * Corporation and others. All Rights Reserved. |
| 8 | * |
| 9 | ******************************************************************************* |
| 10 | */ |
| 11 | |
| 12 | #ifndef STRENUM_H |
| 13 | #define STRENUM_H |
| 14 | |
| 15 | #include "unicode/utypes.h" |
| 16 | |
| 17 | #if U_SHOW_CPLUSPLUS_API |
| 18 | |
| 19 | #include "unicode/uobject.h" |
| 20 | #include "unicode/unistr.h" |
| 21 | |
| 22 | /** |
| 23 | * \file |
| 24 | * \brief C++ API: String Enumeration |
| 25 | */ |
| 26 | |
| 27 | U_NAMESPACE_BEGIN |
| 28 | |
| 29 | /** |
| 30 | * Base class for 'pure' C++ implementations of uenum api. Adds a |
| 31 | * method that returns the next UnicodeString since in C++ this can |
| 32 | * be a common storage format for strings. |
| 33 | * |
| 34 | * <p>The model is that the enumeration is over strings maintained by |
| 35 | * a 'service.' At any point, the service might change, invalidating |
| 36 | * the enumerator (though this is expected to be rare). The iterator |
| 37 | * returns an error if this has occurred. Lack of the error is no |
| 38 | * guarantee that the service didn't change immediately after the |
| 39 | * call, so the returned string still might not be 'valid' on |
| 40 | * subsequent use.</p> |
| 41 | * |
| 42 | * <p>Strings may take the form of const char*, const char16_t*, or const |
| 43 | * UnicodeString*. The type you get is determine by the variant of |
| 44 | * 'next' that you call. In general the StringEnumeration is |
| 45 | * optimized for one of these types, but all StringEnumerations can |
| 46 | * return all types. Returned strings are each terminated with a NUL. |
| 47 | * Depending on the service data, they might also include embedded NUL |
| 48 | * characters, so API is provided to optionally return the true |
| 49 | * length, counting the embedded NULs but not counting the terminating |
| 50 | * NUL.</p> |
| 51 | * |
| 52 | * <p>The pointers returned by next, unext, and snext become invalid |
| 53 | * upon any subsequent call to the enumeration's destructor, next, |
| 54 | * unext, snext, or reset.</p> |
| 55 | * |
| 56 | * ICU 2.8 adds some default implementations and helper functions |
| 57 | * for subclasses. |
| 58 | * |
| 59 | * @stable ICU 2.4 |
| 60 | */ |
| 61 | class U_COMMON_API StringEnumeration : public UObject { |
| 62 | public: |
| 63 | /** |
| 64 | * Destructor. |
| 65 | * @stable ICU 2.4 |
| 66 | */ |
| 67 | virtual ~StringEnumeration(); |
| 68 | |
| 69 | /** |
| 70 | * Clone this object, an instance of a subclass of StringEnumeration. |
| 71 | * Clones can be used concurrently in multiple threads. |
| 72 | * If a subclass does not implement clone(), or if an error occurs, |
| 73 | * then nullptr is returned. |
| 74 | * The caller must delete the clone. |
| 75 | * |
| 76 | * @return a clone of this object |
| 77 | * |
| 78 | * @see getDynamicClassID |
| 79 | * @stable ICU 2.8 |
| 80 | */ |
| 81 | virtual StringEnumeration *clone() const; |
| 82 | |
| 83 | /** |
| 84 | * <p>Return the number of elements that the iterator traverses. If |
| 85 | * the iterator is out of sync with its service, status is set to |
| 86 | * U_ENUM_OUT_OF_SYNC_ERROR, and the return value is zero.</p> |
| 87 | * |
| 88 | * <p>The return value will not change except possibly as a result of |
| 89 | * a subsequent call to reset, or if the iterator becomes out of sync.</p> |
| 90 | * |
| 91 | * <p>This is a convenience function. It can end up being very |
| 92 | * expensive as all the items might have to be pre-fetched |
| 93 | * (depending on the storage format of the data being |
| 94 | * traversed).</p> |
| 95 | * |
| 96 | * @param status the error code. |
| 97 | * @return number of elements in the iterator. |
| 98 | * |
| 99 | * @stable ICU 2.4 */ |
| 100 | virtual int32_t count(UErrorCode& status) const = 0; |
| 101 | |
| 102 | /** |
| 103 | * <p>Returns the next element as a NUL-terminated char*. If there |
| 104 | * are no more elements, returns nullptr. If the resultLength pointer |
| 105 | * is not nullptr, the length of the string (not counting the |
| 106 | * terminating NUL) is returned at that address. If an error |
| 107 | * status is returned, the value at resultLength is undefined.</p> |
| 108 | * |
| 109 | * <p>The returned pointer is owned by this iterator and must not be |
| 110 | * deleted by the caller. The pointer is valid until the next call |
| 111 | * to next, unext, snext, reset, or the enumerator's destructor.</p> |
| 112 | * |
| 113 | * <p>If the iterator is out of sync with its service, status is set |
| 114 | * to U_ENUM_OUT_OF_SYNC_ERROR and nullptr is returned.</p> |
| 115 | * |
| 116 | * <p>If the native service string is a char16_t* string, it is |
| 117 | * converted to char* with the invariant converter. If the |
| 118 | * conversion fails (because a character cannot be converted) then |
| 119 | * status is set to U_INVARIANT_CONVERSION_ERROR and the return |
| 120 | * value is undefined (though not nullptr).</p> |
| 121 | * |
| 122 | * Starting with ICU 2.8, the default implementation calls snext() |
| 123 | * and handles the conversion. |
| 124 | * Either next() or snext() must be implemented differently by a subclass. |
| 125 | * |
| 126 | * @param status the error code. |
| 127 | * @param resultLength a pointer to receive the length, can be nullptr. |
| 128 | * @return a pointer to the string, or nullptr. |
| 129 | * |
| 130 | * @stable ICU 2.4 |
| 131 | */ |
| 132 | virtual const char* next(int32_t *resultLength, UErrorCode& status); |
| 133 | |
| 134 | /** |
| 135 | * <p>Returns the next element as a NUL-terminated char16_t*. If there |
| 136 | * are no more elements, returns nullptr. If the resultLength pointer |
| 137 | * is not nullptr, the length of the string (not counting the |
| 138 | * terminating NUL) is returned at that address. If an error |
| 139 | * status is returned, the value at resultLength is undefined.</p> |
| 140 | * |
| 141 | * <p>The returned pointer is owned by this iterator and must not be |
| 142 | * deleted by the caller. The pointer is valid until the next call |
| 143 | * to next, unext, snext, reset, or the enumerator's destructor.</p> |
| 144 | * |
| 145 | * <p>If the iterator is out of sync with its service, status is set |
| 146 | * to U_ENUM_OUT_OF_SYNC_ERROR and nullptr is returned.</p> |
| 147 | * |
| 148 | * Starting with ICU 2.8, the default implementation calls snext() |
| 149 | * and handles the conversion. |
| 150 | * |
| 151 | * @param status the error code. |
| 152 | * @param resultLength a pointer to receive the length, can be nullptr. |
| 153 | * @return a pointer to the string, or nullptr. |
| 154 | * |
| 155 | * @stable ICU 2.4 |
| 156 | */ |
| 157 | virtual const char16_t* unext(int32_t *resultLength, UErrorCode& status); |
| 158 | |
| 159 | /** |
| 160 | * <p>Returns the next element a UnicodeString*. If there are no |
| 161 | * more elements, returns nullptr.</p> |
| 162 | * |
| 163 | * <p>The returned pointer is owned by this iterator and must not be |
| 164 | * deleted by the caller. The pointer is valid until the next call |
| 165 | * to next, unext, snext, reset, or the enumerator's destructor.</p> |
| 166 | * |
| 167 | * <p>If the iterator is out of sync with its service, status is set |
| 168 | * to U_ENUM_OUT_OF_SYNC_ERROR and nullptr is returned.</p> |
| 169 | * |
| 170 | * Starting with ICU 2.8, the default implementation calls next() |
| 171 | * and handles the conversion. |
| 172 | * Either next() or snext() must be implemented differently by a subclass. |
| 173 | * |
| 174 | * @param status the error code. |
| 175 | * @return a pointer to the string, or nullptr. |
| 176 | * |
| 177 | * @stable ICU 2.4 |
| 178 | */ |
| 179 | virtual const UnicodeString* snext(UErrorCode& status); |
| 180 | |
| 181 | /** |
| 182 | * <p>Resets the iterator. This re-establishes sync with the |
| 183 | * service and rewinds the iterator to start at the first |
| 184 | * element.</p> |
| 185 | * |
| 186 | * <p>Previous pointers returned by next, unext, or snext become |
| 187 | * invalid, and the value returned by count might change.</p> |
| 188 | * |
| 189 | * @param status the error code. |
| 190 | * |
| 191 | * @stable ICU 2.4 |
| 192 | */ |
| 193 | virtual void reset(UErrorCode& status) = 0; |
| 194 | |
| 195 | /** |
| 196 | * Compares this enumeration to other to check if both are equal |
| 197 | * |
| 198 | * @param that The other string enumeration to compare this object to |
| 199 | * @return true if the enumerations are equal. false if not. |
| 200 | * @stable ICU 3.6 |
| 201 | */ |
| 202 | virtual bool operator==(const StringEnumeration& that)const; |
| 203 | /** |
| 204 | * Compares this enumeration to other to check if both are not equal |
| 205 | * |
| 206 | * @param that The other string enumeration to compare this object to |
| 207 | * @return true if the enumerations are equal. false if not. |
| 208 | * @stable ICU 3.6 |
| 209 | */ |
| 210 | virtual bool operator!=(const StringEnumeration& that)const; |
| 211 | |
| 212 | protected: |
| 213 | /** |
| 214 | * UnicodeString field for use with default implementations and subclasses. |
| 215 | * @stable ICU 2.8 |
| 216 | */ |
| 217 | UnicodeString unistr; |
| 218 | /** |
| 219 | * char * default buffer for use with default implementations and subclasses. |
| 220 | * @stable ICU 2.8 |
| 221 | */ |
| 222 | char charsBuffer[32]; |
| 223 | /** |
| 224 | * char * buffer for use with default implementations and subclasses. |
| 225 | * Allocated in constructor and in ensureCharsCapacity(). |
| 226 | * @stable ICU 2.8 |
| 227 | */ |
| 228 | char *chars; |
| 229 | /** |
| 230 | * Capacity of chars, for use with default implementations and subclasses. |
| 231 | * @stable ICU 2.8 |
| 232 | */ |
| 233 | int32_t charsCapacity; |
| 234 | |
| 235 | /** |
| 236 | * Default constructor for use with default implementations and subclasses. |
| 237 | * @stable ICU 2.8 |
| 238 | */ |
| 239 | StringEnumeration(); |
| 240 | |
| 241 | /** |
| 242 | * Ensures that chars is at least as large as the requested capacity. |
| 243 | * For use with default implementations and subclasses. |
| 244 | * |
| 245 | * @param capacity Requested capacity. |
| 246 | * @param status ICU in/out error code. |
| 247 | * @stable ICU 2.8 |
| 248 | */ |
| 249 | void ensureCharsCapacity(int32_t capacity, UErrorCode &status); |
| 250 | |
| 251 | /** |
| 252 | * Converts s to Unicode and sets unistr to the result. |
| 253 | * For use with default implementations and subclasses, |
| 254 | * especially for implementations of snext() in terms of next(). |
| 255 | * This is provided with a helper function instead of a default implementation |
| 256 | * of snext() to avoid potential infinite loops between next() and snext(). |
| 257 | * |
| 258 | * For example: |
| 259 | * \code |
| 260 | * const UnicodeString* snext(UErrorCode& status) { |
| 261 | * int32_t resultLength=0; |
| 262 | * const char *s=next(&resultLength, status); |
| 263 | * return setChars(s, resultLength, status); |
| 264 | * } |
| 265 | * \endcode |
| 266 | * |
| 267 | * @param s String to be converted to Unicode. |
| 268 | * @param length Length of the string. |
| 269 | * @param status ICU in/out error code. |
| 270 | * @return A pointer to unistr. |
| 271 | * @stable ICU 2.8 |
| 272 | */ |
| 273 | UnicodeString *setChars(const char *s, int32_t length, UErrorCode &status); |
| 274 | }; |
| 275 | |
| 276 | U_NAMESPACE_END |
| 277 | |
| 278 | #endif /* U_SHOW_CPLUSPLUS_API */ |
| 279 | |
| 280 | /* STRENUM_H */ |
| 281 | #endif |
| 282 | |