| 1 | // © 2016 and later: Unicode, Inc. and others. | 
|---|
| 2 | // License & terms of use: http://www.unicode.org/copyright.html | 
|---|
| 3 | /* | 
|---|
| 4 | ********************************************************************** | 
|---|
| 5 | * Copyright (c) 2002-2006, International Business Machines | 
|---|
| 6 | * Corporation and others.  All Rights Reserved. | 
|---|
| 7 | ********************************************************************** | 
|---|
| 8 | */ | 
|---|
| 9 | #include "unicode/usetiter.h" | 
|---|
| 10 | #include "unicode/uniset.h" | 
|---|
| 11 | #include "unicode/unistr.h" | 
|---|
| 12 | #include "uvector.h" | 
|---|
| 13 |  | 
|---|
| 14 | U_NAMESPACE_BEGIN | 
|---|
| 15 |  | 
|---|
| 16 | UOBJECT_DEFINE_RTTI_IMPLEMENTATION(UnicodeSetIterator) | 
|---|
| 17 |  | 
|---|
| 18 | /** | 
|---|
| 19 | * Create an iterator | 
|---|
| 20 | * @param set set to iterate over | 
|---|
| 21 | */ | 
|---|
| 22 | UnicodeSetIterator::UnicodeSetIterator(const UnicodeSet& uSet) { | 
|---|
| 23 | cpString  = NULL; | 
|---|
| 24 | reset(uSet); | 
|---|
| 25 | } | 
|---|
| 26 |  | 
|---|
| 27 | /** | 
|---|
| 28 | * Create an iterator. Convenience for when the contents are to be set later. | 
|---|
| 29 | */ | 
|---|
| 30 | UnicodeSetIterator::UnicodeSetIterator() { | 
|---|
| 31 | this->set = NULL; | 
|---|
| 32 | cpString  = NULL; | 
|---|
| 33 | reset(); | 
|---|
| 34 | } | 
|---|
| 35 |  | 
|---|
| 36 | UnicodeSetIterator::~UnicodeSetIterator() { | 
|---|
| 37 | delete cpString; | 
|---|
| 38 | } | 
|---|
| 39 |  | 
|---|
| 40 | /** | 
|---|
| 41 | * Returns the next element in the set. | 
|---|
| 42 | * @return true if there was another element in the set. | 
|---|
| 43 | * if so, if codepoint == IS_STRING, the value is a string in the string field | 
|---|
| 44 | * else the value is a single code point in the codepoint field. | 
|---|
| 45 | * <br>You are guaranteed that the codepoints are in sorted order, and the strings are in sorted order, | 
|---|
| 46 | * and that all code points are returned before any strings are returned. | 
|---|
| 47 | * <br>Note also that the codepointEnd is undefined after calling this method. | 
|---|
| 48 | */ | 
|---|
| 49 | UBool UnicodeSetIterator::next() { | 
|---|
| 50 | if (nextElement <= endElement) { | 
|---|
| 51 | codepoint = codepointEnd = nextElement++; | 
|---|
| 52 | string = NULL; | 
|---|
| 53 | return TRUE; | 
|---|
| 54 | } | 
|---|
| 55 | if (range < endRange) { | 
|---|
| 56 | loadRange(++range); | 
|---|
| 57 | codepoint = codepointEnd = nextElement++; | 
|---|
| 58 | string = NULL; | 
|---|
| 59 | return TRUE; | 
|---|
| 60 | } | 
|---|
| 61 |  | 
|---|
| 62 | if (nextString >= stringCount) return FALSE; | 
|---|
| 63 | codepoint = (UChar32)IS_STRING; // signal that value is actually a string | 
|---|
| 64 | string = (const UnicodeString*) set->strings->elementAt(nextString++); | 
|---|
| 65 | return TRUE; | 
|---|
| 66 | } | 
|---|
| 67 |  | 
|---|
| 68 | /** | 
|---|
| 69 | * @return true if there was another element in the set. | 
|---|
| 70 | * if so, if codepoint == IS_STRING, the value is a string in the string field | 
|---|
| 71 | * else the value is a range of codepoints in the <codepoint, codepointEnd> fields. | 
|---|
| 72 | * <br>Note that the codepoints are in sorted order, and the strings are in sorted order, | 
|---|
| 73 | * and that all code points are returned before any strings are returned. | 
|---|
| 74 | * <br>You are guaranteed that the ranges are in sorted order, and the strings are in sorted order, | 
|---|
| 75 | * and that all ranges are returned before any strings are returned. | 
|---|
| 76 | * <br>You are also guaranteed that ranges are disjoint and non-contiguous. | 
|---|
| 77 | * <br>Note also that the codepointEnd is undefined after calling this method. | 
|---|
| 78 | */ | 
|---|
| 79 | UBool UnicodeSetIterator::() { | 
|---|
| 80 | string = NULL; | 
|---|
| 81 | if (nextElement <= endElement) { | 
|---|
| 82 | codepointEnd = endElement; | 
|---|
| 83 | codepoint = nextElement; | 
|---|
| 84 | nextElement = endElement+1; | 
|---|
| 85 | return TRUE; | 
|---|
| 86 | } | 
|---|
| 87 | if (range < endRange) { | 
|---|
| 88 | loadRange(++range); | 
|---|
| 89 | codepointEnd = endElement; | 
|---|
| 90 | codepoint = nextElement; | 
|---|
| 91 | nextElement = endElement+1; | 
|---|
| 92 | return TRUE; | 
|---|
| 93 | } | 
|---|
| 94 |  | 
|---|
| 95 | if (nextString >= stringCount) return FALSE; | 
|---|
| 96 | codepoint = (UChar32)IS_STRING; // signal that value is actually a string | 
|---|
| 97 | string = (const UnicodeString*) set->strings->elementAt(nextString++); | 
|---|
| 98 | return TRUE; | 
|---|
| 99 | } | 
|---|
| 100 |  | 
|---|
| 101 | /** | 
|---|
| 102 | *@param set the set to iterate over. This allows reuse of the iterator. | 
|---|
| 103 | */ | 
|---|
| 104 | void UnicodeSetIterator::reset(const UnicodeSet& uSet) { | 
|---|
| 105 | this->set = &uSet; | 
|---|
| 106 | reset(); | 
|---|
| 107 | } | 
|---|
| 108 |  | 
|---|
| 109 | /** | 
|---|
| 110 | * Resets to the start, to allow the iteration to start over again. | 
|---|
| 111 | */ | 
|---|
| 112 | void UnicodeSetIterator::reset() { | 
|---|
| 113 | if (set == NULL) { | 
|---|
| 114 | // Set up indices to empty iteration | 
|---|
| 115 | endRange = -1; | 
|---|
| 116 | stringCount = 0; | 
|---|
| 117 | } else { | 
|---|
| 118 | endRange = set->getRangeCount() - 1; | 
|---|
| 119 | stringCount = set->stringsSize(); | 
|---|
| 120 | } | 
|---|
| 121 | range = 0; | 
|---|
| 122 | endElement = -1; | 
|---|
| 123 | nextElement = 0; | 
|---|
| 124 | if (endRange >= 0) { | 
|---|
| 125 | loadRange(range); | 
|---|
| 126 | } | 
|---|
| 127 | nextString = 0; | 
|---|
| 128 | string = NULL; | 
|---|
| 129 | } | 
|---|
| 130 |  | 
|---|
| 131 | void UnicodeSetIterator::loadRange(int32_t iRange) { | 
|---|
| 132 | nextElement = set->getRangeStart(iRange); | 
|---|
| 133 | endElement = set->getRangeEnd(iRange); | 
|---|
| 134 | } | 
|---|
| 135 |  | 
|---|
| 136 |  | 
|---|
| 137 | const UnicodeString& UnicodeSetIterator::getString()  { | 
|---|
| 138 | if (string==NULL && codepoint!=(UChar32)IS_STRING) { | 
|---|
| 139 | if (cpString == NULL) { | 
|---|
| 140 | cpString = new UnicodeString(); | 
|---|
| 141 | } | 
|---|
| 142 | if (cpString != NULL) { | 
|---|
| 143 | cpString->setTo((UChar32)codepoint); | 
|---|
| 144 | } | 
|---|
| 145 | string = cpString; | 
|---|
| 146 | } | 
|---|
| 147 | return *string; | 
|---|
| 148 | } | 
|---|
| 149 |  | 
|---|
| 150 | U_NAMESPACE_END | 
|---|
| 151 |  | 
|---|
| 152 | //eof | 
|---|
| 153 |  | 
|---|