1// © 2016 and later: Unicode, Inc. and others.
2// License & terms of use: http://www.unicode.org/copyright.html
3/*
4**********************************************************************
5* Copyright (c) 2002-2006, International Business Machines
6* Corporation and others. All Rights Reserved.
7**********************************************************************
8*/
9#include "unicode/usetiter.h"
10#include "unicode/uniset.h"
11#include "unicode/unistr.h"
12#include "uvector.h"
13
14U_NAMESPACE_BEGIN
15
16UOBJECT_DEFINE_RTTI_IMPLEMENTATION(UnicodeSetIterator)
17
18/**
19 * Create an iterator
20 * @param set set to iterate over
21 */
22UnicodeSetIterator::UnicodeSetIterator(const UnicodeSet& uSet) {
23 cpString = NULL;
24 reset(uSet);
25}
26
27/**
28 * Create an iterator. Convenience for when the contents are to be set later.
29 */
30UnicodeSetIterator::UnicodeSetIterator() {
31 this->set = NULL;
32 cpString = NULL;
33 reset();
34}
35
36UnicodeSetIterator::~UnicodeSetIterator() {
37 delete cpString;
38}
39
40/**
41 * Returns the next element in the set.
42 * @return true if there was another element in the set.
43 * if so, if codepoint == IS_STRING, the value is a string in the string field
44 * else the value is a single code point in the codepoint field.
45 * <br>You are guaranteed that the codepoints are in sorted order, and the strings are in sorted order,
46 * and that all code points are returned before any strings are returned.
47 * <br>Note also that the codepointEnd is undefined after calling this method.
48 */
49UBool UnicodeSetIterator::next() {
50 if (nextElement <= endElement) {
51 codepoint = codepointEnd = nextElement++;
52 string = NULL;
53 return TRUE;
54 }
55 if (range < endRange) {
56 loadRange(++range);
57 codepoint = codepointEnd = nextElement++;
58 string = NULL;
59 return TRUE;
60 }
61
62 if (nextString >= stringCount) return FALSE;
63 codepoint = (UChar32)IS_STRING; // signal that value is actually a string
64 string = (const UnicodeString*) set->strings->elementAt(nextString++);
65 return TRUE;
66}
67
68/**
69 * @return true if there was another element in the set.
70 * if so, if codepoint == IS_STRING, the value is a string in the string field
71 * else the value is a range of codepoints in the <codepoint, codepointEnd> fields.
72 * <br>Note that the codepoints are in sorted order, and the strings are in sorted order,
73 * and that all code points are returned before any strings are returned.
74 * <br>You are guaranteed that the ranges are in sorted order, and the strings are in sorted order,
75 * and that all ranges are returned before any strings are returned.
76 * <br>You are also guaranteed that ranges are disjoint and non-contiguous.
77 * <br>Note also that the codepointEnd is undefined after calling this method.
78 */
79UBool UnicodeSetIterator::nextRange() {
80 string = NULL;
81 if (nextElement <= endElement) {
82 codepointEnd = endElement;
83 codepoint = nextElement;
84 nextElement = endElement+1;
85 return TRUE;
86 }
87 if (range < endRange) {
88 loadRange(++range);
89 codepointEnd = endElement;
90 codepoint = nextElement;
91 nextElement = endElement+1;
92 return TRUE;
93 }
94
95 if (nextString >= stringCount) return FALSE;
96 codepoint = (UChar32)IS_STRING; // signal that value is actually a string
97 string = (const UnicodeString*) set->strings->elementAt(nextString++);
98 return TRUE;
99}
100
101/**
102 *@param set the set to iterate over. This allows reuse of the iterator.
103 */
104void UnicodeSetIterator::reset(const UnicodeSet& uSet) {
105 this->set = &uSet;
106 reset();
107}
108
109/**
110 * Resets to the start, to allow the iteration to start over again.
111 */
112void UnicodeSetIterator::reset() {
113 if (set == NULL) {
114 // Set up indices to empty iteration
115 endRange = -1;
116 stringCount = 0;
117 } else {
118 endRange = set->getRangeCount() - 1;
119 stringCount = set->stringsSize();
120 }
121 range = 0;
122 endElement = -1;
123 nextElement = 0;
124 if (endRange >= 0) {
125 loadRange(range);
126 }
127 nextString = 0;
128 string = NULL;
129}
130
131void UnicodeSetIterator::loadRange(int32_t iRange) {
132 nextElement = set->getRangeStart(iRange);
133 endElement = set->getRangeEnd(iRange);
134}
135
136
137const UnicodeString& UnicodeSetIterator::getString() {
138 if (string==NULL && codepoint!=(UChar32)IS_STRING) {
139 if (cpString == NULL) {
140 cpString = new UnicodeString();
141 }
142 if (cpString != NULL) {
143 cpString->setTo((UChar32)codepoint);
144 }
145 string = cpString;
146 }
147 return *string;
148}
149
150U_NAMESPACE_END
151
152//eof
153