1 // © 2016 and later: Unicode, Inc. and others.
2 // License & terms of use: http://www.unicode.org/copyright.html
3 /*
4 **********************************************************************
5 * Copyright (c) 2002-2006, International Business Machines
6 * Corporation and others.  All Rights Reserved.
7 **********************************************************************
8 */
9 #include "unicode/usetiter.h"
10 #include "unicode/uniset.h"
11 #include "unicode/unistr.h"
12 #include "uvector.h"
13 
14 U_NAMESPACE_BEGIN
15 
UOBJECT_DEFINE_RTTI_IMPLEMENTATION(UnicodeSetIterator)16 UOBJECT_DEFINE_RTTI_IMPLEMENTATION(UnicodeSetIterator)
17 
18 /**
19  * Create an iterator
20  * @param set set to iterate over
21  */
22 UnicodeSetIterator::UnicodeSetIterator(const UnicodeSet& uSet) {
23     cpString  = NULL;
24     reset(uSet);
25 }
26 
27 /**
28  * Create an iterator. Convenience for when the contents are to be set later.
29  */
UnicodeSetIterator()30 UnicodeSetIterator::UnicodeSetIterator() {
31     this->set = NULL;
32     cpString  = NULL;
33     reset();
34 }
35 
~UnicodeSetIterator()36 UnicodeSetIterator::~UnicodeSetIterator() {
37     delete cpString;
38 }
39 
40 /**
41  * Returns the next element in the set.
42  * @return true if there was another element in the set.
43  * if so, if codepoint == IS_STRING, the value is a string in the string field
44  * else the value is a single code point in the codepoint field.
45  * <br>You are guaranteed that the codepoints are in sorted order, and the strings are in sorted order,
46  * and that all code points are returned before any strings are returned.
47  * <br>Note also that the codepointEnd is undefined after calling this method.
48  */
next()49 UBool UnicodeSetIterator::next() {
50     if (nextElement <= endElement) {
51         codepoint = codepointEnd = nextElement++;
52         string = NULL;
53         return TRUE;
54     }
55     if (range < endRange) {
56         loadRange(++range);
57         codepoint = codepointEnd = nextElement++;
58         string = NULL;
59         return TRUE;
60     }
61 
62     if (nextString >= stringCount) return FALSE;
63     codepoint = (UChar32)IS_STRING; // signal that value is actually a string
64     string = (const UnicodeString*) set->strings->elementAt(nextString++);
65     return TRUE;
66 }
67 
68 /**
69  * @return true if there was another element in the set.
70  * if so, if codepoint == IS_STRING, the value is a string in the string field
71  * else the value is a range of codepoints in the <codepoint, codepointEnd> fields.
72  * <br>Note that the codepoints are in sorted order, and the strings are in sorted order,
73  * and that all code points are returned before any strings are returned.
74  * <br>You are guaranteed that the ranges are in sorted order, and the strings are in sorted order,
75  * and that all ranges are returned before any strings are returned.
76  * <br>You are also guaranteed that ranges are disjoint and non-contiguous.
77  * <br>Note also that the codepointEnd is undefined after calling this method.
78  */
nextRange()79 UBool UnicodeSetIterator::nextRange() {
80     string = NULL;
81     if (nextElement <= endElement) {
82         codepointEnd = endElement;
83         codepoint = nextElement;
84         nextElement = endElement+1;
85         return TRUE;
86     }
87     if (range < endRange) {
88         loadRange(++range);
89         codepointEnd = endElement;
90         codepoint = nextElement;
91         nextElement = endElement+1;
92         return TRUE;
93     }
94 
95     if (nextString >= stringCount) return FALSE;
96     codepoint = (UChar32)IS_STRING; // signal that value is actually a string
97     string = (const UnicodeString*) set->strings->elementAt(nextString++);
98     return TRUE;
99 }
100 
101 /**
102  *@param set the set to iterate over. This allows reuse of the iterator.
103  */
reset(const UnicodeSet & uSet)104 void UnicodeSetIterator::reset(const UnicodeSet& uSet) {
105     this->set = &uSet;
106     reset();
107 }
108 
109 /**
110  * Resets to the start, to allow the iteration to start over again.
111  */
reset()112 void UnicodeSetIterator::reset() {
113     if (set == NULL) {
114         // Set up indices to empty iteration
115         endRange = -1;
116         stringCount = 0;
117     } else {
118         endRange = set->getRangeCount() - 1;
119         stringCount = set->stringsSize();
120     }
121     range = 0;
122     endElement = -1;
123     nextElement = 0;
124     if (endRange >= 0) {
125         loadRange(range);
126     }
127     nextString = 0;
128     string = NULL;
129 }
130 
loadRange(int32_t iRange)131 void UnicodeSetIterator::loadRange(int32_t iRange) {
132     nextElement = set->getRangeStart(iRange);
133     endElement = set->getRangeEnd(iRange);
134 }
135 
136 
getString()137 const UnicodeString& UnicodeSetIterator::getString()  {
138     if (string==NULL && codepoint!=(UChar32)IS_STRING) {
139        if (cpString == NULL) {
140           cpString = new UnicodeString();
141        }
142        if (cpString != NULL) {
143           cpString->setTo((UChar32)codepoint);
144        }
145        string = cpString;
146     }
147     return *string;
148 }
149 
150 U_NAMESPACE_END
151 
152 //eof
153