1 // Copyright (C) 2016 and later: Unicode, Inc. and others. 2 // License & terms of use: http://www.unicode.org/copyright.html 3 /* 4 ********************************************************************** 5 * Copyright (c) 2002-2006, International Business Machines 6 * Corporation and others. All Rights Reserved. 7 ********************************************************************** 8 */ 9 #include "unicode/usetiter.h" 10 #include "unicode/uniset.h" 11 #include "unicode/unistr.h" 12 #include "uvector.h" 13 14 U_NAMESPACE_BEGIN 15 16 UOBJECT_DEFINE_RTTI_IMPLEMENTATION(UnicodeSetIterator) 17 18 /** 19 * Create an iterator 20 * @param set set to iterate over 21 */ 22 UnicodeSetIterator::UnicodeSetIterator(const UnicodeSet& uSet) { 23 cpString = NULL; 24 reset(uSet); 25 } 26 27 /** 28 * Create an iterator. Convenience for when the contents are to be set later. 29 */ 30 UnicodeSetIterator::UnicodeSetIterator() { 31 this->set = NULL; 32 cpString = NULL; 33 reset(); 34 } 35 36 UnicodeSetIterator::~UnicodeSetIterator() { 37 delete cpString; 38 } 39 40 /** 41 * Returns the next element in the set. 42 * @return true if there was another element in the set. 43 * if so, if codepoint == IS_STRING, the value is a string in the string field 44 * else the value is a single code point in the codepoint field. 45 * <br>You are guaranteed that the codepoints are in sorted order, and the strings are in sorted order, 46 * and that all code points are returned before any strings are returned. 47 * <br>Note also that the codepointEnd is undefined after calling this method. 48 */ 49 UBool UnicodeSetIterator::next() { 50 if (nextElement <= endElement) { 51 codepoint = codepointEnd = nextElement++; 52 string = NULL; 53 return TRUE; 54 } 55 if (range < endRange) { 56 loadRange(++range); 57 codepoint = codepointEnd = nextElement++; 58 string = NULL; 59 return TRUE; 60 } 61 62 if (nextString >= stringCount) return FALSE; 63 codepoint = (UChar32)IS_STRING; // signal that value is actually a string 64 string = (const UnicodeString*) set->strings->elementAt(nextString++); 65 return TRUE; 66 } 67 68 /** 69 * @return true if there was another element in the set. 70 * if so, if codepoint == IS_STRING, the value is a string in the string field 71 * else the value is a range of codepoints in the <codepoint, codepointEnd> fields. 72 * <br>Note that the codepoints are in sorted order, and the strings are in sorted order, 73 * and that all code points are returned before any strings are returned. 74 * <br>You are guaranteed that the ranges are in sorted order, and the strings are in sorted order, 75 * and that all ranges are returned before any strings are returned. 76 * <br>You are also guaranteed that ranges are disjoint and non-contiguous. 77 * <br>Note also that the codepointEnd is undefined after calling this method. 78 */ 79 UBool UnicodeSetIterator::nextRange() { 80 string = NULL; 81 if (nextElement <= endElement) { 82 codepointEnd = endElement; 83 codepoint = nextElement; 84 nextElement = endElement+1; 85 return TRUE; 86 } 87 if (range < endRange) { 88 loadRange(++range); 89 codepointEnd = endElement; 90 codepoint = nextElement; 91 nextElement = endElement+1; 92 return TRUE; 93 } 94 95 if (nextString >= stringCount) return FALSE; 96 codepoint = (UChar32)IS_STRING; // signal that value is actually a string 97 string = (const UnicodeString*) set->strings->elementAt(nextString++); 98 return TRUE; 99 } 100 101 /** 102 *@param set the set to iterate over. This allows reuse of the iterator. 103 */ 104 void UnicodeSetIterator::reset(const UnicodeSet& uSet) { 105 this->set = &uSet; 106 reset(); 107 } 108 109 /** 110 * Resets to the start, to allow the iteration to start over again. 111 */ 112 void UnicodeSetIterator::reset() { 113 if (set == NULL) { 114 // Set up indices to empty iteration 115 endRange = -1; 116 stringCount = 0; 117 } else { 118 endRange = set->getRangeCount() - 1; 119 stringCount = set->strings->size(); 120 } 121 range = 0; 122 endElement = -1; 123 nextElement = 0; 124 if (endRange >= 0) { 125 loadRange(range); 126 } 127 nextString = 0; 128 string = NULL; 129 } 130 131 void UnicodeSetIterator::loadRange(int32_t iRange) { 132 nextElement = set->getRangeStart(iRange); 133 endElement = set->getRangeEnd(iRange); 134 } 135 136 137 const UnicodeString& UnicodeSetIterator::getString() { 138 if (string==NULL && codepoint!=(UChar32)IS_STRING) { 139 if (cpString == NULL) { 140 cpString = new UnicodeString(); 141 } 142 if (cpString != NULL) { 143 cpString->setTo((UChar32)codepoint); 144 } 145 string = cpString; 146 } 147 return *string; 148 } 149 150 U_NAMESPACE_END 151 152 //eof 153