// Copyright (C) 2016 and later: Unicode, Inc. and others.
// License & terms of use: http://www.unicode.org/copyright.html
/*
**********************************************************************
* Copyright (c) 2002-2006, International Business Machines
* Corporation and others. All Rights Reserved.
**********************************************************************
*/
#include "unicode/usetiter.h"
#include "unicode/uniset.h"
#include "unicode/unistr.h"
#include "uvector.h"
U_NAMESPACE_BEGIN
UOBJECT_DEFINE_RTTI_IMPLEMENTATION(UnicodeSetIterator)
/**
* Create an iterator
* @param set set to iterate over
*/
UnicodeSetIterator::UnicodeSetIterator(const UnicodeSet& uSet) {
cpString = NULL;
reset(uSet);
}
/**
* Create an iterator. Convenience for when the contents are to be set later.
*/
UnicodeSetIterator::UnicodeSetIterator() {
this->set = NULL;
cpString = NULL;
reset();
}
UnicodeSetIterator::~UnicodeSetIterator() {
delete cpString;
}
/**
* Returns the next element in the set.
* @return true if there was another element in the set.
* if so, if codepoint == IS_STRING, the value is a string in the string field
* else the value is a single code point in the codepoint field.
*
You are guaranteed that the codepoints are in sorted order, and the strings are in sorted order,
* and that all code points are returned before any strings are returned.
*
Note also that the codepointEnd is undefined after calling this method.
*/
UBool UnicodeSetIterator::next() {
if (nextElement <= endElement) {
codepoint = codepointEnd = nextElement++;
string = NULL;
return TRUE;
}
if (range < endRange) {
loadRange(++range);
codepoint = codepointEnd = nextElement++;
string = NULL;
return TRUE;
}
if (nextString >= stringCount) return FALSE;
codepoint = (UChar32)IS_STRING; // signal that value is actually a string
string = (const UnicodeString*) set->strings->elementAt(nextString++);
return TRUE;
}
/**
* @return true if there was another element in the set.
* if so, if codepoint == IS_STRING, the value is a string in the string field
* else the value is a range of codepoints in the fields.
*
Note that the codepoints are in sorted order, and the strings are in sorted order,
* and that all code points are returned before any strings are returned.
*
You are guaranteed that the ranges are in sorted order, and the strings are in sorted order,
* and that all ranges are returned before any strings are returned.
*
You are also guaranteed that ranges are disjoint and non-contiguous.
*
Note also that the codepointEnd is undefined after calling this method.
*/
UBool UnicodeSetIterator::nextRange() {
string = NULL;
if (nextElement <= endElement) {
codepointEnd = endElement;
codepoint = nextElement;
nextElement = endElement+1;
return TRUE;
}
if (range < endRange) {
loadRange(++range);
codepointEnd = endElement;
codepoint = nextElement;
nextElement = endElement+1;
return TRUE;
}
if (nextString >= stringCount) return FALSE;
codepoint = (UChar32)IS_STRING; // signal that value is actually a string
string = (const UnicodeString*) set->strings->elementAt(nextString++);
return TRUE;
}
/**
*@param set the set to iterate over. This allows reuse of the iterator.
*/
void UnicodeSetIterator::reset(const UnicodeSet& uSet) {
this->set = &uSet;
reset();
}
/**
* Resets to the start, to allow the iteration to start over again.
*/
void UnicodeSetIterator::reset() {
if (set == NULL) {
// Set up indices to empty iteration
endRange = -1;
stringCount = 0;
} else {
endRange = set->getRangeCount() - 1;
stringCount = set->strings->size();
}
range = 0;
endElement = -1;
nextElement = 0;
if (endRange >= 0) {
loadRange(range);
}
nextString = 0;
string = NULL;
}
void UnicodeSetIterator::loadRange(int32_t iRange) {
nextElement = set->getRangeStart(iRange);
endElement = set->getRangeEnd(iRange);
}
const UnicodeString& UnicodeSetIterator::getString() {
if (string==NULL && codepoint!=(UChar32)IS_STRING) {
if (cpString == NULL) {
cpString = new UnicodeString();
}
if (cpString != NULL) {
cpString->setTo((UChar32)codepoint);
}
string = cpString;
}
return *string;
}
U_NAMESPACE_END
//eof