2020-08-11 09:10:23 +00:00
|
|
|
// © 2016 and later: Unicode, Inc. and others.
|
|
|
|
// License & terms of use: http://www.unicode.org/copyright.html
|
|
|
|
/*
|
|
|
|
**********************************************************************
|
|
|
|
* Copyright (c) 2002-2006, International Business Machines
|
|
|
|
* Corporation and others. All Rights Reserved.
|
|
|
|
**********************************************************************
|
|
|
|
*/
|
|
|
|
#include "unicode/usetiter.h"
|
|
|
|
#include "unicode/uniset.h"
|
|
|
|
#include "unicode/unistr.h"
|
|
|
|
#include "uvector.h"
|
|
|
|
|
|
|
|
U_NAMESPACE_BEGIN
|
|
|
|
|
|
|
|
UOBJECT_DEFINE_RTTI_IMPLEMENTATION(UnicodeSetIterator)
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Create an iterator
|
|
|
|
* @param set set to iterate over
|
|
|
|
*/
|
|
|
|
UnicodeSetIterator::UnicodeSetIterator(const UnicodeSet& uSet) {
|
2023-05-23 00:05:01 +00:00
|
|
|
cpString = nullptr;
|
2020-08-11 09:10:23 +00:00
|
|
|
reset(uSet);
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Create an iterator. Convenience for when the contents are to be set later.
|
|
|
|
*/
|
|
|
|
UnicodeSetIterator::UnicodeSetIterator() {
|
2023-05-23 00:05:01 +00:00
|
|
|
this->set = nullptr;
|
|
|
|
cpString = nullptr;
|
2020-08-11 09:10:23 +00:00
|
|
|
reset();
|
|
|
|
}
|
|
|
|
|
|
|
|
UnicodeSetIterator::~UnicodeSetIterator() {
|
|
|
|
delete cpString;
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Returns the next element in the set.
|
|
|
|
* @return true if there was another element in the set.
|
|
|
|
* if so, if codepoint == IS_STRING, the value is a string in the string field
|
|
|
|
* else the value is a single code point in the codepoint field.
|
|
|
|
* <br>You are guaranteed that the codepoints are in sorted order, and the strings are in sorted order,
|
|
|
|
* and that all code points are returned before any strings are returned.
|
|
|
|
* <br>Note also that the codepointEnd is undefined after calling this method.
|
|
|
|
*/
|
|
|
|
UBool UnicodeSetIterator::next() {
|
|
|
|
if (nextElement <= endElement) {
|
|
|
|
codepoint = codepointEnd = nextElement++;
|
2023-05-23 00:05:01 +00:00
|
|
|
string = nullptr;
|
2022-10-28 06:11:55 +00:00
|
|
|
return true;
|
2020-08-11 09:10:23 +00:00
|
|
|
}
|
|
|
|
if (range < endRange) {
|
|
|
|
loadRange(++range);
|
|
|
|
codepoint = codepointEnd = nextElement++;
|
2023-05-23 00:05:01 +00:00
|
|
|
string = nullptr;
|
2022-10-28 06:11:55 +00:00
|
|
|
return true;
|
2020-08-11 09:10:23 +00:00
|
|
|
}
|
|
|
|
|
2022-10-28 06:11:55 +00:00
|
|
|
if (nextString >= stringCount) return false;
|
2020-08-11 09:10:23 +00:00
|
|
|
codepoint = (UChar32)IS_STRING; // signal that value is actually a string
|
|
|
|
string = (const UnicodeString*) set->strings->elementAt(nextString++);
|
2022-10-28 06:11:55 +00:00
|
|
|
return true;
|
2020-08-11 09:10:23 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* @return true if there was another element in the set.
|
|
|
|
* if so, if codepoint == IS_STRING, the value is a string in the string field
|
|
|
|
* else the value is a range of codepoints in the <codepoint, codepointEnd> fields.
|
|
|
|
* <br>Note that the codepoints are in sorted order, and the strings are in sorted order,
|
|
|
|
* and that all code points are returned before any strings are returned.
|
|
|
|
* <br>You are guaranteed that the ranges are in sorted order, and the strings are in sorted order,
|
|
|
|
* and that all ranges are returned before any strings are returned.
|
|
|
|
* <br>You are also guaranteed that ranges are disjoint and non-contiguous.
|
|
|
|
* <br>Note also that the codepointEnd is undefined after calling this method.
|
|
|
|
*/
|
|
|
|
UBool UnicodeSetIterator::nextRange() {
|
2023-05-23 00:05:01 +00:00
|
|
|
string = nullptr;
|
2020-08-11 09:10:23 +00:00
|
|
|
if (nextElement <= endElement) {
|
|
|
|
codepointEnd = endElement;
|
|
|
|
codepoint = nextElement;
|
|
|
|
nextElement = endElement+1;
|
2022-10-28 06:11:55 +00:00
|
|
|
return true;
|
2020-08-11 09:10:23 +00:00
|
|
|
}
|
|
|
|
if (range < endRange) {
|
|
|
|
loadRange(++range);
|
|
|
|
codepointEnd = endElement;
|
|
|
|
codepoint = nextElement;
|
|
|
|
nextElement = endElement+1;
|
2022-10-28 06:11:55 +00:00
|
|
|
return true;
|
2020-08-11 09:10:23 +00:00
|
|
|
}
|
|
|
|
|
2022-10-28 06:11:55 +00:00
|
|
|
if (nextString >= stringCount) return false;
|
2020-08-11 09:10:23 +00:00
|
|
|
codepoint = (UChar32)IS_STRING; // signal that value is actually a string
|
|
|
|
string = (const UnicodeString*) set->strings->elementAt(nextString++);
|
2022-10-28 06:11:55 +00:00
|
|
|
return true;
|
2020-08-11 09:10:23 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
*@param set the set to iterate over. This allows reuse of the iterator.
|
|
|
|
*/
|
|
|
|
void UnicodeSetIterator::reset(const UnicodeSet& uSet) {
|
|
|
|
this->set = &uSet;
|
|
|
|
reset();
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Resets to the start, to allow the iteration to start over again.
|
|
|
|
*/
|
|
|
|
void UnicodeSetIterator::reset() {
|
2023-05-23 00:05:01 +00:00
|
|
|
if (set == nullptr) {
|
2020-08-11 09:10:23 +00:00
|
|
|
// Set up indices to empty iteration
|
|
|
|
endRange = -1;
|
|
|
|
stringCount = 0;
|
|
|
|
} else {
|
|
|
|
endRange = set->getRangeCount() - 1;
|
|
|
|
stringCount = set->stringsSize();
|
|
|
|
}
|
|
|
|
range = 0;
|
|
|
|
endElement = -1;
|
|
|
|
nextElement = 0;
|
|
|
|
if (endRange >= 0) {
|
|
|
|
loadRange(range);
|
|
|
|
}
|
|
|
|
nextString = 0;
|
2023-05-23 00:05:01 +00:00
|
|
|
string = nullptr;
|
2020-08-11 09:10:23 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
void UnicodeSetIterator::loadRange(int32_t iRange) {
|
|
|
|
nextElement = set->getRangeStart(iRange);
|
|
|
|
endElement = set->getRangeEnd(iRange);
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
const UnicodeString& UnicodeSetIterator::getString() {
|
2023-05-23 00:05:01 +00:00
|
|
|
if (string==nullptr && codepoint!=(UChar32)IS_STRING) {
|
|
|
|
if (cpString == nullptr) {
|
2020-08-11 09:10:23 +00:00
|
|
|
cpString = new UnicodeString();
|
|
|
|
}
|
2023-05-23 00:05:01 +00:00
|
|
|
if (cpString != nullptr) {
|
2020-08-11 09:10:23 +00:00
|
|
|
cpString->setTo((UChar32)codepoint);
|
|
|
|
}
|
|
|
|
string = cpString;
|
|
|
|
}
|
|
|
|
return *string;
|
|
|
|
}
|
|
|
|
|
|
|
|
U_NAMESPACE_END
|
|
|
|
|
|
|
|
//eof
|