ICU-23004 CodeUnits.data() -> begin()/end()

This commit is contained in:
Markus Scherer 2025-03-14 15:12:35 -07:00
parent d2d17f2dc9
commit b4df027cef
2 changed files with 112 additions and 134 deletions

View file

@ -124,8 +124,8 @@ class UnsafeCodeUnits {
using Unit = typename std::iterator_traits<UnitIter>::value_type;
public:
// @internal
UnsafeCodeUnits(CP32 codePoint, uint8_t length, UnitIter data) :
c(codePoint), len(length), p(data) {}
UnsafeCodeUnits(CP32 codePoint, uint8_t length, UnitIter start, UnitIter limit) :
c_(codePoint), len_(length), start_(start), limit_(limit) {}
UnsafeCodeUnits(const UnsafeCodeUnits &other) = default;
UnsafeCodeUnits &operator=(const UnsafeCodeUnits &other) = default;
@ -137,20 +137,27 @@ public:
* UTFIllFormedBehavior template parameter.
* @draft ICU 78
*/
UChar32 codePoint() const { return c; }
UChar32 codePoint() const { return c_; }
/**
* @return the start of the minimal Unicode code unit sequence.
* Only enabled if UnitIter is a (multi-pass) forward_iterator or better.
* @draft ICU 78
*/
UnitIter data() const { return p; }
UnitIter begin() const { return start_; }
/**
* @return the limit (exclusive end) of the minimal Unicode code unit sequence.
* Only enabled if UnitIter is a (multi-pass) forward_iterator or better.
* @draft ICU 78
*/
UnitIter end() const { return limit_; }
/**
* @return the length of the minimal Unicode code unit sequence.
* @draft ICU 78
*/
uint8_t length() const { return len; }
uint8_t length() const { return len_; }
/**
* @return a string_view of the minimal Unicode code unit sequence.
@ -162,14 +169,15 @@ public:
std::is_pointer_v<Iter>,
std::basic_string_view<Unit>>
stringView() const {
return std::basic_string_view<Unit>(p, len);
return std::basic_string_view<Unit>(start_, len_);
}
private:
// Order of fields with padding and access frequency in mind.
CP32 c;
uint8_t len;
UnitIter p;
CP32 c_;
uint8_t len_;
UnitIter start_;
UnitIter limit_;
};
#ifndef U_IN_DOXYGEN
@ -185,19 +193,19 @@ class UnsafeCodeUnits<
typename std::iterator_traits<UnitIter>::iterator_category>>> {
public:
// @internal
UnsafeCodeUnits(CP32 codePoint, uint8_t length) : c(codePoint), len(length) {}
UnsafeCodeUnits(CP32 codePoint, uint8_t length) : c_(codePoint), len_(length) {}
UnsafeCodeUnits(const UnsafeCodeUnits &other) = default;
UnsafeCodeUnits &operator=(const UnsafeCodeUnits &other) = default;
UChar32 codePoint() const { return c; }
UChar32 codePoint() const { return c_; }
uint8_t length() const { return len; }
uint8_t length() const { return len_; }
private:
// Order of fields with padding and access frequency in mind.
CP32 c;
uint8_t len;
CP32 c_;
uint8_t len_;
};
#endif // U_IN_DOXYGEN
@ -219,16 +227,16 @@ template<typename CP32, typename UnitIter, typename = void>
class CodeUnits : public UnsafeCodeUnits<CP32, UnitIter> {
public:
// @internal
CodeUnits(CP32 codePoint, uint8_t length, bool wellFormed, UnitIter data) :
UnsafeCodeUnits<CP32, UnitIter>(codePoint, length, data), ok(wellFormed) {}
CodeUnits(CP32 codePoint, uint8_t length, bool wellFormed, UnitIter start, UnitIter limit) :
UnsafeCodeUnits<CP32, UnitIter>(codePoint, length, start, limit), ok_(wellFormed) {}
CodeUnits(const CodeUnits &other) = default;
CodeUnits &operator=(const CodeUnits &other) = default;
bool wellFormed() const { return ok; }
bool wellFormed() const { return ok_; }
private:
bool ok;
bool ok_;
};
#ifndef U_IN_DOXYGEN
@ -246,15 +254,15 @@ class CodeUnits<
public:
// @internal
CodeUnits(CP32 codePoint, uint8_t length, bool wellFormed) :
UnsafeCodeUnits<CP32, UnitIter>(codePoint, length), ok(wellFormed) {}
UnsafeCodeUnits<CP32, UnitIter>(codePoint, length), ok_(wellFormed) {}
CodeUnits(const CodeUnits &other) = default;
CodeUnits &operator=(const CodeUnits &other) = default;
bool wellFormed() const { return ok; }
bool wellFormed() const { return ok_; }
private:
bool ok;
bool ok_;
};
#endif // U_IN_DOXYGEN
@ -349,7 +357,7 @@ public:
CP32 c = uint8_t(*p);
++p;
if (U8_IS_SINGLE(c)) {
return {c, 1, true, p0};
return {c, 1, true, p0, p};
}
uint8_t length = 1;
uint8_t t = 0;
@ -373,9 +381,9 @@ public:
c = (c << 6) | t;
++length;
++p;
return {c, length, true, p0};
return {c, length, true, p0, p};
}
return {sub(), length, false, p0};
return {sub(), length, false, p0, p};
}
static inline CodeUnits<CP32, UnitIter> singlePassReadAndInc(
@ -415,9 +423,10 @@ public:
static inline CodeUnits<CP32, UnitIter> decAndRead(UnitIter start, UnitIter &p) {
// Very similar to U8_PREV_OR_FFFD().
UnitIter p0 = p;
CP32 c = uint8_t(*--p);
if (U8_IS_SINGLE(c)) {
return {c, 1, true, p};
return {c, 1, true, p, p0};
}
if (U8_IS_TRAIL(c) && p != start) {
UnitIter p1 = p;
@ -426,13 +435,13 @@ public:
if (b1 < 0xe0) {
p = p1;
c = ((b1 - 0xc0) << 6) | (c & 0x3f);
return {c, 2, true, p};
return {c, 2, true, p, p0};
} else if (b1 < 0xf0 ?
U8_IS_VALID_LEAD3_AND_T1(b1, c) :
U8_IS_VALID_LEAD4_AND_T1(b1, c)) {
// Truncated 3- or 4-byte sequence.
p = p1;
return {sub(), 2, false, p};
return {sub(), 2, false, p, p0};
}
} else if (U8_IS_TRAIL(b1) && p1 != start) {
// Extract the value bits from the last trail byte.
@ -444,12 +453,12 @@ public:
if (U8_IS_VALID_LEAD3_AND_T1(b2, b1)) {
p = p1;
c = (b2 << 12) | ((b1 & 0x3f) << 6) | c;
return {c, 3, true, p};
return {c, 3, true, p, p0};
}
} else if (U8_IS_VALID_LEAD4_AND_T1(b2, b1)) {
// Truncated 4-byte sequence.
p = p1;
return {sub(), 3, false, p};
return {sub(), 3, false, p, p0};
}
} else if (U8_IS_TRAIL(b2) && p1 != start) {
uint8_t b3 = *--p1;
@ -458,17 +467,13 @@ public:
if (U8_IS_VALID_LEAD4_AND_T1(b3, b2)) {
p = p1;
c = (b3 << 18) | ((b2 & 0x3f) << 12) | ((b1 & 0x3f) << 6) | c;
return {c, 4, true, p};
return {c, 4, true, p, p0};
}
}
}
}
}
return {sub(), 1, false, p};
}
static inline void moveToDecAndReadLimit(UnitIter &p, uint8_t n) {
std::advance(p, n);
return {sub(), 1, false, p, p0};
}
};
@ -513,15 +518,15 @@ public:
CP32 c = *p;
++p;
if (!U16_IS_SURROGATE(c)) {
return {c, 1, true, p0};
return {c, 1, true, p0, p};
} else {
uint16_t c2;
if (U16_IS_SURROGATE_LEAD(c) && p != limit && U16_IS_TRAIL(c2 = *p)) {
++p;
c = U16_GET_SUPPLEMENTARY(c, c2);
return {c, 2, true, p0};
return {c, 2, true, p0, p};
} else {
return {sub(c), 1, false, p0};
return {sub(c), 1, false, p0, p};
}
}
}
@ -547,29 +552,22 @@ public:
static inline CodeUnits<CP32, UnitIter> decAndRead(UnitIter start, UnitIter &p) {
// Very similar to U16_PREV_OR_FFFD().
UnitIter p0 = p;
CP32 c = *--p;
if (!U16_IS_SURROGATE(c)) {
return {c, 1, true, p};
return {c, 1, true, p, p0};
} else {
UnitIter p1;
uint16_t c2;
if (U16_IS_SURROGATE_TRAIL(c) && p != start && (p1 = p, U16_IS_LEAD(c2 = *--p1))) {
p = p1;
c = U16_GET_SUPPLEMENTARY(c2, c);
return {c, 2, true, p};
return {c, 2, true, p, p0};
} else {
return {sub(c), 1, false, p};
return {sub(c), 1, false, p, p0};
}
}
}
static inline void moveToDecAndReadLimit(UnitIter &p, uint8_t n) {
// n = 1 or 2 for UTF-16
++p;
if (n == 2) {
++p;
}
}
};
// UTF-32: trivial, but still validating
@ -604,9 +602,9 @@ public:
CP32 c = uc;
++p;
if (uc < 0xd800 || (0xe000 <= uc && uc <= 0x10ffff)) {
return {c, 1, true, p0};
return {c, 1, true, p0, p};
} else {
return {sub(uc < 0xe000, c), 1, false, p0};
return {sub(uc < 0xe000, c), 1, false, p0, p};
}
}
@ -623,18 +621,15 @@ public:
}
static inline CodeUnits<CP32, UnitIter> decAndRead(UnitIter /*start*/, UnitIter &p) {
UnitIter p0 = p;
uint32_t uc = *--p;
CP32 c = uc;
if (uc < 0xd800 || (0xe000 <= uc && uc <= 0x10ffff)) {
return {c, 1, true, p};
return {c, 1, true, p, p0};
} else {
return {sub(uc < 0xe000, c), 1, false, p};
return {sub(uc < 0xe000, c), 1, false, p, p0};
}
}
static inline void moveToDecAndReadLimit(UnitIter &p, uint8_t /*n*/) {
++p;
}
};
// Non-validating implementations ----------------------------------------- ***
@ -668,11 +663,11 @@ public:
CP32 c = uint8_t(*p);
++p;
if (U8_IS_SINGLE(c)) {
return {c, 1, p0};
return {c, 1, p0, p};
} else if (c < 0xe0) {
c = ((c & 0x1f) << 6) | (*p & 0x3f);
++p;
return {c, 2, p0};
return {c, 2, p0, p};
} else if (c < 0xf0) {
// No need for (c&0xf) because the upper bits are truncated
// after <<12 in the cast to uint16_t.
@ -680,7 +675,7 @@ public:
++p;
c |= *p & 0x3f;
++p;
return {c, 3, p0};
return {c, 3, p0, p};
} else {
c = ((c & 7) << 18) | ((*p & 0x3f) << 12);
++p;
@ -688,7 +683,7 @@ public:
++p;
c |= *p & 0x3f;
++p;
return {c, 4, p0};
return {c, 4, p0, p};
}
}
@ -723,9 +718,10 @@ public:
static inline UnsafeCodeUnits<CP32, UnitIter> decAndRead(UnitIter &p) {
// Very similar to U8_PREV_UNSAFE().
UnitIter p0 = p;
CP32 c = uint8_t(*--p);
if (U8_IS_SINGLE(c)) {
return {c, 1, p};
return {c, 1, p, p0};
}
// U8_IS_TRAIL(c) if well-formed
c &= 0x3f;
@ -743,11 +739,7 @@ public:
}
}
++count;
return {c, count, p};
}
static inline void moveToDecAndReadLimit(UnitIter &p, uint8_t n) {
std::advance(p, n);
return {c, count, p, p0};
}
};
@ -781,12 +773,12 @@ public:
CP32 c = *p;
++p;
if (!U16_IS_LEAD(c)) {
return {c, 1, p0};
return {c, 1, p0, p};
} else {
uint16_t c2 = *p;
++p;
c = U16_GET_SUPPLEMENTARY(c, c2);
return {c, 2, p0};
return {c, 2, p0, p};
}
}
@ -806,21 +798,14 @@ public:
static inline UnsafeCodeUnits<CP32, UnitIter> decAndRead(UnitIter &p) {
// Very similar to U16_PREV_UNSAFE().
UnitIter p0 = p;
CP32 c = *--p;
if (!U16_IS_TRAIL(c)) {
return {c, 1, p};
return {c, 1, p, p0};
} else {
uint16_t c2 = *--p;
c = U16_GET_SUPPLEMENTARY(c2, c);
return {c, 2, p};
}
}
static inline void moveToDecAndReadLimit(UnitIter &p, uint8_t n) {
// n = 1 or 2 for UTF-16
++p;
if (n == 2) {
++p;
return {c, 2, p, p0};
}
}
};
@ -845,7 +830,7 @@ public:
UnitIter p0 = p;
CP32 c = *p;
++p;
return {c, 1, p0};
return {c, 1, p0, p};
}
static inline UnsafeCodeUnits<CP32, UnitIter> singlePassReadAndInc(UnitIter &p) {
@ -855,12 +840,9 @@ public:
}
static inline UnsafeCodeUnits<CP32, UnitIter> decAndRead(UnitIter &p) {
UnitIter p0 = p;
CP32 c = *--p;
return {c, 1, p};
}
static inline void moveToDecAndReadLimit(UnitIter &p, uint8_t /*n*/) {
++p;
return {c, 1, p, p0};
}
};
@ -917,13 +899,13 @@ public:
// Only enabled if UnitIter is a (multi-pass) forward_iterator or better.
// TODO: Should we enable this only for a bidirectional_iterator?
inline UTFIterator(UnitIter start, UnitIter p, UnitIter limit) :
p_(p), start_(start), limit_(limit), units_(0, 0, false, p) {}
p_(p), start_(start), limit_(limit), units_(0, 0, false, p, p) {}
// Constructs an iterator with start=p.
inline UTFIterator(UnitIter p, UnitIter limit) :
p_(p), start_(p), limit_(limit), units_(0, 0, false, p) {}
p_(p), start_(p), limit_(limit), units_(0, 0, false, p, p) {}
// Constructs an iterator start or limit sentinel.
// Requires UnitIter to be copyable.
inline UTFIterator(UnitIter p) : p_(p), start_(p), limit_(p), units_(0, 0, false, p) {}
inline UTFIterator(UnitIter p) : p_(p), start_(p), limit_(p), units_(0, 0, false, p, p) {}
inline UTFIterator(UTFIterator &&src) noexcept = default;
inline UTFIterator &operator=(UTFIterator &&src) noexcept = default;
@ -965,7 +947,7 @@ public:
Impl::inc(p_, limit_);
} else /* state_ < 0 */ {
// operator--() called decAndRead() so we know how far to skip.
Impl::moveToDecAndReadLimit(p_, units_.length());
p_ = units_.end();
state_ = 0;
}
return *this;
@ -992,7 +974,7 @@ public:
} else /* state_ < 0 */ {
UTFIterator result(*this);
// operator--() called decAndRead() so we know how far to skip.
Impl::moveToDecAndReadLimit(p_, units_.length());
p_ = units_.end();
state_ = 0;
return result;
}
@ -1009,7 +991,7 @@ public:
operator--() { // pre-decrement
if (state_ > 0) {
// operator*() called readAndInc() so p_ is ahead of the logical position.
p_ = units_.data();
p_ = units_.begin();
}
units_ = Impl::decAndRead(start_, p_);
state_ = -1;
@ -1034,7 +1016,7 @@ private:
friend class std::reverse_iterator<UTFIterator<CP32, behavior, UnitIter>>;
inline UnitIter getLogicalPosition() const {
return state_ <= 0 ? p_ : units_.data();
return state_ <= 0 ? p_ : units_.begin();
}
// operator*() etc. are logically const.
@ -1188,7 +1170,7 @@ public:
inline reverse_iterator(U_HEADER_ONLY_NAMESPACE::UTFIterator<CP32, behavior, UnitIter> iter) :
p_(iter.getLogicalPosition()), start_(iter.start_), limit_(iter.limit_),
units_(0, 0, false, p_), unitsLimit_(p_) {}
units_(0, 0, false, p_, p_) {}
inline reverse_iterator(reverse_iterator &&src) noexcept = default;
inline reverse_iterator &operator=(reverse_iterator &&src) noexcept = default;
@ -1203,7 +1185,6 @@ public:
inline CodeUnits_ operator*() const {
if (state_ == 0) {
unitsLimit_ = p_;
units_ = Impl::decAndRead(start_, p_);
state_ = -1;
}
@ -1212,7 +1193,6 @@ public:
inline Proxy operator->() const {
if (state_ == 0) {
unitsLimit_ = p_;
units_ = Impl::decAndRead(start_, p_);
state_ = -1;
}
@ -1227,7 +1207,7 @@ public:
Impl::dec(start_, p_);
} else /* state_ > 0 */ {
// operator--() called readAndInc() so we know how far to skip.
p_ = units_.data();
p_ = units_.begin();
state_ = 0;
}
return *this;
@ -1240,7 +1220,6 @@ public:
state_ = 0;
return result;
} else if (state_ == 0) {
unitsLimit_ = p_;
units_ = Impl::decAndRead(start_, p_);
reverse_iterator result(*this);
result.state_ = -1;
@ -1249,7 +1228,7 @@ public:
} else /* state_ > 0 */ {
reverse_iterator result(*this);
// operator--() called readAndInc() so we know how far to skip.
p_ = units_.data();
p_ = units_.begin();
state_ = 0;
return result;
}
@ -1258,7 +1237,7 @@ public:
inline reverse_iterator &operator--() { // pre-decrement
if (state_ < 0) {
// operator*() called decAndRead() so p_ is behind the logical position.
p_ = unitsLimit_;
p_ = units_.end();
}
units_ = Impl::readAndInc(start_, p_);
state_ = 1;
@ -1273,7 +1252,7 @@ public:
private:
inline UnitIter getLogicalPosition() const {
return state_ >= 0 ? p_ : unitsLimit_;
return state_ >= 0 ? p_ : units_.end();
}
// operator*() etc. are logically const.
@ -1285,8 +1264,6 @@ private:
// Keep state so that we call decAndRead() only once for both operator*() and ++
// to make it easy for the compiler to optimize.
mutable CodeUnits_ units_;
// For fast getLogicalPosition() and operator==().
mutable UnitIter unitsLimit_;
// >0: units_ = readAndInc(), p_ = units limit
// 0: initial state
// <0: units_ = decAndRead(), p_ = units start
@ -1485,7 +1462,7 @@ public:
std::bidirectional_iterator_tag,
std::forward_iterator_tag>;
inline UnsafeUTFIterator(UnitIter p) : p_(p), units_(0, 0, p) {}
inline UnsafeUTFIterator(UnitIter p) : p_(p), units_(0, 0, p, p) {}
inline UnsafeUTFIterator(UnsafeUTFIterator &&src) noexcept = default;
inline UnsafeUTFIterator &operator=(UnsafeUTFIterator &&src) noexcept = default;
@ -1527,7 +1504,7 @@ public:
Impl::inc(p_);
} else /* state_ < 0 */ {
// operator--() called decAndRead() so we know how far to skip.
Impl::moveToDecAndReadLimit(p_, units_.length());
p_ = units_.end();
state_ = 0;
}
return *this;
@ -1554,7 +1531,7 @@ public:
} else /* state_ < 0 */ {
UnsafeUTFIterator result(*this);
// operator--() called decAndRead() so we know how far to skip.
Impl::moveToDecAndReadLimit(p_, units_.length());
p_ = units_.end();
state_ = 0;
return result;
}
@ -1571,7 +1548,7 @@ public:
operator--() { // pre-decrement
if (state_ > 0) {
// operator*() called readAndInc() so p_ is ahead of the logical position.
p_ = units_.data();
p_ = units_.begin();
}
units_ = Impl::decAndRead(p_);
state_ = -1;
@ -1596,7 +1573,7 @@ private:
friend class std::reverse_iterator<UnsafeUTFIterator<CP32, UnitIter>>;
inline UnitIter getLogicalPosition() const {
return state_ <= 0 ? p_ : units_.data();
return state_ <= 0 ? p_ : units_.begin();
}
// operator*() etc. are logically const.
@ -1737,7 +1714,7 @@ public:
using iterator_category = std::bidirectional_iterator_tag;
inline reverse_iterator(U_HEADER_ONLY_NAMESPACE::UnsafeUTFIterator<CP32, UnitIter> iter) :
p_(iter.getLogicalPosition()), units_(0, 0, p_), unitsLimit_(p_) {}
p_(iter.getLogicalPosition()), units_(0, 0, p_, p_) {}
inline reverse_iterator(reverse_iterator &&src) noexcept = default;
inline reverse_iterator &operator=(reverse_iterator &&src) noexcept = default;
@ -1752,7 +1729,6 @@ public:
inline UnsafeCodeUnits_ operator*() const {
if (state_ == 0) {
unitsLimit_ = p_;
units_ = Impl::decAndRead(p_);
state_ = -1;
}
@ -1761,7 +1737,6 @@ public:
inline Proxy operator->() const {
if (state_ == 0) {
unitsLimit_ = p_;
units_ = Impl::decAndRead(p_);
state_ = -1;
}
@ -1776,7 +1751,7 @@ public:
Impl::dec(p_);
} else /* state_ > 0 */ {
// operator--() called readAndInc() so we know how far to skip.
p_ = units_.data();
p_ = units_.begin();
state_ = 0;
}
return *this;
@ -1789,7 +1764,6 @@ public:
state_ = 0;
return result;
} else if (state_ == 0) {
unitsLimit_ = p_;
units_ = Impl::decAndRead(p_);
reverse_iterator result(*this);
result.state_ = -1;
@ -1798,7 +1772,7 @@ public:
} else /* state_ > 0 */ {
reverse_iterator result(*this);
// operator--() called readAndInc() so we know how far to skip.
p_ = units_.data();
p_ = units_.begin();
state_ = 0;
return result;
}
@ -1807,7 +1781,7 @@ public:
inline reverse_iterator &operator--() { // pre-decrement
if (state_ < 0) {
// operator*() called decAndRead() so p_ is behind the logical position.
p_ = unitsLimit_;
p_ = units_.end();
}
units_ = Impl::readAndInc(p_);
state_ = 1;
@ -1822,7 +1796,7 @@ public:
private:
inline UnitIter getLogicalPosition() const {
return state_ >= 0 ? p_ : unitsLimit_;
return state_ >= 0 ? p_ : units_.end();
}
// operator*() etc. are logically const.
@ -1830,8 +1804,6 @@ private:
// Keep state so that we call decAndRead() only once for both operator*() and ++
// to make it easy for the compiler to optimize.
mutable UnsafeCodeUnits_ units_;
// For fast getLogicalPosition() and operator==().
mutable UnitIter unitsLimit_;
// >0: units_ = readAndInc(), p_ = units limit
// 0: initial state
// <0: units_ = decAndRead(), p_ = units start

View file

@ -283,7 +283,7 @@ void U16IteratorTest::testNegative() {
auto sv = units.stringView();
assertEquals("iter[1] * stringView().length()", 1, sv.length());
assertEquals("iter[1] * stringView()[0]", 0xd900, sv[0]);
// TODO: test units.data()
// TODO: test units.begin()
++iter;
assertEquals("iter[2] * codePoint", u'b', (*iter++).codePoint()); // post-increment
units = *iter++; // post-increment
@ -359,7 +359,7 @@ void U16IteratorTest::testSinglePassIter() {
assertEquals("iter[1] * length", 1, units.length());
assertTrue("iter[1] * wellFormed", units.wellFormed());
// No units.stringView() when the unit iterator is not a pointer.
// No data() for a single-pass unit iterator.
// No begin() for a single-pass unit iterator.
++iter;
assertEquals("iter[2] * codePoint", u'ç', (*iter++).codePoint()); // post-increment
assertEquals("iter[3] -> codePoint", u'', iter->codePoint());
@ -395,7 +395,8 @@ void U16IteratorTest::testFwdIter() {
assertEquals("iter[1] * length", 1, units.length());
assertTrue("iter[1] * wellFormed", units.wellFormed());
// No units.stringView() when the unit iterator is not a pointer.
assertTrue("iter[1] * data()[0]", *units.data() == u'b');
assertTrue("iter[1] * begin()[0]", *units.begin() == u'b');
assertTrue("iter[1] * end()[0]", *units.end() == u'ç');
++iter;
assertEquals("iter[2] * codePoint", u'ç', (*iter++).codePoint()); // post-increment
assertEquals("iter[3] -> codePoint", u'', iter->codePoint());
@ -406,9 +407,10 @@ void U16IteratorTest::testFwdIter() {
assertEquals("iter[4] * codePoint", U'🚴', units.codePoint());
assertEquals("iter[4] * length", 2, units.length());
assertTrue("iter[4] * wellFormed", units.wellFormed());
FwdIter<char16_t> data = units.data();
assertTrue("iter[4] * data()[0]", *data++ == u"🚴"[0]);
assertTrue("iter[4] * data()[1]", *data == u"🚴"[1]);
FwdIter<char16_t> data = units.begin();
assertTrue("iter[4] * begin()[0]", *data++ == u"🚴"[0]);
assertTrue("iter[4] * begin()[1]", *data == u"🚴"[1]);
assertTrue("iter[4] * end() == endIter", units.end() == goodLimit);
assertTrue("iter == endIter", iter == rangeLimit);
}
@ -496,7 +498,7 @@ void U8IteratorTest::testSinglePassIter() {
assertEquals("iter[1] * length", 1, units.length());
assertTrue("iter[1] * wellFormed", units.wellFormed());
// No units.stringView() when the unit iterator is not a pointer.
// No data() for a single-pass unit iterator.
// No begin() for a single-pass unit iterator.
++iter;
assertEquals("iter[2] * codePoint", u'ç', (*iter++).codePoint()); // post-increment
assertEquals("iter[3] -> codePoint", u'', iter->codePoint());
@ -532,7 +534,8 @@ void U8IteratorTest::testFwdIter() {
assertEquals("iter[1] * length", 1, units.length());
assertTrue("iter[1] * wellFormed", units.wellFormed());
// No units.stringView() when the unit iterator is not a pointer.
assertTrue("iter[1] * data()[0]", *units.data() == u8'b');
assertTrue("iter[1] * begin()[0]", *units.begin() == u8'b');
assertTrue("iter[1] * end()[0]", *units.end() == u8"ç"[0]);
++iter;
assertEquals("iter[2] * codePoint", u'ç', (*iter++).codePoint()); // post-increment
assertEquals("iter[3] -> codePoint", u'', iter->codePoint());
@ -543,11 +546,12 @@ void U8IteratorTest::testFwdIter() {
assertEquals("iter[4] * codePoint", U'🚴', units.codePoint());
assertEquals("iter[4] * length", 4, units.length());
assertTrue("iter[4] * wellFormed", units.wellFormed());
FwdIter<char> data = units.data();
assertTrue("iter[4] * data()[0]", *data++ == u8"🚴"[0]);
assertTrue("iter[4] * data()[1]", *data++ == u8"🚴"[1]);
assertTrue("iter[4] * data()[2]", *data++ == u8"🚴"[2]);
assertTrue("iter[4] * data()[3]", *data == u8"🚴"[3]);
FwdIter<char> data = units.begin();
assertTrue("iter[4] * begin()[0]", *data++ == u8"🚴"[0]);
assertTrue("iter[4] * begin()[1]", *data++ == u8"🚴"[1]);
assertTrue("iter[4] * begin()[2]", *data++ == u8"🚴"[2]);
assertTrue("iter[4] * begin()[3]", *data == u8"🚴"[3]);
assertTrue("iter[4] * end() == endIter", units.end() == goodLimit);
assertTrue("iter == endIter", iter == rangeLimit);
}
@ -631,7 +635,7 @@ void U32IteratorTest::testSinglePassIter() {
assertEquals("iter[1] * length", 1, units.length());
assertTrue("iter[1] * wellFormed", units.wellFormed());
// No units.stringView() when the unit iterator is not a pointer.
// No data() for a single-pass unit iterator.
// No begin() for a single-pass unit iterator.
++iter;
assertEquals("iter[2] * codePoint", u'ç', (*iter++).codePoint()); // post-increment
assertEquals("iter[3] -> codePoint", u'', iter->codePoint());
@ -667,7 +671,8 @@ void U32IteratorTest::testFwdIter() {
assertEquals("iter[1] * length", 1, units.length());
assertTrue("iter[1] * wellFormed", units.wellFormed());
// No units.stringView() when the unit iterator is not a pointer.
assertTrue("iter[1] * data()[0]", *units.data() == u'b');
assertTrue("iter[1] * begin()[0]", *units.begin() == u'b');
assertTrue("iter[1] * end()[0]", *units.end() == u'ç');
++iter;
assertEquals("iter[2] * codePoint", u'ç', (*iter++).codePoint()); // post-increment
assertEquals("iter[3] -> codePoint", u'', iter->codePoint());
@ -678,7 +683,8 @@ void U32IteratorTest::testFwdIter() {
assertEquals("iter[4] * codePoint", U'🚴', units.codePoint());
assertEquals("iter[4] * length", 1, units.length());
assertTrue("iter[4] * wellFormed", units.wellFormed());
FwdIter<char32_t> data = units.data();
assertTrue("iter[4] * data()[0]", *data == U"🚴"[0]);
FwdIter<char32_t> data = units.begin();
assertTrue("iter[4] * begin()[0]", *data == U"🚴"[0]);
assertTrue("iter[4] * end() == endIter", units.end() == goodLimit);
assertTrue("iter == endIter", iter == rangeLimit);
}