4#include "../Foundation/Assert.h"
5#include "../Foundation/Span.h"
6#include "../Foundation/StringSpan.h"
22 return (encoding1 == encoding2) or (encoding2 == StringEncoding::Ascii and encoding1 == StringEncoding::Utf8) or
23 (encoding2 == StringEncoding::Utf8 and encoding1 == StringEncoding::Ascii);
34template <
typename CharIterator>
37 static constexpr StringEncoding getEncoding() {
return CharIterator::getEncoding(); }
39 using CodeUnit = char;
50 [[nodiscard]]
constexpr bool isAtEnd()
const {
return it >= end; }
54 [[nodiscard]]
constexpr bool isAtStart()
const {
return it <= start; }
70 template <
typename OtherIterator>
73 return advanceBeforeOrAfterFinding<OtherIterator, true>(other);
76 [[nodiscard]]
bool advanceAfterFinding(
StringIterator other) {
return advanceAfterFindingSameIterator(other); }
82 template <
typename OtherIterator>
85 return advanceBeforeOrAfterFinding<OtherIterator, false>(other);
88 [[nodiscard]]
bool advanceBeforeFinding(
StringIterator other) {
return advanceBeforeFindingSameIterator(other); }
138 [[nodiscard]]
bool match(CodePoint c) {
return it < end and CharIterator::decode(it, end) == c; }
148 [[nodiscard]]
bool read(CodePoint& c);
206 template <
typename IteratorType>
207 [[nodiscard]]
bool endsWith(IteratorType other)
const;
212 template <
typename IteratorType>
216 template <
typename OtherIterator,
bool after>
218 [[nodiscard]]
bool advanceAfterFindingSameIterator(
StringIterator other);
219 [[nodiscard]]
bool advanceBeforeFindingSameIterator(
StringIterator other);
220 [[nodiscard]]
bool advanceOfBytes(
ssize_t bytesLength);
223 static constexpr const CodeUnit* getNextOf(
const CodeUnit* src,
const char* end)
225 return CharIterator::getNextOf(src, end);
227 static constexpr const CodeUnit* getPreviousOf(
const CodeUnit* src,
const char* start)
229 return CharIterator::getPreviousOf(src, start);
231 constexpr StringIterator(
const CodeUnit* it,
const CodeUnit* end) : it(it), start(it), end(end) {}
233 const CodeUnit* start;
240 [[nodiscard]]
constexpr bool advanceUntilMatches(CodePoint c);
243 [[nodiscard]]
bool advanceUntilMatchesNonConstexpr(CodePoint c);
244 using StringIterator::StringIterator;
250 [[nodiscard]]
static constexpr StringEncoding getEncoding() {
return StringEncoding::Ascii; }
252 [[nodiscard]]
static constexpr const char* getNextOf(
const char* src,
const char*) {
return src + 1; }
253 [[nodiscard]]
static constexpr const char* getPreviousOf(
const char* src,
const char*) {
return src - 1; }
254 [[nodiscard]]
static constexpr CodePoint decode(
const char* src,
const char*)
256 return static_cast<CodePoint
>(*src);
264 using StringIterator::StringIterator;
270 [[nodiscard]]
static StringEncoding getEncoding() {
return StringEncoding::Utf16; }
272 [[nodiscard]]
static const char* getNextOf(
const char* bytes,
const char* end);
273 [[nodiscard]]
static const char* getPreviousOf(
const char* bytes,
const char* start);
275 [[nodiscard]]
static uint32_t decode(
const char* bytes,
const char* end);
285 using StringIterator::StringIterator;
288 [[nodiscard]]
static StringEncoding getEncoding() {
return StringEncoding::Utf8; }
290 [[nodiscard]]
static const char* getNextOf(
const char* src,
const char* end);
291 [[nodiscard]]
static const char* getPreviousOf(
const char* src,
const char* start);
293 [[nodiscard]]
static uint32_t decode(
const char* src,
const char* end);
299 bool matches[256] = {
false};
304 matches[
static_cast<int>(c)] =
true;
313template <
typename CharIterator>
318 if (CharIterator::decode(it, end) == c)
320 it = getNextOf(it, end);
325template <
typename CharIterator>
328 if (it < end and CharIterator::decode(it, end) == c)
330 it = getNextOf(it, end);
336template <
typename CharIterator>
341 c = CharIterator::decode(it, end);
342 it = getNextOf(it, end);
348template <
typename CharIterator>
353 it = getNextOf(it, end);
359template <
typename CharIterator>
364 it = getPreviousOf(it, start);
370template <
typename CharIterator>
373 while (numCodePoints > 0)
380 it = getNextOf(it, end);
385template <
typename CharIterator>
388 return it < end ? CharIterator::decode(getNextOf(it, end), end) == c :
false;
391template <
typename CharIterator>
394 return it > start ? CharIterator::decode(getPreviousOf(it, start), it) == c :
false;
397template <
typename CharIterator>
405template <
typename CharIterator>
408 return (it - other.it) *
static_cast<ssize_t>(
sizeof(CodeUnit));
412[[nodiscard]]
constexpr bool StringIteratorASCII::advanceUntilMatches(CodePoint c)
414#if defined(__clang__)
415#pragma clang diagnostic push
416#pragma clang diagnostic ignored "-Wunreachable-code"
419 : advanceUntilMatchesNonConstexpr(c);
420#if defined(__clang__)
421#pragma clang diagnostic pop
#define SC_ASSERT_RELEASE(e)
Assert expression e to be true.
Definition Assert.h:42
unsigned int uint32_t
Platform independent (4) bytes unsigned int.
Definition PrimitiveTypes.h:38
signed long ssize_t
Platform independent signed size type.
Definition PrimitiveTypes.h:57
constexpr bool StringEncodingAreBinaryCompatible(StringEncoding encoding1, StringEncoding encoding2)
Checks if two encodings have the same utf unit size.
Definition StringIterator.h:20
uint32_t StringCodePoint
UTF code point (32 bit)
Definition StringIterator.h:14
View over a contiguous sequence of items (pointer + size in elements).
Definition Span.h:29
A string iterator for ASCII strings.
Definition StringIterator.h:239
Builds a constexpr bool skip table of 256 entries used in some parsers.
Definition StringIterator.h:298
A string iterator for UTF16 strings.
Definition StringIterator.h:262
A string iterator for UTF8 strings.
Definition StringIterator.h:280
A position inside a fixed range [start, end) of UTF code points.
Definition StringIterator.h:36
constexpr void setToStart()
Rewind current position to start of iterator range.
Definition StringIterator.h:43
constexpr ssize_t bytesDistanceFrom(StringIterator other) const
Get distance in bytes from current position to another StringIterator current position.
Definition StringIterator.h:406
constexpr void setToEnd()
Set current position to end of iterator range.
Definition StringIterator.h:46
bool advanceUntilMatchesAny(Span< const CodePoint > items, CodePoint &matched)
Advances position until any CodePoint in the given Span is found.
bool advanceBackwardIfMatches(CodePoint c)
Move position by one code point towards start if previous code point matches c
constexpr bool advanceIfMatches(CodePoint c)
Advance position only if next code point matches c.
Definition StringIterator.h:326
bool advanceBeforeFinding(StringIterator< OtherIterator > other)
Advances position towards end until a matching range of character equal to other[it,...
Definition StringIterator.h:83
constexpr bool isAtStart() const
Check if current position is at start of iterator range.
Definition StringIterator.h:54
bool reverseAdvanceUntilMatches(CodePoint c)
Moves position towards start until CodePoint c is found or position == end
bool advanceAfterFinding(StringIterator< OtherIterator > other)
Advances position towards end until a matching range of character equal to other[it,...
Definition StringIterator.h:71
bool advanceUntilDifferentFrom(CodePoint c, CodePoint *optionalReadChar=nullptr)
Advances position until a code point different from c is found or end is reached.
bool startsWith(IteratorType other) const
Check if this Iterator at its start matches entirely another Iterator's range.
bool reverseAdvanceCodePoints(size_t numCodePoints)
Move position backwards (towards start) by variable number of code pints.
constexpr bool stepBackward()
Move position to previous code point.
Definition StringIterator.h:360
constexpr bool advanceCodePoints(size_t numCodePoints)
Move position forward (towards end) by variable number of code points.
Definition StringIterator.h:371
bool reverseAdvanceUntilMatchesAny(Span< const CodePoint > items, CodePoint &matched)
Moves position towards start until any CodePoint in the given Span is found.
constexpr bool stepForward()
Move position to next code point.
Definition StringIterator.h:349
bool endsWithAnyOf(Span< const CodePoint > codePoints) const
Check if this Iterator ends with any code point in the given span.
bool advanceIfMatchesAny(Span< const CodePoint > items)
Advance position only if any of the code points in given Span is matched.
constexpr bool isFollowedBy(CodePoint c)
Check if next code point is c
Definition StringIterator.h:386
bool advanceBackwardRead(CodePoint &c)
Move to previous position and read code unit.
bool startsWithAnyOf(Span< const CodePoint > codePoints) const
Check if this Iterator starts with any code point in the given span.
constexpr StringIterator sliceFromStartUntil(StringIterator otherPoint) const
Returns another StringIterator range, starting from start to otherPoint position.
Definition StringIterator.h:398
constexpr bool isPrecededBy(CodePoint c)
Check if previous code point is c
Definition StringIterator.h:392
constexpr bool advanceUntilMatches(CodePoint c)
Advances position towards end until it matches CodePoint c or position == end
Definition StringIterator.h:314
bool read(CodePoint &c)
Read code unit at current position.
constexpr bool advanceRead(CodePoint &c)
Decode code unit at current position and advance.
Definition StringIterator.h:337
bool match(CodePoint c)
Check if code unit at current position matches CodePoint c
Definition StringIterator.h:138
constexpr bool isAtEnd() const
Check if current position is at end of iterator range.
Definition StringIterator.h:50
bool advanceIfMatchesRange(CodePoint first, CodePoint last)
Advance position if any code point in the range [first, last] is matched.
bool endsWith(IteratorType other) const
Check if this Iterator at its end matches entirely another Iterator's range.
bool advanceByLengthOf(StringIterator other)
Advances position by the same number of code points as other.
Definition StringIterator.h:93
Non-owning view over a range of characters with UTF Encoding.
Definition StringView.h:46