mirror of
https://github.com/RGBCube/serenity
synced 2025-05-31 12:28:12 +00:00
AK: Add starts_with to Utf8View
Unlike String/StringView::starts_with this compares utf8 code points instead of "characters" (bytes), which is important when handling aribtary utf-8 input that could include overlong characters.
This commit is contained in:
parent
3f9ac88c6e
commit
edecf8f6a3
2 changed files with 20 additions and 0 deletions
|
@ -144,6 +144,24 @@ size_t Utf8View::calculate_length() const
|
|||
return length;
|
||||
}
|
||||
|
||||
bool Utf8View::starts_with(const Utf8View& start) const
|
||||
{
|
||||
if (start.is_empty())
|
||||
return true;
|
||||
if (is_empty())
|
||||
return false;
|
||||
if (start.length() > length())
|
||||
return false;
|
||||
if (begin_ptr() == start.begin_ptr())
|
||||
return true;
|
||||
|
||||
for (auto k = begin(), l = start.begin(); l != start.end(); ++k, ++l) {
|
||||
if (*k != *l)
|
||||
return false;
|
||||
}
|
||||
return true;
|
||||
}
|
||||
|
||||
Utf8CodepointIterator::Utf8CodepointIterator(const unsigned char* ptr, size_t length)
|
||||
: m_ptr(ptr)
|
||||
, m_length(length)
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue