1
Fork 0
mirror of https://github.com/RGBCube/serenity synced 2025-05-31 16:38:10 +00:00

UTF-8: Add Utf8CodepointIterator::codepoint_length_in_bytes()

This allows you to retrieve the length (in bytes) of the codepoint the
iterator is currently pointing at.
This commit is contained in:
Andreas Kling 2019-10-18 22:49:23 +02:00
parent ab9e6166e8
commit f4e6dae6fe
2 changed files with 12 additions and 0 deletions

View file

@ -139,6 +139,16 @@ Utf8CodepointIterator& Utf8CodepointIterator::operator++()
return *this;
}
int Utf8CodepointIterator::codepoint_length_in_bytes() const
{
ASSERT(m_length > 0);
int codepoint_length_in_bytes;
u32 value;
bool first_byte_makes_sense = decode_first_byte(*m_ptr, codepoint_length_in_bytes, value);
ASSERT(first_byte_makes_sense);
return codepoint_length_in_bytes;
}
u32 Utf8CodepointIterator::operator*() const
{
ASSERT(m_length > 0);