mirror of https://github.com/bsnes-emu/bsnes.git
33 lines
1.0 KiB
C++
33 lines
1.0 KiB
C++
|
#pragma once
|
||
|
|
||
|
namespace nall {
|
||
|
|
||
|
//note: this function assumes the string contains valid UTF-8 characters
|
||
|
//invalid characters will result in an incorrect result from this function
|
||
|
//invalid case 1: byte 1 == 0b'01xxxxxx
|
||
|
//invalid case 2: bytes 2-4 != 0b'10xxxxxx
|
||
|
//invalid case 3: end of string without bytes 2-4 present
|
||
|
auto characters(string_view self, int offset, int length) -> uint {
|
||
|
uint characters = 0;
|
||
|
if(offset < 0) offset = self.size() - abs(offset);
|
||
|
if(offset >= 0 && offset < self.size()) {
|
||
|
if(length < 0) length = self.size() - offset;
|
||
|
if(length >= 0) {
|
||
|
for(int index = offset; index < offset + length;) {
|
||
|
auto byte = self.data()[index++];
|
||
|
if((byte & 0b111'00000) == 0b110'00000) index += 1;
|
||
|
if((byte & 0b1111'0000) == 0b1110'0000) index += 2;
|
||
|
if((byte & 0b11111'000) == 0b11110'000) index += 3;
|
||
|
characters++;
|
||
|
}
|
||
|
}
|
||
|
}
|
||
|
return characters;
|
||
|
}
|
||
|
|
||
|
auto string::characters(int offset, int length) const -> uint {
|
||
|
return nall::characters(*this, offset, length);
|
||
|
}
|
||
|
|
||
|
}
|