// SPDX-FileCopyrightText: 2002-2024 PCSX2 Dev Team // SPDX-License-Identifier: GPL-3.0+ #include "Assertions.h" #include "StringUtil.h" #include #include #include #include #include #include "fmt/core.h" #ifdef _WIN32 #include "RedtapeWindows.h" #endif namespace StringUtil { std::string StdStringFromFormat(const char* format, ...) { std::va_list ap; va_start(ap, format); std::string ret = StdStringFromFormatV(format, ap); va_end(ap); return ret; } std::string StdStringFromFormatV(const char* format, std::va_list ap) { std::va_list ap_copy; va_copy(ap_copy, ap); #ifdef _WIN32 int len = _vscprintf(format, ap_copy); #else int len = std::vsnprintf(nullptr, 0, format, ap_copy); #endif va_end(ap_copy); std::string ret; // If an encoding error occurs, len is -1. Which we definitely don't want to resize to. if (len > 0) { ret.resize(len); std::vsnprintf(ret.data(), ret.size() + 1, format, ap); } return ret; } bool WildcardMatch(const char* subject, const char* mask, bool case_sensitive /*= true*/) { if (case_sensitive) { const char* cp = nullptr; const char* mp = nullptr; while ((*subject) && (*mask != '*')) { if ((*mask != '?') && (std::tolower(*mask) != std::tolower(*subject))) return false; mask++; subject++; } while (*subject) { if (*mask == '*') { if (*++mask == 0) return true; mp = mask; cp = subject + 1; } else { if ((*mask == '?') || (std::tolower(*mask) == std::tolower(*subject))) { mask++; subject++; } else { mask = mp; subject = cp++; } } } while (*mask == '*') { mask++; } return *mask == 0; } else { const char* cp = nullptr; const char* mp = nullptr; while ((*subject) && (*mask != '*')) { if ((*mask != *subject) && (*mask != '?')) return false; mask++; subject++; } while (*subject) { if (*mask == '*') { if (*++mask == 0) return true; mp = mask; cp = subject + 1; } else { if ((*mask == *subject) || (*mask == '?')) { mask++; subject++; } else { mask = mp; subject = cp++; } } } while (*mask == '*') { mask++; } return *mask == 0; } } std::size_t Strlcpy(char* dst, const char* src, std::size_t size) { std::size_t len = std::strlen(src); if (len < size) { std::memcpy(dst, src, len + 1); } else { std::memcpy(dst, src, size - 1); dst[size - 1] = '\0'; } return len; } std::size_t Strlcpy(char* dst, const std::string_view src, std::size_t size) { std::size_t len = src.length(); if (len < size) { std::memcpy(dst, src.data(), len); dst[len] = '\0'; } else { std::memcpy(dst, src.data(), size - 1); dst[size - 1] = '\0'; } return len; } std::optional> DecodeHex(const std::string_view in) { std::vector data; data.reserve(in.size() / 2); for (size_t i = 0; i < in.size() / 2; i++) { std::optional byte = StringUtil::FromChars(in.substr(i * 2, 2), 16); if (byte.has_value()) data.push_back(*byte); else return std::nullopt; } return {data}; } std::string EncodeHex(const u8* data, int length) { std::stringstream ss; for (int i = 0; i < length; i++) ss << std::hex << std::setfill('0') << std::setw(2) << static_cast(data[i]); return ss.str(); } std::string toLower(const std::string_view input) { std::string newStr; std::transform(input.begin(), input.end(), std::back_inserter(newStr), [](unsigned char c) { return std::tolower(c); }); return newStr; } std::string toUpper(const std::string_view input) { std::string newStr; std::transform(input.begin(), input.end(), std::back_inserter(newStr), [](unsigned char c) { return std::toupper(c); }); return newStr; } bool compareNoCase(const std::string_view str1, const std::string_view str2) { if (str1.length() != str2.length()) { return false; } return Strncasecmp(str1.data(), str2.data(), str1.length()) == 0; } std::vector splitOnNewLine(const std::string& str) { std::vector lines; std::istringstream stream(str); std::string line; while (std::getline(stream, line)) { lines.push_back(line); } return lines; } std::string_view StripWhitespace(const std::string_view str) { std::string_view::size_type start = 0; while (start < str.size() && std::isspace(str[start])) start++; if (start == str.size()) return {}; std::string_view::size_type end = str.size() - 1; while (end > start && std::isspace(str[end])) end--; return str.substr(start, end - start + 1); } void StripWhitespace(std::string* str) { { const char* cstr = str->c_str(); std::string_view::size_type start = 0; while (start < str->size() && std::isspace(cstr[start])) start++; if (start != 0) str->erase(0, start); } { const char* cstr = str->c_str(); std::string_view::size_type start = str->size(); while (start > 0 && std::isspace(cstr[start - 1])) start--; if (start != str->size()) str->erase(start); } } std::vector SplitString(const std::string_view str, char delimiter, bool skip_empty /*= true*/) { std::vector res; std::string_view::size_type last_pos = 0; std::string_view::size_type pos; while (last_pos < str.size() && (pos = str.find(delimiter, last_pos)) != std::string_view::npos) { std::string_view part(StripWhitespace(str.substr(last_pos, pos - last_pos))); if (!skip_empty || !part.empty()) res.push_back(std::move(part)); last_pos = pos + 1; } if (last_pos < str.size()) { std::string_view part(StripWhitespace(str.substr(last_pos))); if (!skip_empty || !part.empty()) res.push_back(std::move(part)); } return res; } std::string ReplaceAll(const std::string_view subject, const std::string_view search, const std::string_view replacement) { std::string ret(subject); ReplaceAll(&ret, search, replacement); return ret; } void ReplaceAll(std::string* subject, const std::string_view search, const std::string_view replacement) { if (!subject->empty()) { std::string::size_type start_pos = 0; while ((start_pos = subject->find(search, start_pos)) != std::string::npos) { subject->replace(start_pos, search.length(), replacement); start_pos += replacement.length(); } } } bool ParseAssignmentString(const std::string_view str, std::string_view* key, std::string_view* value) { const std::string_view::size_type pos = str.find('='); if (pos == std::string_view::npos) { *key = std::string_view(); *value = std::string_view(); return false; } *key = StripWhitespace(str.substr(0, pos)); if (pos != (str.size() - 1)) *value = StripWhitespace(str.substr(pos + 1)); else *value = std::string_view(); return true; } void AppendUTF16CharacterToUTF8(std::string& s, u16 ch) { if (ch & 0xf800) { s.push_back(static_cast(static_cast(0xe0 | static_cast(ch >> 12)))); s.push_back(static_cast(static_cast(0x80 | static_cast(((ch >> 6) & 0x3f))))); s.push_back(static_cast(static_cast(0x80 | static_cast((ch & 0x3f))))); } else if (ch & 0xff80) { s.push_back(static_cast(static_cast(0xc0 | static_cast((ch >> 6))))); s.push_back(static_cast(static_cast(0x80 | static_cast((ch & 0x3f))))); } else { s.push_back(static_cast(static_cast(ch))); } } void EncodeAndAppendUTF8(std::string& s, char32_t ch) { if (ch <= 0x7F) { s.push_back(static_cast(static_cast(ch))); } else if (ch <= 0x07FF) { s.push_back(static_cast(static_cast(0xc0 | static_cast((ch >> 6) & 0x1f)))); s.push_back(static_cast(static_cast(0x80 | static_cast((ch & 0x3f))))); } else if (ch <= 0xFFFF) { s.push_back(static_cast(static_cast(0xe0 | static_cast(((ch >> 12) & 0x0f))))); s.push_back(static_cast(static_cast(0x80 | static_cast(((ch >> 6) & 0x3f))))); s.push_back(static_cast(static_cast(0x80 | static_cast((ch & 0x3f))))); } else if (ch <= 0x10FFFF) { s.push_back(static_cast(static_cast(0xf0 | static_cast(((ch >> 18) & 0x07))))); s.push_back(static_cast(static_cast(0x80 | static_cast(((ch >> 12) & 0x3f))))); s.push_back(static_cast(static_cast(0x80 | static_cast(((ch >> 6) & 0x3f))))); s.push_back(static_cast(static_cast(0x80 | static_cast((ch & 0x3f))))); } else { s.push_back(static_cast(0xefu)); s.push_back(static_cast(0xbfu)); s.push_back(static_cast(0xbdu)); } } size_t DecodeUTF8(const void* bytes, size_t length, char32_t* ch) { const u8* s = reinterpret_cast(bytes); if (s[0] < 0x80) { *ch = s[0]; return 1; } else if ((s[0] & 0xe0) == 0xc0) { if (length < 2) goto invalid; *ch = static_cast((static_cast(s[0] & 0x1f) << 6) | (static_cast(s[1] & 0x3f) << 0)); return 2; } else if ((s[0] & 0xf0) == 0xe0) { if (length < 3) goto invalid; *ch = static_cast((static_cast(s[0] & 0x0f) << 12) | (static_cast(s[1] & 0x3f) << 6) | (static_cast(s[2] & 0x3f) << 0)); return 3; } else if ((s[0] & 0xf8) == 0xf0 && (s[0] <= 0xf4)) { if (length < 4) goto invalid; *ch = static_cast((static_cast(s[0] & 0x07) << 18) | (static_cast(s[1] & 0x3f) << 12) | (static_cast(s[2] & 0x3f) << 6) | (static_cast(s[3] & 0x3f) << 0)); return 4; } invalid: *ch = 0xFFFFFFFFu; return 1; } size_t DecodeUTF8(const std::string_view str, size_t offset, char32_t* ch) { return DecodeUTF8(str.data() + offset, str.length() - offset, ch); } size_t DecodeUTF8(const std::string& str, size_t offset, char32_t* ch) { return DecodeUTF8(str.data() + offset, str.length() - offset, ch); } std::string Ellipsise(const std::string_view str, u32 max_length, const char* ellipsis /*= "..."*/) { std::string ret; ret.reserve(max_length); const u32 str_length = static_cast(str.length()); const u32 ellipsis_len = static_cast(std::strlen(ellipsis)); pxAssert(ellipsis_len > 0 && ellipsis_len <= max_length); if (str_length > max_length) { const u32 copy_size = std::min(str_length, max_length - ellipsis_len); if (copy_size > 0) ret.append(str.data(), copy_size); if (copy_size != str_length) ret.append(ellipsis); } else { ret.append(str); } return ret; } void EllipsiseInPlace(std::string& str, u32 max_length, const char* ellipsis /*= "..."*/) { const u32 str_length = static_cast(str.length()); const u32 ellipsis_len = static_cast(std::strlen(ellipsis)); pxAssert(ellipsis_len > 0 && ellipsis_len <= max_length); if (str_length > max_length) { const u32 keep_size = std::min(static_cast(str.length()), max_length - ellipsis_len); if (keep_size != str_length) str.erase(keep_size); str.append(ellipsis); } } #ifdef _WIN32 std::wstring UTF8StringToWideString(const std::string_view str) { std::wstring ret; if (!UTF8StringToWideString(ret, str)) return {}; return ret; } bool UTF8StringToWideString(std::wstring& dest, const std::string_view str) { int wlen = MultiByteToWideChar(CP_UTF8, 0, str.data(), static_cast(str.length()), nullptr, 0); if (wlen < 0) return false; dest.resize(wlen); if (wlen > 0 && MultiByteToWideChar(CP_UTF8, 0, str.data(), static_cast(str.length()), dest.data(), wlen) < 0) return false; return true; } std::string WideStringToUTF8String(const std::wstring_view& str) { std::string ret; if (!WideStringToUTF8String(ret, str)) ret.clear(); return ret; } bool WideStringToUTF8String(std::string& dest, const std::wstring_view& str) { int mblen = WideCharToMultiByte(CP_UTF8, 0, str.data(), static_cast(str.length()), nullptr, 0, nullptr, nullptr); if (mblen < 0) return false; dest.resize(mblen); if (mblen > 0 && WideCharToMultiByte(CP_UTF8, 0, str.data(), static_cast(str.length()), dest.data(), mblen, nullptr, nullptr) < 0) { return false; } return true; } #endif std::string U128ToString(const u128& u) { return fmt::format("0x{:08X}.{:08X}.{:08X}.{:08X}", u._u32[0], u._u32[1], u._u32[2], u._u32[3]); } std::string& AppendU128ToString(const u128& u, std::string& s) { fmt::format_to(std::back_inserter(s), "0x{:08X}.{:08X}.{:08X}.{:08X}", u._u32[0], u._u32[1], u._u32[2], u._u32[3]); return s; } } // namespace StringUtil