2017-10-10 23:32:13 +02:00
|
|
|
#pragma once
|
|
|
|
|
2022-04-18 00:52:22 +01:00
|
|
|
#include <cstring>
|
2017-10-10 23:32:13 +02:00
|
|
|
#include <string>
|
|
|
|
#include <sstream>
|
2019-02-11 21:35:32 +01:00
|
|
|
#include <vector>
|
2018-07-21 12:51:50 +02:00
|
|
|
|
2018-07-21 13:43:33 +03:00
|
|
|
#include "./com/com_include.h"
|
2017-10-10 23:32:13 +02:00
|
|
|
|
2022-07-28 18:40:46 +02:00
|
|
|
#include "util_bit.h"
|
|
|
|
#include "util_likely.h"
|
|
|
|
|
2017-10-10 23:32:13 +02:00
|
|
|
namespace dxvk::str {
|
2022-07-28 18:40:46 +02:00
|
|
|
|
|
|
|
template<size_t S> struct UnicodeChar { };
|
|
|
|
template<> struct UnicodeChar<1> { using type = uint8_t; };
|
|
|
|
template<> struct UnicodeChar<2> { using type = uint16_t; };
|
|
|
|
template<> struct UnicodeChar<4> { using type = uint32_t; };
|
|
|
|
|
|
|
|
template<typename T>
|
|
|
|
using UnicodeCharType = typename UnicodeChar<sizeof(T)>::type;
|
|
|
|
|
|
|
|
const uint8_t* decodeTypedChar(
|
|
|
|
const uint8_t* begin,
|
|
|
|
const uint8_t* end,
|
|
|
|
uint32_t& ch);
|
|
|
|
|
|
|
|
const uint16_t* decodeTypedChar(
|
|
|
|
const uint16_t* begin,
|
|
|
|
const uint16_t* end,
|
|
|
|
uint32_t& ch);
|
|
|
|
|
|
|
|
const uint32_t* decodeTypedChar(
|
|
|
|
const uint32_t* begin,
|
|
|
|
const uint32_t* end,
|
|
|
|
uint32_t& ch);
|
|
|
|
|
|
|
|
size_t encodeTypedChar(
|
|
|
|
uint8_t* begin,
|
|
|
|
uint8_t* end,
|
|
|
|
uint32_t ch);
|
|
|
|
|
|
|
|
size_t encodeTypedChar(
|
|
|
|
uint16_t* begin,
|
|
|
|
uint16_t* end,
|
|
|
|
uint32_t ch);
|
|
|
|
|
|
|
|
size_t encodeTypedChar(
|
|
|
|
uint32_t* begin,
|
|
|
|
uint32_t* end,
|
|
|
|
uint32_t ch);
|
|
|
|
|
|
|
|
/**
|
|
|
|
* \brief Decodes a single character
|
|
|
|
*
|
|
|
|
* Note that \c begin and \c end must not be equal.
|
|
|
|
* \param [in] begin Pointer to current position within the input string
|
|
|
|
* \param [in] end Pointer to the end of the input string
|
|
|
|
* \param [out] ch Pointer to the decoded character code
|
|
|
|
* \returns Pointer to next character in the input string
|
|
|
|
*/
|
|
|
|
template<typename T>
|
|
|
|
const T* decodeChar(
|
|
|
|
const T* begin,
|
|
|
|
const T* end,
|
|
|
|
uint32_t& ch) {
|
|
|
|
using CharType = UnicodeCharType<T>;
|
|
|
|
|
|
|
|
const CharType* result = decodeTypedChar(
|
|
|
|
reinterpret_cast<const CharType*>(begin),
|
|
|
|
reinterpret_cast<const CharType*>(end),
|
|
|
|
ch);
|
|
|
|
|
|
|
|
return reinterpret_cast<const T*>(result);
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* \brief Encodes a character
|
|
|
|
*
|
|
|
|
* Note that \c begin and \c end may be both be \c nullptr or equal, in
|
|
|
|
* which case only the length of the encoded character will be returned.
|
|
|
|
* \param [in] begin Pointer to current position within the output string
|
|
|
|
* \param [in] end Pointer to the end of the output string
|
|
|
|
* \param [in] ch Character to encode
|
|
|
|
* \returns If begin is \c nullptr , the number of units required to encode
|
|
|
|
* the character. Otherwise, the number of units written to the output.
|
|
|
|
* This may return \c 0 for characters that cannot be written or encoded.
|
|
|
|
*/
|
|
|
|
template<typename T>
|
|
|
|
size_t encodeChar(
|
|
|
|
T* begin,
|
|
|
|
T* end,
|
|
|
|
uint32_t ch) {
|
|
|
|
using CharType = UnicodeCharType<T>;
|
|
|
|
|
|
|
|
return encodeTypedChar(
|
|
|
|
reinterpret_cast<CharType*>(begin),
|
|
|
|
reinterpret_cast<CharType*>(end),
|
|
|
|
ch);
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* \brief Computes length of a null-terminated string
|
|
|
|
*
|
|
|
|
* \param [in] begin Start of input string
|
|
|
|
* \returns Number of characters in input string,
|
|
|
|
* excluding the terminating null character
|
|
|
|
*/
|
|
|
|
template<typename S>
|
|
|
|
size_t length(const S* string) {
|
|
|
|
size_t result = 0;
|
|
|
|
|
|
|
|
while (string[result])
|
|
|
|
result += 1;
|
|
|
|
|
|
|
|
return result;
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* \brief Converts string from one encoding to another
|
|
|
|
*
|
|
|
|
* The output string arguments may be \c nullptr. In that case, the
|
|
|
|
* total length of the transcoded string will be returned, in units
|
|
|
|
* of the output character type. The output string will only be
|
|
|
|
* null-terminated if the input string is also null-terminated.
|
|
|
|
* \tparam D Output character type
|
|
|
|
* \tparam S Input character type
|
|
|
|
* \param [in] dstBegin Start of output string
|
|
|
|
* \param [in] dstLength Length of output string
|
|
|
|
* \param [in] srcBegin Start of input string
|
|
|
|
* \param [in] srcLength Length of input string
|
|
|
|
* \returns If \c dstBegin is \c nullptr , the total number of output
|
|
|
|
* characters required to store the output string. Otherwise, the
|
|
|
|
* total number of characters written to the output string.
|
|
|
|
*/
|
|
|
|
template<typename D, typename S>
|
|
|
|
size_t transcodeString(
|
|
|
|
D* dstBegin,
|
|
|
|
size_t dstLength,
|
|
|
|
const S* srcBegin,
|
|
|
|
size_t srcLength) {
|
|
|
|
size_t totalLength = 0;
|
|
|
|
|
|
|
|
auto dstEnd = dstBegin + dstLength;
|
|
|
|
auto srcEnd = srcBegin + srcLength;
|
|
|
|
|
|
|
|
while (srcBegin < srcEnd) {
|
|
|
|
uint32_t ch;
|
|
|
|
|
|
|
|
srcBegin = decodeChar<S>(srcBegin, srcEnd, ch);
|
|
|
|
|
|
|
|
if (dstBegin)
|
|
|
|
totalLength += encodeChar<D>(dstBegin + totalLength, dstEnd, ch);
|
|
|
|
else
|
|
|
|
totalLength += encodeChar<D>(nullptr, nullptr, ch);
|
|
|
|
|
|
|
|
if (!ch)
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
return totalLength;
|
|
|
|
}
|
|
|
|
|
2018-08-27 14:15:34 +02:00
|
|
|
std::string fromws(const WCHAR *ws);
|
2019-02-11 21:35:32 +01:00
|
|
|
|
2019-11-16 19:18:21 +00:00
|
|
|
void tows(const char* mbs, WCHAR* wcs, size_t wcsLen);
|
|
|
|
|
|
|
|
template <size_t N>
|
|
|
|
void tows(const char* mbs, WCHAR (&wcs)[N]) {
|
|
|
|
return tows(mbs, wcs, N);
|
|
|
|
}
|
2020-09-10 12:02:53 +09:00
|
|
|
|
|
|
|
std::wstring tows(const char* mbs);
|
2017-10-10 23:32:13 +02:00
|
|
|
|
2018-08-27 14:15:34 +02:00
|
|
|
inline void format1(std::stringstream&) { }
|
|
|
|
|
|
|
|
template<typename... Tx>
|
|
|
|
void format1(std::stringstream& str, const WCHAR *arg, const Tx&... args) {
|
|
|
|
str << fromws(arg);
|
|
|
|
format1(str, args...);
|
|
|
|
}
|
|
|
|
|
2017-10-10 23:32:13 +02:00
|
|
|
template<typename T, typename... Tx>
|
|
|
|
void format1(std::stringstream& str, const T& arg, const Tx&... args) {
|
|
|
|
str << arg;
|
|
|
|
format1(str, args...);
|
|
|
|
}
|
|
|
|
|
|
|
|
template<typename... Args>
|
|
|
|
std::string format(const Args&... args) {
|
|
|
|
std::stringstream stream;
|
|
|
|
format1(stream, args...);
|
|
|
|
return stream.str();
|
|
|
|
}
|
2022-04-18 00:52:22 +01:00
|
|
|
|
|
|
|
inline void strlcpy(char* dst, const char* src, size_t count) {
|
|
|
|
std::strncpy(dst, src, count);
|
|
|
|
if (count > 0)
|
|
|
|
dst[count - 1] = '\0';
|
|
|
|
}
|
2017-10-10 23:32:13 +02:00
|
|
|
|
|
|
|
}
|