50 lines
1.1 KiB
C++
50 lines
1.1 KiB
C++
#include "utf8utf16.h"
|
|
|
|
#include <string>
|
|
#include <locale>
|
|
#include <codecvt>
|
|
|
|
std::string UTF16to8(const wchar_t * in)
|
|
{
|
|
std::wstring_convert<std::codecvt_utf8<wchar_t>> conv;
|
|
std::string s = conv.to_bytes(in);
|
|
|
|
return s;
|
|
}
|
|
|
|
std::wstring UTF8to16(const char * in)
|
|
{
|
|
|
|
std::wstring out;
|
|
if (in == NULL)
|
|
return out;
|
|
|
|
unsigned int codepoint;
|
|
while (*in != 0)
|
|
{
|
|
unsigned char ch = static_cast<unsigned char>(*in);
|
|
if (ch <= 0x7f)
|
|
codepoint = ch;
|
|
else if (ch <= 0xbf)
|
|
codepoint = (codepoint << 6) | (ch & 0x3f);
|
|
else if (ch <= 0xdf)
|
|
codepoint = ch & 0x1f;
|
|
else if (ch <= 0xef)
|
|
codepoint = ch & 0x0f;
|
|
else
|
|
codepoint = ch & 0x07;
|
|
++in;
|
|
if (((*in & 0xc0) != 0x80) && (codepoint <= 0x10ffff))
|
|
{
|
|
if (codepoint > 0xffff)
|
|
{
|
|
out.append(1, static_cast<wchar_t>(0xd800 + (codepoint >> 10)));
|
|
out.append(1, static_cast<wchar_t>(0xdc00 + (codepoint & 0x03ff)));
|
|
}
|
|
else if (codepoint < 0xd800 || codepoint >= 0xe000)
|
|
out.append(1, static_cast<wchar_t>(codepoint));
|
|
}
|
|
}
|
|
return out;
|
|
}
|