方式一:
#include <string>
#include <locale>
#include <codecvt>
//unicode转中文 (\u4f60\u597d\u554a ==》 你好啊)
string unicodeToCHI(string &unicodeStr){
string uStr, value;
int index, len;
wstring_convert<codecvt_utf8<char32_t>, char32_t> converter;
if (unicodeStr.length() <= 0)
{
return "";
}
//unicode转utf8
while (1){
index = unicodeStr.find("\\u");
if (index<0 || index>unicodeStr.length())
break;
//转换需要的地方
uStr = unicodeStr.substr(index + 2, 4);
for (size_t i = 0; i < uStr.length();){
char32_t uhan = strtol(uStr.substr(i, 4).c_str(), nullptr, 16);
value = converter.to_bytes(uhan);
i += 4;
}
//在原字符串中替换掉
unicodeStr.replace(index, 6, value);
}
//utf8转ANSI
len = ::MultiByteToWideChar(CP_UTF8, 0, unicodeStr.c_str(), -1, NULL, 0);
WCHAR* wStr = new WCHAR[len + 1];
memset(wStr, 0, sizeof(wStr));
len = MultiByteToWideChar(CP_UTF8, 0, unicodeStr.c_str(), -1, wStr, len);
len = WideCharToMultiByte(CP_ACP, 0, wStr, -1, NULL, 0, NULL, NULL);
char *szANSI = new char[len + 1];
memset(szANSI, 0, sizeof(szANSI));
WideCharToMultiByte(CP_ACP, 0, wStr, -1, szANSI, len, NULL, NULL);
unicodeStr = szANSI;
delete[]wStr;
wStr = NULL;
return unicodeStr;
}
方式二:
#include <atlstr.h>
string unicodeToCHI2(string &unicodeStr)
{
int index;
CString cstr;
int nValue = 0;
WCHAR * pWchar;
wchar_t* szHex;
char strchar[6] = { '0', 'x', '\0' };
if (unicodeStr.length() <= 0)
{
return "";
}
while (1){
int index = unicodeStr.find("\\u");
if (index <0 || index>unicodeStr.length())
break;
strchar[2] = unicodeStr[index+2];
strchar[3] = unicodeStr[index + 3];
strchar[4] = unicodeStr[index + 4];
strchar[5] = unicodeStr[index + 5];
USES_CONVERSION;
szHex = A2W(strchar);
StrToIntExW(szHex, STIF_SUPPORT_HEX, &nValue);
pWchar = (WCHAR*)& nValue;
cstr = pWchar;
//替换掉unicode字符串
unicodeStr.replace(index, 6, cstr);
}
return unicodeStr;
}
注意:目前好像发现有些字符转换不过来,比如 \u0456
版权声明:本文为bangtanhui原创文章,遵循 CC 4.0 BY-SA 版权协议,转载请附上原文出处链接和本声明。