UTF8 & GBK之间的转换

时间:2022-11-05 14:08:25

使用lua的时候,在lua中给字符串赋值的中文,但是在C中读出来的就是乱码,是因为在lua中使用的是UTF8编码,而在C(windows下面)中使用的是GBK编码,将UTF8转成GBK就可以了,下面的代码就是实现这一转换的

转自:http://www.cppblog.com/zgysx/articles/13085.html

// 1、将GBK转换成UTF8

string GBKToUTF8(const std::string& strGBK)
{
string strOutUTF8 = "";
WCHAR
* str1;
int n = MultiByteToWideChar(CP_ACP, 0, strGBK.c_str(), -1, NULL, 0);
str1
= new WCHAR[n];
MultiByteToWideChar(CP_ACP,
0, strGBK.c_str(), -1, str1, n);
n
= WideCharToMultiByte(CP_UTF8, 0, str1, -1, NULL, 0, NULL, NULL);
char * str2 = new char[n];
WideCharToMultiByte(CP_UTF8,
0, str1, -1, str2, n, NULL, NULL);
strOutUTF8
= str2;
delete[]str1;
str1
= NULL;
delete[]str2;
str2
= NULL;
return strOutUTF8;
}

// 2、将UTF8转换成GBK

string UTF8ToGBK(const std::string& strUTF8)
{
int len = MultiByteToWideChar(CP_UTF8, 0, strUTF8.c_str(), -1, NULL, 0);
unsigned
short * wszGBK = new unsigned short[len + 1];
memset(wszGBK,
0, len * 2 + 2);
MultiByteToWideChar(CP_UTF8,
0, (LPCTSTR)strUTF8.c_str(), -1, wszGBK, len);

len
= WideCharToMultiByte(CP_ACP, 0, wszGBK, -1, NULL, 0, NULL, NULL);
char *szGBK = new char[len + 1];
memset(szGBK,
0, len + 1);
WideCharToMultiByte(CP_ACP,
0, wszGBK, -1, szGBK, len, NULL, NULL);
//strUTF8 = szGBK;
std::string strTemp(szGBK);
delete[]szGBK;
delete[]wszGBK;
return strTemp;
}