#include "boost/locale.hpp"
using CODECVR_BYNAME_TYPE = std::codecvt_byname<wchar_t, char, mbstate_t>;
const char* GBK_LOCALE_NAME = ".936";
bool UTF8ToWide(std::wstring& wstr, const std::string& utf8)
std::wstring_convertwchar_t>> converter;
wstr = converter.from_bytes(utf8);
bool GBKToWide(std::wstring& wstr, const std::string& gbk)
std::wstring_convert convert(new CODECVR_BYNAME_TYPE(GBK_LOCALE_NAME));
wstr = convert.from_bytes(gbk);
bool WideToUTF8(std::string& utf8, const std::wstring& wstr)
std::wstring_convertwchar_t>> converter;
utf8 = converter.to_bytes(wstr);
bool WideToGBK(std::string& gbk, const std::wstring& wstr)
std::wstring_convert convert(new CODECVR_BYNAME_TYPE(GBK_LOCALE_NAME));
gbk = convert.to_bytes(wstr);
bool GBKToUTF8(std::string& utf8, const std::string& gbk)
bool UTF8ToGBK(std::string& gbk, const std::string& utf8)
bool IsStringUTF8(const string& str)
for (size_t i = 0; i < str.size(); ++i)
if (chr >= 0xFC && chr <= 0xFD)
if ((chr & 0xC0) != 0x80)
int UTF8StringSize(const std::string& str)
return MultiByteToWideChar(CP_UTF8, NULL, str.c_str(), str.size(), NULL, NULL);
int GetUTF8Bytes(const char chr)
if (chr >= 0xFC && chr <= 0xFD)
std::string UTF8StringSafeTruncate(const std::string& name, const size_t need_size)
while (i < need_size && j < name.length()) {
unsigned char c = (unsigned char)name[j++];
i += ((c & 0xc0) != 0x80);
while (j < name.length()) {
unsigned char c = (unsigned char)name[j];
if ((c & 0xc0) == 0x80) {
return name.substr(0, j);
std::string ToLower_transform1(const std::string& str)
std::string str_tmp = str;
std::transform(str_tmp.begin(), str_tmp.end(), str_tmp.begin(), ::tolower);
std::string ToUpper_transform1(const std::string& str)
std::string str_tmp = str;
std::transform(str_tmp.begin(), str_tmp.end(), str_tmp.begin(), ::toupper);
std::string ToLower_transform2(const std::string& str)
UTF8ToWide(wstr_tmp, str);;
std::transform(wstr_tmp.begin(), wstr_tmp.end(), wstr_tmp.begin(), ::tolower);
WideToUTF8(str_tmp, wstr_tmp);;
std::string ToUpper_transform2(const std::string& str)
UTF8ToWide(wstr_tmp, str);;
std::transform(wstr_tmp.begin(), wstr_tmp.end(), wstr_tmp.begin(), ::toupper);
WideToUTF8(str_tmp, wstr_tmp);;
std::string ToLower_boost(const std::string& str)
static boost::locale::generator generator;
static std::locale locale = generator("en_US.UTF-8");
std::wstring wstr = boost::locale::conv::to_utf<wchar_t>(str, "utf-8");
wstr = boost::locale::to_lower(wstr, locale);
return boost::locale::conv::from_utf(wstr, "utf-8");
std::string ToUpper_boost(const std::string& str)
static boost::locale::generator generator;
static std::locale locale = generator("en_US.UTF-8");
std::wstring wstr = boost::locale::conv::to_utf<wchar_t>(str, "utf-8");
wstr = boost::locale::to_upper(wstr, locale);
return boost::locale::conv::from_utf(wstr, "utf-8");
std::string str_gb2312 = "中国";
GBKToUTF8(str_utf8, str_gb2312);
bool utf8 = IsStringUTF8(str_gb2312);
bool utf8_2 = IsStringUTF8(str_utf8);
int num = UTF8StringSize(str_utf8);
std::string str_utf8_truncate = UTF8StringSafeTruncate(str_utf8, 1);
std::string str_gb2312_truncate;
UTF8ToGBK(str_gb2312_truncate, str_utf8_truncate);
std::string str_lower = "ABC";
std::string str_upper = "def";
std::string str_lower1 = ToLower_transform1(str_lower);
std::string str_upper1 = ToUpper_transform1(str_upper);
std::string str_lower2 = ToLower_transform2(str_lower);
std::string str_upper2 = ToUpper_transform2(str_upper);
std::string str_lower3 = ToLower_boost(str_lower);
std::string str_upper3 = ToUpper_boost(str_upper);