C++ std::string 包含中文

环境:VS2015

场景描述:std::string 包含中文时,字符串截取有问题,如下所示:

int main()
{
    std::vector<std::string> spliteList;

    string value = "类型A123";
    for (int i = 0; i < value.size(); ++i)
    {
        spliteList.push_back(value.substr(i, 1));
    }
}

 

 

解决办法:std::string 转为 std::wstring后处理

#include <Windows.h>
#include <tchar.h>
#include <vector>
#include <string>

#pragma warning(disable:4996)
using namespace std;

std::string WStringToString(const std::wstring& ws)
{
    std::string strLocale = setlocale(LC_ALL, "");
    const wchar_t* wchSrc = ws.c_str();
    size_t nDestSize = wcstombs(NULL, wchSrc, 0) + 1;
    char *chDest = new char[nDestSize];
    memset(chDest, 0, nDestSize);
    wcstombs(chDest, wchSrc, nDestSize);
    std::string strResult = chDest;
    delete[]chDest;
    setlocale(LC_ALL, strLocale.c_str());
    return strResult;
}

std::wstring StringToWString(const std::string &str)
{
    std::wstring wContext = L"";
    int len = MultiByteToWideChar(CP_ACP, 0, str.c_str(), str.size(), NULL, 0);
    WCHAR* buffer = new WCHAR[len + 1];
    MultiByteToWideChar(CP_ACP, 0, str.c_str(), str.size(), buffer, len);
    buffer[len] = '\0';
    wContext.append(buffer);
    delete[] buffer;

    return wContext;
}

std::vector<std::string> SpiteStringCharacter(std::string context)
{
    std::vector<std::string> res;

    std::wstring wContext = StringToWString(context);
    for (int i = 0; i < wContext.length(); ++i)
    {
        std::wstring tmp = wContext.substr(i, 1);
        res.push_back(WStringToString(tmp));
    }

    return res;
}

bool IsChineseChar(std::wstring value)
{
    if (value.size() == 1)
    {
        unsigned char* pCh = (unsigned char*)&value[0];
        if (((*pCh >= 0) && (*pCh <= 0xff)) && (*(pCh + 1) >= 0x4e && *(pCh + 1) <= 0x9f))
        {
            return true;
        }
    }

    return false;
}

int GetStringChineseCharCount(std::string context)
{
    std::wstring wContext = StringToWString(context);

    int chineseCharCount = 0;
    for (int i = 0; i < wContext.length(); ++i)
    {
        if (IsChineseChar(wContext.substr(i, 1)))
        {
            ++chineseCharCount;
        }
    }

    return chineseCharCount;
}

int main()
{
    std::string value = "类型A123";
    std::vector<std::string> spliteList = SpiteStringCharacter(value);
    int count = GetStringChineseCharCount(value);

    return 0;
}

结果如下:

评论 4
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值