C++：窄字节转宽字节（宽字节转窄字节）

最新推荐文章于 2023-05-18 13:09:30 发布

Ryan_naiquan

最新推荐文章于 2023-05-18 13:09:30 发布

阅读量2.3k

点赞数 3

分类专栏： MFC和win32 文章标签： string C++ 窄字节宽字节 CString

本文链接：https://blog.csdn.net/xiaonaiquan/article/details/76510828

版权

MFC和win32 专栏收录该内容

5 篇文章 0 订阅

订阅专栏

string CMainDlg::wstringToString(const wstring & wstr)
{
    LPCWSTR pwszSrc = wstr.c_str();
    int nLen = WideCharToMultiByte(CP_ACP, 0, pwszSrc, -1, NULL, 0, NULL, NULL);
    if (nLen == 0)
        return string("");
    char *pszDst = new char[nLen];
    if (!pszDst)
        return string("");
    WideCharToMultiByte(CP_ACP, 0, pwszSrc, -1, pszDst, nLen, NULL, NULL);
    string str(pszDst);
    delete[] pszDst;
    pszDst = NULL;
    return str;
}

wstring CMainDlg::stringToWstring(const string &str)
{
    LPCSTR pszSrc = str.c_str();
    int nLen = MultiByteToWideChar(CP_ACP, 0, pszSrc, -1, NULL, 0);
    if (nLen == 0)
        return wstring(L"");
    wchar_t * pwszDst = new wchar_t[nLen];
    if (!pwszDst)
        return wstring(L"");
    MultiByteToWideChar(CP_ACP, 0, pszSrc, -1, pwszDst, nLen);
    std::wstring wstr(pwszDst);
    delete[] pwszDst;
    pwszDst = NULL;
    return wstr;
}

下面这些有些用到，有些用不到：
stringTool.h

#pragma once

#include <Windows.h>
#include <string>
#include <vector>

#pragma warning(disable:4190)
using namespace std;

#ifndef xstring 
#ifdef UNICODE
#define xstring wstring
#else
#define xstring string
#endif
#endif

std::string  UnicodeToAnsi(const std::wstring& strSource);
std::wstring AnsiToUnicode(const std::string& strSource);
std::wstring Utf8ToUnicode(const std::string& strSrouce);
std::string UnicodeToUtf8(const std::wstring& strSource);
std::string AnsiToUtf8(const std::string& strSource);
std::string Utf8ToAnsi(const std::string& strSource);
std::string URLEncodeGB2312(const string& strUtf8/*, char* pBuf, int cbBufLen*/);           //空格转为'+'
std::string URLEncodeGB2312Forspace(const string& strUtf8/*, char* pBuf, int cbBufLen*/);   //空格转为'%20'
char* Utf8ToGBK(const char* strSource);
char* GBKToUtf8(const char* strSource);
bool UrlEncode(const char* szSrc, char* pBuf, int cbBufLen, bool bUpperCase);
bool Utf8UrlDecode(const char* szSrc, char* pBuf, int cbBufLen);
bool UrlDecode(const char* szSrc, char* pBuf, int cbBufLen);
std::string EscapeToAnsi(const std::string& strSource);

#ifndef _W
#define _W(x) AnsiToUnicode(x).data()
#endif

#ifndef _A
#define _A(x) UnicodeToAnsi(x).data()
#endif

//字符串替换 会对strText中的所有strOld都进行替换,但不会对替换后的串再次检查替换.例如将"1001"中的"1"替换为"1234",那么返回值为"1234001234"
//strText-全部内容 strOld-将要被替换的内容 strNew-新的用来替换的
xstring StringReplace(const xstring& strText, const xstring& strOld, const xstring& strNew);

inline bool IsGB2312(const unsigned char *pszIn) 
{ 
    if (*pszIn>=0xB0 && *pszIn<=0xF7 && *(pszIn+1)>=0xA0 && *(pszIn+1)<=0xFE) 
        return true; 
    else 
        return false; 
}

inline bool IsGBK(const unsigned char *pszIn) 
{ 
    if (*pszIn>=0x81 && *pszIn<=0xFE && *(pszIn+1)>=0x40 && *(pszIn+1)<=0xFE) 
        return true; 
    else 
        return false; 
}

inline bool IsBIG5(const unsigned char *pszIn) 
{ 
    if (*pszIn>=0x81 && *pszIn<=0xFE && ((*(pszIn+1)>=0x40 && *(pszIn+1)<=0x7E) || (*(pszIn+1)>=0xA1 && *(pszIn+1)<=0xFE)))
        return true; 
    else 
        return false; 
}

inline bool IsValidEnglishChar(const unsigned char *pszIn) 
{
    if((*pszIn>='0' && *pszIn <= '9') || (*pszIn>='a' && *pszIn <= 'z') || (*pszIn>='A' && *pszIn <= 'Z'))
    {
        return true;
    }
    else
        return false;
}

inline bool IsValidName(const unsigned char *pszIn, int nLen) 
{
    for (int i=0; i < nLen; )
    {
        if(IsValidEnglishChar(pszIn+i))
        {
            i++;
            continue;
        }
        else if(((i+1) < nLen) && IsGBK(pszIn+i))
        {
            i += 2;
            continue;
        }
        else
            return false;
    }
    return true;
}

inline bool IsValidQQ(const unsigned char *pszIn, int nLen) 
{
    for (int i=0; i < nLen; )
    {
        if(isdigit(*(pszIn+i)))
        {
            i++;
            continue;
        }
        else
            return false;
    }
    return true;

}

inline void CutChineseChar(char *pszSrc,unsigned int nNeedLen)
{
    if (strlen(pszSrc) >= nNeedLen)
    {
        //如果后两位不是英文字符，也不是一个有效的汉字，则后三位是一个汉字多最后一个字节
        if(!IsValidEnglishChar((const unsigned char *)(pszSrc+nNeedLen-2)) && !IsGBK((const unsigned char *)(pszSrc+nNeedLen-2)))
        {
            *(pszSrc+nNeedLen-3) = '.';
        }
        *(pszSrc+nNeedLen-2) = '.';
        *(pszSrc+nNeedLen-1) = '.';
        *(pszSrc+nNeedLen) = '\0';
    }
}

stringTool.cpp

#include "StringTools.h"

std::string UnicodeToAnsi(const std::wstring& strSource)
{
    int nLength = ::WideCharToMultiByte(CP_ACP, 0, strSource.data(), -1, NULL, 0, NULL, FALSE);

    if (nLength < 1)
    {
        return "";
    }

    std::vector<char> vecResult(nLength);
    ::WideCharToMultiByte(CP_ACP, 0, strSource.data(), -1, &vecResult[0], nLength, NULL, FALSE);

    return std::string(vecResult.begin(), vecResult.end()-1);
}


std::wstring AnsiToUnicode(const std::string& strSource)
{
    int nLength = ::MultiByteToWideChar(CP_ACP, 0, strSource.data(), -1, NULL, 0);

    if (nLength < 1)
    {
        return L"";
    }

    std::wstring strResult(nLength, 0);
    ::MultiByteToWideChar(CP_ACP, 0, strSource.data(), strSource.size(), &strResult[0], nLength);

    return std::wstring(strResult.data(), nLength - 1);
}


std::wstring Utf8ToUnicode(const std::string& strSrouce)
{
    int nLength = ::MultiByteToWideChar(CP_UTF8, 0, strSrouce.data(), -1, NULL, 0);

    if (nLength < 1)
    {
        return L"";
    }

    std::wstring strResult(nLength, 0);
    ::MultiByteToWideChar(CP_UTF8, 0, strSrouce.data(), strSrouce.size(), &strResult[0], nLength);

    return std::wstring(strResult.data(), nLength - 1);
}

std::string UnicodeToUtf8(const std::wstring& strSource)
{
    int nLength = ::WideCharToMultiByte(CP_UTF8, 0, strSource.data(), -1, NULL, 0, NULL, FALSE);

    if (nLength < 1)
    {
        return "";
    }

    std::string strResult(nLength, 0);
    ::WideCharToMultiByte(CP_UTF8, 0, strSource.data(), -1, &strResult[0], nLength, NULL, FALSE);

    return std::string(strResult.data(), nLength - 1);
}

std::string AnsiToUtf8(const std::string& strSource)
{
    std::wstring temp = AnsiToUnicode(strSource);
    return UnicodeToUtf8(temp);
}

std::string Utf8ToAnsi(const std::string& strSource)
{
    std::wstring strTmp = Utf8ToUnicode(strSource);
    return UnicodeToAnsi(strTmp);
}

//UrlEncode
bool UrlEncode(const char* szSrc, char* pBuf, int cbBufLen, bool bUpperCase)
{
    if(szSrc == NULL || pBuf == NULL || cbBufLen <= 0)
        return false;

    size_t len_ascii = strlen(szSrc);
    if(len_ascii == 0)
    {
        pBuf[0] = 0;
        return true;
    }

    //先转换到UTF-8
    char baseChar = bUpperCase ? 'A' : 'a';
    int cchWideChar = MultiByteToWideChar(CP_ACP, 0, szSrc, len_ascii, NULL, 0);
    LPWSTR pUnicode = (LPWSTR)malloc((cchWideChar + 1) * sizeof(WCHAR));
    if(pUnicode == NULL)
        return false;
    MultiByteToWideChar(CP_ACP, 0, szSrc, len_ascii, pUnicode, cchWideChar + 1);

    int cbUTF8 = WideCharToMultiByte(CP_UTF8, 0, pUnicode, cchWideChar, NULL, 0, NULL, NULL);
    LPSTR pUTF8 = (LPSTR)malloc((cbUTF8 + 1) * sizeof(CHAR));
    if(pUTF8 == NULL)
    {
        free(pUnicode);
        return false;
    }
    WideCharToMultiByte(CP_UTF8, 0, pUnicode, cchWideChar, pUTF8, cbUTF8 + 1, NULL, NULL);
    pUTF8[cbUTF8] = '\0';

    unsigned char c;
    int cbDest = 0; //累加
    unsigned char *pSrc = (unsigned char*)pUTF8;
    unsigned char *pDest = (unsigned char*)pBuf;
    while(*pSrc && cbDest < cbBufLen - 1)
    {
        c = *pSrc;
        if(isalpha(c) || isdigit(c) || c == '-' || c == '.' || c == '~')
        {
            *pDest = c;
            ++pDest;
            ++cbDest;
        }
        else if(c == ' ')
        {
            *pDest = '+';
            ++pDest;
            ++cbDest;
        }
        else
        {
            //检查缓冲区大小是否够用？
            if(cbDest + 3 > cbBufLen - 1)
                break;
            pDest[0] = '%';
            pDest[1] = (c >= 0xA0) ? ((c >> 4) - 10 + baseChar) : ((c >> 4) + '0');
            pDest[2] = ((c & 0xF) >= 0xA)? ((c & 0xF) - 10 + baseChar) : ((c & 0xF) + '0');
            pDest += 3;
            cbDest += 3;
        }
        ++pSrc;
    }
    //null-terminator
    *pDest = '\0';
    free(pUnicode);
    free(pUTF8);
    return true;
}

bool Utf8UrlDecode(const char* szSrc, char* pBuf, int cbBufLen)
{
    if(szSrc == NULL || pBuf == NULL || cbBufLen <= 0)
        return false;

    size_t len_ascii = strlen(szSrc);
    if(len_ascii == 0)
    {
        pBuf[0] = 0;
        return true;
    }

    char *pUTF8 = (char*)malloc(len_ascii + 1);
    if(pUTF8 == NULL)
        return false;

    int cbDest = 0; //累加
    unsigned char *pSrc = (unsigned char*)szSrc;
    unsigned char *pDest = (unsigned char*)pUTF8;
    while(*pSrc)
    {
        if(*pSrc == '%')
        {
            *pDest = 0;
            //高位
            if(pSrc[1] >= 'A' && pSrc[1] <= 'F')
                *pDest += (pSrc[1] - 'A' + 10) * 0x10;
            else if(pSrc[1] >= 'a' && pSrc[1] <= 'f')
                *pDest += (pSrc[1] - 'a' + 10) * 0x10;
            else
                *pDest += (pSrc[1] - '0') * 0x10;

            //低位
            if(pSrc[2] >= 'A' && pSrc[2] <= 'F')
                *pDest += (pSrc[2] - 'A' + 10);
            else if(pSrc[2] >= 'a' && pSrc[2] <= 'f')
                *pDest += (pSrc[2] - 'a' + 10);
            else
                *pDest += (pSrc[2] - '0');

            pSrc += 3;
        }
        else if(*pSrc == '+')
        {
            *pDest = ' ';
            ++pSrc;
        }
        else
        {
            *pDest = *pSrc;
            ++pSrc;
        }
        ++pDest;
        ++cbDest;
    }
    //null-terminator
    *pDest = '\0';
    ++cbDest;

    if(cbDest < cbBufLen)
    {
        strncpy_s(pBuf, cbBufLen, pUTF8, cbDest);
        return true;
    }
    return false;
}

//解码后是utf-8编码
bool UrlDecode(const char* szSrc, char* pBuf, int cbBufLen)
{
    if(Utf8UrlDecode(szSrc, pBuf, cbBufLen))
    {
        string strTemp = Utf8ToAnsi(pBuf);
        if(strTemp.size() > 0)
        {
            strncpy_s(pBuf, cbBufLen, strTemp.c_str(), strTemp.size());
            return true;
        }
    }
    return false;


 //   if(szSrc == NULL || pBuf == NULL || cbBufLen <= 0)
 //       return false;

 //   size_t len_ascii = strlen(szSrc);
 //   if(len_ascii == 0)
 //   {
 //       pBuf[0] = 0;
 //       return true;
 //   }

 //   char *pUTF8 = (char*)malloc(len_ascii + 1);
 //   if(pUTF8 == NULL)
 //       return false;

 //   int cbDest = 0; //累加
 //   unsigned char *pSrc = (unsigned char*)szSrc;
 //   unsigned char *pDest = (unsigned char*)pUTF8;
 //   while(*pSrc)
 //   {
 //       if(*pSrc == '%')
 //       {
 //           *pDest = 0;
 //           //高位
 //           if(pSrc[1] >= 'A' && pSrc[1] <= 'F')
 //               *pDest += (pSrc[1] - 'A' + 10) * 0x10;
 //           else if(pSrc[1] >= 'a' && pSrc[1] <= 'f')
 //               *pDest += (pSrc[1] - 'a' + 10) * 0x10;
 //           else
 //               *pDest += (pSrc[1] - '0') * 0x10;

 //           //低位
 //           if(pSrc[2] >= 'A' && pSrc[2] <= 'F')
 //               *pDest += (pSrc[2] - 'A' + 10);
 //           else if(pSrc[2] >= 'a' && pSrc[2] <= 'f')
 //               *pDest += (pSrc[2] - 'a' + 10);
 //           else
 //               *pDest += (pSrc[2] - '0');

 //           pSrc += 3;
 //       }
 //       else if(*pSrc == '+')
 //       {
 //           *pDest = ' ';
 //           ++pSrc;
 //       }
 //       else
 //       {
 //           *pDest = *pSrc;
 //           ++pSrc;
 //       }
 //       ++pDest;
 //       ++cbDest;
 //   }
 //   //null-terminator
 //   *pDest = '\0';
 //   ++cbDest;

 //   int cchWideChar = MultiByteToWideChar(CP_UTF8, 0, (LPCSTR)pUTF8, cbDest, NULL, 0);
 //   LPWSTR pUnicode = (LPWSTR)malloc(cchWideChar * sizeof(WCHAR));
 //   if(pUnicode == NULL)
 //   {
 //       free(pUTF8);
 //       return false;
 //   }
 //   MultiByteToWideChar(CP_UTF8, 0, (LPCSTR)pUTF8, cbDest, pUnicode, cchWideChar);
 //   WideCharToMultiByte(CP_ACP, 0, pUnicode, cchWideChar, pBuf, cbBufLen, NULL, NULL);
 //   free(pUTF8);
 //   free(pUnicode);
 //   return true;
}

typedef unsigned char BYTE;

inline BYTE toHex(const BYTE &x)
{

    return x > 9 ? x + 55: x + 48; 

}

std::string URLEncodeGB2312(const string& strUtf8/*, char* pBuf, int cbBufLen*/)
{
    std::string sOut;
    for( size_t ix = 0; ix < strUtf8.length(); ix++ )
    {       
        BYTE buf[4]; 
        memset( buf, 0, 4 ); 
        if( isalnum( (BYTE)strUtf8[ix] ) || ispunct((BYTE)strUtf8[ix]))
        {       
            buf[0] = strUtf8[ix];
        }
        else if ( isspace( (BYTE)strUtf8[ix] ) )
        {
            buf[0] = '+';
        }
        else
        {
            buf[0] = '%';
            buf[1] = toHex( (BYTE)strUtf8[ix] >> 4 );
            buf[2] = toHex( (BYTE)strUtf8[ix] % 16);
        }
        sOut += (char *)buf;
    }
    //strncpy(pBuf,sOut.data(),cbBufLen);
    return sOut;
};

std::string URLEncodeGB2312Forspace(const string& strUtf8/*, char* pBuf, int cbBufLen*/)
{
    std::string sOut;
    for( size_t ix = 0; ix < strUtf8.length(); ix++ )
    {       
        BYTE buf[4]; 
        memset( buf, 0, 4 ); 
        if( isalnum( (BYTE)strUtf8[ix] ) || ispunct((BYTE)strUtf8[ix]))
        {       
            buf[0] = strUtf8[ix];
        }
        else if ( isspace( (BYTE)strUtf8[ix] ) )
        {
            //buf[0] = '+';
            buf[0] = '%';
            buf[1] = '2';
            buf[2] = '0';
        }
        else
        {
            buf[0] = '%';
            buf[1] = toHex( (BYTE)strUtf8[ix] >> 4 );
            buf[2] = toHex( (BYTE)strUtf8[ix] % 16);
        }
        sOut += (char *)buf;
    }
    //strncpy(pBuf,sOut.data(),cbBufLen);
    return sOut;
};

char* Utf8ToGBK(const char* strUtf8)
{
    int len=MultiByteToWideChar(CP_UTF8, 0, /*(LPCTSTR)*/strUtf8, -1, NULL,0); 
    unsigned short * wszGBK = new unsigned short[len+1];       
    memset(wszGBK, 0, len * 2 + 2); 
    MultiByteToWideChar(CP_UTF8, 0, /*(LPCTSTR)*/strUtf8, -1, (LPWSTR)wszGBK, len);
    len = WideCharToMultiByte(CP_ACP, 0, (LPCWSTR)wszGBK, -1, NULL, 0, NULL, NULL);
    char *szGBK=new char[len + 1]; 
    memset(szGBK, 0, len + 1); 
    WideCharToMultiByte (CP_ACP, 0, (LPCWSTR)wszGBK, -1, (LPSTR)szGBK, len, NULL,NULL);
    return szGBK; 
}

char* GBKToUtf8(const char* strGBK)
{ 
    int len=MultiByteToWideChar(CP_ACP, 0, /*(LPCTSTR)*/strGBK, -1, NULL,0); 
    unsigned short * wszUtf8 = new unsigned short[len+1]; 
    memset(wszUtf8, 0, len * 2 + 2); 
    MultiByteToWideChar(CP_ACP, 0, /*(LPCTSTR)*/strGBK, -1, (LPWSTR)wszUtf8, len);
    len = WideCharToMultiByte(CP_UTF8, 0, (LPCWSTR)wszUtf8, -1, NULL, 0, NULL, NULL);
    char *szUtf8=new char[len + 1]; 
    memset(szUtf8, 0, len + 1); 
    WideCharToMultiByte (CP_UTF8, 0, (LPCWSTR)wszUtf8, -1, (LPSTR)szUtf8, len, NULL,NULL);
    return szUtf8; 
}

std::string EscapeToAnsi(const std::string& strSource)
{
    try
    {
        string strAnsi = strSource;                 //"\u50ab",另外一种"%u50ab"暂时没有做处理
        string strValue,strvalue1;
        wchar_t wch;

        unsigned int npos = strAnsi.find("\\u",0);
        while (npos != string::npos)
        {
            strvalue1 = strAnsi.substr(npos,6);     //"\u50ab"
            strValue = strAnsi.substr(npos+2,4);    //"50ab"
            if (strValue.length() == 4)
            {
                if ( (strValue.at(0)>='0'&& strValue.at(0)<='9') || (strValue.at(0)>='a'&& strValue.at(0)<='f') || (strValue.at(0)>='A'&& strValue.at(0)<='F') )
                {
                    if ( (strValue.at(1)>='0'&&strValue.at(1)<='9') || (strValue.at(1)>='a'&&strValue.at(1)<='f') || (strValue.at(1)>='A'&&strValue.at(1)<='F') )
                    {
                        if ( (strValue.at(2)>='0'&& strValue.at(2)<='9') || ((strValue.at(2)>='a'&& strValue.at(2)<='f')) || (strValue.at(2)>='A'&& strValue.at(2)<='F') )
                        {
                            if ( (strValue.at(3)>='0'&& strValue.at(3)<='9') || ((strValue.at(3)>='a'&& strValue.at(3)<='f')) || (strValue.at(3)>='A'&& strValue.at(3)<='F') )
                            {
                                sscanf(strValue.c_str(),"%4x",&wch);
                                strAnsi.replace(strAnsi.begin()+npos,strAnsi.begin()+npos+6,_A(&wch));

                                npos = strAnsi.find("\\u",0);
                            }
                            else
                                npos = strAnsi.find("\\u",npos+2);
                        }
                        else
                            npos = strAnsi.find("\\u",npos+2);
                    }
                    else
                        npos = strAnsi.find("\\u",npos+2);
                }
                else
                    npos = strAnsi.find("\\u",npos+2);
            }
            else
                break;          
        }
        return strAnsi;
    }
    catch (...)
    {
        return "";
    }
}

//描述：中文汉字在没在对应的拼音范围
bool  InPYRange(wchar_t start, wchar_t end, wchar_t code)
{
    if (code >= start && code <= end)
    {
        return true;
    }

    return false;
}


//描述：得到当前中文字的拼音的第一个字母
char  GetChineseFirstPY(wchar_t n)
{
    if (InPYRange(0xB0A1,0xB0C4,n)) return 'a';
    if (InPYRange(0XB0C5,0XB2C0,n)) return 'b';
    if (InPYRange(0xB2C1,0xB4ED,n)) return 'c';
    if (InPYRange(0xB4EE,0xB6E9,n)) return 'd';
    if (InPYRange(0xB6EA,0xB7A1,n)) return 'e';
    if (InPYRange(0xB7A2,0xB8c0,n)) return 'f';
    if (InPYRange(0xB8C1,0xB9FD,n)) return 'g';
    if (InPYRange(0xB9FE,0xBBF6,n)) return 'h';
    if (InPYRange(0xBBF7,0xBFA5,n)) return 'j';
    if (InPYRange(0xBFA6,0xC0AB,n)) return 'k';
    if (InPYRange(0xC0AC,0xC2E7,n)) return 'l';
    if (InPYRange(0xC2E8,0xC4C2,n)) return 'm';
    if (InPYRange(0xC4C3,0xC5B5,n)) return 'n';
    if (InPYRange(0xC5B6,0xC5BD,n)) return 'o';
    if (InPYRange(0xC5BE,0xC6D9,n)) return 'p';
    if (InPYRange(0xC6DA,0xC8BA,n)) return 'q';
    if (InPYRange(0xC8BB,0xC8F5,n)) return 'r';
    if (InPYRange(0xC8F6,0xCBF0,n)) return 's';
    if (InPYRange(0xCBFA,0xCDD9,n)) return 't';
    if (InPYRange(0xCDDA,0xCEF3,n)) return 'w';
    if (InPYRange(0xCEF4,0xD188,n)) return 'x';
    if (InPYRange(0xD1B9,0xD4D0,n)) return 'y';
    if (InPYRange(0xD4D1,0xD7F9,n)) return 'z';
    return '\0';
}


//***************************************************
//名称：GetFirstChinesePYCharOfText
//功能：得到中文文本中的第一个中文的拼音的第一个字母 
//参数：
//      szText - 包含有中文的文本
//      firstChar - 返回第一个中文的拼音的首个字母
//返回值：
//     若文本以中文打头，且成功得到其拼音的首个字母，则返回true,否则false
//***************************************************
bool GetFirstChinesePYCharOfText(char* szText, char &firstChar)
{
    if (!szText || strlen(szText) <= 1)
    {
        return false;
    }

    string sChinese = szText;
    int  nCnt = 1;//sChinese.length()/2   //得到文本中前几个中文的拼音的第一个字母

    char chr[3];
    wchar_t wchr = 0;
    char* buff = new char[nCnt + 1];

    memset(buff, 0x00, sizeof(char) * nCnt + 1);
    for (int i = 0, j = 0; i < nCnt; ++i)
    {
        memset(chr, 0x00, sizeof(chr));
        chr[0] = sChinese[j++];
        chr[1] = sChinese[j++];
        chr[2] = '\0';

        // 单个字符的编码 如：'我' = 0xced2
        wchr = 0;
        wchr = (chr[0] & 0xff) << 8;
        wchr |= (chr[1] & 0xff);

        buff[i] = GetChineseFirstPY(wchr);
    }

    firstChar = buff[0];
    delete []buff;

    if (firstChar == '\0')
    {
        firstChar = szText[0];
        return false;
    }
    else
    {
        return true;
    }
}

xstring StringReplace(const xstring& strText, const xstring& strOld, const xstring& strNew)
{
    if (strOld == strNew)
        return strText;

    xstring strValue = strText;
    int nFind = 0;
    int nStart = strValue.find(strOld, nFind);
    while (nStart != string::npos)
    {
        strValue.replace(nStart, strOld.length(), strNew);
        nFind = nStart + strNew.length();
        nStart = strValue.find(strOld, nFind);
    }
    return strValue;
}