UTF8编码转Unicode编码(C语言)

/**
 * 功能:UTF8编码转Unicode编码
 * 参数:dst 目标字符串,src 源字符串
 */
WORD UTF8_to_Unicode(BYTE *dst, BYTE *src)
{
    WORD i = 0, unicode = 0, ii, iii;
    int codeLen = 0;
    
    while ( *src )
    {
        //1. UTF-8 ---> Unicode
        if(0 == (src[0] & 0x80))
        {
            // 单字节
            codeLen = 1;
            unicode = src[0];
        }
        else if(0xC0 == (src[0] & 0xE0) && 0x80 == (src[1] & 0xC0))
        {// 双字节
            codeLen = 2;
            unicode = (WORD)((((WORD)src[0] & 0x001F) << 6) | ((WORD)src[1] & 0x003F));
        }
        else if(0xE0 == (src[0] & 0xF0) && 0x80 == (src[1] & 0xC0) && 0x80 == (src[2] & 0xC0))
        {// 三字节
            codeLen = 3;
            ii = (((WORD)src[0] & 0x000F) << 12);
            iii = (((WORD)src[1] & 0x003F) << 6);
            unicode = ii|iii|((WORD)src[2] & 0x003F);
            unicode = (WORD)((((WORD)src[0] & 0x000F) << 12) | (((WORD)src[1] & 0x003F) << 6) | ((WORD)src[2] & 0x003F));
        }
        else if(0xF0 == (src[0] & 0xF0) && 0x80 == (src[1] & 0xC0) && 0x80 == (src[2] & 0xC0) && 0x80 == (src[3] & 0xC0))
        {// 四字节
            codeLen = 4;
            unicode = (((int)(src[0] & 0x07)) << 18) | (((int)(src[1] & 0x3F)) << 12) | (((int)(src[2] & 0x3F)) << 6) | (src[3] & 0x3F);
        }
        else
        {
            INFOBOX_Show("超出4字节的Unicode码", 100);
            break;
        }
        src += codeLen;
        if (unicode < 0x80)
        {
            if (i == 0 && unicode == 0x20)
            {
                continue;
            }
        }
        i += 2;
        *dst++ = (BYTE)(unicode&0xff);
        *dst++ = (BYTE)((unicode>>8)&0xff);
    } // end while
    *dst = 0;
    
    return i;
}


  • 0
    点赞
  • 1
    收藏
    觉得还不错? 一键收藏
  • 0
    评论
评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值