判断字符串是否是中文

本文介绍了几种编程方法,如通过Unicode编码、逐字符检查、正则表达式等,来判断给定字符串中是否仅包含汉字(4e00-9fff范围内的字符),适用于C#编程语言。
摘要由CSDN通过智能技术生成

方法一:

在unicode 字符串中,中文的范围是在4E00..9FFF:CJK Unified Ideographs。

通过对字符的unicode编码进行判断来确定字符是否为中文。

protected bool  IsChineseLetter(string input,int index)

{

        int code = 0;

        int chfrom = Convert.ToInt32("4e00", 16);    //范围(0x4e00~0x9fff)转换成int(chfrom~chend)

        int chend = Convert.ToInt32("9fff", 16);

        if (input != "")

        {

            code = Char.ConvertToUtf32(input, index);    //获得字符串input中指定索引index处字符unicode编码

            

           if (code >= chfrom && code <= chend)     

            {

                return true;     //当code在中文范围内返回true

            }

            else

            {

                 return false ;    //当code不在中文范围内返回false

            }

        }

        return false;

}

方法二:

public bool IsChina(string CString)

          {

              bool BoolValue = false;

              for (int i = 0; i < CString.Length; i++)

              {

                  if (Convert.ToInt32(Convert.ToChar(CString.Substring(i, 1))) < Convert.ToInt32(Convert.ToChar(128)))

                  {

                      BoolValue = false;

                  }

                  else

                  {

                      return BoolValue = true;

                  }

              }

              return BoolValue;

          }

方法三:

**/**/ <summary>

        /// 判断句子中是否含有中文

        /// </summary>

        /// <param >字符串</param>

        public bool WordsIScn(string words)

        {

            string TmmP;

            for (int i = 0; i < words.Length; i++)

            {

                TmmP = words.Substring(i, 1);

                byte[] sarr = System.Text.Encoding.GetEncoding("gb2312").GetBytes(TmmP);

                if (sarr.Length == 2)

                {

                    return true;

                }

            }

            return false;

        }

方法四:

for (int i=0; i<s.length; i++)

{

Regex rx = new Regex("^[\u4e00-\u9fa5]$");

if (rx.IsMatch(s[i]))

// 是

else

// 否

}

正解!

\u4e00-\u9fa5 汉字的范围。

^[\u4e00-\u9fa5]$ 汉字的范围的正则

方法五:

unicodeencoding   unicodeencoding   =   new   unicodeencoding();  

  byte   []   unicodebytearray   =   unicodeencoding.getbytes(   inputstring   );  

  for(   int   i   =   0;   i   <   unicodebytearray.length;   i++   )  

  {  

  i++;  

  //如果是中文字符那么高位不为0  

  if   (   unicodebytearray[i]   !=   0   )  

  {  

  }  

  ……   

方法六:

 /**//**//** <summary>

        /// 给定一个字符串,判断其是否只包含有汉字

        /// </summary>

        /// <param name="testStr"></param>

        /// <returns></returns>

        public bool IsOnlyContainsChinese(string testStr)

        {

            char[] words = testStr.ToCharArray();

            foreach (char word in words)

            {

                if ( IsGBCode(word.ToString()) || IsGBKCode(word.ToString()) )  // it is a GB2312 or GBK chinese word

                {

                    continue;

                }

                else

                {

                    return false;

                }

            }

            return true;

        }

        /**//**//** <summary>

        /// 判断一个word是否为GB2312编码的汉字

        /// </summary>

        /// <param name="word"></param>

        /// <returns></returns>

        private bool IsGBCode(string word)

        {

            byte[] bytes = Encoding.GetEncoding("GB2312").GetBytes(word);

            if (bytes.Length <= 1)  // if there is only one byte, it is ASCII code or other code

            {

                return false;

            }

            else

            {

                byte byte1 = bytes[0];

                byte byte2 = bytes[1];

                if (byte1 >= 176 && byte1 <= 247 && byte2 >= 160 && byte2 <= 254)    //判断是否是GB2312

                {

                    return true;

                }

                else

                {

                    return false;

                }

            }

        }

        /**//**//** <summary>

        /// 判断一个word是否为GBK编码的汉字

        /// </summary>

        /// <param name="word"></param>

        /// <returns></returns>

        private bool IsGBKCode(string word)

        {

            byte[] bytes = Encoding.GetEncoding("GBK").GetBytes(word.ToString());

            if (bytes.Length <= 1)  // if there is only one byte, it is ASCII code

            {

                return false;

            }

            else

            {

                byte byte1 = bytes[0];

                byte byte2 = bytes[1];

                if ( byte1 >= 129 && byte1 <= 254 && byte2 >= 64 && byte2 <= 254)     //判断是否是GBK编码

                {

                    return true;

                }

                else

                {

                    return false;

                }

            }

        }

        /**//**//** <summary>

        /// 判断一个word是否为Big5编码的汉字

        /// </summary>

        /// <param name="word"></param>

        /// <returns></returns>

        private bool IsBig5Code(string word)

        {

            byte[] bytes = Encoding.GetEncoding("Big5").GetBytes(word.ToString());

            if (bytes.Length <= 1)  // if there is only one byte, it is ASCII code

            {

                return false;

            }

            else

            {

                byte byte1 = bytes[0];

                byte byte2 = bytes[1];

                if ( (byte1 >= 129 && byte1 <= 254) && ((byte2 >= 64 && byte2 <= 126) || (byte2 >= 161 && byte2 <= 254)) )  //判断是否是Big5编码

                {

                    return true;

                }

                else

                {

                    return false;

                }

            }

        }

  • 24
    点赞
  • 22
    收藏
    觉得还不错? 一键收藏
  • 打赏
    打赏
  • 0
    评论
评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包

打赏作者

等天晴i

你的鼓励将是我创作的最大动力

¥1 ¥2 ¥4 ¥6 ¥10 ¥20
扫码支付:¥1
获取中
扫码支付

您的余额不足,请更换扫码支付或充值

打赏作者

实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值