java获取文章的字数或者字符数

 package util;
/**
 * 获取文章的字数或者字符数
 *
 * @author ffshi
 */
public class StatWordCount {

 private final char[] CHS = { ',', ';', '.', '!', '?', ';', '+', '。', '?',
   '!' }; // 符号数组

 private final char[] CHN = { '/n', '/r' }; // 转义符数组

 private final char[] SPACE = { ' ', ' ' }; // 空格的数组(前半角,后全角)

 /**
  * 根据指定条件来筛选文章的字数
  *
  * @param wordContent
  *            文章内容
  * @param compriseInterpunction
  *            是否包含指定字符
  * @param compriseSpace
  *            是否包含空格
  * @return 返回文章经过指定筛选后的长度
  */
 public int getWordCount(String wordContent, boolean compriseInterpunction,
   boolean compriseSpace) {
  if (wordContent == null) {
   return 0;
  } else if (wordContent.length() == 0) {
   return 0;
  } else {
   // 既要包含符号又要包含空格
   if (compriseInterpunction && compriseSpace) {
    // 清除转义符
    String regex = "[" + new String(CHN) + "]";
    wordContent = wordContent.replaceAll(regex, " ");
    return this.getWordCount(wordContent);
   }
   // 不包含符号包含空格
   else if (!compriseInterpunction && compriseSpace) {
    // 使用正则表达式去掉指定的符号和转义符
    String regex1 = "[" + new String(CHN) + "]";
    String regex2 = "[" + new String(CHS) + "]";
    wordContent = wordContent.replaceAll(regex1, " ");
    wordContent = wordContent.replaceAll(regex2, " ");
    return this.getWordCount(wordContent);
   }
   // 包含指定符号不包含空格
   else if (compriseInterpunction && !compriseSpace) {
    // 使用正则表达式去掉空格和转义符
    String regex1 = "[" + new String(CHN) + "]";
    String regex2 = "[" + new String(SPACE) + "]";
    wordContent = wordContent.replaceAll(regex1, " ");
    wordContent = wordContent.replaceAll(regex2, " ");
    return this.getWordCount(wordContent);
   }
   // 空格和指定符号都不包含
   else {
    // 使用正则表达式去掉空格,指定符号和转义符
    String regex1 = "[" + new String(CHN) + "]";
    String regex3 = "[" + new String(CHS) + "]";
    String regex2 = "[" + new String(SPACE) + "]";
    wordContent = wordContent.replaceAll(regex1, " ");
    wordContent = wordContent.replaceAll(regex2, " ");
    wordContent = wordContent.replaceAll(regex3, " ");
    return this.getWordCount(wordContent);
   }
  }
 }

 /**
  * 返回文章中的字数
  *
  * @param wordCount
  *            文章内容
  * @return
  */
 @SuppressWarnings("unused")
 private int getWordCount(String wordContent) {
  int count = 0;
  if (wordContent == null) { // 判断是否为null,如果为null直接返回0
   count = 0;
  } else if (wordContent.length() == 0) { // 判断是否为空,如果为空直接返回0
   count = 0;
  } else { // 判断获取字数
   wordContent = wordContent.trim(); // 清空空格
   // 临时变量
   String s4 = "";
   String s3 = "";
   String s1 = "";
   boolean bb = false;
   if (wordContent.length() > 0) {
    s4 = String.valueOf(wordContent
      .charAt(wordContent.length() - 1));
   }
   for (int i = 0; i < wordContent.length(); i++) {
    s3 = String.valueOf(wordContent.charAt(i));
    int num = s3.getBytes().length;
    if (s3.hashCode() == 32 || s3.getBytes().length == 2) {
     bb = true;
    }
    if (num == 2) {
     count++;
    } else {
     if (i + 1 < wordContent.length() && (i > 1)) {
      s1 = String.valueOf(wordContent.charAt(i + 1));
      if ((s1.hashCode() == 32 || s1.getBytes().length == 2)
        && (s3.hashCode() != 32)) {
       count++;
      }
     }
    }
   }
   if (!bb) {
    count++;
   } else {
    if (s4.getBytes().length == 1) {
     count++;
    }
   }
  }
  return count;
 }

 /**
  * 根据条件来获取文章的字符数
  *
  * @param wordContent
  *            文章内容
  * @param compriseInterpunction
  *            是否包含指定符号
  * @param compriseSpace
  *            是否包含空格
  * @return 返回字符长度
  */
 public int getWordCharacter(String wordContent,
   boolean compriseInterpunction, boolean compriseSpace) {
  // 既要包含符号又要包含空格
  if (compriseInterpunction && compriseSpace) {
   // 清除转义符
   String regex = "[" + new String(CHN) + "]";
   wordContent = wordContent.replaceAll(regex, " ");
   // 首部的空格不算
   wordContent = wordContent.replaceAll("^//s+", "");
   return wordContent.length();
  }// 不包含符号包含空格
  else if (!compriseInterpunction && compriseSpace) {
   // 首部的空格不算
   wordContent = wordContent.replaceAll("^//s+", "");
   // 使用正则表达式去掉指定的符号和转义符
   String regex1 = "[" + new String(CHN) + "]";
   String regex2 = "[" + new String(CHS) + "]";
   wordContent = wordContent.replaceAll(regex1, " ");
   wordContent = wordContent.replaceAll(regex2, " ");
   return wordContent.length();
  }// 包含指定符号不包含空格
  else if (compriseInterpunction && !compriseSpace) {
   // 使用正则表达式去掉空格和转义符
   return this.getNoSpaceCount(wordContent);
  }// 空格和指定符号都不包含
  else {
   // 使用正则表达式去掉指定符号
   String regex1 = "[" + new String(CHS) + "]";
   wordContent = wordContent.replaceAll(regex1, " ");
   return this.getNoSpaceCount(wordContent);
  }
 }

 /**
  * 获取文章中非空格的字符总数
  *
  * @param wordContent
  *            文章内容
  * @return
  */
 private int getNoSpaceCount(String wordContent) {
  int spaceCount = 0;
  if (wordContent == null) {
   spaceCount = 0;
  } else if (wordContent.length() == 0) {
   spaceCount = 0;
  } else {
   // 替换首部的
   wordContent = wordContent.replaceAll("^//s+", "");
   wordContent = wordContent.replaceAll(" ", "");
   // 使用正则替换转义符
   String regex = "[" + new String(CHN) + "]";
   wordContent = wordContent.replaceAll(regex, "");
   spaceCount = wordContent.length();
  }
  return spaceCount;
 }
}

  • 0
    点赞
  • 0
    收藏
    觉得还不错? 一键收藏
  • 0
    评论
评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值