工具类记录于此,以供参考。
package com.gccp.translate.biz.util;
import org.apache.commons.lang3.StringUtils;
import java.util.regex.Matcher;
import java.util.regex.Pattern;
/**
* @author hilbert.xu
* @date 2019/5/20
*/
public class HtmlUtil {
/**
* 过滤所有以html标签
*/
private final static String REG_HTML = "<([^>]*)>";
/**
* img标签
*/
private static final String REG_IMG = "(<img\\b.*?(?:\\>|\\/>))";
/**
* @param htmlStr
* @return 删除Html标签
*/
public static String delHTMLTag(String htmlStr) {
Pattern p_html = Pattern.compile(REG_HTML, Pattern.CASE_INSENSITIVE);
Matcher m_html = p_html.matcher(htmlStr);
// 过滤html标签
htmlStr = m_html.replaceAll("");
return htmlStr;
}
/**
* 获取完整img标签
*
* @param html
* @return
*/
public stat