public static void main(String[] args)
{
InputStream is = CommonUtil.getStream("http://wz.csdn.net/");
String regex = "(?<=href=/")[^/"]*";//查找网页中所有连接字符串
// String regex2 = "[A-Za-z]*([/u4e00-/u9fa5]*)(?=//d*(//.//d*)*)";
String test="<td><a rel=/"mz/" href=/"http://bbs.csdn.net//">论坛</a></td>";
Pattern pattern = Pattern.compile(regex);
Matcher matcher = pattern.matcher(test);
//显示匹配上的字符串。一次只找匹配的一个,必须循环找出所有
while(matcher.find())
{
System.out.println(matcher.group());
}
System.out.println(CommonUtil.patternText(test,regex));
System.out.println(CommonUtil.replaceRegex(test,regex,""));
}
/**
* 根据指定的正则表达式验证指定的文本内容
* @param content
* @return
* @throws UnsupportedEncodingException
*/
public static boolean patternText(String text,String regex)
{
// Pattern pattern=Pattern.compile("[A-Za-z]*([/u4e00-/u9fa5]*)(?=//d*(//.//d*)*)");
Pattern pattern = Pattern.compile(regex);
Matcher matcher = pattern.matcher(text);
return matcher.find();
}
/**
* 用指定字符串替换符合正则表达式的字符
* @param text
* @param regex
* @param replaceStr
* @return
*/
public static String replaceRegex(String text,String regex,String replaceStr)
{
Pattern pattern = Pattern.compile(regex);
Matcher matcher = pattern.matcher(text);
return matcher.replaceAll(replaceStr);
}