使用正则表达式查询一段Html中的Title标签,包括内容!!
结果:
import java.util.ArrayList;
import java.util.Iterator;
import java.util.List;
import java.util.regex.Matcher;
import java.util.regex.Pattern;
public class Test {
public static void main(String args[]) {
String html = "<title fdsafdsa>ABCD<hrf></title>gsdggas<title>ggds</title>jkll<title fdfdsa>005</title>";
List resultList = getContextByTag(html,"title");
for (Iterator iterator = resultList.iterator(); iterator.hasNext();) {
String context = (String) iterator.next();
System.out.println(context);
}
}
public static List getContextByTag(String html,String tag) {
String reg="<"+tag+"(([^<|^>|.]*>)|( >)).*?</"+tag+">";
List resultList = new ArrayList();
Pattern p = Pattern.compile(reg);
Matcher m = p.matcher(html );
while (m.find()) {
resultList.add(m.group());
}
return resultList;
}
}
结果:
<title fdsafdsa>ABCD<hrf></title>
<title>ggds</title>
<title fdfdsa>005</title>