引用 http://www.javaresearch.org/article/82778.htm
- import java.io.BufferedReader;
- import java.io.FileNotFoundException;
- import java.io.FileReader;
- import java.io.IOException;
- import java.util.regex.Matcher;
- import java.util.regex.Pattern;
- public class LinkerFinder {
- public static void main(String [] args)
- {
- String regStr="<a\\s+href\\s*=\\s*"//<a href=
- +"(\"[^\"]*\"|[^\\s]*)\\s*" //URL部分
- +"(target=\\s*(\"[^\"]*\"|[^\\s]*))?>";//target部分
- StringBuffer sb=new StringBuffer();
- try {
- FileReader fr = new FileReader("111.htm");
- BufferedReader br=new BufferedReader(fr);
- String line;
- while((line=br.readLine())!=null)
- {
- sb.append(line);
- }
- br.close();
- fr.close();
- Pattern ptn=Pattern.compile(regStr,Pattern.CASE_INSENSITIVE);
- Matcher matcher=ptn.matcher(sb);
- while(matcher.find())
- {
- int start=matcher.start();
- int end=matcher.end();
- String url=sb.substring(start,end);
- System.out.println(url);
- }
- } catch (FileNotFoundException e) {
- // TODO 自动生成 catch 块
- e.printStackTrace();
- } catch (IOException e) {
- // TODO 自动生成 catch 块
- e.printStackTrace();
- }
- }
- }
以上只是个例子,希望能给大家带来些启发.