java提供图片链接,提取网页图片链接的JAVA程序

最新推荐文章于 2024-05-14 04:23:04 发布

weixin_40004502

最新推荐文章于 2024-05-14 04:23:04 发布

阅读量370

点赞数

文章标签： java提供图片链接

输入网页文件名，和资源列表文件名

输出资源列表文件供迅雷下载。

适用于批量下载图片。

由两个文件组成。

1// AnalizeIMG.java

3 // 主程序

5 import java.io.BufferedReader;

6import java.io.File;

7 import java.io.FileReader;

8 import java.io.FileWriter;

9 import java.io.IOException;

12 public class AnalizeIMG {

14 public void p(String s)

15 {

16 System.out.println(s);

17 }

19 public void analizeFile(String infile,String outfile) throws Exception

20 {

21 File file = new File(infile);

22 if (file == null || ! file.exists()) {

23 p( "File" + infile + "not exits !" );

24 }

26 if ( ! file.canRead()) {

27 p( "File" + infile +" can't read !" );

29 }

31 String strLine = null ;

32 FileReader frd = new FileReader(infile);

33 BufferedReader bufferedReader = new BufferedReader(frd);

34 try {

35 AnalizeWebParse parse = new AnalizeWebParse();

36 String s = parse.parse(bufferedReader);

38 createFile(outfile,s);

40 } catch (Exception ex) {

41 throw ex;

42 } finally {

43 frd.close();

44 bufferedReader.close();

45 }

46 }

48 private void createFile(String filename, String content) {

49 FileWriter f = null ;

50 try {

51 f = new FileWriter(filename);

52 if (f == null || content == null ) {

53 return ;

54 }

56 f.write(content);

57 f.flush();

58 f.close();

60 } catch (Exception e) {

62 } finally {

63 if (f!= null ) {

64 try {

65 f.close();

66 } catch (Exception e) {

68 }

69 }

70 }

71 }

73public static void main(String arg[])

74 {

75 AnalizeIMG ana = new AnalizeIMG();

76 try {

77 ana.analizeFile("E:\\1.txt" , "E:\\out.lst");

78 } catch (Exception ex) {

79 ex.printStackTrace();

80 }

81 }

82 }

第二个文件时解析文件

1// AnalizeWebParse.java

3 // 网页分析代码，需要用户根据自己需要做适当修改

5 import java.io.BufferedReader;

6 import java.io.StringReader;

7 import java.util.regex.Pattern;

9 import javax.swing.text.MutableAttributeSet;

10 import javax.swing.text.html.HTML;

11 import javax.swing.text.html.HTMLEditorKit.ParserCallback;

12 import javax.swing.text.html.parser.ParserDelegator;

14 public class AnalizeWebParse extends ParserCallback {

16 StringBuffer sb = new StringBuffer();

18 boolean start =false ;

19 boolean finished =false ;

21 public void p(String s)

22 {

23 System.out.println(s);

24 }

26 public void handleStartTag(HTML.Tag tag, MutableAttributeSet attribs,

27 int pos) {

29 if (finished == true )

30 {

31 return ;

32 }

34 if (start == false ) {

35 if (tag == HTML.Tag.DIV) {

36 String cla = (String) attribs

37 .getAttribute(HTML.Attribute.CLASS);

38 if (cla == null ) {

39 return ;

40 }

42 if (cla.indexOf("body")!= - 1 ) {

43 // Start

44 start = true ;

45 }

46 }

47 }

48 }

50 public void handleEndTag(HTML.Tag tag, int pos) {

51 if (tag == HTML.Tag.DIV && start == true && finished == false ) {

52 finished = true ;

53 }

54 }

56 public void handleText( char [] text, int pos) {

58 }

60 public void handleSimpleTag(HTML.Tag t, MutableAttributeSet a, int pos) {

61 if (t == HTML.Tag.IMG) {

62 // get a src

63 String src = (String) a.getAttribute(HTML.Attribute.SRC);

64 if (src == null ) {

65 return ;

66 }

68 if (Pattern.matches("^(http://.+)" , src)) {

69 sb.append(src).append("\n");

70 }

71 }

72 }

74 public String parse(BufferedReader file) throws Exception {

75 if (file == null )

76 {

77 return null ;

78 }

80 ParserDelegator pd = new ParserDelegator();

81 try {

82 pd.parse(file, this , true );

83 } catch(Exception e) {

84 throw e;

85 }

87 return sb.toString();

88 }

89 }

weixin_40004502

关注

0
点赞
踩
0

收藏

觉得还不错? 一键收藏
0
评论
java提供图片链接,提取网页图片链接的JAVA程序

输入网页文件名，和资源列表文件名输出资源列表文件供迅雷下载。适用于批量下载图片。由两个文件组成。1// AnalizeIMG.java23 // 主程序45 import java.io.BufferedReader;6import java.io.File;7 import java.io.FileReader;8 import java.io.FileWriter;9 import java....
复制链接

扫一扫