Java爬虫实例
直接上代码
public static void main(String[] args) throws IOException {
String url = "需要下载图片的地址,具体看源码";
Document document = Jsoup.connect(url).get();
Elements elements = document.select("img.lazy");
for (org.jsoup.nodes.Element element : elements) {
String imgUrl = element.attr("data-original");
String pictureName = element.attr("alt");
URL urlConn = new URL("http:" + imgUrl);
URLConnection urlConnection = urlConn.openConnection();
InputStream inputStream = urlConnection.getInputStream();
String filePath = "C:\\Users\\Administrator\\Desktop\\temp\\";
String fileName = pictureName + LocalDateTime.now().format(DateTimeFormatter.ofPattern("yyyy-MM-dd-HH-mm-ss-SSS")) + ".jpg";
OutputStream outputStream = new FileOutputStream(new File(filePath + fileName));
byte[] b = new byte[1024];
int count = 0;
while ((count = inputStream.read(b)) != -1) {
outputStream.write(b, 0, count);
}
outputStream.close();
inputStream.close();
System.out.println(fileName + " 下载完成。");
}
System.out.println(elements.size() + "张图下载完成。");
}
源码地址
Java爬虫