python 爬取指定图片并将图片下载到指定文件夹

最新推荐文章于 2024-08-29 04:16:38 发布

YiFoEr_Liu

最新推荐文章于 2024-08-29 04:16:38 发布

阅读量5.8k

点赞数 2

分类专栏：个人学习 python 文章标签：爬取图片

本文链接：https://blog.csdn.net/liiukangkang/article/details/83180579

版权

个人学习同时被 2 个专栏收录

28 篇文章 1 订阅

订阅专栏

python

9 篇文章 0 订阅

订阅专栏

"""
Version 1.1.0
Author lkk
Email lkk199404@163.com
date 2018-10-19 11:34
DESC 下载指定网页的图片到指定文件夹
"""
import requests
import os
from urllib import request
import re
res = request.urlopen("http://www.27270.com/beautiful/")
html = res.read()
with open("picture.html", 'wb') as f:
    f.write(html)
with open("picture.html", "rb") as f:
    msg = r'alt="(.*?)".*?src="(.*?)"'
    result = re.findall(msg, f.read().decode('gbk'))
    for i in result:
        url = ""
        root = "E:\my_test\day10_18\image/"
        path = root + i[0]+'.jpg'
        try:
            if not os.path.exists(root):
                os.mkdir(root)
                if os.path.exists(path):
                    r = requests.get(i[1])
                    # 如果发送了一个错误请求(一个 4XX 客户端错误，或者
                    # 5XX 服务器错误响应)，我们可以通过Response.raise_for_status() 来抛出异常：
                    r.raise_for_status()
                    # 使用with语句可以不用自己手动关闭已经打开的文件流
                    with open(path, "wb") as e:  # 开始写文件，wb代表写二进制文件
                        e.write(r.content)
                    print("爬取完成")
            else:
                os.path.exists(path)
                r = requests.get(i[1])
                r.raise_for_status()
                # 使用with语句可以不用自己手动关闭已经打开的文件流
                with open(path, "wb") as e:  # 开始写文件，wb代表写二进制文件
                    e.write(r.content)
                print("爬取完成")
        except Exception as e:
            print("爬取失败:"+str(e))