import requests,re,os.path,time
headers = {
'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/79.0.3945.88 Safari/537.36'
}
response = requests.get('https://www.vmgirls.com/12985.html',headers=headers)
html = response.text
urls = re.findall('<a href="(.*?)" alt=".*?" title=".*?">',html)
dir_name = re.findall('<h1 class=".*?">(.*?)</h1>',html)[-1]
# 如果不存在文件夹,则创建文件夹
if not os.path.exists(dir_name):
os.mkdir(dir_name)
print(urls)
"""保存图片"""
for url in urls:
time.sleep(1)
response = requests.get(url, headers=headers)
# 图片名字
r1 = os.path.basename(url)
with open(dir_name+"/"+r1,'wb') as f:
f.write(response.content)
python爬取网页图片
最新推荐文章于 2024-05-13 13:56:11 发布