# 爬取京东网站上的商品图片
import requests
import re
url = 'https://list.jd.com/list.html?cat=9987,653,655'
res = requests.get(url)
res.encoding = 'utf-8'
# --获取图片地址
image_pat = '<img width="220" height="220" data-img="1" .*="//(.*)">'
imagelist = re.findall(image_pat, res.text)
# ---将图片保存到本地---
# 通过循环保存所有图片
x = 1
for image_url in imagelist:
image_url = 'http://' + image_url
image_name = '../data/jd_image/' + str(x) + '.jpg'
res2 = requests.get(image_url)
with open(image_name, 'wb') as pic_object: # 表示以二进制方式写入文件
pic_object.write(res2.content) # 对于非文本的请求,用res.content
x += 1