import xlrd,os,re,time
from xlrd import xldate_as_tuple
import requests
from urllib import request
from io import BytesIO
from PIL import Image
data = xlrd.open_workbook(r'.\郑州洪水暴雨.xlsx')
table = data.sheets()[0]
# 创建一个空列表,存储Excel的数据
tables = []
# 将excel表格内容导入到tables列表中
for rown in range(table.nrows):
array = {'序号':'','图片url':''}
array['序号'] = table.cell_value(rown, 0)
array['图片url'] = table.cell_value(rown, 2)
tables.append(array)
for i in tables[1:]:
path = r'E:\a'
os.chdir(path)
dirname = str(int(i['序号']))
print(dirname)
os.mkdir(dirname)
path2 = os.path.join(path,dirname)
print(path2)
os.chdir(path2)
imglist = i['图片url'].split(";")[0:-1]
# 保存图片,思路:将所有的图片保存在本地的一个文件夹下,用图片的url链接的后缀名来命名
dir_name = 'teacherImage' # 设置文件夹的名字
if not os.path.exists(path2): # os模块判断并创建
os.mkdir(path2)
for img_url in imglist:
time.sleep(1) # 设置间隔时间,防止把网页爬崩
i2 = img_url[30:-4] # https://wx4.sinaimg.cn/orj360/006iqas9ly1gu9fgwf4uqj60u014g7i102.jpg
reponse = requests.get(img_url)
with open(path2 + '/' + i2 + '.jpg', 'wb') as f:
f.write(reponse.content)