import os
import requests
import re
# 1.初始参数配置
wenti = input("你想下载什么图片")
# wenti = "袁隆平"
number = 10
# 新建文件夹 make directory
# os.makedirs(wenti)
# 判断是否存在文件夹
if not os.path.exists(wenti):
os.mkdir(wenti)
# 2.获取网页源代码
url = r'http://image.baidu.com/search/flip?tn=baiduimage&ipn=r&ct=201326592&cl=2&lm=-1&st=-1&fm=result&fr=&sf=1&fmq=1497491098685_R&pv=&ic=0&nc=1&z=&se=1&showtab=0&fb=0&width=&height=&face=0&istype=2&ie=utf-8&ctd=1497491098685%5E00_1519X735&word='
url = url+wenti
# print(url)
get = requests.get(url)
# print(get.text)
# 2.1 提取里面的每一个图片链接:正则表达式
tupian_url = re.findall(r'"objURL":"(.*?)", ',get.text)
print(tupian_url)
tupian_shu = 1
for i in tupian_url:
print("正在下载第%d张图片"%tupian_shu)
tupian_leixing = i.split('.')[-1]
h = requests.get(i)
# w write r read
f = open("%s/%s_%d.%s"%(wenti,wenti,tupian_shu,tupian_leixing), 'wb')
f.write(h.content)
f.close()
tupian_shu = tupian_shu + 1
if tupian_shu > number:
print("已经全部下载完成")
break
Alex - 用爬虫学习下载图片
最新推荐文章于 2023-06-21 13:17:18 发布