使用python爬取斗图网的图片
以下是代码部分:
# -*- coding: utf-8 -*-
"""
Created on Wed Apr 14 14:41:42 2021
@author: www99
"""
import os
import requests as req
from pyquery import PyQuery
from urllib import request
if not os.path.exists("/doutu"):
os.mkdir('./doutu')
headers={'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/89.0.4389.114 Safari/537.36'}
url='https://www.qiushibaike.com/imgrank/'
resp=req.get(url,headers=headers)
page=resp.text
pq=PyQuery(page)
imgs=pq('.thumb img')
print(imgs)
print("=============================")
for img in imgs.items():
print(img.attr['src'])
link_base=img.attr['src']
url='https:'+link_base
img_name=url.split('/')[-1]
print(img_name)
img_path='./doutu/'+img_name
resp=req.get(url,headers=headers)
with open(img_path,'wb') as f:
f.write(resp.content)
print("成功")