from bs4 import BeautifulSoup import random import os import re import requests url ='https://tieba.baidu.com/p/4814458788?pn=' headers ={'User-Agent':"Mozilla/5.0 (Windows NT 6.1; WOW64) AppleWebKit/537.1 (KHTML, like Gecko) Chrome/22.0.1207.1 Safari/537.1"} for i in range(1,53): page_url=url +str(i) html = requests.get(page_url , headers=headers) soup = BeautifulSoup(html.text, 'lxml') list = soup.select('img.BDE_Image') title = random.randint(1,10000) path = str(title).strip() os.makedirs(os.path.join("D:\patuw", path)) os.chdir("D:\patuw\\"+path ) for img in list: img_url = img.get('src') name = img_url[100:103] get_img =requests.get(img_url ,headers=headers ) f =open(name+'.jpg','ab') f.write(get_img.content ) f.close()
太菜,写了好久,代码也很烂,新手。