代码可以运行,可以爬取小说,可以保存到本地,但还有不足,请教大侠,怎么分段保存?
每一章保存为一个文件
from bs4 import BeautifulSoup
import requests
import codecs
import re
def getHtml(url):
htm2 = requests.get(url,headers)
soup = BeautifulSoup(htm2.content,'lxml')
books_dir = []
name = soup.find('div',class_='listmain')
#父div,子dl,孙dt(总标题)和dd(每一章)
if name:
dd_items = name.find('dl')
dt_num = 0
for n in dd_items.children:
ename = str(n.name).strip()
if ename == 'dt':
dt_num += 1
if ename != 'dd':
continue
books_info = {}
if dt_num == 2:
durls = n.find_all('a')