import requests
from bs4 import BeautifulSoup
# 页面源代码有连接,找到连接
def save_book(chapters,name):
file = open(f'a/{name}', 'w+', encoding='utf-8')
for i in chapters:
# file.write('\t')
for ii in i.split(' '): # i.split(' ')用多个空白符分割字符串,保留一个空格部分;''表示空,
if ii.startswith('<div'): # 去掉每章开头多余的<div……></div>
ii = ""
ii = ii.replace("<p></p>", "") # 去掉每章最后多余的<p></p>
file.write(ii)
file.write('\n') # 每写完一句,换行,控制文本格式
print(name+'搞定')
def downliad(url, name):
tk = []
resp = requests.get(url)
newr = resp.text.replace('<br />', '')
page = BeautifulSoup(newr, 'html.parser')
content = page.find('div', attrs={'id&
python异步爬取乐文小说
最新推荐文章于 2024-07-12 19:06:42 发布