python爬虫(一):爬取网页小说+AI智能读取文本
import requests
import re
url = 'https://www.ibswtan.com/70/70672/19808959.html'
res = requests.get(url)
a = res.encoding = 'utf-8'
contents = re.findall('<div id="content">(.*?)</div>',res.text)
print(contents)
with open('demo.txt','w') as f:
for content in contents:
f.write(content.replace(' ','').replace('<br/><br/>',''))
import pyttsx3
with open('demo.txt','r') as f:
line = f.read()
engine = pyttsx3.init()
engine.say(line)
engine.runAndWait()