1、目标
①爬取所有章节名称
②爬取所有章节的具体内容
2、url:‘https://www.shicimingju.com/book/sanguoyanyi.html’
import requests
from bs4 import BeautifulSoup
# BeautifulSoup 是bs4模块中一个类,需要导入后才能够实例化时使用
import lxml
headers={
'user_agent':'http://scxk.nmpa.gov.cn:81/xk/itownet/portalAction.do?method=getXkzsList '
}
url='https://www.shicimingju.com/book/sanguoyanyi.html'
page_text=requests<