import requests
import time
from lxml import etree
import os
url_list = [] # 存取搜索内容的URL
class_name_list = [] # 类名
author_name_list = [] # 作者名字
book_name_list = [] # 书名
data_list = [] # 作品信息
content_list_Detail = []
nums_list = [] # 获取搜索内容的书名ID
list_zhang_list = [] # 获取章节列表的id
zhangjie_url_content = [] # 章节的URL列表
z_id_list = [] # 章节id列表
num_id = 0
nameBook = ""
# 发送搜索请求
def get_info():
url = "http://www.shuquge.com/search.php"
name = input("请输入小说名字:")
headers = {
'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; WOW64)'
' AppleWebKit/537.36 (KHTML, like Gecko) '
'Chrome/70.0.3538.25 Safari/537.36 Core/1.70.3722.400'
' QQBrowser/10.5.3751.400',
}
formData = {
's': '6445266503022880974', 'searchkey': name
}
r = requests.post(url=url, headers=headers, data=formData)
r.encoding = r.apparent_encoding # 解决乱码问题
# print(r.text)
get_book_list(r)
# 分析书的列表的方法
def get_book_list(r):
global url_list, class_name_list, author_name_list, book_name_list
tree = etree.HTML(r.text)
a_num = tree.xpath('//div[@class="bookinfo"]/h4/a/@href')
# print(a_num)
class_name = tree.xpath('//div[@class="bookinfo"]/div[@class="cat"]/text()')
# print(class_name)
author_name = tree.xpath('//div[@class="bookinfo"]/div[@class="author"]/text()')
book_name = tree.xpath('//div[@class="bookinfo"]/h4/a/text()')
# print(book_name)
num = len(a_num)
if num ==
python获取网络小说的代码,复制粘贴即可用
最新推荐文章于 2023-05-21 21:01:00 发布