import requests
import os #文件夹操作模块,标准库
from lxml import etree
for page in range(1,48+1):
if page == 1:
url = 'https://www.jdlingyu.com/collection/acg'
else:
url = 'https://www.jdlingyu.com/collection/acg/page/' + str(page)
page += 1
page_index = page - 1
html_str = requests.get(url).text
xpath_str = etree.HTML(html_str)
name_list =xpath_str.xpath('//h2/a/text()')
href_list =xpath_str.xpath('//h2/a/@href')
index_num = 0
for name,href in zip(name_list,href_list):
# print(img_url)
res = requests.get(href).text
html = etree.HTML(res)
img_url_list =html.xpath(