from lxml import etree
html = "需要解析的网页"
html = etree.HTML(html)
#获取所有的href属性
url_list = html.xpath("//*/@href")
for url in url_list:
print(url)
xpath提取网页的所有href标签
最新推荐文章于 2021-06-07 18:01:00 发布
from lxml import etree
html = "需要解析的网页"
html = etree.HTML(html)
#获取所有的href属性
url_list = html.xpath("//*/@href")
for url in url_list:
print(url)