import parsel
html_str = '''
<div>
<ul>
<li class = "item-1">
<a href = "link1.htm1">第一个</a>
</li>
<li class = "item-2">
<a href = "link2.htm1">第二个</a>
</li>
<li class = "item-3">
<a href = "link3.htm1">第三个</a>
</li>
<li class = "item-4">
<a href = "link4.htm1">第四个</a>
</li>
<li class = "item-5">
<a href = "link5.htm1">第五个</a>
</li>
</u1>
</div>
'''
#1.转换数据类型
data = parsel.Selector(html_str)#能把缺失的标签补充完整
#2、解析数据
#从根节点开始,获取所有<a
python中的xpath语法
最新推荐文章于 2024-06-24 19:59:02 发布