from lxml import etree import urllib.request url = 'http://www.baidu.com/' headers = { 'User-Agent':'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/113.0.0.0 Safari/537.36 Edg/113.0.1774.42' } request = urllib.request.Request(url = url,headers = headers) response = urllib.request.urlopen(request) content = response.read().decode('utf-8') #解析服务器响应的文件 tree = etree.HTML(content) #xpath语法 result = tree.xpath('//input[@id="su"]/@value')[0] print(result)
打印结果为 百度一下