from urllib import request,parse
url = "http://www.baidu.com"
headers = {
'User-Agent':"Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/85.0.4183.83 Safari/537.36 Edg/85.0.564.41"
}
#用户输入关键字
kw = input('请输入要查找的内容')
params = {
'ie':'utf-8',
'wd':kw
}
#将字典变成 url编码字符串
# https://www.baidu.com/s?ie=utf-8&wd=%E8%8B%8D%E8%80%81%E5%B8%88
params = parse.urlencode(params)
url = "http://www.baidu.com/s?" + params
#创建请求对象
req = request.Request(url=url,headers=headers)
#发送请求 获取网页源代码
response = request.urlopen(req)
# print(response.read().decode('utf-8'))
print(response.status) #状态码
爬虫模拟百度搜索
最新推荐文章于 2024-04-23 18:06:15 发布