import requests # UA伪装 反扒机制 if __name__ == '__main__': headers = {'user-agent':'Mozilla/5.0 (Windows NT 10.0; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/96.0.4664.9 Safari/537.36'} url = 'https://www.sogou.com/web' # 处理url 携带的参数:封装到字典中: kw = input('输入词:') param = {'query':kw} #对指定的url发起的请求是携带参数的,并且请求过程中处理了参数 resp = requests.get(url=url,params=param,headers=headers) #获取响应数据 page_text = resp.text #存储 fileName = kw + '.html' with open(fileName,'w',encoding='utf-8')as ft: ft.write(page_text) print(fileName,'保存成功!!!!')
02request_(简易网站采集器)实战
最新推荐文章于 2024-09-05 15:44:26 发布