简单的爬虫操作:
四步:
1. 指定url
2. 发送请求
3. 获取数据
4. 永久化存储
import requests
#指定url
url = 'https://www.sogou.com/'
#发起请求
response = requests.get(url=url)#response为get的相应对象
#获取相应数据
page_text = response.text
print(page_text)
#持久化存储
with open('./sogou.html','w',encoding='utf-8') as fp:
fp.write(page_text)
print("爬取数据结束!!!!")