爬虫的起点,获取网页代码
#!/usr/bin/env python3
# -*- encoding:utf-8 -*-
# 请求网页代码
import urllib.request
req = urllib.request.Request('http://www.weather.com.cn/adat/sk/101280101.html')
r = urllib.request.urlopen(req)
result = str(r.read(), encoding='utf-8')
print(result, type(result))
#############################
# requests是第三方模块,与上面urllib.request一样的效果。而且跟方便简洁
import requests
res = requests.get("http://www.weather.com.cn/adat/sk/101280101.html")
res.encoding = 'utf-8'
r = res.text
print(type(r), r)
#<class 'str'> {"weatherinfo":{"city":"广州","cityid":"101280101","temp":"24","WD":"东南风","WS":"3级","SD":"80%","WSE":"3","time":"10:25","isRadar":"1","Radar":"JC_RADAR_AZ9200_JB","njd":"暂无实况","qy":"1001"}}