利用python+request+bs4爬取7天的天气预报信息
为了熟练掌握静态页面信息爬取,几种方法如下所示,希望大神指点。
import requests
import re
from bs4 import BeautifulSoup
url = 'http://www.weather.com.cn/weather/101221001.shtml'
headers={
'User-Agent':'Mozilla/5.0 (Windows NT 10.0; WOW64; rv:62.0) Gecko/20100101 Firefox/62.0',
}
html = requests.get(url, headers=headers)
html.encoding = 'utf-8'
htmlText = html.text
soup = BeautifulSoup(html.text, 'html.parser')
date = []
weather = []
templerature = []
lis = soup.find_all('li', class_='sky')
for li in lis:
h1_dates = li.find_all('h1')
p_weas = li