这个是学习网站的代码参考(爬取的网站已经不能用了):
import requests
from bs4 import BeautifulSoup
def get_city_aqi(city_pinyin):
"""
获取城市的AQI
"""
url = 'http://pm25.in/' + city_pinyin
r = requests.get(url, timeout=30)
soup = BeautifulSoup(r.text, 'lxml')
div_list = soup.find_all('div', {
'class': 'span1'})
city_aqi = []
for i in range(8):
div_content = div_list[i]
caption = div_content.find('div', {
'class': 'caption'}).text.strip()
value = div_content.find('div', {
'class':