爬取历史天气数据
import requests
from requests.exceptions import RequestException
from bs4 import BeautifulSoup
import os
import csv
import time
def get_one_page(url):
'''
获取网页
'''
print('正在加载'+url)
headers={
'User-Agent':'User-Agent:Mozilla/5.0'}
try:
response = requests.get(url,headers=headers)
if response.status_code == 200:
return response.content
return None
except RequestException:
return None
def parse_one_page(html):
'''
对网页内容进行解析
'''
soup = BeautifulSoup(html, "lxml")
info = soup.find('div', class_='wdetail')
rows=[]
tr_list = info.find_all('tr')[1:] # 使用从第二个tr开始取
for index, tr in enumerate(tr_list): # enumerate可以返回元素的位置及内容
td_list = tr.find_all(