pandas.read_html读取表格
import pandas
import requests
from my_fake_useragent import UserAgent
url = "http://tianqi.2345.com/Pc/GetHistory"
def extract_data(year, month):
params = {
"areaInfo[areaId]": 71833,
"areaInfo[areaType]": 2,
"date[year]": year,
"date[month]": month
}
headers = {"User-Agent": UserAgent().random()}
resp = requests.get(url, headers=headers, params=params)
print(resp)
data = resp.json()["data"]
df = pandas.read_html(data)[0]
print("extracting data:", year, month)
return df
weather_list = []
for year in range(2018, 2021):
for month in range(1, 13):
df = extract_data(year, month)
weather_list.append(df)
pandas.concat(weather_list).to_excel("weatherOfWuHan.xlsx", index=False)