第一次用旧知识爬取天气网站数据。
import requests
from bs4 import BeautifulSoup
import bs4
def getHTMLText(url):
try:
r = requests.get(url)
r.raise_for_status()
r.encoding = r.apparent_encoding
return r.text
except:
return ""
def fillWList(ist, html):
soup = BeautifulSoup(html, 'html.parser')
for ul in soup.find('div','tqtongji2').findAll('ul')[1:]: #原代码:for ul in soup.find('div','tqtongji2').children 去除了每个月的表头
if isinstance(ul, bs4.element.Tag):
lis = ul('li')
ist.append([lis[0].string,lis[1].string,lis[2].string,lis[3].string,lis[4].string,lis[5].string])
def printWList(ist)</