import requests
from lxml import etree
import json
# 获取网页源代码
r = requests.get('http://www.tianqihoubao.com/lishi/kunming/month/202104.html')
# 使用xpath对爬取的源代码进行处理
dom_tree = etree.HTML(r.content)
links = dom_tree.xpath("/html/body/form/div[2]/div[6]/div[1]/div[1]/table[1]/tr/td[3]")
# 切片函数1::2 可以使得每两天一个天气
list = [i.text.replace("\r\n", "") for i in links[1:]]
listHighTemperature = []
listLowTemperature = []
for i in list:
temp = i.replace("¡æ", "")
newtemp = temp.split("/", 1)
val1 = newtemp[0].replace(" ", "")
val2 = newtemp[1].replace(" ", "")
listHighTemperature.append(int(val1))
listLowTemperature.append(int(val2))
print("昆明最高气温:")
print(listHighTemperature)
print("昆明最低气温:")
print(listLowTemperature)
# list = [i.text for i in links[1::1]]
# print(list)