# coding:utf-8
# Created: 04-07-2018 at home
# by Python 3.6.5 Sublime text 3
# aurhor :wangjianxin
import urllib.request ,sys
import re
#以拼音的形式输入查询的省份和城市 例如:shanxi JinCheng
provice = input('provice:')
city = input('city:')
#构建查询的网址
url = "http://qq.ip138.com/weather/"+provice+'/'+city+'_7tian.htm'
#爬取网页内容并赋给res
weatherhtml = urllib.request.urlopen(url)
res = weatherhtml.read().decode('GB2312')
#将网页编码后写入到本地方便爬取
f=open('wea.txt','wb')
f.write(res.encode('GB2312'))
f.close()
#获取标题
pattern = 'Title.+<b>(.+)</b>'
Title = re.search(pattern,res).group(1)
#获取具体的日期
pattern = '>(\d*-\d*-\d*?)<'
date = re.findall(pattern,res)
#获取某一天具体的天气情况
pattern = '/><br/>(.+?)</td>'
weather = re.findall(pattern,res)
print ("%35.30s"%Title)
length = len(date)
#打印输出具体的天气情况
for i in range (0,length):
print ('%33.20s'%date[i], '\t%s'%weather[i])
特别强调文章中一些正则表达式的构建
标题:pattern = 'Title.+<b>(.+)</b>'
日期:pattern = '>(\d*-\d*-\d*?)<'
天气:pattern = '/><br/>(.+?)</td>'
--------风吹浪打 岿然不动 怡然自得 继续前行