#coding:utf-8
import urllib2
import string
def baidu_url(url,page,endpage):
for i in (page,endpage+1):
f=open(str(i)+'.html','w+')
print u'正在下载第'+str(i)+u'个页面'
m=urllib2.urlopen(url+'?pn='+str(i)).read()
f.write(m)
f.close()
url=raw_input(unicode('请输入帖子的第一页,例如http://tieba.baidu.com/p/2925873031','utf-8').encode('gbk'))
page=int(raw_input(unicode('从哪一页开始下载','utf-8').encode('gbk')))
endpage=int(raw_input(unicode('哪一页截止下载','utf-8').encode('gbk')))
baidu_url(url,page,endpage)
参考文章:
http://blog.csdn.net/pleasecallmewhy/article/details/8927832