简单的需求 ,访问某个百度贴吧,并且把信息保存下来。
from urllib import request,parse
import random
def tieba():
data = {
"kw" : "魔方" ,
"ie" : "utf-8",
"pn" : 0
}
urls = []
httpurl = 'http://tieba.baidu.com/f?'
for t in range(10):
pn = t * 50
data['pn'] = str(pn)
urls.append(httpurl + parse.urlencode(data))
print(urls)
for url in urls:
rsp = request.urlopen(url).read()
#html = rsp.read().decode()
#print(html)
tt = str(random.randint(0,99))
fp = open(tt +".html", "w+b") # 打开一个文本文件
fp.write(rsp) # 写入数据
fp.close() # 关闭文件
if __name__ == '__main__':
tieba()