qiushibaike 如何写抓取翻页的内容,这里只写好了一个抓取本页的内容
#coding=utf-8
import urllib2
import urllib
import re
page = 1
url = 'http://www.qiushibaike.com/hot/page/'+str(page)
user_agent = 'Mozilla/4.0 (compatible; MSIE 5.5; Windows NT)'
headers = { 'User-Agent' : user_agent }
try:
request = urllib2.Request(url,headers=headers)
response = urllib2.urlopen(request)
content = response.read()
pattern = re.compile('