使用requests 和 post
import requests
– url=‘https://tieba.baidu.com/f?kw=python&ie=utf-8&pn=0’
–https://tieba.baidu.com/f?kw=python&ie=utf-8&pn=50
class Tiebaspider(object): 创建类项目
def init(self,tieba_name):
self.tieba_name=tieba_name 定义项目名字
self.url=“https://tieba.baidu.com/f?kw=”+tieba_name+"&ie=utf-8&pn={}"
def get_url_list(self): **获取url地址串 的列表**
'''构造URL列表'''
# url_list=[]
# for i in range(10):
# url_list.append(self.url.format(i*50)) #基础的URL地址
# print(url_list)
return [self.url.format(i*50) for i in range(10)]
def parse_url(self,url):
'''发送请求,获取响应'''
response=requests.get(url)
return response.text
def save_html(self,page_num,tb_html):
''