import urllib.request import urllib.parse def a(page): url='https://movie.douban.com/explore#!type=movie&tag=%E7%83%AD%E9%97%A8&sort=recommend&' date={ 'start':(page-1)*20, 'limit':20 } date=urllib.parse.urlencode(date) url=url+date headers={ 'User-Agent': 'Mozilla/5.0 (Linux; Android 6.0; Nexus 5 Build/MRA58N) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/94.0.4606.81 Mobile Safari/537.36 Edg/94.0.992.50' } requese=urllib.request.Request(url=url,headers=headers) return requese def get_count(request): response=urllib.request.urlopen(request) content= response.read().decode('utf-8') return content def doem_lode(page,content): with open(r'douban'+str(page)+'.json','w',encoding='utf-8') as fp: fp.write(content) if __name__=='__main__': stater_page=int(input('请输入起始页码:')) end_page=int(input('请输入结束页码:')) for page in range(stater_page,end_page+1): request=a(page) #获取相应数据 content=get_count(request) doem_lode(page,content)
PyCharm请求网站特征,修改后缀
最新推荐文章于 2024-09-15 22:31:42 发布