对于豆瓣这个登录必须有验证的网址,
post和get没有关联性,按照不同的需求使用不同的连接方式,可以先自己手动登录到豆瓣,然后拷贝登录后的cookie到代码里,爬虫程序就会以登录后的状态抓数据了
import requests
from user_agent import headers
def douban_login():
login_url = 'https://accounts.douban.com/j/mobile/login/basic'
url = 'https://www.douban.com/people/221725636/'
# headers = {
# 'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/70.0.3538.25 Safari/537.36 Core/1.70.3875.400 QQBrowser/10.8.4492.400'
# }
# 发送请求
# 在发送的时候以传参的方式发送cookie
# cookies = 'bid=CoFnyYaHvxQ; douban-fav-remind=1; __yadk_uid=MGLPA6D5bDkj8JypPNYfwDtVVqUUC1nu; ll="118281"; push_doumail_num=0; __utmv=30149280.22172; gr_user_id=59b923b6-172f-4e68-a7f1-4a2facfb25c7; _ga=GA1.1.843993488.1628860359; _ga_RXNMP372GL=GS1.1.1628860359.1.0.1628860362.0; push_noty_num=0; __g