爬取微博某些内容需要登陆,整理两种方法【不知道对不对】
1设置cookie
def getHTMLText(url):
cookie='XXXXXXXX'
headers = {
'User-Agent':'Mozilla/5.0 (Windows NT 6.2; WOW64; rv:21.0) Gecko/20100101 Firefox/21.0',
'Cookie': cookie
}
try:
r = requests.get(url, headers=headers,timeout=30,proxies={
'http':