QQ群:33314708
from selenium import webdriver
from selenium.webdriver.common.desired_capabilities import DesiredCapabilities#配合加载模式
import time
from selenium.webdriver.support.wait import WebDriverWait #显式等待
from selenium.webdriver.support import expected_conditions as EC #显式等待提供的方法
from selenium.webdriver.common.by import By #By选择器
def gogogo(url):
# 创建driver对象
chromedriver_path = "chromedriver.exe"
options = webdriver.ChromeOptions()
# 此步骤很重要,设置为开发者模式,防止被各大网站识别出来使用了Selenium
options.add_experimental_option('excludeSwitches', ['enable-automation'])
#无头
#options.add_argument('--headless')
#加载模式不等待,如果操作页面需要配合显示等待
desired_capabilities = DesiredCapabilities.CHROME
desired_capabilities["pageLoadStrategy"] = "none"
driver = webdriver.Chrome(executable_path=chromedriver_path, options=options,desired_capabilities=desired_capabilities)
#get url
driver.get(url)
#等待元素/等待js渲染
locator = (By.CLASS_NAME, "user-name")
ele = WebDriverWait(driver,20).until(EC.presence_of_element_located(locator))
cookies = driver.get_cookies()
ck_cookie = ''
#拼接cookie
for item in cookies:
ck_cookie= ck_cookie + item['name'] + "=" + item['value'] +";"
#print(driver.title)
cookie = ck_cookie[:-1]
driver.quit()
return cookie
if __name__ == '__main__':
url = 'https://www.xiaohongshu.com/user/profile/53154482b4c4d64f5296aecd'
#url = "https://www.baidu.com"
cookie = gogogo(url)
# headers = {
# 'cookie':cookie,
# 'user-agent':'Mozilla/5.0 (Linux; Android 6.0; Nexus 5 Build/MRA58N) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/69.0.3497.100 Mobile Safari/537.36'
# }
# import requests
# res =requests.get(url,headers=headers,verify=False)
# print(res.text)