from json import dumps
from selenium.webdriver import Chrome
b = Chrome()# 1.打开需要完成自动登录的网站(需要获取cookie的网站)
b.get('https://www.taobao.com/')# 2.给足够长的时间让人工完成自动登录并且人工刷新出登陆后的页面# 强调一定要把第一个页面刷新出登陆之后的页面input('已经完成登录:')# 3.获取登陆后的cookie并且将获取到的cookie保存到本地文件
cookies = b.get_cookies()print(cookies)
b.close()withopen('files/taobao.txt','w', encoding='utf-8')as f:
f.write(dumps(cookies))
seleniue使用cookie
from json import loads
from selenium.webdriver import Chrome
b = Chrome()# 1.打开需要自动登录的网页
b.get('https://www.taobao.com/')# 2.添加cookiewithopen('files/taobao.txt', encoding='utf-8')as f:
content = f.read()
cookies = loads(content)for i in cookies:
b.add_cookie(i)print(b.page_source)# 3.重新打开网站
b.get('https://www.taobao.com/')print(b.page_source)input(":")
requests 使用代理
import requests
res = requests.get(
url='https://movie.douban.com/top250',
headers={'User-Agent':'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/101.0.0.0 Safari/537.36'},# proxies={# 'http': 'http://119.7.145.65:4531',# 'https': 'http://119.7.145.65:4531'# }# 119.7.145.65:4531
proxies={'http':'119.7.145.65:4531','https':'119.7.145.65:4531'})print(res.text)
requests使用代理实际用法
from time import sleep
import requests
defget_ip():
url ='http://d.jghttp.alicloudecs.com/getip?num=1&type=1&pro=510000&city=510600&yys=0&port=11&time=2&ts=0&ys=0&cs=0&lb=4&sb=0&pb=4&mr=1®ions='whileTrue:
response = requests.get(url)if response.text[0]=='{':print('提取失败,重试!')
sleep(1)continuereturn response.text
defget_douban_film():
ip = get_ip()
res = requests.get(
url='https://movie.douban.com/top250',
headers={'User-Agent':'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/101.0.0.0 Safari/537.36'},
proxies={'http':f'{ip}','https':f'{ip}'})print(res)print(res.text)if __name__ =='__main__':
get_douban_film()