# -*- coding: utf-8 -*-
import re
import urllib.parse
import urllib.request
from http.cookiejar import CookieJar
#豆瓣的登录url
loginurl = "https://www.douban.com/accounts/login"
cookie = CookieJar()
opener = urllib.request.build_opener(urllib.request.HTTPCookieProcessor)
data={}
data["form_email"]="chaowang.hn@gmail.com"
data["form_password"]="wanghejin18592"
data["source"]= "index_nav"
# 从首页提交登录
response = opener.open(loginurl,urllib.parse.urlencode(data).encode("utf-8"))
# 验证成功跳转至登录页
if response.geturl() == "https://www.douban.com/accounts/login":
html = response.read().decode()
# 验证码图片地址
imgurl = re.search('<img id="captcha_image" src="(.+?)" alt="captcha" class="captcha_image"/>', html)
if imgurl:
url = imgurl.group(1)
# 将图片保存至同目录下
res = urllib.request.urlretrieve(url, "v.jpg")
# 获取captcha-id参数
captcha = re.search('<input type="hidden" name="captcha-id" value="(.+?)"/>', html)
if captcha:
vcode = input("请输入图片上的验证码:")
data["captcha-solution"] = vcode
data["captcha-id"] = captcha.group(1)
data["user_login"] = "登录"
# 提交验证码验证
response = opener.open(loginurl, urllib.parse.urlencode(data).encode("utf-8"))
#登录成功跳转至首页
if response.geturl() == "http://www.douban.com/":
print ("登录成功")
使用http.cookiejar生产Cookie模拟用户登陆
最新推荐文章于 2024-08-13 08:07:15 发布