这里我们需要正定义一个自己的opener. 默认是opener是遇到30x,
会出继续往下请求.
# -*- coding=utf-8 -*-
from urllib.request import urlopen
from urllib.request import Request
import urllib.request
# 定义一个自己的头类, 继承HTTPRedirectHandler
# 重写 http_error_302, 直接返回 fp(reponse);
class MyRedirectHandler(urllib.request.HTTPRedirectHandler):
def http_error_302(self, req, fp, code, msg, hdrs):
return fp
myHandler = MyRedirectHandler()
opener = urllib.request.build_opener(myHandler)
req = Request('http://www.baidu.com/')
# 模拟一个浏览器访问百度, 不然不会重写到 https.
req.add_header('User-Agent','Mozilla/5.0 (X11; Linux x86_64; rv:47.0) Gecko/20100101 Firefox/47.0')
res = opener.open(req)
print(res.getcode())
print(res.getheaders())