代码可实现获取简单的网页源代码,包括简单的登录、代理、cookies的使用
import urllib
import socket
from urllib import request, parse
from urllib.request import HTTPPasswordMgrWithDefaultRealm, HTTPBasicAuthHandler, build_opener, ProxyHandler
from urllib.error import URLError
import http.cookiejar
def get_simple_url(url, method='POST', timeout=2): # 获取简单的网页源代码
headers = {
'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/75.0.3770.100 Safari/537.36'
}
dict = {
'word': 'hello'
}
try:
data = bytes(parse.urlencode(dict), encoding='utf8')
res = request.Request(url, data=data, headers=headers, method=method)
response = request.urlopen(res, timeout=timeout)
# print(response.read().decode('utf-8')) # 输出网页源代码
# print(type(response))