2020/09/23
记录一下
# -*- codeing = utf-8 -*-
# @Time : 2020/9/23 9:51
# @Author : KYY
# @File : test.py
# @Software : PyCharm
import urllib.request
# response = urllib.request.urlopen("http://www.baidu.com/")
# print(response.read().decode('utf-8')) #对获取到的网页源码进行utf-8解码
#获取一个post请求
import urllib.parse
# data = bytes(urllib.parse.urlencode({"hello" : "world"}), encoding="utf-8") #使用utf-8这种编码方式封装一个dic作为表单, 使用二进制方式 bytes
# response = urllib.request.urlopen("http://httpbin.org/post", data=data)
# print(response.read().decode("utf-8"))
#超时处理
# try:
# response = urllib.request.urlopen("http://httpbin.org/get", timeout=0.01)
# print(response.read().decode("utf-8"))
# except urllib.error.URLError as e:
# print("time out!")
# response = urllib.request.urlopen("http://www.baidu.com")
# print(response.status)
# print(response.getheader("Server")) #如果要获得全部的信息就要使用getheaders方法
# url = "https://www.douban.com"
# url = "http://httpbin.org/post"
# headers = {
# "User-Agent" : "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/85.0.4183.102 Safari/537.36"
# }
# data = bytes(urllib.parse.urlencode({"name" : "aaa"}), encoding="utf-8")
# req = urllib.request.Request(url=url,data=data,headers=headers,method="POST") 封装好的request对象
# response = urllib.request.urlopen(req)
# print(response.read().decode("utf-8"))
url = "https://www.douban.com"
headers = {
"User-Agent" : "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/85.0.4183.102 Safari/537.36"
}
req = urllib.request.Request(url=url,headers=headers)
response = urllib.request.urlopen(req)
print(response.read().decode("utf-8"))