import io
import sys
url = 'https://www.baidu.com/'
headers = {
'User-Agent': 'Mozilla/4.0 (compatible; MSIE 8.0; Windows NT 6.0; Trident/4.0)',
"Accept": "text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,image/apng,*/*;q=0.8,application/signed-exchange;v=b3;q=0.9",
"Accept-Encoding": "gzip, deflate, br",
"Accept-Language": "zh-CN,zh;q=0.9",
"Connection": "keep-alive",
}
import requests
import urllib3
#解决urllib3 提示报错
urllib3.disable_warnings(urllib3.exceptions.InsecureRequestWarning)
#解决输出html超文本乱码问题
sys.stdout = io.TextIOWrapper(sys.stdout.buffer, encoding='utf-8')
html = requests.get(url=url, headers=headers, verify=False)
html.encoding = html.apparent_encoding
print(html.text)
将project encoding 的格式 勾选成 utf-8
这个py文件中 中文文字报错了。 可以选用这个。
# -*- coding: gbk -*-
最终效果没问题了。