一.TXT文本存储
from pyquery import PyQuery as pq
import requests
url = 'https://www.zhihu.com/roundtable/lol2020'
headers = {
'User-Agent':'Mozilla/5.0 (Windows NT 10.0; WOW64)'
+' AppleWebKit/537.36 (KHTML, like Gecko) Chrome/70.0.3538.25'
+' Safari/537.36 Core/1.70.3742.400 QQBrowser/10.5.3864.400'}
html = requests.get(url,headers = headers).text
#此处为text而非text()
doc = pq(html)
#调用items()函数,是pyquery对象变为一个generator
items = doc('.item-title a').items()
for item in items:
#item.text()使一个pyquery对象转变为字符串形式
print(item.text())
#打开一个文档,如果不存在,则创建一个
with open('zhihu_lol.txt','a',encoding='utf-8') as f:
f.write(item.text()+'\n')
关于open函数的第二个参数:
r:只读&#