导入bs4
import requests
from bs4 import BeautifulSoup
找到文章列表及链接
article_list = soup.find('div', attrs={'class': 'article-list'})
article_item = article_list.find_all('div', attrs={'class': 'article-item-box'})
写入文件
for ai in article_item:
title = ai.a.text
link = ai.a['href']
print(title)
print(link)
write_to_file(title+'\t')
write_to_file(link+'\n')
def write_to_file(content):
with open('article.txt', 'a', encoding='utf-8') as f:
f.write(content)