#问题需求就是把豆瓣TOP250里面的 序号/电影名/评分/推荐语/链接 都爬取下来,结果就是全部展示打印出来
import csv
import requests
from bs4 import BeautifulSoup
file=open('电影列表.csv','w',newline='',encoding='gbk')
book=csv.writer(file)
book.writerow(['序号','名称','评分','评价','链接'])
url='https://movie.douban.com/top250?start=%27%20+%20str(x*25)%20+%20%27&filter='
moveurl=requests.get(url)
soup=BeautifulSoup(moveurl.text,'html.parser')
for move in soup.find_all('li'):
number=move.find('em',class_='')
move_name=move.find('span',class_='title')
score=move.find('span',class_='rating_num')
evaluate=move.find('span',class_='inq')
href=move.find('a')
if (number)!=None:
move_number=number.text
move_name=move_name.text
move_score=score.text
move_evaluate=evaluate.text
move_href=href.attrs['href']
print(move_number+move_name+move_score+move_evaluate+move_href)
book.writerow([move_number,move_name,move_score,move_evaluate,move_href])
python+豆瓣电影top排名查询
最新推荐文章于 2021-07-30 17:15:13 发布