# 导入工具包
import requests
from bs4 import BeautifulSoup
import time
import pandas as pd
import numpy as np
# 请求头
headers={
'User-Agent':'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/88.0.4324.190 Safari/537.36'}
# =============================================================================
# 爬取一页
# =============================================================================
# 爬取的网址
url='https://movie.douban.com/subject/34841067/comments?limit=20&status=P&sort=new_score'
# 获取信息
html = requests.get(url,headers=headers)
# 获取内容
data = html.text
soup = BeautifulSoup(data,'lxml')
# 信息
# 用户
names = soup.select('#comments > div > div.comment > h3 > span.comm
python爬取《你好, 李焕英》豆瓣评论数据
最新推荐文章于 2022-09-01 16:44:47 发布