爬取:电影名称+主演+时间+评论+保存图片到指定路径
from urllib import request
import re
import random
from day01_爬虫.useragents import ua_list
import os
class MaoyanSpider(object):
def __init__(self):
self.url="https://maoyan.com/board/4?offset={}"
#获取响应内容
def get_html(self,url):
headers = {
"User-Agent": random.choice(ua_list)} # 随机获取请求头
req = request.Request(url=url, headers=headers)
res = request.urlopen(req)
html = res.read()
return html
#解析提取数据
def re_func(self,re_bds,