# 目标url:https://52online.vip/list/?1.html
import requests
from bs4 import BeautifulSoup
import time
import csv
# 请求访问
def request_url(ye):
headers = {'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/76.0.3809.100 Safari/537.36'}
url = 'https://52online.vip/list/?1-' + str(ye) + '.html'
while True:
time.sleep(3)
r = requests.get(url, headers=headers, verify=False)
if r.status_code == 200:
print('访问成功:', url)
return r.text
# 抓取网页数据
def url_texts(url_text):
'''
:param url_text: 响应的url.text
:return: urls=电影对应的网址
dates=上映日期和类型
hds=清晰度
names=电影名
'''
url_text = url_text
urs = 'https://52online.vip'
urls = [] # 电影url
dates = [] # 上映日期
guojia
使用python3爬取电影储存到本地
最新推荐文章于 2024-07-24 17:05:28 发布