# coding=utf-8
import requests
from lxml import etree
import os
import time
# 导入线程池包
from concurrent.futures import ProcessPoolExecutor
import random
"""
这里我们直接爬取P站图片内容。
排行榜原始地址
https://i.pximg.net/ c/240x480 /img-master/img/2021/04/14/00/00/04/89135748_p0_master1200.jpg
高清图原始地址
https://i.pximg.net/ img-master/img/2021/04/14/00/00/04/89135748_p0_master1200.jpg
页码XHR
https://www.pixiv.net/ranking.php?p=2&format=json
"""
def get_content(url=None, s_type=None, name=None):
headers = {
"User-Agent":
"Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/89.0.4389.128 Safari/537.36 Edg/89.0.774.77",
"referer":
"https://www.pixiv.net/ranking.php?mode=daily&content=illust"
}
session = requests.Session()
response = session.get(url=url, headers=headers)
多进程爬取P站图片
最新推荐文章于 2024-05-14 11:00:23 发布