1. 导入库 import os import chardet import requests import logging from lxml import etree from tqdm import tqdm from fake_useragent import UserAgent import time import re 2.日志输出配置以及随机请求头 # 日志输出的基本配置 logging.basicConfig(level=logging.INFO, format='%(asctime)s - %(levelname)s: %(message)s') # 随机产生请求头 ua = UserAgent(verify_ssl=False, path='fake_useragent.json') def random_ua(): headers = { "accept-encoding": "gzip", # gzip压缩编码 能提高传输文件速率 "user-agent": ua.random } return headers 3.生成存放下载文件函数 def make_path(name): path = 'D:/PPT模板_1/'+name if not os.path.exists(path): os.mkdir(path) return path 4. 获取该网站的模板类别 kinds=[x+2 for x in range(22)] d