import requests
import os
from bs4 import BeautifulSoup
import urllib
from tqdm import tqdm
from pptx import Presentation
from pptx.util import Inches
import argparse
print("===================================")
print("删除原有ppt,并重新创建")
if os.path.exists('demo.pptx'):
os.remove('demo.pptx')
print("===================================")
parser = argparse.ArgumentParser(description='Input The URL')
parser.add_argument('--url', type=str, help='URL')
parser.add_argument('--img_save_path', type=str, default='./img')
opt = parser.parse_args()
img_list = []
resp = requests.get(opt.url)
content = resp.text
bs = BeautifulSoup(content, 'html.parser')
for im in bs.select('img'):
if 'data-src' in im.attrs:
img_list.append(im['data-src'])
if not os.path.isdir(opt.img_save_path):
os.makedirs(opt.img_save_path)
x = 0
for imgurl in tqdm(img_list):
urllib.request.urlretrieve(imgurl, '{}/{}.jpg'.format(opt.img_save_path,x))
x = x + 1
print("===================================")
print("图片下载完成,开始制作PPT")
print("===================================")
prs = Presentation()
prs.slide_width = Inches(16)
prs.slide_height = Inches(9)
for i in range(len(os.listdir('./img'))-1):
prs.slides.add_slide(prs.slide_layouts[6])
img_index = 0
for slide in tqdm(prs.slides):
slide.shapes.add_picture("img/{}.jpg".format(img_index),left=Inches(0),
top=Inches(0),
width=Inches(16),
height=Inches(9))
img_index += 1
print("==============制作完成=============")
prs.save("demo.pptx")
爬取公众号图片并自动导入到ppt
最新推荐文章于 2024-07-21 22:27:18 发布