import fitz
import pdfkit
import requests
from selenium import webdriver
import time
import glob
import os
import warnings
warnings.simplefilter("ignore", ResourceWarning) #忽略警告
# chrome_options =webdriver.ChromeOptions()
# chrome_options.add_argument('--start-maximized ')
# chrome_options.add_argument('--headless')
# chrome_options.add_argument('--disable-gpu')
# chrome_options.add_argument("window-size=1920,1080")
# driver = webdriver.Chrome(executable_path=r".\chromedriver.exe",options=chrome_options)
# driver.get('目标网址')
# driver.maximize_window()
# driver.fullscreen_window()
def get_img_pdf_return_url(driver):
num=0
num_while=936
while True:
driver.save_screenshot("C:/Users/Administrator/Desktop/img_pdf/img{}.png".format(num))
js="var q=document.documentElement.scrollTop={}".format(num_while)
driver.execute_script(js)
time.sleep(0.2)
print("截图:",num_while,"成功")
# print(driver.title)
num+=1
if num_while >7198:
break
num_while+=936
doc = fitz.open()
# print("doc:", f)
# 从规定路径下读取图片,确保按文件名排序
for img in sorted(glob.glob(r"C:\Users\Administrator\Desktop\img_pdf\*.png")):
print(img)
imgdoc = fitz.open(img)
# print("imgdoc",imgdoc)
# 使用图片创建单页的 PDF
pdfbytes = imgdoc.convertToPDF()
# print("pdfbytes", pdfbytes)
# 将当前页插入文档
imgpdf = fitz.open("pdf", pdfbytes)
doc.insertPDF(imgpdf)
if os.path.exists("./img_pdf/aa.pdf"):
os.remove("./img_pdf/aa.pdf")
doc.save(r"C:\Users\Administrator\Desktop\img_pdf\aa.pdf")
doc.close()
return "C:\Users\Administrator\Desktop\img_pdf\aa.pdf"
对可视化截图,然后合并成pdf
最新推荐文章于 2024-08-12 07:30:00 发布