安装第三方库
pip install pdfminer3k
配置注册百度翻译平台账号,获取appid 及key
详细代码
import hashlib
import random
import urllib.parse
import requests
from concurrent import futures
from io import StringIO
from pdfminer.pdfinterp import PDFResourceManager
from pdfminer.pdfinterp import process_pdf
from pdfminer.converter import TextConverter
from pdfminer.layout import LAParams
def read_from_pdf(file_path):
'''
解析pdf文件
'''
with open(file_path, 'rb') as file:
resource_manager = PDFResourceManager()
return_str = StringIO()
lap_params = LAParams()
device = TextConverter(
resource_manager, return_str, laparams=lap_params)
process_pdf(resource_manager, device, file)
device.close()
content =