安装pdf相关库:
pip install pdfplumber
pip install typing-extensions
编写代码
import pdfplumber
import pandas as pd
pdf_file = r'G:\Core_v5.3.pdf'
pdf = pdfplumber.open(pdf_file)
result_df = pd.DataFrame()
for page in pdf.pages[100:200]:
tables = page.extract_tables()
if tables:
for table in tables:
print('============================================================')
print(table)
df_detail = pd.DataFrame(table[1:],columns=table[0])
# df_detail = pd.DataFrame(table)
print(df_detail)