import pdfplumber as pr
import pandas as pd
pdf = pr.open('21.PDF')
ps = pdf.pages
i1 = 0
table1 = [[0 for i in range(20)] for j in range(200)]
for p in range(9):
pg = ps[p]
tables = pg.extract_tables()
table = tables[0]
print(table)
df = pd.DataFrame(table[1:],columns = table[0])
for i in range(len(table)):
for j in range(len(table[i])):
#table[i][j] = table[i][j].replace('\n','')
table1[i1][j] = table[i][j]
i1 = i1+1
df1 = pd.DataFrame(table1[1:],columns = table1[0])
df1.to_excel('1.xlsx')
python pdfplumber 转换多页PDF表格为Excel
于 2022-02-23 18:33:10 首次发布