1.切分PDF文件提取任意页面
from PyPDF2 import PdfFileReader, PdfFileWriter
def split_pdf(fileName, result, start=0, end=None):
#打开原始pdf文件
pdf_src = PdfFileReader(fileName)
if end is None:
#获取页数
end = pdf_src.getNumPages()
with open(result, 'wb') as fp:
pdf = PdfFileWriter()
#提取页面内容,写入空白文件
for num in range(start, end):
pdf.addPage(pdf_src.getPage(num))
#写入结果pdf文件
pdf.write(fp)
path = './123.pdf'
split_pdf(path, './1.pdf', 0, 7)
2.读取csv文件
import csv
csv_reader = csv.reader(open("data.csv"))
for row in csv_reader:
print(row)
import pandas as pd
csv_reader = pd.read_csv("data.csv")
print(csv_reader)
#csv_reader = pd.read_table("data.csv", sep=",")
#print(csv