1、使用到的库:docx、lxml、xlwt
pip install python-docx
pip install lxml
pip install xlwt
2、python代码
import xlwt # 负责写excel
import numpy as np
from docx import Document
# 将数据保存到xlxs文件
def generateExcel(matrix):
matrix = np.array(matrix)
filename =xlwt.Workbook() # 创建工作簿
sheet1 = filename.add_sheet(u'sheet1',cell_overwrite_ok=True) # 创建sheet
[h,l] = matrix.shape # h为行数,l为列数
for i in range (h):
for j in range (l):
sheet1.write(i,j,str(matrix[i,j]))
filename.save('test.xlsx') # 保存到当前工作目录
# word文档路径
filename="test.docx"
doc = Document(filename)
tables=doc.tables
table_num = 1 # 表示word文档的第2个表格
tb=tables[table_num]
# 获取表格的行
tb_rows=tb.rows
row_data1=[]
for i in range(len(tb_rows)):
row_data=[]
row_cells=tb_rows[i].cells
# 读取每一行单元格内容
for cell in row_cells:
# 单元格内容
row_data.append(cell.text)
row_data1.append(row_data)
print("row_data1",row_data1)
generateExcel(row_data1)
3、test.docx和test.xlsx内容
word文档
xlsx表格