import docx
import codecs
from difflib import HtmlDiff
file1=docx.Document('文档1.docx')
file2=docx.Document('文档2.docx')
para1=''
para2=''
for para in file1.paragraphs:
para1=para1+para.text+'\n'
print(para1)
for para in file2.paragraphs:
para2=para2+para.text+'\n'
print(para2)
delta_html=HtmlDiff().make_file(para1.splitlines(),para2.splitlines())
with codecs.open('diff.html','w',encoding='utf-8') as f:
f.write(delta_html)
dfflib模块的使用可参考:
http://blog.csdn.net/lockey23/article/details/77913855
python-比较两份word文档
最新推荐文章于 2024-12-23 21:10:59 发布