python 整理txt文件中的格式,按照句号划分句子,形成新的txt
# -*- coding:utf-8 -*-
if __name__ == '__main__':
# 读入需要修改格式的txt
with open("input/pre_data/one.txt", "r", encoding="utf-8") as f:
text = f.read().splitlines()
# 重新写入到一个新txt中
with open(r"input/pre_data/testz.txt", "w", encoding='utf-8') as r:
for i in text:
# 去掉句子中的空格
i=i.replace(' ','')
# 给句子换行
i = i.replace('。', '。\n')
r.write(i)
print(text)
print(type(text))