python逐个读取文件并处理_python 读取文件夹下的所有文件并处理重新分类写入...

import os

import sys

import io

import time

# sys.stdout = io.TextIOWrapper(sys.stdout.buffer,encoding='gb18030') #改变标准输出的默认编码

def read():

path = r"C:\Users\mzj\Desktop\高精准"# 文件夹目录

for i in os.listdir(path):

try:

for q in os.listdir(os.path.join(path,i)):

paths=os.path.join(path,i,q)

f = open(paths, "r", encoding="UTF-8")

lines = f.readlines()

f.close()

url = os.path.basename(paths)

li = url.split('_')

temp_lines_list = [x.strip() for x in lines]

# print(temp_lines_list)

if len(temp_lines_list) < 2:

# 行数不够,不进行处理

print('行数太短了。。。。。。')

# #去掉空行

for t in temp_lines_list:

download_file_path = r'C:\Users\mzj\Desktop'

now_title = t.split("|")

while now_title:

if now_title[8] == 'ztb':

download_path = os.path.join(download_file_path, now_title[8])

if not os.path.exists(download_path):

os.mkdir(download_path)

time_path = os.path.join(download_path, str(li[0][:4] + '-' + li[0][4:6] + '-' + li[0][6:8]))

if not os.path.exists(time_path):

os.mkdir(time_path)

urls = time_path + '/' + str(

li[0] + '_' + li[1] + '_' + str(now_title[8]) + '_' + li[3] + '_' + li[4])

with open(urls, 'a', encoding='utf-8')as f:

f.write(t + '\n')

break

else:

break

except Exception as e:

# 文件读取失败

print(e)

#去掉\n

if __name__=='__main__':

read()

import os

path=r'C:\Users\mzj\Desktop\city\city\out'

for i in os.listdir(path):

with open(os.path.join(path,i),'r',encoding='utf-8')as r:

for w in r.readlines():

with open(r'C:\Users\mzj\Desktop\city\city\two.out','a+',encoding='utf-8')as f:

f.write(w)

os.remove(os.path.join(path,i))

print('写入成功{},删除成功{}'.format(os.path.join(path,i),os.path.join(path,i)))

  • 0
    点赞
  • 0
    收藏
    觉得还不错? 一键收藏
  • 0
    评论
评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值