日常一些常用模块汇集【读取文件名】【json读取与保存】

Jennie_J

于 2021-09-29 15:03:27 发布

阅读量281

点赞数

分类专栏： python数据处理文章标签： json python

本文链接：https://blog.csdn.net/weixin_43685844/article/details/120548703

版权

python数据处理专栏收录该内容

31 篇文章 6 订阅

订阅专栏

def get_files(dir):
    """
    获取所有文件名
    :param dir: 目录
    :return: 目录下所有去重文件名的列表
    """
    file_list=[]
    for roots, dirs, files in os.walk(dir):
        for file in files:
            file_list.append(file.split('.')[0])
    return list(set(file_list))

def read_json(file_path):
    """
    json文件中存储多行内容
    读取json文件的每一行的内容 
    """
    with open(file_path,'r',encoding='utf-8') as f:
        for line in f.readlines():
            line_dict = json.loads(line)            
            print(line_dict)
            print('++++++++++++')

def save_json_result(dir_path,person_feat,person_index):
    """
    json文件中存储多行内容,每行一个dict
    """
    with open(dir_path+'text_person.json','w',encoding='utf-8') as f:
        out = {'data_id':None,'feat_value':None,'text_LabelIndex':None}
        for pid in person_feat.keys():
            out['data_id'] = pid
            out['feat_value'] = person_feat[pid]
            out['text_LabelIndex'] = person_index[pid]
            json.dump(out,f,ensure_ascii=False)
            f.write('\n')

def make_path(params):
    """
    Make folders for training and evaluation
    """
    if not os.path.isdir(params.result_path):
        os.makedirs(params.result_path)
    if not os.path.isdir(params.ckpt_path):
        os.makedirs(params.ckpt_path)
    if not os.path.isdir("log"):
        os.makedirs("log")

def writefile(filename,list,save_dir,sep=' '):
    """
    该函数负责将处理好的标注数据文件保存
    :param filename: 保存的文件名
    :param list: 要保存的列表
    :param sep: 字符和标注之间的分隔符
    :return:
    """
    save_file = os.path.join(save_dir,filename)
    with open(save_file,'w',encoding='utf-8') as f:
        for item in list:
            if item=='\n':
                f.write( '\n')
            else:
                f.write(sep.join(item) + '\n')

# 读取00和81组成train.txt，82作为test.txt
def concate_file(dir,files,filename,save_path,sep=' '):
    sentences=[]
    for name in files:
        t_file=os.path.join(dir,name+'.txt')
        for line in codecs.open(t_file, 'r', 'utf8'):
            line = line.replace('\r\n','').split(' ')
            sentences.append(line)
            if line[0] =='。' and line[1]=='O':
                sentences.append('\n')
    writefile(filename,sentences,save_path)

Jennie_J

关注

0
点赞
踩
1

收藏

觉得还不错? 一键收藏
0
评论
日常一些常用模块汇集【读取文件名】【json读取与保存】

def get_files(dir): """ 获取所有文件名 :param dir: 目录 :return: 目录下所有去重文件名的列表 """ file_list=[] for roots, dirs, files in os.walk(dir): for file in files: file_list.append(file.split('.')[0]) return list(set(file_
复制链接

扫一扫

专栏目录