批量读取文件

kitanoli

于 2022-06-20 17:32:54 发布

阅读量302

点赞数

文章标签： python 开发语言

本文链接：https://blog.csdn.net/neoistheone/article/details/125296602

版权

import pandas as pd
import numpy as np
import scipy.io
import tensorflow as tf

import os

# 获取文件路径
# def get_file_path():

#     read_path = r"C:\Users\电力系统人工智能\Documents\pycharm\宽频\1"
#     output_path = r"C:\Users\电力系统人工智能\Documents\pycharm\宽频\test1"
#     return read_path,output_path
#
# # 处理单个文件程序 /针对不同批量处理文件进行修改对文件的处理代码,返回值：finish_dfdata/
# def get_deal_file(dfdata):
#     pass


# 读取文件名称和内容
def deal_files():
    # 获取read_path下的所有文件名称（顺序读取的）
    read_path = r"C:\Users\电力系统人工智能\Documents\pycharm\宽频\1"
    files = os.listdir(read_path)
    a2 = pd.DataFrame()
    for i in [0,624,1248,1872,2496]:
        for file_name in files[i:i+100]:
            # 读取单个文件内容
            # dfdata = pd.read_excel(read_path+"\\"+file_name)
            #处理单个文件(调用方法)
            mat1 = scipy.io.loadmat(read_path+"\\"+file_name)
            a1 = pd.DataFrame(mat1['Sample_i'])
            a2 = pd.concat([a1.iloc[4800:6000,:], a2], axis=1, ignore_index=True)
            # get_deal_file(mat1)
            # 输出结果到指定路径下
            # a1.to_excel(output_path + "\\" + "处理结果_" + "1.xlsx", index=False)
    train_stats =a2.describe()  # 查看训练集的输入X的统计数据，统计的是列
    train_stats = train_stats.transpose()  # 转置
    def norm(x):
        return (x - train_stats['min']) / (train_stats['max'] - train_stats['min'])
    a2=norm(a2).T
    return a2

# 主函数
def onehot():
    # 获取文件输入和输出路径
    read_path,output_path = get_file_path()
    # 开始处理文件，并输出处理文件结果