import pandas as pd
import numpy as np
import scipy.io
import tensorflow as tf
import os
# 获取文件路径
# def get_file_path():
# read_path = r"C:\Users\电力系统人工智能\Documents\pycharm\宽频\1"
# output_path = r"C:\Users\电力系统人工智能\Documents\pycharm\宽频\test1"
# return read_path,output_path
#
# # 处理单个文件程序 /针对不同批量处理文件进行修改对文件的处理代码,返回值:finish_dfdata/
# def get_deal_file(dfdata):
# pass
# 读取文件名称和内容
def deal_files():
# 获取read_path下的所有文件名称(顺序读取的)
read_path = r"C:\Users\电力系统人工智能\Documents\pycharm\宽频\1"
files = os.listdir(read_path)
a2 = pd.DataFrame()
for i in [0,624,1248,1872,2496]:
for file_name in files[i:i+100]:
# 读取单个文件内容
# dfdata = pd.read_excel(read_path+"\\"+file_name)
#处理单个文件(调用方法)
mat1 = scipy.io.loadmat(read_path+"\\"+file_name)
a1 = pd.DataFrame(mat1['Sample_i'])
a2 = pd.concat([a1.iloc[4800:6000,:], a2], axis=1, ignore_index=True)
# get_deal_file(mat1)
# 输出结果到指定路径下
# a1.to_excel(output_path + "\\" + "处理结果_" + "1.xlsx", index=False)
train_stats =a2.describe() # 查看训练集的输入X的统计数据,统计的是列
train_stats = train_stats.transpose() # 转置
def norm(x):
return (x - train_stats['min']) / (train_stats['max'] - train_stats['min'])
a2=norm(a2).T
return a2
# 主函数
def onehot():
# 获取文件输入和输出路径
read_path,output_path = get_file_path()
# 开始处理文件,并输出处理文件结果