# Read data and group by label
def read_and_group_data(data_folder):
files = os.listdir(data_folder)
label_data_dict = {}
for file in files:
label = file.split("_")[1].split(".")[0]
label = ''.join([c for c in label if c.isalpha()])
if label[-1].isnumeric():
label = label[:-1]
df = pd.read_csv(os.path.join(data_folder, file), encoding='ISO-8859-1')
if label not in label_data_dict:
label_data_dict[label] = pd.DataFrame()
label_data_dict[label] = pd.concat([label_data_dict[label], df])
return label_data_dict
输入文件夹名称,数据的标签是文件夹第一个下划线之后的第一个英文单词,输出的是按照标签分类数据的字典数据。