【导入数据集】
# 导入数据 数据集的h5文件
import h5py
# 训练集
train_data = h5py.File('E:\pycharmTest\datasets/train_catvnoncat.h5','r')
# 测试集
test_data = h5py.File('E:\pycharmTest\datasets/test_catvnoncat.h5','r')
【查看数据格式】
# 查看数据
for key in train_data.keys():#遍历key
print(key)
# classes 1/0
# train_set_x key
# train_set_y value 1/0 标签
print(train_data['train_set_x'].shape)#该key的数据
# [(209, 64, 64, 3)] 209张图片 64 64 3 3个通道 RGB
print(train_data['train_set_x'][:1])
print(train_data['train_set_y'].shape)
【取出训练集、测试集】
train_data_org = train_data['train_set_x'][:]#org 训练集原始数据 [209,64,64,3]
train_labels_org = train_data['train_set_y'][:]
test_data_org = test_data['test_set_x'][:]
test_labels_org = test_data['test_set_y'][:]
#添加查看功能
# 查看图片
import matplotlib.pyplot as plt
#plt.imshow(train_data_org[148])#图片
#plt.show()
【数据处理】
# 数据维度的处理
import numpy as np
m_train = train_labels_org.shape[0]
m_test = test_labels_org.shape[0]
#print(m_test)
#print(m_train)
train_da