【Pytorch实战系列】VGG11训练FashionMNIST数据集

目录

模型

代码

训练结果

总结


模型

代码

import torch
from torch import nn
from torchvision import datasets, transforms
from torch.utils.data import DataLoader
from tqdm import tqdm

# 加载数据
train_dataset = datasets.FashionMNIST(root="../datasets/", transform=transforms.Compose([transforms.ToTensor(), transforms.Resize(224)]), train=True, download=True)
test_dataset = datasets.FashionMNIST(root="../datasets/", transform=transforms.Compose([transforms.ToTensor(), transforms.Resize(224)]), train=False, download=True)
train_dataloader = DataLoader(train_dataset, batch_size=128, shuffle=True)
test_dataloader = DataLoader(test_dataset, batch_size=128, shuffle=False)

# 定义 VGG 网络结构
class VGG11(nn.Module):
    def __init__(self, conv_arch):
        super().__init__()
        self.conv_blks = []
        self.conv_arch = conv_arch
        self.conv_blocks()
        self.convs = nn.Sequential(*self.conv_blks)
        self.linears = nn.Sequential(nn.Flatten(),
                                     nn.Linear(128 * 7 * 7, 4096), nn.ReLU(), nn.Dropout(0.5),
                                     nn.Linear(4096, 4096), nn.ReLU(), nn.Dropout(0.5),
                                     nn.Linear(4096, 10))

    # 定义 vgg 卷积块函数
    def vgg_block(self, num_convs, in_channels, out_channels):
        layers = []
        for _ in range(num_convs):
            layers.append(nn.Conv2d(in_channels, out_channels, kernel_size=3, padding=1))
            layers.append(nn.ReLU())
            in_channels = out_channels
        layers.append(nn.MaxPool2d(kernel_size=2, stride=2))
        return nn.Sequential(*layers)
    
    def conv_blocks(self):
        in_channels = 1
        for num_convs, out_channels in self.conv_arch:
            self.conv_blks.append(self.vgg_block(num_convs, in_channels, out_channels))
            in_channels = out_channels

    def forward(self, x):
        x = self.convs(x)
        x = self.linears(x)
        return x


conv_arch = ((1, 16), (1, 32), (2, 64), (2, 128), (2, 128))
device = "cuda:0" if torch.cuda.is_available() else "cpu"
vgg11 = VGG11(conv_arch).to(device)
# 定义超参数
epochs = 10
lr = 1e-4
# 定义优化器
optimizer = torch.optim.Adam(vgg11.parameters(), lr = lr)
# 定义损失函数
loss_fn = nn.CrossEntropyLoss()
# 训练
for epoch in range(epochs):
    train_loss_epoch = []
    for train_data, labels in tqdm(train_dataloader):
        train_data = train_data.to(device)
        labels = labels.to(device)
        y_hat = vgg11(train_data)
        loss = loss_fn(y_hat, labels)
        optimizer.zero_grad()
        loss.backward()
        optimizer.step()

        train_loss_epoch.append(loss.cpu().detach().numpy())
    
    print(f'epoch:{epoch}, train_loss:{sum(train_loss_epoch) / len(train_loss_epoch)}')
    with torch.no_grad():
        test_loss_epoch = []
        right = 0
        for test_data, labels in tqdm(test_dataloader):
            test_data = test_data.to(device)
            labels = labels.to(device)
            y_hat = vgg11(test_data)
            loss = loss_fn(y_hat, labels)
            test_loss_epoch.append(loss.cpu().detach().numpy()) 
            right += (torch.argmax(y_hat, 1) == labels).sum()
        acc = right / len(test_dataset)
        print(f'test_loss:{sum(test_loss_epoch) / len(test_loss_epoch)}, acc:{acc}')

训练结果

总结

考虑到原VGG11网络的卷积通道数太大,导致训练时间过长的问题,因此我将通道数做了除4处理。

  • 13
    点赞
  • 10
    收藏
    觉得还不错? 一键收藏
  • 1
    评论
好的,关于softmax回归在PyTorch中的实现,针对FashionMNIST数据集的话,可以按照以下步骤进行。 首先,需要引入相应的包: ``` import torch import torchvision from torch.utils.data import DataLoader import torch.nn.functional as F ``` 然后,准备数据集: ``` # 准备训练集和测试集 train_dataset = torchvision.datasets.FashionMNIST(root='./data/FashionMNIST', train=True, transform=torchvision.transforms.ToTensor(), download=True) test_dataset = torchvision.datasets.FashionMNIST(root='./data/FashionMNIST', train=False, transform=torchvision.transforms.ToTensor(), download=True) # 定义数据加载器 train_loader = DataLoader(dataset=train_dataset, batch_size=64, shuffle=True) test_loader = DataLoader(dataset=test_dataset, batch_size=64, shuffle=False) ``` 接下来,定义模型: ``` # 定义模型 class SoftmaxRegression(torch.nn.Module): def __init__(self): super(SoftmaxRegression, self).__init__() self.linear = torch.nn.Linear(784, 10) def forward(self, x): x = x.reshape(x.shape[0], -1) logits = self.linear(x) return logits ``` 然后,定义优化器和损失函数: ``` # 定义优化器和损失函数 model = SoftmaxRegression() optimizer = torch.optim.SGD(model.parameters(), lr=0.1) criterion = torch.nn.CrossEntropyLoss() ``` 接着,进行模型训练: ``` # 模型训练 num_epochs = 10 for epoch in range(num_epochs): for i, (images, labels) in enumerate(train_loader): # 前向传播及计算损失 outputs = model(images) loss = criterion(outputs, labels) # 反向传播及优化 optimizer.zero_grad() loss.backward() optimizer.step() if (i+1) % 100 == 0: print("Epoch [{}/{}], Step [{}/{}], Loss: {:.4f}".format(epoch+1, num_epochs, i+1, len(train_loader), loss.item())) ``` 最后,进行模型测试: ``` # 模型测试 with torch.no_grad(): correct = 0 total = 0 for images, labels in test_loader: outputs = model(images) _, predicted = torch.max(outputs.data, 1) total += labels.size(0) correct += (predicted == labels).sum().item() print('Accuracy of the model on the 10000 test images: {} %'.format(100 * correct / total)) ``` 这样,就可以在PyTorch中实现softmax回归,利用FashionMNIST数据集进行模型训练和测试了。

“相关推荐”对你有帮助么?

  • 非常没帮助
  • 没帮助
  • 一般
  • 有帮助
  • 非常有帮助
提交
评论 1
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值