17.1 以SGD为例使用优化器
参考的官方文档link
代码实现(在笔记16的代码中加入优化器)
import torch
import torchvision.datasets
from torch import nn
from torch.nn import Conv2d, MaxPool2d, Flatten, Linear, Sequential
from torch.utils.data import DataLoader
dataset = torchvision.datasets.CIFAR10("../data", train=False, transform=torchvision.transforms.ToTensor(),
download=True)
dataloader = DataLoader(dataset, batch_size=1)
class Avlon(nn.Module):
def __init__(self):
super().__init__()
self.model1 = Sequential(
Conv2d(3, 32, 5, padding=2),
MaxPool2d(2),
Conv2d(32, 32, 5, padding=2),
MaxPool2d(2),
Conv2d(32, 64, 5, padding=2),
MaxPool2d(2),
Flatten(),
Linear(1024, 64),
Linear(64, 10)
)
def forward(self, x):
x = self.model1(x)
return x
loss = nn.CrossEntropyLoss()
avlon = Avlon()
optim = torch.optim.SGD(avlon.parameters(), 0.01) # 随机梯度下降。神经网络参数,学习率
for epoch in range(20):
running_loss = 0.0 # 每一轮开始前,清零
for data in dataloader:
imgs, targets = data
outputs = avlon(imgs)
result_loss = loss(outputs, targets)
optim.zero_grad() # 对网络模型中每一可调参数的梯度清零
result_loss.backward() # 得到每一可调参数的梯度
optim.step() # 对每一参数进行调优
running_loss = running_loss + result_loss
print(running_loss)
运行后
误差确实在逐渐减小。
# 关于反向传播和梯度下降法,可以观看吴恩达的机器学习视频课程