官网中有相关优化器optim的使用方法及例子
Taking an optimization step案例
for input, target in dataset:
optimizer.zero_grad()
output = model(input)
loss = loss_fn(output, target)
loss.backward()
optimizer.step()
首先是传入的参数是params,优化器需要知道可更新的参数有哪些
grad不断减少,进行更新
import torch
import torchvision.datasets
from torch import nn
from torch.nn import Conv2d, MaxPool2d, Linear, Flatten, Sequential
from torch.utils.data import DataLoader
from torch.utils.tensorboard import SummaryWriter
dataset = torchvision.datasets.CIFAR10("./dataset", train=False, transform=torchvision.transforms.ToTensor(), download=True)
dataloader = DataLoader(dataset, batch_size=1)
class Lixinyu(nn.Module):
def __init__(self):
super(Lixinyu, self).__init__()
self.model1 = Sequential(Conv2d(3, 32, 5, stride=1, padding=2),
MaxPool2d(2),
Conv2d(32, 32, 5, padding=2),
MaxPool2d(2),
Conv2d(32, 64, 5, padding=2),
MaxPool2d(2),
Flatten(),
Linear(1024, 64),
Linear(64, 10))
def forward(self, x):
x = self.model1(x)
return x
loss = nn.CrossEntropyLoss()
lixinyu = Lixinyu()
optim = torch.optim.SGD(lixinyu.parameters(), lr=0.01)
for data in dataloader:
imgs, targets = data
outputs = lixinyu(imgs)
result_loss = loss(outputs, targets)
optim.zero_grad()
result_loss.backward()
optim.step()
print(result_loss)
tensor(1.8779, grad_fn=<NllLossBackward0>)
tensor(1.7652, grad_fn=<NllLossBackward0>)
tensor(1.2320, grad_fn=<NllLossBackward0>)
tensor(0.9124, grad_fn=<NllLossBackward0>)
tensor(3.4349, grad_fn=<NllLossBackward0>)
tensor(0.6194, grad_fn=<NllLossBackward0>)
仅进行了一轮循环,可再套一层循环
对每轮loss求和,查看每轮loss的变化
import torch
import torchvision.datasets
from torch import nn
from torch.nn import Conv2d, MaxPool2d, Linear, Flatten, Sequential
from torch.utils.data import DataLoader
from torch.utils.tensorboard import SummaryWriter
dataset = torchvision.datasets.CIFAR10("./dataset", train=False, transform=torchvision.transforms.ToTensor(), download=True)
dataloader = DataLoader(dataset, batch_size=1)
class Lixinyu(nn.Module):
def __init__(self):
super(Lixinyu, self).__init__()
self.model1 = Sequential(Conv2d(3, 32, 5, stride=1, padding=2),
MaxPool2d(2),
Conv2d(32, 32, 5, padding=2),
MaxPool2d(2),
Conv2d(32, 64, 5, padding=2),
MaxPool2d(2),
Flatten(),
Linear(1024, 64),
Linear(64, 10))
def forward(self, x):
x = self.model1(x)
return x
loss = nn.CrossEntropyLoss()
lixinyu = Lixinyu()
optim = torch.optim.SGD(lixinyu.parameters(), lr=0.01)
for epoch in range(20):
running_loss = 0.0
for data in dataloader:
imgs, targets = data
outputs = lixinyu(imgs)
result_loss = loss(outputs, targets)
optim.zero_grad()
result_loss.backward()
optim.step()
running_loss = running_loss + result_loss
print(f"{epoch}" ":" f"{running_loss}")