介绍:
在进行神经网络训练时,一般我们需要使用预训练模型的参数,但是有时候我们需要对网络的层进行调整,就会导致预训练的模型参数和我们的模型参数不一样,这样我们就只能使用预训练模型中的部分参数
操作:
使用方法很简单,直接上代码:
def change_key_names(old_params, in_channels):
new_params = collections.OrderedDict()
layer_count = 0
allKeyList = old_params.keys()
for layer_key in allKeyList:
if layer_count >= len(allKeyList) - 2:
# exclude fc layers
continue
else:
if layer_count == 0:
rgb_weight = old_params[layer_key].data
rgb_weight_mean = torch.mean(rgb_weight, dim=1)
flow_weight = rgb_weight_mean.unsqueeze(1).repeat(1, in_channels, 1, 1)
new_params[layer_key] = flow_weight
layer_count += 1
else:
new_params[layer_key] = old_params[layer_key]
layer_count += 1
return new_params
def flow_resnet34(pretrained=False, channels=20, num_classes=61):
"""Constructs a ResNet-34 model.
Args:
pretrained (bool): If True, returns a model pre-trained on ImageNet
"""
model = ResNet(BasicBlock, [3, 4, 6, 3], channels=channels, num_classes=num_classes)
if pretrained: # 使用预训练模型
in_channels = channels
pretrained_dict = model_zoo.load_url(model_urls['resnet34'])
model_dict = model.state_dict()
new_pretrained_dict = change_key_names(pretrained_dict, in_channels)
# 1. filter out unnecessary keys
new_pretrained_dict = {k: v for k, v in new_pretrained_dict.items() if k in model_dict}
# 2. overwrite entries in the existing state dict
model_dict.update(new_pretrained_dict)
# 3. load the new state dict
model.load_state_dict(model_dict)
return model