【跑实验记录】SOLO

最新推荐文章于 2022-09-13 19:56:16 发布

zxfhahaha

最新推荐文章于 2022-09-13 19:56:16 发布

阅读量767

点赞数

分类专栏：跑实验文章标签： solo 计算机视觉深度学习 python

本文链接：https://blog.csdn.net/zxfhahaha/article/details/106711279

版权

这篇博客记录了使用SOLO模型进行计算机视觉实验的过程，包括用R50训练到12个epoch，然后切换到MobilenetV2作为Backbone并调整代码以适应其特征图大小。实验涉及预训练模型的融合，通过FPN和内积进行改进，并在停电前完成了6个epoch的训练。

摘要由CSDN通过智能技术生成

6.12

跑测试集

python tools/test_ins.py configs/solo/solo_r50_fpn_8gpu_1x.py download  --show --out  results_solo.pkl --eval segm

测试模型：SOLO_R50_1x

在这里插入图片描述

训练 6.12-6-18

用的命令
python tools/train.py configs/solo/solo_r50_fpn_8gpu_1x.py

训练结果：
在这里插入图片描述

6.16 把Backbone换成mobilenetv2

修改代码

记得要把/home/flora/SOLO/mmdet/models/anchor_heads/solo_head.py第108行的4改成8(因为Mobilenetv2输出的feature map下采样的倍数是resnet的两倍，这里是为了得到原图的大小)
upsampled_size = (featmap_sizes[0][0] * 8, featmap_sizes[0][1] * 8)

实验结果

batchsize调成了4，成功开始训练如下
在这里插入图片描述
到12个epoch的loss

‘CUDA_VISIBLE_DEVICES=3 python tools/test_ins.py configs/solo/solo_mobilenetv2_fpn_8gpu_1x.py work_dirs/solo_release_mv2_fpn_8gpu_1x/epoch_10.pth --show --out results_solo.pkl --eval segm’

在这里插入图片描述

mobilenet+预训练模型

训练 6.29 2：14-7.1 17：40

加mobilenet预训练模型后的结果
CUDA_VISIBLE_DEVICES=0,3 python tools/train.py configs/solo/solo_mobilenetv2_fpn_8gpu_1x.py --gpus 2
模型地址
/home/flora/SOLO/work_dirs/solo_release_mv2_fpn_8gpu_1x_pretrained/epoch_12.pth

在这里插入图片描述测试结果

solo_head.py代码

张老师内积

import mmcv
import torch
import torch.nn as nn
import torch.nn.functional as F
from mmcv.cnn import normal_init
from mmdet.ops import DeformConv, roi_align
from mmdet.core import multi_apply, bbox2roi, matrix_nms
from ..builder import build_loss
from ..registry import HEADS
from ..utils import bias_init_with_prob, ConvModule
import pdb # zsc
INF = 1e8

from scipy import ndimage

def points_nms(heat, kernel=2):
    # kernel must be 2
    hmax = nn.functional.max_pool2d(
        heat, (kernel, kernel), stride=1, padding=1)
    keep = (hmax[:, :, :-1, :-1] == heat).float()
    return heat * keep

def dice_loss(input, target):
    input = input.contiguous().view(input.size()[0], -1)
    target = target.contiguous().view(target.size()[0], -1).float()

    a = torch.sum(input * target, 1)
    b = torch.sum(input * input, 1) + 0.001
    c = torch.sum(target * target, 1) + 0.001
    d = (2 * a) / (b + c)
    return 1-d

@HEADS.register_module
class SOLOHead(nn.Module):

    def __init__(self,
                 num_classes,
                 in_channels,
                 seg_feat_channels=256,
                 stacked_convs=4,
                 strides=(4, 8, 16, 32, 64),
                 base_edge_list=(16, 32, 64, 128, 256),
                 scale_ranges=((8, 32), (16, 64), (32, 128), (64, 256), (128, 512)),
                 sigma=0.4,
                 num_grids=None,
                 cate_down_pos=0,
                 with_deform=False,
                 loss_ins=None,
                 loss_cate=None,
                 conv_cfg=None,
                 norm_cfg=None):
        super(SOLOHead, self).__init__()
        self.num_classes = num_classes
        self.seg_num_grids = num_grids
        self.cate_out_channels = self.num_classes - 1
        self.in_channels = in_channels
        self.seg_feat_channels = seg_feat_channels
        self.stacked_convs = stacked_convs
        self.strides = strides
        self.sigma = sigma
        self.cate_down_pos = cate_down_pos
        self.base_edge_list = base_edge_list
        self.scale_ranges = scale_ranges
        self.with_deform = with_deform
        self.loss_cate = build_loss(loss_cate)
        self.ins_loss_weight = loss_ins['loss_weight']
        self.conv_cfg = conv_cfg
        self.norm_cfg = norm_cfg
        self._init_layers()

    def _init_layers(self):
        norm_cfg = dict(type='GN', num_groups=32, requires_grad=True)        
        self.ins_convs = nn.ModuleList()
        self.cate_convs = nn.ModuleList()
        for i in range(self.stacked_convs):
            chn = self.in_channels + 2 if i == 0 else self.seg_feat_channels
            self.ins_convs.append(
                ConvModule(
                    chn,
                    self.seg_feat_channels,
                    3,
                    stride=1,
                    padding=1,
                    norm_cfg=norm_cfg,
                    bias=norm_cfg is None))

            chn = self.in_channels if i == 0 else self.seg_feat_channels
            self.cate_convs.append(
                ConvModule(
                    chn,
                    self.seg_feat_channels,
                    3,
                    stride=1,
                    padding=1,
                    norm_cfg=norm_cfg,
                    bias=norm_cfg is None))

        self.solo_ins_list = nn.ModuleList()
        for seg_num_grid in self.seg_num_grids:
            self.solo_ins_list.append(
                nn.Conv2d(
                    seg_num_grid**2, seg_num_grid**2, 1))

        self.solo_cate = nn.Conv2d(
            self.seg_feat_channels, self.cate_out_channels, 3, padding=1)

    def init_weights(self):
        for m in self.ins_convs:
            normal_init(m.conv, std=0.01)
        for m in self.cate_convs:
            normal_init(m.conv, std=0.01)
        bias_ins = bias_init_with_prob(0.01)
        for m in self.solo_ins_list: 
            normal_init(m, std=0.01, bias=bias_ins)
        bias_cate = bias_init_with_prob(0.01)
        normal_init(self.solo_cate, std=0.01, bias=bias_cate)

    def forward(self, feats, eval=False):
        new_feats = self.split_feats(feats)        
        featmap_sizes = [featmap.size()[-2:] for featmap in new_feats]
        upsampled_size = (featmap_sizes[0][0] * 2, featmap_sizes[0][1] * 2)
        ins_pred, cate_pred = multi_apply(self.forward_single, new_feats, 
                                          list(range(len(self.seg_num_grids))),
                                          eval=eval, upsampled_size=upsampled_size)
        return ins_pred, cate_pred

    def split_feats(self, feats):
        return (F.interpolate(feats[0], scale_factor=0.5, mode='bilinear'), 
                feats[1], 
                feats[2], 
                feats[3], 
                F.interpolate(feats[4], size=feats[3].shape[-2:], mode='bilinear'))

    def forward_single(self, x, idx, eval=False, upsampled_size=None):
        ins_feat = x
        cate_feat = x
        # ins branch
        # concat coord        
        x_range = torch.linspace(-1, 1, ins_feat.shape[-1], device=ins_feat.device)
        y_range = torch.linspace(-1, 1, ins_feat.shape[-2], device=ins_feat.device)
        y, x = torch.meshgrid(y_range, x_range)
        y =