train.py部分

最新推荐文章于 2023-10-09 14:25:13 发布

MingX.Zhao

最新推荐文章于 2023-10-09 14:25:13 发布

阅读量504

点赞数

分类专栏： yolov5详解文章标签： pytorch 深度学习机器学习

本文链接：https://blog.csdn.net/Newt_Scamander/article/details/122271308

版权

yolov5详解专栏收录该内容

5 篇文章 2 订阅

订阅专栏

    plots = not evolve  # create plots
    cuda = device.type != 'cpu'
    init_seeds(1 + RANK)
    with torch_distributed_zero_first(LOCAL_RANK):
        data_dict = data_dict or check_dataset(data)  # check if None
        这里的check_dataset会把train,val生成为path+train,path+val
    train_path, val_path = data_dict['train'], data_dict['val']
    nc = 1 if single_cls else int(data_dict['nc'])  # number of classes
    names = ['item'] if single_cls and len(data_dict['names']) != 1 else data_dict['names']  # class names
    assert len(names) == nc, f'{len(names)} names found for nc={nc} dataset in {data}'  # check
    is_coco = isinstance(val_path, str) and val_path.endswith('coco/val2017.txt')  # COCO dataset

    # Model
    check_suffix(weights, '.pt')  # check weights
    pretrained = weights.endswith('.pt')
   
    if pretrained:
        with torch_distributed_zero_first(LOCAL_RANK):
            weights = attempt_download(weights)  # download if not found locally
        ckpt = torch.load(weights, map_location=device)  # load checkpoint
        model = Model(cfg or ckpt['model'].yaml, ch=3, nc=nc, anchors=hyp.get('anchors')).to(device)  # create
        exclude = ['anchor'] if (cfg or hyp.get('anchors')) and not resume else []  # exclude keys
        exclude的作用是在有预训练模型时想要在load到当前模型时不load的参数的key
        csd = ckpt['model'].float().state_dict()  # checkpoint state_dict as FP32
        csd是预训练模型的参数
        csd = intersect_dicts(csd, model.state_dict(), exclude=exclude)  # intersect
        intersect作用是把exclude的key去掉，并把预训练中有但当前模型中没有的参数去掉
        model.load_state_dict(csd, strict=False)  # load
        LOGGER.info(f'Transferred {len(csd)}/{len(model.state_dict())} items from {weights}')  # report
    else:
        model = Model(cfg, ch=3, nc=nc, anchors=hyp.get('anchors')).to(device)  # create
    # Freeze
    freeze = [f'model.{x}.' for x in (freeze if len(freeze) > 1 else range(freeze[0]))]  # layers to freeze
    for k, v in model.named_parameters(): 
    k为key键值，v为value
        v.requires_grad = True  # train all layers
        if any(x in k for x in freeze):
            LOGGER.info(f'freezing {k}')
            v.requires_grad = False 将freeze中的层设为不训练的参数