根据yolo目标检测的检测框裁剪检测目标

万事云

已于 2023-07-26 14:19:22 修改

阅读量789

点赞数

分类专栏：目标检测文章标签：计算机视觉 python 深度学习

于 2023-07-26 14:10:42 首次发布

本文链接：https://blog.csdn.net/CloudVans/article/details/131937862

版权

目标检测专栏收录该内容

1 篇文章 1 订阅

订阅专栏

根据已经训练好的模型在yolov5中检测抠图

首先，在detect代码中找到

parser.add_argument('--save-txt',  action='store_true', help='save results to *.txt')

添加default=True，这一步是为了输出检测框的txt文件

parser.add_argument('--save-txt', default=True, action='store_true', help='save results to *.txt')

import os
import cv2
 
path = 'runs/detect/exp4/exp4'        # jpg图片和对应的生成结果的txt标注文件放在一个文件夹下
path3 = 'runs/cut_picture'    # 裁剪出来的小图保存的根目录
path2 = 'runs/crop_picture'   # 覆盖目标区域后的原图
 
file = os.listdir(path)

img_total = []
txt_total = []
for filename in file:
    first, last = os.path.splitext(filename)
    if last == ".jpg":                      # 图片的后缀名
        img_total.append(first)
    else:
        txt_total.append(first)
for img_name in img_total:
    if img_name in txt_total:
        filename_img = img_name+".jpg"
        path1 = os.path.join(path, filename_img)
        img = cv2.imread(path1)
        h, w = img.shape[0], img.shape[1]
        img = cv2.resize(img, (w, h), interpolation=cv2.INTER_CUBIC)  # resize 图像大小，否则roi区域可能会报错
        filename_txt = img_name+".txt"
        n = 1
        with open(os.path.join(path, filename_txt), "r+", encoding="utf-8", errors="ignore") as f:
            for line in f:
                coordinate = line.split(" ")
                x_center = w * float(coordinate[1])       # coordinate[1]左上点的x坐标
                y_center = h * float(coordinate[2])       # coordinate[2]左上点的y坐标
                width = int(w*float(coordinate[3]))       # coordinate[3]图片width
                height = int(h*float(coordinate[4]))      # coordinate[4]图片height
                lefttopx = int(x_center-width/2.0)
                lefttopy = int(y_center-height/2.0)
                filename_last = img_name + "_" + str(n) + ".jpg"
                roi = img[lefttopy+1:lefttopy+height+3, lefttopx+1:lefttopx+width+1]
                cv2.imwrite(os.path.join(path3, filename_last), roi)
                filename_last = img_name+"_"+str(n)+".jpg"    # 裁剪出来的小图文件名
                img[lefttopy + 1:lefttopy + height + 3, lefttopx + 1:lefttopx + width + 1] = (255, 255, 255)
                n = n+1
            cv2.imwrite(os.path.join(path2, filename_last), img)
    else:
        continue