VOC转yolov5格式

最新推荐文章于 2024-08-05 11:19:50 发布

One橙序猿

最新推荐文章于 2024-08-05 11:19:50 发布

阅读量1.5k

点赞数 6

分类专栏：数据集

本文链接：https://blog.csdn.net/rush9838465/article/details/120559802

版权

VOC数据集 YOLOv5 XML转换边界框图像标注

关键词由CSDN通过智能技术生成

数据集专栏收录该内容

1 篇文章 0 订阅

订阅专栏

import os
import shutil
import cv2
from lxml import etree


def VOC2Yolov5(class_num, voc_img_path, voc_xml_path, yolo_txt_save_path, yolo_img_save_path=None):
    xmls = os.listdir(voc_xml_path)
    xmls = [x for x in xmls if x.endswith('.xml')]
    if yolo_img_save_path is not None:
        if not os.path.exists(yolo_img_save_path):
            os.mkdir(yolo_img_save_path)
    if not os.path.exists(yolo_txt_save_path):
        os.mkdir(yolo_txt_save_path)
    all_xmls = len(xmls)
    for idx, one_xml in enumerate(xmls):
        xl = etree.parse(os.path.join(voc_xml_path, one_xml))
        root = xl.getroot()
        objects = root.findall('object')
        img_size = root.find('size')
        img_w = 0
        img_h = 0
        if img_size:
            img_width = img_size.find('width')
            if img_width is not None:
                img_w = int(img_width.text)
            img_height = img_size.find('height')
            if img_height is not None:
                img_h = int(img_height.text)
        label_lines = []
        for ob in objects:
            one_annotation = {}
            label = ob.find('name').text
            one_annotation['tag'] = label
            one_annotation['flag'] = False
            bbox = ob.find('bndbox')
            xmin = int(bbox.find('xmin').text)
            ymin = int(bbox.find('ymin').text)
            xmax = int(bbox.find('xmax').text)
            ymax = int(bbox.find('ymax').text)
            if img_w == 0 or img_h == 0:
                img = cv2.imread(os.path.join(voc_img_path, one_xml.replace('.xml', '.jpg')))
                img_h, img_w = img.shape[:2]
            bbox_w = (xmax - xmin) / img_w
            bbox_h = (ymax - ymin) / img_h
            bbox_cx = (xmin + xmax) / 2 / img_w
            bbox_cy = (ymin + ymax) / 2 / img_h
            try:
                bbox_label = class_num[label]
                label_lines.append(f'{bbox_label} {bbox_cx} {bbox_cy} {bbox_w} {bbox_h}' + '\n')
            except Exception as e:
                print("not find number label in class_num ", e, one_xml)
                label_lines = []
                break
        if len(label_lines):
            with open(os.path.join(yolo_txt_save_path, one_xml.replace('.xml', '.txt')), 'w') as fp:
                fp.writelines(label_lines)
            if yolo_img_save_path is not None:
                shutil.copy(os.path.join(voc_img_path, one_xml.replace('.xml', '.jpg')),
                            os.path.join(yolo_img_save_path))
        print(f"processing: {idx}/{all_xmls}")


if __name__ == '__main__':
    VOC2Yolov5(
        class_num={'person': 0, 'hat': 1},
        voc_img_path=r'\VOC2028\JPEGImages',
        voc_xml_path=r'\VOC2028\Annotations',
        yolo_txt_save_path=r'\VOC2028\yolov5\labels\train2017',
        # yolo_img_save_path="/home/zhouhe/datasets/huiliantiao/images/train2017"
    )

输入参数：

class_num：label名和想要对应的id，如果voc中有的label名 这个字典没有将不会转换到yolov5 txt中

voc_img_path：voc图片文件夹

voc_xml_path：voc  xml 文件夹

yolo_txt_save_path： yolov5保存txt文件夹

yolo_img_save_path：（可选），如果非NONE 会将图片从voc中拷贝到这个目录下

One橙序猿

关注

6
点赞
踩
11

收藏

觉得还不错? 一键收藏
1
评论
复制链接

分享到 QQ

分享到新浪微博

扫一扫

专栏目录