将YOLO数据集的txt标签转为VOC数据集的xml标签

import os
import xml.etree.ElementTree as ET
from xml.dom.minidom import parseString

# Define paths
images_path = "/mnt/data/fall_person/images/val/"  # 图片路径
labels_path = "/mnt/data/fall_person/labels/val/"  # TXT标注文件路径
output_path = "/mnt/data/fall_person/anchor/"  # 生成的XML文件存储路径

# 创建output目录(如果不存在)
if not os.path.exists(output_path):
    os.makedirs(output_path)

# 获取图片文件列表
image_files = [f for f in os.listdir(images_path) if f.endswith('.jpg') or f.endswith('.png')]

def create_xml(filename, img_width, img_height, objects):
    annotation = ET.Element("annotation")

    folder = ET.SubElement(annotation, "folder").text = "images"
    filename_tag = ET.SubElement(annotation, "filename").text = filename

    size = ET.SubElement(annotation, "size")
    ET.SubElement(size, "width").text = str(img_width)
    ET.SubElement(size, "height").text = str(img_height)
    ET.SubElement(size, "depth").text = "3"  # Assuming RGB images

    for obj in objects:
        obj_tag = ET.SubElement(annotation, "object")
        ET.SubElement(obj_tag, "name").text = obj['name']
        ET.SubElement(obj_tag, "pose").text = "Unspecified"
        ET.SubElement(obj_tag, "truncated").text = "0"
        ET.SubElement(obj_tag, "difficult").text = "0"

        bndbox = ET.SubElement(obj_tag, "bndbox")
        ET.SubElement(bndbox, "xmin").text = str(obj['xmin'])
        ET.SubElement(bndbox, "ymin").text = str(obj['ymin'])
        ET.SubElement(bndbox, "xmax").text = str(obj['xmax'])
        ET.SubElement(bndbox, "ymax").text = str(obj['ymax'])

    return annotation

def txt_to_xml(image_file):
    filename = os.path.splitext(image_file)[0]
    label_file = os.path.join(labels_path, filename + ".txt")
    image_file_path = os.path.join(images_path, image_file)
    
    if not os.path.exists(label_file):
      return
    # 读取图片的宽高(可以使用PIL或OpenCV读取图片尺寸)
    from PIL import Image
    img = Image.open(image_file_path)
    img_width, img_height = img.size

    objects = []
    with open(label_file, 'r') as file:
        for line in file.readlines():
            parts = line.strip().split()
            class_name = parts[0]
            # YOLO标注格式:class_id, center_x, center_y, width, height
            center_x = float(parts[1]) * img_width
            center_y = float(parts[2]) * img_height
            width = float(parts[3]) * img_width
            height = float(parts[4]) * img_height

            xmin = int(center_x - width / 2)
            ymin = int(center_y - height / 2)
            xmax = int(center_x + width / 2)
            ymax = int(center_y + height / 2)

            obj = {
                'name': class_name,
                'xmin': xmin,
                'ymin': ymin,
                'xmax': xmax,
                'ymax': ymax
            }
            objects.append(obj)

    annotation = create_xml(filename, img_width, img_height, objects)
    dom = parseString(ET.tostring(annotation))
    with open(os.path.join(output_path, filename + ".xml"), "w") as f:
        f.write(dom.toprettyxml(indent="\t"))

# 处理所有图片
for image_file in image_files:
    txt_to_xml(image_file)

print("转换完成!")

评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包

打赏作者

lucky169

你的鼓励将是我创作的最大动力

¥1 ¥2 ¥4 ¥6 ¥10 ¥20
扫码支付:¥1
获取中
扫码支付

您的余额不足,请更换扫码支付或充值

打赏作者

实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值