VOC数据集转YOLO数据集

1.xml转txt

import os.path
import xml.etree.ElementTree as ET

class_names = ['palm','stone','scissor','awesome','heartB','OK','ROCK','one','swear','thanks','heartA','heartC','good','bad','pray','call','take_picture','salute']

xmlpath='/data/tts/yohji.qian/dataset/hand18_1201/labels_voc/' #原xml路径
txtpath='/data/tts/yohji.qian/dataset/hand18_1201/labels/'     #转换后txt文件存放路径 
files = []

for root, dirs, files in os.walk(xmlpath):
    None

number = len(files)
print(number)
i = 0
while i < number:

    name = files[i][0:-4]
    xml_name = name + ".xml"
    txt_name = name + ".txt"
    xml_file_name = xmlpath + xml_name
    txt_file_name = txtpath + txt_name

    xml_file = open(xml_file_name)
    tree = ET.parse(xml_file)
    root = tree.getroot()
    filename = root.find('filename').text

    image_name = root.find('filename').text
    w = int(root.find('size').find('width').text)
    h = int(root.find('size').find('height').text)

    f_txt = open(txt_file_name, 'w+')
    content = ""

    first = True

    for obj in root.iter('object'):

        name = obj.find('name').text
        class_num = class_names.index(name)

        xmlbox = obj.find('bndbox')

        x1 = int(xmlbox.find('xmin').text)
        x2 = int(xmlbox.find('xmax').text)
        y1 = int(xmlbox.find('ymin').text)
        y2 = int(xmlbox.find('ymax').text)

        if first:
            content += str(class_num) + " " + \
                       str((x1 + x2) / 2 / w) + " " + str((y1 + y2) / 2 / h) + " " + \
                       str((x2 - x1) / w) + " " + str((y2 - y1) / h)
            first = False
        else:
            content += "\n" + \
                       str(class_num) + " " + \
                       str((x1 + x2) / 2 / w) + " " + str((y1 + y2) / 2 / h) + " " + \
                       str((x2 - x1) / w) + " " + str((y2 - y1) / h)

    # print(str(i / (number - 1) * 100) + "%\n")
    print(content)
    f_txt.write(content)
    f_txt.close()
    xml_file.close()
    i += 1

print("done!")

2.划分数据集为train、val、test,在ImageSets/Main文件夹下得到train.txt\val.txt\trainval.txt\test.txt,每行为对应图片文件名

import os
import random
import cv2

trainval_percent = 0.9  
train_percent = 0.9  

data_root = "/data/tts/yohji.qian/dataset/hand18_1201/"

fdir = data_root + 'ImageSets/Main/'
if not os.path.exists(fdir):
    os.makedirs(fdir)
xmlfilepath = data_root + 'txts/'
txtsavepath = fdir
total_xml = os.listdir(xmlfilepath)
random.shuffle(total_xml)

num = len(total_xml)
num_list = range(num)
tv = int(num * trainval_percent)
tr = int(tv * train_percent)
trainval = random.sample(num_list, tv)
trainval.sort(key=int)
train = random.sample(trainval, tr)
train.sort(key=int)

val = list(set(trainval) - set(train))
test = list(set(num_list) - set(trainval))

ftrainval = open(fdir + 'trainval.txt', 'w')
ftest = open(fdir + 'test.txt', 'w')
ftrain = open(fdir + 'train.txt', 'w')
fval = open(fdir + 'val.txt', 'w')

start = cv2.getTickCount()
for i in trainval:
    name = total_xml[i][:-4] + '\n'
    ftrainval.write(name)

for i in train:
    name = total_xml[i][:-4] + '\n'
    ftrain.write(name)

for i in val:
    name = total_xml[i][:-4] + '\n'
    fval.write(name)

for i in test:
    name = total_xml[i][:-4] + '\n'
    ftest.write(name)

end = cv2.getTickCount()
during = (end - start) / cv2.getTickFrequency()
print("time: {}".format(during))

ftrainval.close()
ftrain.close()
fval.close()
ftest.close()

3.根据Imagests/Main里分好的train、val、test需要的文件名,复制到images目录下,标注txt复制到labels目录下

import os
import shutil
from tqdm import tqdm

SPLIT_PATH = "/data/tts/yohji.qian/dataset/hand18_1201/ImageSets/Main"
IMGS_PATH = "/data/tts/yohji.qian/dataset/hand18_1201/JPEGImages"
TXTS_PATH = "/data/tts/yohji.qian/dataset/hand18_1201/txts"

TO_IMGS_PATH = '/data/tts/yohji.qian/dataset/hand18_1201/images'
TO_TXTS_PATH = '/data/tts/yohji.qian/dataset/hand18_1201/labels'


data_split = ['trainval.txt', 'test.txt']
to_split = ['train', 'val']

for index, split in enumerate(data_split):
    split_path = os.path.join(SPLIT_PATH, split)

    to_imgs_path = os.path.join(TO_IMGS_PATH, to_split[index])
    if not os.path.exists(to_imgs_path):
        os.makedirs(to_imgs_path)

    to_txts_path = os.path.join(TO_TXTS_PATH, to_split[index])
    if not os.path.exists(to_txts_path):
        os.makedirs(to_txts_path)

    f = open(split_path, 'r')
    count = 1

    for line in tqdm(f.readlines(), desc="{} is copying".format(to_split[index])):
        # 复制图片
        src_img_path = os.path.join(IMGS_PATH, line.strip() + '.jpg')
        dst_img_path = os.path.join(to_imgs_path, line.strip() + '.jpg')
        if os.path.exists(src_img_path):
            shutil.copyfile(src_img_path, dst_img_path)
        else:
            print("error file: {}".format(src_img_path))

        # 复制txt标注文件
        src_txt_path = os.path.join(TXTS_PATH, line.strip() + '.txt')
        dst_txt_path = os.path.join(to_txts_path, line.strip() + '.txt')
        if os.path.exists(src_txt_path):
            shutil.copyfile(src_txt_path, dst_txt_path)
        else:
            print("error file: {}".format(src_txt_path))

 

  • 3
    点赞
  • 41
    收藏
    觉得还不错? 一键收藏
  • 3
    评论
VOC数据换为YOLO格式的具体步骤如下: 1. 首先,确保你已经下载了VOC格式的数据集,并且了解VOC格式的数据集结构和标注方式。 2. 创建一个新的文件夹,用于存放换后的YOLO格式的数据集。 3. 遍历VOC数据集中的每个图像文件和相应的标注文件。 4. 对于每个图像文件,读取图像的宽度和高度。 5. 根据YOLO格式的要求,将图像的宽度和高度写入到YOLO格式的标注文件的第一行。 6. 对于每个标注文件,读取其中的每个标注框的类别和边界框的坐标。 7. 将每个边界框的坐标换为相对于图像宽度和高度的比例。 8. 将每个标注框的类别和换后的边界框坐标按照YOLO格式的要求写入到YOLO格式的标注文件。 9. 将换后的YOLO格式的标注文件保存到之前创建的文件夹中。 10. 重复上述步骤,直到遍历完所有的图像文件和标注文件。 请注意,以上步骤中的具体代码实现可以参考引用和引用中提供的代码示例,它们都是用来将VOC数据换为YOLO格式的工具。同时,关于文件之间的关系以及存放位置的问题,可以参考引用中的相关讲解。<span class="em">1</span><span class="em">2</span><span class="em">3</span> #### 引用[.reference_title] - *1* *3* [VOC格式数据yolo格式数据集的方法](https://blog.csdn.net/qq_40280673/article/details/125179556)[target="_blank" data-report-click={"spm":"1018.2226.3001.9630","extra":{"utm_source":"vip_chatgpt_common_search_pc_result","utm_medium":"distribute.pc_search_result.none-task-cask-2~all~insert_cask~default-1-null.142^v93^chatsearchT3_2"}}] [.reference_item style="max-width: 50%"] - *2* [voc数据yolo格式](https://download.csdn.net/download/qq_45389690/13712004)[target="_blank" data-report-click={"spm":"1018.2226.3001.9630","extra":{"utm_source":"vip_chatgpt_common_search_pc_result","utm_medium":"distribute.pc_search_result.none-task-cask-2~all~insert_cask~default-1-null.142^v93^chatsearchT3_2"}}] [.reference_item style="max-width: 50%"] [ .reference_list ]
评论 3
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值