标注文件xml和json转yolov5所需的txtb

最新推荐文章于 2024-08-07 11:40:50 发布

空空武士

最新推荐文章于 2024-08-07 11:40:50 发布

阅读量1.5k

点赞数 3

文章标签： python xml svg

本文链接：https://blog.csdn.net/qq_51993578/article/details/114952522

版权

xml转txt

import os
import xml.etree.ElementTree as ET
 
dirpath = r'C:\c\internet download\NEU-DET\NEU-DET\ANNOTATIONS'     #原来存放xml文件的目录
newdir = r'C:\c\internet download\NEU-DET\NEU-DET\yolo'  #修改label后形成的txt目录
 
if not os.path.exists(newdir):
    os.makedirs(newdir)
 
for fp in os.listdir(dirpath):
 
    root = ET.parse(os.path.join(dirpath,fp)).getroot()
 
    xmin, ymin, xmax, ymax = 0,0,0,0
    sz = root.find('size')
    
    width = float(sz[0].text)
    height = float(sz[1].text)
    filename = root.find('filename').text
    for child in root.findall('object'):         #找到图片中的所有框
        #print(child.find('name').text)
    
        sub = child.find('bndbox')               #找到框的标注值并进行读取
        label = 0
        xmin = float(sub[0].text)
        ymin = float(sub[1].text)
        xmax = float(sub[2].text)
        ymax = float(sub[3].text)
        try:                                     #转换成yolov3的标签格式，需要归一化到（0-1）的范围内
            x_center = (xmin + xmax) / (2 * width)
            y_center = (ymin + ymax) / (2 * height)
            w = (xmax - xmin) / width
            h = (ymax - ymin) / height
        except ZeroDivisionError:
            print(filename,'的 width有问题')
 
        with open(os.path.join(newdir, fp.split('.')[0]+'.txt'), 'a+') as f:
            f.write(' '.join([str(label), str(x_center), str(y_center), str(w), str(h) + '\n']))
 
print('ok')

json转txt

import json
import numpy as np

with open('train_annos.json', 'r') as fp:
     results=json.load(fp)

def get_yolo_box(dict_data):
    fname=dict_data['name'].split('.j')[0]
    xy=dict_data['bbox']
    w=dict_data['image_width']
    h=dict_data['image_height']
    out_x=np.mean([xy[0],xy[2]])/w
    out_y=np.mean([xy[1],xy[3]])/h
    out_w=(xy[2]-xy[0])/w
    out_h=(xy[3]-xy[1])/h
    out_string="{} {:.6f} {:.6f} {:.6f} {:.6f}\n".format(dict_data['category'],out_x,out_y,out_w,out_h)
    with open('./tcdata/tile_round1_train_20201231/train_imgs/'+fname+'.txt','a+') as f:
        f.write(out_string)

for dict_data in results:
    get_yolo_box(dict_data)