yolo格式标签转xml格式、json格式

最新推荐文章于 2024-06-12 15:06:51 发布

花花花哇_

最新推荐文章于 2024-06-12 15:06:51 发布

阅读量2.3k

点赞数

分类专栏：目标检测文章标签： python

本文链接：https://blog.csdn.net/sinat_39307513/article/details/119275466

版权

目标检测专栏收录该内容

26 篇文章 4 订阅

订阅专栏

一、yolo训练标签为txt格式

类别中心点x 中心的y 宽度w 高度h

二、voc 数据集标签文件为xml格式，将txt转xml

（1）yolo_txt_2voc_xmltxt(): 生成txt标签文件索引，用于生成xml文件，索引文件格式为：

文件名类别左上x 左上y 右下x 右下y

def yolo_txt_2voc_xmltxt():
    k = 0
    g = os.walk("/data/my_docker/lyy/wj_dataset/WJ_DATA/labels/test/")#标签文件路径
    txtpath = "/data/my_docker/lyy/wj_dataset/WJ_DATA/voc_xml_txt.txt"#生成索引文件
    imgpath = '/data/my_docker/lyy/wj_dataset/WJ_DATA/images/test/'#图片路径
    with open(txtpath, 'w') as txtfile:
        for path,d,filelist in g:
            for filename in filelist:
                if filename.endswith('txt'):
                    print(k)
                    imgname = imgpath + filename.split('.')[0] + '.png'
                    img = cv2.imread(imgname)
                    wide = img.shape[1]
                    height = img.shape[0]
                    ttfile = path + filename
                    with open(ttfile, 'r') as fi:
                        for i in fi.readlines():
                            if len(i) > 0:
                                line = i.split(' ')
                                class_id = int(line[0])
                                box = line[0:]
                                x = float(box[1])
                                y = float(box[2])
                                wp = float(box[3])
                                hp = float(box[4])
                                xmin = int(wide * (x - (wp / 2.0)))
                                ymin = int(height * (y - (hp / 2.0)))
                                xmax = int(wide * (x + (wp / 2.0)))
                                ymax = int(height * (y + (hp / 2.0)))

                                txtfile.writelines(str(imgname) + ' ' + str(classname[class_id]) + ' ' + str(xmin) + ' ' + str(ymin)
                                                   + ' ' + str(xmax) + ' ' + str(ymax) + '\n')
                k = k+1

2、txtxml（）函数：按行读取索引voc_xml_txt.txt文件，根据anno.xml格式在Annotations文件夹下生成txt标签文件对应的生成xml文件。

def txt2xml():
    template_file = '/data/my_docker/lyy/wj_dataset/WJ_DATA/anno.xml'#xml格式样例
    target_dir = '/data/my_docker/lyy/wj_dataset/WJ_DATA/Annotations/'
    image_dir = '/data/my_docker/lyy/wj_dataset/WJ_DATA/images/test/'  # 图片文件夹
    train_file = '/data/my_docker/lyy/wj_dataset/WJ_DATA/voc_xml_txt.txt'  # 存储了图片信息的txt文件
    path = '/data/my_docker/lyy/wj_dataset/WJ_DATA/images/test/'# 图片文件夹

    with open(train_file) as f:
        trainfiles = f.readlines()  # 标注数据 格式(filename label x_min y_min x_max y_max)

    file_names = []
    tree = ElementTree()

    for line in trainfiles:
        trainFile = line.split()
        file_name = trainFile[0]

        file_name = file_name.split('/')[-1]
        print(file_name)
        # 如果没有重复，则顺利进行。这给的数据集一张图片的多个框没有写在一起。
        if file_name not in file_names:

            file_names.append(file_name)
            lable = trainFile[1]
            xmin = trainFile[2]
            ymin = trainFile[3]
            xmax = trainFile[4]
            ymax = trainFile[5]

            tree.parse(template_file)
            root = tree.getroot()
            root.find('filename').text = file_name
            #path
            root.find('path').text = path + file_name

            # size
            sz = root.find('size')
            im = cv2.imread(path + file_name)  # 读取图片信息

            sz.find('height').text = str(im.shape[0])
            sz.find('width').text = str(im.shape[1])
            sz.find('depth').text = str(im.shape[2])

            # object 因为我的数据集都只有一个框
            obj = root.find('object')

            obj.find('name').text = lable
            bb = obj.find('bndbox')
            bb.find('xmin').text = xmin
            bb.find('ymin').text = ymin
            bb.find('xmax').text = xmax
            bb.find('ymax').text = ymax
            # 如果重复，则需要添加object框
        else:
            lable = trainFile[1]
            xmin = trainFile[2]
            ymin = trainFile[3]
            xmax = trainFile[4]
            ymax = trainFile[5]
            if xmin < xmax and ymin < ymax:
                xml_file = file_name.replace('png', 'xml')
                tree.parse(target_dir + xml_file)  # 如果已经重复
                root = tree.getroot()

                obj_ori = root.find('object')

                obj = copy.deepcopy(obj_ori)  # 注意这里深拷贝

                obj.find('name').text = lable
                bb = obj.find('bndbox')
                bb.find('xmin').text = xmin
                bb.find('ymin').text = ymin
                bb.find('xmax').text = xmax
                bb.find('ymax').text = ymax
                root.append(obj)

        xml_file = file_name.replace('png', 'xml')
        tree.write(target_dir + xml_file, encoding='utf-8')

anno.xml文件格式(复制到对应目录下)

<annotation verified="yes">
<folder>train_small</folder>
<filename>slipper0-113.jpg</filename>
<path>
/home/hesongze/PycharmProjects/keras-yolo2-master/raccoon_dataset-master/train_small/slipper0-113.jpg
</path>
<source>
<database>Unknown</database>
</source>
<size>
<width>1280</width>
<height>1280</height>
<depth>3</depth>
</size>
<segmented>0</segmented>
<object>
<name>slipper</name>
<pose>Unspecified</pose>
<truncated>0</truncated>
<difficult>0</difficult>
<bndbox>
<xmin>79</xmin>
<ymin>351</ymin>
<xmax>1279</xmax>
<ymax>961</ymax>
</bndbox>
</object>
</annotation>

三、xml文件转换coco对应的json文件

1、voc_filetxt(): 读取Annotations文件下xml文件，生成voc_train.txt：格式为

图片路径 xml路径

ef voc_filetxt():
    k = 0
    xml_file = os.walk("/data/my_docker/lyy/wj_dataset/WJ_DATA/Annotations/")#xml文件
    txtpath = "/data/my_docker/lyy/wj_dataset/WJ_DATA/voc_train.txt"#文件索引：图片路径 xml路径
    imgpath = '/data/my_docker/lyy/wj_dataset/WJ_DATA/images/test/'#图片
    with open(txtpath, 'w') as txtfile:
        for path, d, filelist in xml_file:
            for filename in filelist:
                if filename.endswith('xml'):
                    print(k)
                    imgname = imgpath + filename.split('.')[0] + '.png'
                    img = cv2.imread(imgname)
                    height, width = img.shape[0], img.shape[1]
                    xmlfile = path + filename
                    # with open(ttfile, 'r') as fi:
                    #     for i in fi.readlines():
                    #         if len(i) > 0:
                    txtfile.writelines(imgname + ' ' + xmlfile + '\n')
                k = k + 1

2、x2coco.py: 加载文件，xml转换生成voc.json文件，执行命令：

python x2coco.py --dataset_type voc --voc_anno_dir /your_path/Annotations/ --voc_anno_list /your_path/voc_train.txt --voc_label_list /your_path/label_list.txt

/your_path/Annotations/: xml文件路径

/your_path/voc_train.txt: 上一步生成的图片-xml索引文件

/your_path/label_list.txt：训练标签类别文件，即yolo训练的coco.names,注意类别名称中间不要有空格

x2coco.py文件

import argparse
import glob
import json
import os
import os.path as osp
import shutil
import xml.etree.ElementTree as ET
from tqdm import tqdm

import numpy as np
import PIL.ImageDraw

label_to_num = {}
categories_list = []
labels_list = []


class MyEncoder(json.JSONEncoder):
    def default(self, obj):
        if isinstance(obj, np.integer):
            return int(obj)
        elif isinstance(obj, np.floating):
            return float(obj)
        elif isinstance(obj, np.ndarray):
            return obj.tolist()
        else:
            return super(MyEncoder, self).default(obj)


def images_labelme(data, num):
    image = {}
    image['height'] = data['imageHeight']
    image['width'] = data['imageWidth']
    image['id'] = num + 1
    if '\\' in data['imagePath']:
        image['file_name'] = data['imagePath'].split('\\')[-1]
    else:
        image['file_name'] = data['imagePath'].split('/')[-1]
    return image


def images_cityscape(data, num, img_file):
    image = {}
    image['height'] = data['imgHeight']
    image['width'] = data['imgWidth']
    image['id'] = num + 1
    image['file_name'] = img_file
    return image


def categories(label, labels_list):
    category = {}
    category['supercategory'] = 'component'
    category['id'] = len(labels_list) + 1
    category['name'] = label
    return category


def annotations_rectangle(points, label, image_num, object_num, label_to_num):
    annotation = {}
    seg_points = np.asarray(points).copy()
    seg_points[1, :] = np.asarray(points)[2, :]
    seg_points[2, :] = np.asarray(points)[1, :]
    annotation['segmentation'] = [list(seg_points.flatten())]
    annotation['iscrowd'] = 0
    annotation['image_id'] = image_num + 1
    annotation['bbox'] = list(
        map(float, [
            points[0][0], points[0][1], points[1][0] - points[0][0], points[1][
                1] - points[0][1]
        ]))
    annotation['area'] = annotation['bbox'][2] * annotation['bbox'][3]
    annotation['category_id'] = label_to_num[label]
    annotation['id'] = object_num + 1
    return annotation


def annotations_polygon(height, width, points, label, image_num, object_num,
                        label_to_num):
    annotation = {}
    annotation['segmentation'] = [list(np.asarray(points).flatten())]
    annotation['iscrowd'] = 0
    annotation['image_id'] = image_num + 1
    annotation['bbox'] = list(map(float, get_bbox(height, width, points)))
    annotation['area'] = annotation['bbox'][2] * annotation['bbox'][3]
    annotation['category_id'] = label_to_num[label]
    annotation['id'] = object_num + 1
    return annotation


def get_bbox(height, width, points):
    polygons = points
    mask = np.zeros([height, width], dtype=np.uint8)
    mask = PIL.Image.fromarray(mask)
    xy = list(map(tuple, polygons))
    PIL.ImageDraw.Draw(mask).polygon(xy=xy, outline=1, fill=1)
    mask = np.array(mask, dtype=bool)
    index = np.argwhere(mask == 1)
    rows = index[:, 0]
    clos = index[:, 1]
    left_top_r = np.min(rows)
    left_top_c = np.min(clos)
    right_bottom_r = np.max(rows)
    right_bottom_c = np.max(clos)
    return [
        left_top_c, left_top_r, right_bottom_c - left_top_c,
        right_bottom_r - left_top_r
    ]


def deal_json(ds_type, img_path, json_path):
    data_coco = {}
    images_list = []
    annotations_list = []
    image_num = -1
    object_num = -1
    for img_file in os.listdir(img_path):
        img_label = os.path.splitext(img_file)[0]
        if img_file.split('.')[
                -1] not in ['bmp', 'jpg', 'jpeg', 'png', 'JPEG', 'JPG', 'PNG']:
            continue
        label_file = osp.join(json_path, img_label + '.json')
        print('Generating dataset from:', label_file)
        image_num = image_num + 1
        with open(label_file) as f:
            data = json.load(f)
            if ds_type == 'labelme':
                images_list.append(images_labelme(data, image_num))
            elif ds_type == 'cityscape':
                images_list.append(images_cityscape(data, image_num, img_file))
            if ds_type == 'labelme':
                for shapes in data['shapes']:
                    object_num = object_num + 1
                    label = shapes['label']
                    if label not in labels_list:
                        categories_list.append(categories(label, labels_list))
                        labels_list.append(label)
                        label_to_num[label] = len(labels_list)
                    p_type = shapes['shape_type']
                    if p_type == 'polygon':
                        points = shapes['points']
                        annotations_list.append(
                            annotations_polygon(data['imageHeight'], data[
                                'imageWidth'], points, label, image_num,
                                                object_num, label_to_num))

                    if p_type == 'rectangle':
                        (x1, y1), (x2, y2) = shapes['points']
                        x1, x2 = sorted([x1, x2])
                        y1, y2 = sorted([y1, y2])
                        points = [[x1, y1], [x2, y2], [x1, y2], [x2, y1]]
                        annotations_list.append(
                            annotations_rectangle(points, label, image_num,
                                                  object_num, label_to_num))
            elif ds_type == 'cityscape':
                for shapes in data['objects']:
                    object_num = object_num + 1
                    label = shapes['label']
                    if label not in labels_list:
                        categories_list.append(categories(label, labels_list))
                        labels_list.append(label)
                        label_to_num[label] = len(labels_list)
                    points = shapes['polygon']
                    annotations_list.append(
                        annotations_polygon(data['imgHeight'], data[
                            'imgWidth'], points, label, image_num, object_num,
                                            label_to_num))
    data_coco['images'] = images_list
    data_coco['categories'] = categories_list
    data_coco['annotations'] = annotations_list
    return data_coco


def voc_get_label_anno(ann_dir_path, ann_ids_path, labels_path):
    with open(labels_path, 'r') as f:
        labels_str = f.read().split()
    labels_ids = list(range(1, len(labels_str) + 1))

    with open(ann_ids_path, 'r') as f:
        ann_ids = [lin.strip().split(' ')[-1] for lin in f.readlines()]

    ann_paths = []
    for aid in ann_ids:
        if aid.endswith('xml'):
            ann_path = os.path.join(ann_dir_path, aid)
        else:
            ann_path = os.path.join(ann_dir_path, aid + '.xml')
        ann_paths.append(ann_path)

    return dict(zip(labels_str, labels_ids)), ann_paths


def voc_get_image_info(annotation_root, im_id):
    filename = annotation_root.findtext('filename')
    assert filename is not None
    img_name = os.path.basename(filename)
    # print(filename)
    size = annotation_root.find('size')
    width = float(size.findtext('width'))
    height = float(size.findtext('height'))

    image_info = {
        'file_name': filename,
        'height': height,
        'width': width,
        'id': im_id
    }
    return image_info


def voc_get_coco_annotation(obj, label2id):
    label = obj.findtext('name')
    # print(label)
    assert label in label2id, "label is not in label2id."
    category_id = label2id[label]
    bndbox = obj.find('bndbox')
    xmin = float(bndbox.findtext('xmin'))
    ymin = float(bndbox.findtext('ymin'))
    xmax = float(bndbox.findtext('xmax'))
    ymax = float(bndbox.findtext('ymax'))
    assert xmax >= xmin and ymax >= ymin, "Box size error."
    # if xmax > xmin and ymax > ymin:
    o_width = xmax - xmin
    o_height = ymax - ymin
    anno = {
        'area': o_width * o_height,
        'iscrowd': 0,
        'bbox': [xmin, ymin, o_width, o_height],
        'category_id': category_id,
        'ignore': 0,
    }
    return anno


def voc_xmls_to_cocojson(annotation_paths, label2id, output_dir, output_file):
    output_json_dict = {
        "images": [],
        "type": "instances",
        "annotations": [],
        "categories": []
    }
    bnd_id = 1  # bounding box start id
    im_id = 0
    print('Start converting !')
    for a_path in tqdm(annotation_paths):
        # Read annotation xml

        ann_tree = ET.parse(a_path)
        ann_root = ann_tree.getroot()

        img_info = voc_get_image_info(ann_root, im_id)
        output_json_dict['images'].append(img_info)
        print(im_id)
        for obj in ann_root.findall('object'):
            ann = voc_get_coco_annotation(obj=obj, label2id=label2id)
            ann.update({'image_id': im_id, 'id': bnd_id})
            output_json_dict['annotations'].append(ann)
            bnd_id = bnd_id + 1
        im_id += 1

    for label, label_id in label2id.items():
        category_info = {'supercategory': 'none', 'id': label_id, 'name': label}
        output_json_dict['categories'].append(category_info)
    output_file = os.path.join(output_dir, output_file)
    with open(output_file, 'w') as f:
        output_json = json.dumps(output_json_dict)
        f.write(output_json)


def main():
    parser = argparse.ArgumentParser(
        formatter_class=argparse.ArgumentDefaultsHelpFormatter)
    parser.add_argument(
        '--dataset_type',
        help='the type of dataset, can be `voc`, `labelme` or `cityscape`')
    parser.add_argument('--json_input_dir', help='input annotated directory')
    parser.add_argument('--image_input_dir', help='image directory')
    parser.add_argument(
        '--output_dir', help='output dataset directory', default='./')
    parser.add_argument(
        '--train_proportion',
        help='the proportion of train dataset',
        type=float,
        default=1.0)
    parser.add_argument(
        '--val_proportion',
        help='the proportion of validation dataset',
        type=float,
        default=0.0)
    parser.add_argument(
        '--test_proportion',
        help='the proportion of test dataset',
        type=float,
        default=0.0)
    parser.add_argument(
        '--voc_anno_dir',
        help='In Voc format dataset, path to annotation files directory.',
        type=str,
        default=None)
    parser.add_argument(
        '--voc_anno_list',
        help='In Voc format dataset, path to annotation files ids list.',
        type=str,
        default=None)
    parser.add_argument(
        '--voc_label_list',
        help='In Voc format dataset, path to label list. The content of each line is a category.',
        type=str,
        default=None)
    parser.add_argument(
        '--voc_out_name',
        type=str,
        default='voc.json',
        help='In Voc format dataset, path to output json file')
    args = parser.parse_args()
    try:
        assert args.dataset_type in ['voc', 'labelme', 'cityscape']
    except AssertionError as e:
        print(
            'Now only support the voc, cityscape dataset and labelme dataset!!')
        os._exit(0)

    if args.dataset_type == 'voc':
        assert args.voc_anno_dir and args.voc_anno_list and args.voc_label_list
        label2id, ann_paths = voc_get_label_anno(
            args.voc_anno_dir, args.voc_anno_list, args.voc_label_list)
        print(label2id)
        voc_xmls_to_cocojson(
            annotation_paths=ann_paths,
            label2id=label2id,
            output_dir=args.output_dir,
            output_file=args.voc_out_name)
    else:
        try:
            assert os.path.exists(args.json_input_dir)
        except AssertionError as e:
            print('The json folder does not exist!')
            os._exit(0)
        try:
            assert os.path.exists(args.image_input_dir)
        except AssertionError as e:
            print('The image folder does not exist!')
            os._exit(0)
        try:
            assert abs(args.train_proportion + args.val_proportion \
                    + args.test_proportion - 1.0) < 1e-5
        except AssertionError as e:
            print(
                'The sum of pqoportion of training, validation and test datase must be 1!'
            )
            os._exit(0)

        # Allocate the dataset.
        total_num = len(glob.glob(osp.join(args.json_input_dir, '*.json')))
        if args.train_proportion != 0:
            train_num = int(total_num * args.train_proportion)
            out_dir = args.output_dir + '/train'
            if not os.path.exists(out_dir):
                os.makedirs(out_dir)
        else:
            train_num = 0
        if args.val_proportion == 0.0:
            val_num = 0
            test_num = total_num - train_num
            out_dir = args.output_dir + '/test'
            if args.test_proportion != 0.0 and not os.path.exists(out_dir):
                os.makedirs(out_dir)
        else:
            val_num = int(total_num * args.val_proportion)
            test_num = total_num - train_num - val_num
            val_out_dir = args.output_dir + '/val'
            if not os.path.exists(val_out_dir):
                os.makedirs(val_out_dir)
            test_out_dir = args.output_dir + '/test'
            if args.test_proportion != 0.0 and not os.path.exists(test_out_dir):
                os.makedirs(test_out_dir)
        count = 1
        for img_name in os.listdir(args.image_input_dir):
            if count <= train_num:
                if osp.exists(args.output_dir + '/train/'):
                    shutil.copyfile(
                        osp.join(args.image_input_dir, img_name),
                        osp.join(args.output_dir + '/train/', img_name))
            else:
                if count <= train_num + val_num:
                    if osp.exists(args.output_dir + '/val/'):
                        shutil.copyfile(
                            osp.join(args.image_input_dir, img_name),
                            osp.join(args.output_dir + '/val/', img_name))
                else:
                    if osp.exists(args.output_dir + '/test/'):
                        shutil.copyfile(
                            osp.join(args.image_input_dir, img_name),
                            osp.join(args.output_dir + '/test/', img_name))
            count = count + 1

        # Deal with the json files.
        if not os.path.exists(args.output_dir + '/annotations'):
            os.makedirs(args.output_dir + '/annotations')
        if args.train_proportion != 0:
            train_data_coco = deal_json(args.dataset_type,
                                        args.output_dir + '/train',
                                        args.json_input_dir)
            train_json_path = osp.join(args.output_dir + '/annotations',
                                       'instance_train.json')
            json.dump(
                train_data_coco,
                open(train_json_path, 'w'),
                indent=4,
                cls=MyEncoder)
        if args.val_proportion != 0:
            val_data_coco = deal_json(args.dataset_type,
                                      args.output_dir + '/val',
                                      args.json_input_dir)
            val_json_path = osp.join(args.output_dir + '/annotations',
                                     'instance_val.json')
            json.dump(
                val_data_coco,
                open(val_json_path, 'w'),
                indent=4,
                cls=MyEncoder)
        if args.test_proportion != 0:
            test_data_coco = deal_json(args.dataset_type,
                                       args.output_dir + '/test',
                                       args.json_input_dir)
            test_json_path = osp.join(args.output_dir + '/annotations',
                                      'instance_test.json')
            json.dump(
                test_data_coco,
                open(test_json_path, 'w'),
                indent=4,
                cls=MyEncoder)


if __name__ == '__main__':
    main()

问题：

1、生成的json文件中图片名不是绝对路径，若要生成文件名为绝对路径修改

voc_get_image_info() 中

image_info = {
    'file_name': filename,#修改为图片绝对路径
    'height': height,
    'width': width,
    'id': im_id
}

花花花哇_

关注

0
点赞
踩
10

收藏

觉得还不错? 一键收藏
0
评论
yolo格式标签转xml格式、json格式

1、yolo训练标签为txt格式类别中心点x 中心的y 宽度w 高度h2、voc 数据集标签文件为xml格式，首先将txt转xml（1）
复制链接

扫一扫

专栏目录