【数据预处理】CoCo数据集标注文件.json转yolov5标注文件.txt格式

最新推荐文章于 2023-12-06 09:52:38 发布

Huang3stone

最新推荐文章于 2023-12-06 09:52:38 发布

阅读量3.6k

点赞数 1

分类专栏： yolov5 文章标签： python 人工智能深度学习

本文链接：https://blog.csdn.net/lafsca5/article/details/123925910

版权

yolov5 专栏收录该内容

9 篇文章 2 订阅

订阅专栏

下载pycocotools包（用于解析coco.json文件）
直接运行即可

from pycocotools.coco import COCO
import numpy as np
import tqdm
import argparse


def arg_parser():
    parser = argparse.ArgumentParser('code by rbj')
    parser.add_argument('--annotation_path', type=str,
                        default='D:/project/project-use/yolov5-6.0/utils/annotations_5_custom_classes.json')
    # 生成的txt文件保存的目录
    parser.add_argument('--save_base_path', type=str, default='D:/project/project-use/yolov5-6.0/utils/labels/')
    args = parser.parse_args(args=[])
    # 原网页中是args = parser.parse_args()会报错，改成这个以后解决了
    return args


if __name__ == '__main__':
    args = arg_parser()
    annotation_path = args.annotation_path
    save_base_path = args.save_base_path

    data_source = COCO(annotation_file=annotation_path)
    catIds = data_source.getCatIds()
    categories = data_source.loadCats(catIds)
    categories.sort(key=lambda x: x['id'])
    classes = {}
    coco_labels = {}
    coco_labels_inverse = {}
    count = 0
    for c in categories:
        coco_labels[len(classes)] = c['id']
        coco_labels_inverse[c['id']] = len(classes)
        classes[c['name']] = len(classes)

    img_ids = data_source.getImgIds()
    for index, img_id in tqdm.tqdm(enumerate(img_ids), desc='change .json file to .txt file'):
        img_info = data_source.loadImgs(img_id)[0]
        file_name = img_info['file_name'].split('.')[0]
        height = img_info['height']
        width = img_info['width']

        save_path = save_base_path + file_name + '.txt'
        with open(save_path, mode='w') as fp:
            annotation_id = data_source.getAnnIds(img_id)
            boxes = np.zeros((0, 5))
            if len(annotation_id) == 0:
                fp.write('')
                continue
            annotations = data_source.loadAnns(annotation_id)
            lines = ''
            for annotation in annotations:
                box = annotation['bbox']
                # some annotations have basically no width / height, skip them
                if box[2] < 1 or box[3] < 1:
                    continue
                # top_x,top_y,width,height---->cen_x,cen_y,width,height
                box[0] = round((box[0] + box[2] / 2) / width, 6)
                box[1] = round((box[1] + box[3] / 2) / height, 6)
                box[2] = round(box[2] / width, 6)
                box[3] = round(box[3] / height, 6)
                label = coco_labels_inverse[annotation['category_id']]
                lines = lines + str(label)
                for i in box:
                    lines += ' ' + str(i)
                lines += '\n'
            fp.writelines(lines)
        count = count + 1
        print('succeed {}', count)
    print('finish')

Huang3stone

关注

1
点赞
踩
6

收藏

觉得还不错? 一键收藏
2
评论
【数据预处理】CoCo数据集标注文件.json转yolov5标注文件.txt格式

下载pycocotools包（用于解析coco.json文件）直接运行即可from pycocotools.coco import COCOimport numpy as npimport tqdmimport argparsedef arg_parser(): parser = argparse.ArgumentParser('code by rbj') parser.add_argument('--annotation_path', type=str,
复制链接

扫一扫