v-coco数据集转换

妖怪书生

于 2024-07-14 17:48:29 发布

阅读量71

点赞数 2

分类专栏：机器学习和深度学习实验运行文章标签： python 开发语言

本文链接：https://blog.csdn.net/weixin_45177424/article/details/140419878

版权

机器学习和深度学习同时被 2 个专栏收录

16 篇文章 0 订阅

订阅专栏

实验运行

3 篇文章 0 订阅

订阅专栏

文章目录

- 整体架构流程
- 技术细节

整体架构流程

对于我们的实现，注释文件必须转换为 HOIA 格式。转换可以按如下方式进行。

PYTHONPATH=data/v-coco
python convert_vcoco_annotations.py
–load_path data/v-coco/data
–prior_path data/v-coco/prior.pickle
–save_path data/v-coco/annotations
请注意，只有 Python2 可用于此转换，因为在 v-coco 存储库中显示 Python3 错误。vsrl_utils.py

具有 HOIA 格式的 V-COCO 注解，，和将生成到目录中。corre_vcoco.npytest_vcoco.jsontrainval_vcoco.jsonannotations

技术细节

1.打开convert_vcoco_annotations.py，发现import vsrl_utils as vu，错误
原因：vsul只支持python2，不支持python3
解决：不需要下载python2,后续安装环境可麻烦了，你只需要在python3上改
没有这个vsul,直接在coco上面搜到vsrl_utils.py

# AUTORIGHTS
# ---------------------------------------------------------
# Copyright (c) 2016, Saurabh Gupta
#
# This file is part of the VCOCO dataset hooks and is available
# under the terms of the Simplified BSD License provided in
# LICENSE. Please retain this notice and LICENSE if you use
# this file (or any portion of it) in your project.
# ---------------------------------------------------------

# vsrl_data is a dictionary for each action class:
# image_id       - Nx1
# ann_id         - Nx1
# label          - Nx1
# action_name    - string
# role_name      - ['agent', 'obj', 'instr']
# role_object_id - N x K matrix, obviously [:,0] is same as ann_id

import numpy as np
from pycocotools.coco import COCO
import os, json

coco = []


def get_data_dir():
    this_dir = os.path.dirname(__file__)
    dir_name = os.path.join(this_dir, 'data')
    return dir_name


def load_coco(dir_name=None):
    global coco
    if dir_name is None:
        dir_name = get_data_dir()
    if coco == []:
        coco = COCO(os.path.join(dir_name, 'instances_vcoco_all_2014.json'))
    return coco


def load_vcoco(imset, dir_name=None):
    if dir_name is None:
        dir_name = get_data_dir()
    with open(os.path.join(dir_name, 'v-coco/data', imset + '.json'), 'rt') as f:
        vsrl_data = json.load(f)
    # vsrl_data = unicode_to_str(vsrl_data)
    for i in range(len(vsrl_data)):
        vsrl_data[i]['role_object_id'] = \
            np.array(vsrl_data[i]['role_object_id']).reshape((len(vsrl_data[i]['role_name']), -1)).T
        for j in ['ann_id', 'label', 'image_id']:
            vsrl_data[i][j] = np.array(vsrl_data[i][j]).reshape((-1, 1))
    return vsrl_data


def coco_ann_id_to_image_id(ann_id, coco):
    ann = coco.loadAnns(ann_id);
    ann_id_r = [a['id'] for a in ann]
    image_id_r = [a['image_id'] for a in ann]
    assert ann_id_r == ann_id, \
        'oops coco returned different ann_id''s in different order'
    return image_id_r


# Attach relevant boxes
def all_relevant_objects(vsrl_data_all, coco):
    vsrl_relevant_objects = []
    for i in xrange(len(vsrl_data_all)):
        v_i = vsrl_data_all[i]
        bbox = [];
        image_id = [];
        num_roles = len(v_i['role_name'])
        for j in range(num_roles):
            # print v_i['action_name'], v_i['include'][j];
            bbox_j = np.NaN * np.ones((0, 4 * num_roles));
            image_id_j = np.NaN * np.ones((0, 1))
            if v_i['include'][j] != []:
                cat_ids = coco.getCatIds(catNms=v_i['include'][j])
                ann_list = coco.getAnnIds(imgIds=np.unique(v_i['image_id'] * 1).tolist(),
                                          iscrowd=False, catIds=cat_ids)
                anns = coco.loadAnns(ann_list)
                bbox_j = np.NaN * np.zeros((len(anns), 4 * num_roles))
                bbox_j[:, 4 * j:4 * j + 4] = xyhw_to_xyxy(
                    np.vstack([np.array(a['bbox']).reshape((1, 4)) for a in anns]))
                image_id_j = np.array(coco_ann_id_to_image_id(ann_list, coco)).reshape(-1, 1)
            bbox.append(bbox_j)
            image_id.append(image_id_j)
        image_id = np.concatenate(image_id, axis=0)
        bbox = np.concatenate(bbox, axis=0)
        vsrl_relevant_objects.append({'image_id': image_id, 'bbox': bbox})
    return vsrl_relevant_objects


def attach_unlabelled(vsrl_data, coco):
    """
    def vsrl_data = attach_unlabelled(vsrl_data, coco)
    """
    anns = coco.loadAnns(
        coco.getAnnIds(imgIds=np.unique(vsrl_data['image_id']).tolist(),
                       iscrowd=False, catIds=1));
    ann_id = [a['id'] for a in anns]
    hard_ann_id = list(set(ann_id) - set(vsrl_data['ann_id'].ravel().tolist()))
    hard_image_id = coco_ann_id_to_image_id(hard_ann_id, coco);

    vsrl_data['image_id'] = np.vstack((vsrl_data['image_id'],
                                       np.array(hard_image_id).reshape((-1, 1))))
    vsrl_data['ann_id'] = np.vstack((vsrl_data['ann_id'],
                                     np.array(hard_ann_id).reshape((-1, 1))))
    vsrl_data['role_object_id'] = np.vstack((vsrl_data['role_object_id'],
                                             np.zeros((len(hard_image_id), vsrl_data['role_object_id'].shape[1]))))
    vsrl_data['role_object_id'][vsrl_data['label'].shape[0]:, 0] = np.array(hard_ann_id).reshape((-1))
    vsrl_data['label'] = np.vstack((vsrl_data['label'],
                                    -1 * np.ones((len(hard_image_id), vsrl_data['label'].shape[1]))))
    return vsrl_data


def remove_negative(vsrl_data):
    """
    def vsrl_data = remove_negative(vsrl_data)
    Remove things that are labelled as a negative
    """
    to_keep = vsrl_data['label'] != 0
    for i in vsrl_data.keys():
        if type(vsrl_data[i]) == np.ndarray:
            vsrl_data[i] = vsrl_data[i][to_keep, :]
    return vsrl_data


def xyhw_to_xyxy(bbox):
    out = bbox.copy()
    out[:, [2, 3]] = bbox[:, [0, 1]] + bbox[:, [2, 3]];
    return out


def attach_gt_boxes(vsrl_data, coco):
    """
    def vsrl_data = attach_gt_boxes(vsrl_data, coco)
    """
    anns = coco.loadAnns(vsrl_data['ann_id'].ravel().tolist());
    bbox = np.vstack([np.array(a['bbox']).reshape((1, 4)) for a in anns])

    vsrl_data['bbox'] = xyhw_to_xyxy(bbox)
    vsrl_data['role_bbox'] = \
        np.nan * np.zeros((vsrl_data['role_object_id'].shape[0], \
                           4 * vsrl_data['role_object_id'].shape[1]), dtype=np.float)

    # Get boxes for the role objects
    for i in range(vsrl_data['role_object_id'].shape[1]):
        has_role = np.where(vsrl_data['role_object_id'][:, i] > 0)[0]
        if has_role.size > 0:
            anns = coco.loadAnns(vsrl_data['role_object_id'][has_role, i].ravel().tolist());
            bbox = np.vstack([np.array(a['bbox']).reshape((1, 4)) for a in anns])
            bbox = xyhw_to_xyxy(bbox)
            vsrl_data['role_bbox'][has_role, 4 * i:4 * (i + 1)] = bbox;
    return vsrl_data


# def unicode_to_str(input):
#     if isinstance(input, dict):
#         return {unicode_to_str(key): unicode_to_str(value) for key, value in input.items()}
#     elif isinstance(input, list):
#         return [unicode_to_str(element) for element in input]
#     elif isinstance(input, unicode):
#         return input.encode('utf-8')
#     else:
#         return input

def unicode_to_str(input):
    if isinstance(input, dict):
        return {unicode_to_str(key): unicode_to_str(value) for key, value in input.items()}
    elif isinstance(input, list):
        return [unicode_to_str(element) for element in input]
    elif isinstance(input, str):
        return input.encode('utf-8')
    else:
        return input

这个

这个已经是修改过后的
需要修改：
1. AttributeError: 'dict' object has no attribute 'iteritems'
问题出现在 vsrl_utils.py 文件的 unicode_to_str 函数中。错误提示是 AttributeError: ‘dict’ object has no attribute ‘iteritems’，这表明在 Python 3 中，字典对象不再有 iteritems() 方法，而是使用 items() 方法。
在 Python 2 中，dict.iteritems() 用于返回字典中的键和值的迭代器。但在 Python 3 中，这个方法被重命名为 items()。因此，你需要将 iteritems() 替换为 items() 来修复这个错误、

找到以下代码行：

python

for key, value in input.iteritems()

将其替换为：

for key, value in input.items()

2. elif isinstance(input, unicode): 这行unicode爆红线'
在 Python 3 中，unicode 类型已经不存在，所有的字符串默认都是 Unicode 字符串，即 str 类型。因此，如果你在 Python 3 环境中看到 unicode 这个词，它应该被替换为 str

elif isinstance(input, str):

妖怪书生

关注

2
点赞
踩
3

收藏

觉得还不错? 一键收藏
0
评论
v-coco数据集转换

错误提示是 AttributeError: ‘dict’ object has no attribute ‘iteritems’，这表明在 Python 3 中，字典对象不再有 iteritems() 方法，而是使用 items() 方法。在 Python 3 中，unicode 类型已经不存在，所有的字符串默认都是 Unicode 字符串，即 str 类型。1.打开convert_vcoco_annotations.py，发现import vsrl_utils as vu，错误。这个已经是修改过后的。
复制链接

扫一扫