json文件的批量转化（亲测有效）

最新推荐文章于 2023-05-31 16:20:59 发布

爱学习滴好青年

最新推荐文章于 2023-05-31 16:20:59 发布

阅读量3k

点赞数

分类专栏： python编程问题（亲测有效）文章标签：神经网络机器学习 tensorflow pytorch

本文链接：https://blog.csdn.net/qq_40287633/article/details/112201448

版权

python编程问题（亲测有效）专栏收录该内容

10 篇文章 0 订阅

订阅专栏

在进行图像分割时，我们需要自备数据集，一般选择labelme进行图像的标注，在标注过后我们会得到很多的json文件。一般我们可以使用labelme自带的脚本文件将其转化为图像格式，即：

激活labelme的环境
运行labelme_json_to_dataset <文件名>.json，例如：labelme_json_to_dataset test.json

但是这里仅仅对于一个json文件进行。一般的需要大量的数据集，所以这时我们采用以下方法进行json文件的批量转化。注意：请在用labelme将所有图片标注完后，再进行以下操作。

找到json_to_dataset.py文件，位置位于D:\install\anaconda3\envs\labelme\Lib\site-packages\labelme\cli，前面的D:\install\anaconda以读者自己的情况而定。
将json_to_dataset.py全选删除后替换为：

import argparse
import json
import os
import os.path as osp
import warnings
import copy

import numpy as np
import PIL.Image
from skimage import io
import yaml

from labelme import utils

NAME_LABEL_MAP = {
#下面的名字请以自身实际情况所更改
    '_background_': 0,
    "name_1": 1,
    "name_2": 2,
    "name_3": 3,
}

LABEL_NAME_MAP = {
#下面的名字请以自身实际情况所更改
    0: '_background_',
    1: "name_1",
    2: "name_2",
    3: "name_3",
}


def main():
    parser = argparse.ArgumentParser()
    parser.add_argument('json_file')
    parser.add_argument('-o', '--out', default=None)
    args = parser.parse_args()

    json_file = args.json_file

    list = os.listdir(json_file)
    for i in range(0, len(list)):
        path = os.path.join(json_file, list[i])
        filename = list[i][:-5]       # .json
        if os.path.isfile(path):
            data = json.load(open(path))
            img = utils.image.img_b64_to_arr(data['imageData'])
            lbl, lbl_names = utils.shape.labelme_shapes_to_label(img.shape, data['shapes'])  # labelme_shapes_to_label

            # modify labels according to NAME_LABEL_MAP
            lbl_tmp = copy.copy(lbl)
            for key_name in lbl_names:
                old_lbl_val = lbl_names[key_name]
                new_lbl_val = NAME_LABEL_MAP[key_name]
                lbl_tmp[lbl == old_lbl_val] = new_lbl_val
            lbl_names_tmp = {}
            for key_name in lbl_names:
                lbl_names_tmp[key_name] = NAME_LABEL_MAP[key_name]

            # Assign the new label to lbl and lbl_names dict
            lbl = np.array(lbl_tmp, dtype=np.int8)
            lbl_names = lbl_names_tmp

            captions = ['%d: %s' % (l, name) for l, name in enumerate(lbl_names)]
            lbl_viz = utils.draw.draw_label(lbl, img, captions)
            out_dir = osp.basename(list[i]).replace('.', '_')
            out_dir = osp.join(osp.dirname(list[i]), out_dir)
            if not osp.exists(out_dir):
                os.mkdir(out_dir)

            PIL.Image.fromarray(img).save(osp.join(out_dir, '{}.png'.format(filename)))
            PIL.Image.fromarray(lbl).save(osp.join(out_dir, '{}_gt.png'.format(filename)))
            PIL.Image.fromarray(lbl_viz).save(osp.join(out_dir, '{}_viz.png'.format(filename)))

            with open(osp.join(out_dir, 'label_names.txt'), 'w') as f:
                for lbl_name in lbl_names:
                    f.write(lbl_name + '\n')

            warnings.warn('info.yaml is being replaced by label_names.txt')
            info = dict(label_names=lbl_names)
            with open(osp.join(out_dir, 'info.yaml'), 'w') as f:
                yaml.safe_dump(info, f, default_flow_style=False)

            print('Saved to: %s' % out_dir)


if __name__ == '__main__':
    main()

请注意里面需要根据自身情况更改的两个部分，代码中已给出相关注释。

激活labelme的环境，进入到文件保存路径，这个路径将保存转换后的文件
输入命令：labelme_json_to_dataset E:\data\json，请把所有的json文件存入E:\data\json这个文件夹中。

在输入上述命令后可能会提示缺少库，请下载相关库。下载相关库后运行，可能会出现以下错误提示：AttributeError: module ‘labelme.utils’ has no attribute ‘draw’，解决方式：

更改labelme的版本：

pip install labelme==3.16.7

查找路径D:\install\anaconda3\envs\labelme\Lib\site-packages\labelme\utils中有无draw.py，若无请在此文件夹下新建draw.py文件，内容如下：

import io
import os.path as osp
 
import numpy as np
import PIL.Image
import PIL.ImageDraw
import PIL.ImageFont
 
 
def label_colormap(N=256):
 
    def bitget(byteval, idx):
        return ((byteval & (1 << idx)) != 0)
 
    cmap = np.zeros((N, 3))
    for i in range(0, N):
        id = i
        r, g, b = 0, 0, 0
        for j in range(0, 8):
            r = np.bitwise_or(r, (bitget(id, 0) << 7 - j))
            g = np.bitwise_or(g, (bitget(id, 1) << 7 - j))
            b = np.bitwise_or(b, (bitget(id, 2) << 7 - j))
            id = (id >> 3)
        cmap[i, 0] = r
        cmap[i, 1] = g
        cmap[i, 2] = b
    cmap = cmap.astype(np.float32) / 255
    return cmap
 
 
def _validate_colormap(colormap, n_labels):
    if colormap is None:
        colormap = label_colormap(n_labels)
    else:
        assert colormap.shape == (colormap.shape[0], 3), \
            'colormap must be sequence of RGB values'
        assert 0 <= colormap.min() and colormap.max() <= 1, \
            'colormap must ranges 0 to 1'
    return colormap
 
 
# similar function as skimage.color.label2rgb
def label2rgb(
    lbl, img=None, n_labels=None, alpha=0.5, thresh_suppress=0, colormap=None,
):
    if n_labels is None:
        n_labels = len(np.unique(lbl))
 
    colormap = _validate_colormap(colormap, n_labels)
    colormap = (colormap * 255).astype(np.uint8)
 
    lbl_viz = colormap[lbl]
    lbl_viz[lbl == -1] = (0, 0, 0)  # unlabeled
 
    if img is not None:
        img_gray = PIL.Image.fromarray(img).convert('LA')
        img_gray = np.asarray(img_gray.convert('RGB'))
        # img_gray = cv2.cvtColor(img, cv2.COLOR_RGB2GRAY)
        # img_gray = cv2.cvtColor(img_gray, cv2.COLOR_GRAY2RGB)
        lbl_viz = alpha * lbl_viz + (1 - alpha) * img_gray
        lbl_viz = lbl_viz.astype(np.uint8)
 
    return lbl_viz
 
 
def draw_label(label, img=None, label_names=None, colormap=None, **kwargs):
    """Draw pixel-wise label with colorization and label names.
 
    label: ndarray, (H, W)
        Pixel-wise labels to colorize.
    img: ndarray, (H, W, 3), optional
        Image on which the colorized label will be drawn.
    label_names: iterable
        List of label names.
    """
    import matplotlib.pyplot as plt
 
    backend_org = plt.rcParams['backend']
    plt.switch_backend('agg')
 
    plt.subplots_adjust(left=0, right=1, top=1, bottom=0,
                        wspace=0, hspace=0)
    plt.margins(0, 0)
    plt.gca().xaxis.set_major_locator(plt.NullLocator())
    plt.gca().yaxis.set_major_locator(plt.NullLocator())
 
    if label_names is None:
        label_names = [str(l) for l in range(label.max() + 1)]
 
    colormap = _validate_colormap(colormap, len(label_names))
 
    label_viz = label2rgb(
        label, img, n_labels=len(label_names), colormap=colormap, **kwargs
    )
    plt.imshow(label_viz)
    plt.axis('off')
 
    plt_handlers = []
    plt_titles = []
    for label_value, label_name in enumerate(label_names):
        if label_value not in label:
            continue
        fc = colormap[label_value]
        p = plt.Rectangle((0, 0), 1, 1, fc=fc)
        plt_handlers.append(p)
        plt_titles.append('{value}: {name}'
                          .format(value=label_value, name=label_name))
    plt.legend(plt_handlers, plt_titles, loc='lower right', framealpha=.5)
 
    f = io.BytesIO()
    plt.savefig(f, bbox_inches='tight', pad_inches=0)
    plt.cla()
    plt.close()
 
    plt.switch_backend(backend_org)
 
    out_size = (label_viz.shape[1], label_viz.shape[0])
    out = PIL.Image.open(f).resize(out_size, PIL.Image.BILINEAR).convert('RGB')
    out = np.asarray(out)
    return out
 
 
def draw_instances(
    image=None,
    bboxes=None,
    labels=None,
    masks=None,
    captions=None,
):
    import matplotlib
 
    # TODO(wkentaro)
    assert image is not None
    assert bboxes is not None
    assert labels is not None
    assert masks is None
    assert captions is not None
 
    viz = PIL.Image.fromarray(image)
    draw = PIL.ImageDraw.ImageDraw(viz)
 
    font_path = osp.join(
        osp.dirname(matplotlib.__file__),
        'mpl-data/fonts/ttf/DejaVuSans.ttf'
    )
    font = PIL.ImageFont.truetype(font_path)
 
    colormap = label_colormap(255)
    for bbox, label, caption in zip(bboxes, labels, captions):
        color = colormap[label]
        color = tuple((color * 255).astype(np.uint8).tolist())
 
        xmin, ymin, xmax, ymax = bbox
        draw.rectangle((xmin, ymin, xmax, ymax), outline=color)
        draw.text((xmin, ymin), caption, font=font)
 
    return np.asarray(viz)

在该文件夹下找到__init__.py，添加：

from .draw import label_colormap
from .draw import _validate_colormap
from .draw import label2rgb
from .draw import draw_label
from .draw import draw_instances

至此，即可成功运行。

爱学习滴好青年

关注

0
点赞
踩
7

收藏

觉得还不错? 一键收藏
2
评论
json文件的批量转化（亲测有效）

在进行图像分割时，我们需要自备数据集，一般选择labelme进行图像的标注，在标注过后我们会得到很多的json文件。一般我们可以使用labelme自带的脚本文件将其转化为图像格式，即：激活labelme的环境运行labelme_json_to_dataset <文件名>.json，例如：labelme_json_to_dataset test.json但是这里仅仅对于一个json文件进行。一般的需要大量的数据集，所以这时我们采用以下方法进行json文件的批量转化。注意：请在用label
复制链接

扫一扫