实现将json文件批量转化成同名xml文件。
json文件名为“1.josn”,json文件内容如下:
{
"lables": [
{
"grid_corners": [
89.07,
310.22,
23.33,
16.23
],
"types": "car",
"scores": 0.89
},
{
"grid_corners": [
227.33,
493.16,
15.33,
21.59
],
"types": "car",
"scores": 0.25
},
{
"grid_corners": [
242.82,
488.91,
18.96,
14.02
],
"types": "car",
"scores": 0.22
},
{
"grid_corners": [
556.86,
289.67,
15.54,
20.44
],
"types": "bus",
"scores": 0.45
}
],
"img_name": "1"
}
生成同名xml文件“1.xml”,xml文件内容如下:
<annotation>
<folder>WH_data</folder>
<filename>1.jpg</filename>
<path>1.jpg</path>
<source>
<database>WH Data</database>
</source>
<size>
<width>1936</width>
<height>1216</height>
<depth>3</depth>
</size>
<segmented>0</segmented>
<object>
<name>car</name>
<pose>Unspecified</pose>
<truncated>1</truncated>
<difficult>0</difficult>
<bndbox>
<xmin>234</xmin>
<ymin>553</ymin>
<xmax>304</xmax>
<ymax>602</ymax>
</bndbox>
</object>
<object>
<name>car</name>
<pose>Unspecified</pose>
<truncated>1</truncated>
<difficult>0</difficult>
<bndbox>
<xmin>664</xmin>
<ymin>1099</ymin>
<xmax>710</xmax>
<ymax>1164</ymax>
</bndbox>
</object>
<object>
<name>car</name>
<pose>Unspecified</pose>
<truncated>1</truncated>
<difficult>0</difficult>
<bndbox>
<xmin>705</xmin>
<ymin>1097</ymin>
<xmax>763</xmax>
<ymax>1140</ymax>
</bndbox>
</object>
<object>
<name>bus</name>
<pose>Unspecified</pose>
<truncated>1</truncated>
<difficult>0</difficult>
<bndbox>
<xmin>1660</xmin>
<ymin>485</ymin>
<xmax>1708</xmax>
<ymax>547</ymax>
</bndbox>
</object>
</annotation>
代码如下:
# -*- coding: utf-8 -*-
import os
from typing import List, Any
import numpy as np
import codecs
import json
from glob import glob
import cv2
import shutil
#文件路径不能有中文
# json文件路径 joson文件名称要与jpg文件名称一致
labelme_path = "C:/json/"
# json文件对应图片路径
img_path = "C:/jpg/"
# 根据json文件生成的xml文件存放路径
saved_path = "C:/xml/"
files1 = os.listdir(labelme_path)
files = [i.split("/")[-1].split(".json")[0] for i in files1]
for json_file_ in files:
json_filename = labelme_path + json_file_ + ".json"
#解决了json文件中的数量太多导致的报错
file = open(json_filename, 'r', encoding='utf-8')
papers = []
for line in file.readlines():
dic = json.loads(line)
papers.append(dic)
#获取图片的高、宽、深度。
height, width, channels = cv2.imread(img_path + json_file_ + ".jpg").shape
with codecs.open(saved_path + json_file_ + ".xml", "w", "utf-8") as xml:
print(papers)
xml.write('<annotation>\n')
xml.write('\t<folder>' + 'WH_data' + '</folder>\n')
xml.write('\t<filename>' + json_file_ + ".jpg" + '</filename>\n')
xml.write('\t<path>' + json_file_ + ".jpg" + '</path>\n')
xml.write('\t<source>\n')
xml.write('\t\t<database>WH Data</database>\n')
xml.write('\t</source>\n')
xml.write('\t<size>\n')
xml.write('\t\t<width>' + str(width) + '</width>\n')
xml.write('\t\t<height>' + str(height) + '</height>\n')
xml.write('\t\t<depth>' + str(channels) + '</depth>\n')
xml.write('\t</size>\n')
xml.write('\t<segmented>0</segmented>\n')
for multi in papers[0]["lables"]:
print(papers)
points = np.array(multi["grid_corners"])
labelName = multi["types"]
# 以下是json中的grid_corners中的四个数据按照我的逻辑转成xml中两个坐标数。只能做参考,你们可以改成你们的逻辑。
#"grid_corners":[439.63,365.73,20.43,19.92],我的grid_corners地四个值表示[xmin,ymin,宽,高],是有比例缩放的。
r_w = 640 / width
r_h = 640 / height
if ( r_h > r_w):
l = points[0] - points[2] / 2
r = points[0] + points[2] / 2
t = points[1] - points[3] / 2 - (640 - r_w * height) / 2
b = points[1] + points[3] / 2 - (640 - r_w * height) / 2
xmin = abs(l / r_w)
ymin = abs(t / r_w)
xmax = abs(r / r_w)
ymax = abs(b / r_w)
else:
l=points[0] - points[2] / 2 - ( 640 - r_h * width )/2
r=points[0] + points[2] / 2 - ( 640 - r_h * width )/2
t= points[1] - points[3] / 2
b= points[1] + points[3] / 2
xmin = abs(l / r_w)
ymin = abs(t / r_w)
xmax = abs(r / r_w)
ymax = abs(b / r_w)
#标框超过图片宽度或高度做处理
if(xmax>width):
xmax=width
if(ymax>height):
ymax=height
#print(labelName, xmin, xmax, ymin, ymax)
label = multi["types"]
xml.write('\t<object>\n')
xml.write('\t\t<name>' + labelName + '</name>\n')
xml.write('\t\t<pose>Unspecified</pose>\n')
xml.write('\t\t<truncated>1</truncated>\n')
xml.write('\t\t<difficult>0</difficult>\n')
xml.write('\t\t<bndbox>\n')
xml.write('\t\t\t<xmin>' + str(int(xmin)) + '</xmin>\n')
xml.write('\t\t\t<ymin>' + str(int(ymin)) + '</ymin>\n')
xml.write('\t\t\t<xmax>' + str(int(xmax)) + '</xmax>\n')
xml.write('\t\t\t<ymax>' + str(int(ymax)) + '</ymax>\n')
xml.write('\t\t</bndbox>\n')
xml.write('\t</object>\n')
xml.write('</annotation>')
代码运行需要三个路径:json文件路径,同名图片路径,需要保存的xml文件路径。