数据来源为https://cg.cs.tsinghua.edu.cn/traffic-sign/
标注格式为json,使用json.load解析后为字典格式。
pascal_voc xml格式为:
<?xml version="1.0" encoding="utf-8"?>
<annotation>
<folder>VOC2007</folder>
<filename>36319.jpg</filename>
<path>/Users/chenhonghu/Downloads/data/image/36319.jpg</path>
<source>
<database>Unknown</database>
</source>
<size>
<width>2048</width>
<height>2048</height>
<depth>3</depth>
</size>
<segmented>0</segmented>
<object>
<name>pne</name>
<pose>Unspecified</pose>
<truncated>1</truncated>
<difficult>0</difficult>
<bndbox>
<xmin>1140.0</xmin>
<ymin>906.0</ymin>
<xmax>1164.0</xmax>
<ymax>930.0</ymax>
</bndbox>
</object>
<object>
<name>i4</name>
<pose>Unspecified</pose>
<truncated>1</truncated>
<difficult>0</difficult>
<bndbox>
<xmin>1273.0</xmin>
<ymin>912.0</ymin>
<xmax>1296.0</xmax>
<ymax>934.0</ymax>
</bndbox>
</object>
<object>
<name>pl70</name>
<pose>Unspecified</pose>
<truncated>1</truncated>
<difficult>0</difficult>
<bndbox>
<xmin>1440.0</xmin>
<ymin>929.0</ymin>
<xmax>1457.0</xmax>
<ymax>949.0</ymax>
</bndbox>