随机裁剪图像
# -*- coding: utf-8 -*-
import os
import tensorlayer as tl
import xml.etree.cElementTree as ET
from lxml.etree import Element, SubElement, tostring
from xml.dom.minidom import parseString
from PIL import Image
##把数据转换为 ann_list的格式,ann_list=[类别,位置信息【list】]
def trans_img(img,img_xml,classes_dict):
ann_list=[]
class_list=[]
tree = ET.parse(img_xml)
root = tree.getroot()
#找到图像的w,h
size = root.find('size')
xml_width = int(size.find('width').text)
xml_height = int(size.find('height').text)
for obj in root.iter('object'):
position=[]
#类别信息
xml_name = str(obj.find('name').text)
if xml_name in classes_dict.keys():
xml_class=classes_dict[xml_name]
xml_box = obj.find('bndbox')
_xmin = int(xml_box.find('xmin').text)
_xmax = int(xml_box.find('xmax').text)
_ymin = int(xml_box.find('ymin').text)
_ymax = int(xml_box.find('ymax').text)
c_x=((_xmin