统一数据集大小

最新推荐文章于 2023-06-07 15:33:30 发布

Walk Off the Earth

最新推荐文章于 2023-06-07 15:33:30 发布

阅读量314

点赞数

文章标签： python opencv 开发语言

原文链接：https://blog.csdn.net/Jimy_Lin/article/details/128182763?ops_request_misc=&request_id=&biz_id=102&utm_term=%E6%89%B9%E9%87%8F%E8%B0%83%E6%95%B4%E6%95%B0%E6%8D%AE%E9%9B%86%E5%9B%BE%E7%89%87%E5%92%8Cxml%E5%A4%A7%E5%B0%8F&utm_medium=distribute.pc_search_resu

版权

该Python脚本用于批量处理图像和其对应的XML标注文件。它首先读取原始图像和XML文件，然后根据设定的目标尺寸缩放图像，同时调整XML文件中对象的边界框坐标以匹配新尺寸。最后，将处理后的图像和XML文件保存到新目录下。

摘要由CSDN通过智能技术生成

import os
import cv2
import numpy as np
import xml.etree.ElementTree as ET

img_path_old = r'E:\data\statistical_distribution\JPEGImages'  # 原图片文件夹路径
img_path_new = r'E:\data\statistical_distribution\image_resize'  # 修改大小后的图片文件夹路径
xml_path_old = r'E:\data\statistical_distribution\Annotations'  # 原xml的文件夹路径
xml_path_new = r'E:\data\statistical_distribution\xml_resize'  # 新xml的文件夹路径
if not os.path.exists(img_path_new): os.makedirs(img_path_new)
if not os.path.exists(xml_path_new): os.makedirs(xml_path_new)
c_w, c_h = 640, 640  # 目标图片的尺寸


def edit_xml(xml_file, ratio, i):
    all_xml_file = os.path.join(xml_path_old, xml_file)
    # print(all_xml_file)
    tree = ET.parse(all_xml_file)
    size_o = tree.find('size')  # 修改xml文件中的图像尺寸大小为新的尺寸大小
    size_width = size_o.find('width')
    size_height = size_o.find('height')
    size_width.text = str(c_w)
    size_height.text = str(c_h)

    objs = tree.findall('object')  # 修改每个目标对应的坐标
    for obj in objs:
        obj_bnd = obj.find('bndbox')
        obj_bnd = obj.find('bndbox')
        obj_xmin = obj_bnd.find('xmin')
        obj_ymin = obj_bnd.find('ymin')
        obj_xmax = obj_bnd.find('xmax')
        obj_ymax = obj_bnd.find('ymax')
        xmin = float(obj_xmin.text)
        ymin = float(obj_ymin.text)
        xmax = float(obj_xmax.text)
        ymax = float(obj_ymax.text)
        obj_xmin.text = str(round(xmin * ratio))
        obj_ymin.text = str(round(ymin * ratio))
        obj_xmax.text = str(round(xmax * ratio))
        obj_ymax.text = str(round(ymax * ratio))

    newfile = os.path.join(xml_path_new, '%05d' % (0 + i) + '.xml')
    tree.write(newfile, method='xml', encoding='utf-8')  # 更新xml文件


if __name__ == '__main__':
    files = os.listdir(img_path_old)  # 获取文件名列表
    i = 0
    for file in files:
        img_zeros = np.zeros((c_w, c_h, 3), np.uint8)  # 创建全黑的图像
        if file.endswith('.png'):
            imgName = os.path.join(img_path_old, file)  # 获取文件完整路径
            xml_file = file.replace('.png', '.xml')
            img = cv2.imread(imgName)  # 读图
            h, w, _ = img.shape  # 获取图像宽高
            # 缩放图像，宽高大于c_w的按长边等比例缩放，小于c_w的保持原图像大小：
            if max(w, h) > c_w:
                ratio = c_w / max(w, h)
                imgcrop = cv2.resize(img, (round(w * ratio), round(h * ratio)))
                # 将缩放后的图像复制进全黑图像里
                img_zeros[0:round(h * ratio), 0:round(w * ratio)] = imgcrop
                edit_xml(xml_file, ratio, i)
            else:
                img_zeros[0:h, 0:w] = img
                edit_xml(xml_file, 1, i)

            # 设置新的文件名：
            newName = os.path.join(img_path_new, '%05d' % (0 + i) + '.jpg')
            i += 1
            print(newName)
            cv2.imwrite(newName, img_zeros)  # 存储按新文件名命令的图片