深度学习模型训练之数据增强

最新推荐文章于 2024-07-06 21:27:32 发布

知行SUN

最新推荐文章于 2024-07-06 21:27:32 发布

阅读量705

点赞数

分类专栏：图像算法深度学习 python 文章标签：深度学习 python

本文链接：https://blog.csdn.net/excellent_sun/article/details/108866359

版权

图像算法同时被 3 个专栏收录

20 篇文章 0 订阅

订阅专栏

python

13 篇文章 0 订阅

订阅专栏

深度学习

9 篇文章 0 订阅

订阅专栏

数据增强

import random
import numpy as np
import cv2
from PIL import Image
import os

base_size = 1024
scale = True
rotate = True
crop_size = 1200
flip = True
blur = False

def augmentation(pp_path, image, label):
    h, w, _ = image.shape
    # Scaling, we set the bigger to base size, and the smaller
    # one is rescaled to maintain the same ratio, if we don't have any obj in the image, re-do the processing
    if base_size:
        if scale:
            longside = random.randint(int(base_size * 0.5), int(base_size * 2.0))
        else:
            longside = base_size
        h, w = (longside, int(1.0 * longside * w / h + 0.5)) if h > w else (int(1.0 * longside * h / w + 0.5), longside)
        image = cv2.resize(image, (w, h), interpolation=cv2.INTER_LINEAR)
        label = cv2.resize(label, (w, h), interpolation=cv2.INTER_NEAREST)

    rgb_resize = Image.fromarray(image)
    rgb_resize.save(os.path.join(pp_path, "rgb_resize.jpg"))
    h, w, _ = image.shape
    # Rotate the image with an angle between -10 and 10
    if rotate:
        angle = random.randint(-10, 10)
        center = (w / 2, h / 2)
        rot_matrix = cv2.getRotationMatrix2D(center, angle, 1.0)
        image = cv2.warpAffine(image, rot_matrix, (w, h), flags=cv2.INTER_LINEAR)  # , borderMode=cv2.BORDER_REFLECT)
        label = cv2.warpAffine(label, rot_matrix, (w, h), flags=cv2.INTER_NEAREST)  # ,  borderMode=cv2.BORDER_REFLECT)

    rgb_rotate = Image.fromarray(image)
    rgb_rotate.save(os.path.join(pp_path, "rgb_rotate.jpg"))
    # Padding to return the correct crop size
    if crop_size:
        pad_h = max(crop_size - h, 0)
        pad_w = max(crop_size - w, 0)
        pad_kwargs = {
            "top": 0,
            "bottom": pad_h,
            "left": 0,
            "right": pad_w,
            "borderType": cv2.BORDER_CONSTANT, }
        if pad_h > 0 or pad_w > 0:
            image = cv2.copyMakeBorder(image, value=0, **pad_kwargs)
            label = cv2.copyMakeBorder(label, value=0, **pad_kwargs)

        # Cropping
        h, w, _ = image.shape
        start_h = random.randint(0, h - crop_size)
        start_w = random.randint(0, w - crop_size)
        end_h = start_h + crop_size
        end_w = start_w + crop_size
        image = image[start_h:end_h, start_w:end_w]
        label = label[start_h:end_h, start_w:end_w]
    rgb_crop = Image.fromarray(image)
    rgb_crop.save(os.path.join(pp_path, "rgb_crop.jpg"))
    # Random H flip
    if flip:
        if random.random() > 0.5:
            image = np.fliplr(image).copy()
            label = np.fliplr(label).copy()

    rgb_flip = Image.fromarray(image)
    rgb_flip.save(os.path.join(pp_path, "rgb_flip.jpg"))
    # Gaussian Blud (sigma between 0 and 1.5)
    if blur:
        sigma = random.random()
        ksize = int(3.3 * sigma)
        ksize = ksize + 1 if ksize % 2 == 0 else ksize
        image = cv2.GaussianBlur(image, (ksize, ksize), sigmaX=sigma, sigmaY=sigma, borderType=cv2.BORDER_REFLECT_101)
    return image, label


if __name__ == '__main__':
    pp_path = "/data/realseeData/test/pano-surface/73de190196212982ee0ed55ef3686496/derived/1552296451"
    rgb_image_array = np.array(Image.open(os.path.join(pp_path, "rgb_image_align.jpg")))
    label_image_array = np.array(Image.open(os.path.join(pp_path, pp_path.split("/")[-1]+".png")))
    image, label = augmentation(pp_path, rgb_image_array, label_image_array)

知行SUN

关注

0
点赞
踩
0

收藏

觉得还不错? 一键收藏
打赏
0
评论
深度学习模型训练之数据增强

数据增强import randomimport numpy as npimport cv2from PIL import Imageimport osbase_size = 1024scale = Truerotate = Truecrop_size = 1200flip = Trueblur = Falsedef augmentation(pp_path, image, label): h, w, _ = image.shape # Scaling, we se
复制链接

扫一扫