Tensorflow---利用Tensorflow对图像进行处理

最新推荐文章于 2024-08-20 19:06:15 发布

进我的收藏吃灰吧~~

最新推荐文章于 2024-08-20 19:06:15 发布

阅读量843

点赞数 2

分类专栏： tensorflow 目标检测--小细节问题文章标签： python opencv 深度学习 java 计算机视觉

本文链接：https://blog.csdn.net/weixin_42206075/article/details/111387473

版权

tensorflow 同时被 2 个专栏收录

40 篇文章 3 订阅

订阅专栏

目标检测--小细节问题

18 篇文章 2 订阅

订阅专栏

Tensorflow—利用Tensorflow对图像进行处理

读取图像数据

import numpy as np
import matplotlib.pyplot as plt
import tensorflow as tf

def show_image(image):
    shape = np.shape(image)
    if len(shape) == 3 and shape[2] == 1:
        # 黑白图像
        plt.imshow(image[:, :, 0], cmap='gray')
        plt.show()
    elif len(shape) == 3:
        # 彩色图像
        plt.imshow(image)
        plt.show()


# 1. 启动一个交互式的会话
sess = tf.InteractiveSession()

# 2. 读取图像数据
image_path = "./xiaoren.png"

file_contents = tf.read_file(image_path)
print(file_contents.eval())
# 将数据转换为图像数据
"""
def decode_image(contents, channels=None, name=None):
  对图像数据做一个转换，对图像数据的类型没有要求；转换的最终结果为：[height, width, num_channels]; 如果是gif的图像返回的是: [num_frames, height, width, num_channels]
  contents: 给定具体的数据对象
  channels: 给定读取数据形成的image tensor是几个通道的，可选值为：0 1 3 4，一般建议选择：0 1 3
    0表示使用默认通道，默认值为0
    1表示使用灰度图像通道
    3表示使用RGB图像通道
    4表示RGBA图像通道
"""
image_tensor = tf.image.decode_png(contents=file_contents, channels=0, dtype=tf.uint8)

图像大小的重置

"""
def resize_images(images,
                  size,
                  method=ResizeMethod.BILINEAR,
                  align_corners=False):
    重置大小，放大或者缩小
        images: 给定需要进行大小重置的tensor对象，shape要求为: [batch_size, height, width, channel] 或者 [height, width, channel]； 表示可以一次对很多图像做大小重置，也可以仅仅对一个图像做一个大小重置操作；
        size：给定一个二元组，也就是(new_height, new_width)
        method: 做一个放大和缩小的时候，采用什么方式放大缩小；如何产生新的像素点的值
            class ResizeMethod(object):
              BILINEAR = 0 # 默认值，二次插值
              NEAREST_NEIGHBOR = 1 # 使用邻居的像素值作为新的像素值
              BICUBIC = 2 # 三次插值，一般建议使用BICUBIC，但是运行速度相当比较慢。
              AREA = 3 # 使用一个区域的所有颜色的均值作为新的像素值
    返回的数据类型和输入的images的数据shape格式一致
"""
resize_image_tensor = tf.image.resize_images(images=image_tensor, size=(128, 80),
                                             method=tf.image.ResizeMethod.NEAREST_NEIGHBOR)

图像的剪切和填充

# 图像剪切+填充+大小重置，如果给定大小小于原始图像的大小，那么进行剪切操作，如果给定的大小大于原始图像的大小，那么进行填充操作
"""
def resize_image_with_crop_or_pad(image, target_height, target_width):
  image：需要进行操作的图像tensor对象
  target_height, target_width: 新图像的高度和宽度
做填充和剪切的时候，是从中心位置开始计算
"""
crop_or_pad_image_tensor = tf.image.resize_image_with_crop_or_pad(image_tensor,
                                                                  target_height=800, target_width=200)
print("新的数据形状:{}".format(np.shape(crop_or_pad_image_tensor.eval())))
show_image(crop_or_pad_image_tensor.eval())

# 从中心位置等比例的剪切
central_crop_image_tensor = tf.image.central_crop(image_tensor, central_fraction=0.5)
# print("新的数据形状:{}".format(np.shape(central_crop_image_tensor.eval())))
# show_image(central_crop_image_tensor.eval())

# 基于给定的坐标进行数据的剪切
"""
def crop_to_bounding_box(image, offset_height, offset_width, target_height,
                         target_width):
        offset_height：给定从高度那个位置进行剪切，其实给定的是剪切的左上角的像素下标
        offset_width: 给定从宽度那个维度进行剪切，其实给定的是剪切的左上角的像素下标
"""
crop_to_bounding_box_image_tensor = tf.image.crop_to_bounding_box(image_tensor, 100, 20, 500, 490)
# print("新的数据形状:{}".format(np.shape(crop_to_bounding_box_image_tensor.eval())))
# show_image(crop_to_bounding_box_image_tensor.eval())

# 给定位置进行数据的填充
"""
def pad_to_bounding_box(image, offset_height, offset_width, target_height,
                        target_width):
"""
pad_to_bounding_box_image_tensor = tf.image.pad_to_bounding_box(image_tensor, 200, 100, 1000, 1000)
# print("新的数据形状:{}".format(np.shape(pad_to_bounding_box_image_tensor.eval())))
# show_image(pad_to_bounding_box_image_tensor.eval())

旋转

# 上下交换
flip_up_down_image_tensor = tf.image.flip_up_down(image_tensor)
# print("新的数据形状:{}".format(np.shape(flip_up_down_image_tensor.eval())))
# show_image(flip_up_down_image_tensor.eval())

# 左右交换
flip_left_right_image_tensor = tf.image.flip_left_right(image_tensor)
# print("新的数据形状:{}".format(np.shape(flip_left_right_image_tensor.eval())))
# show_image(flip_left_right_image_tensor.eval())

# 转置
transpose_image_tensor = tf.image.transpose_image(image_tensor)
# print("新的数据形状:{}".format(np.shape(transpose_image_tensor.eval())))
# show_image(transpose_image_tensor.eval())


# 旋转（90、180、270、360）
rot90_image_tensor = tf.image.rot90(image_tensor, k=3)
# print("新的数据形状:{}".format(np.shape(rot90_image_tensor.eval())))
# show_image(rot90_image_tensor.eval())

颜色空间的转换

# NOTE: 如果要进行颜色空间的转换，那么必须将Tensor对象中的数据类型转换为float类型
# NOTE: 对于图像像素点的表示来讲，可以使用0~255的int类型的数值表示，也可以使用0~1之间的float类型的数据表示
# print(image_tensor.eval())
float_image_tensor = tf.image.convert_image_dtype(image_tensor, dtype=tf.float32)
# print(float_image_tensor.eval())
# RGB -> Gray
gray_image_tensor = tf.image.rgb_to_grayscale(float_image_tensor)
# print("新的数据形状:{}".format(np.shape(gray_image_tensor.eval())))
# show_image(gray_image_tensor.eval())

# RGB -> HSV(RGB: 颜色是由三原色构成的，也就是R红色、G绿色、B蓝色；HSV：描述的是颜色的色彩信息，H：图像的色彩、色度，S表示的图像的饱和度；V表示亮度)
# TypeError: Value passed to parameter 'images' has DataType uint8 not in list of allowed values: float32, float64
hsv_image_tensor = tf.image.rgb_to_hsv(float_image_tensor)
# print("新的数据形状:{}".format(np.shape(hsv_image_tensor.eval())))
# # hsv的图像展示不是特别好...
# show_image(hsv_image_tensor.eval())

# hsv -> rgb
rgb_image_tensor = tf.image.hsv_to_rgb(hsv_image_tensor)
# print("新的数据形状:{}".format(np.shape(rgb_image_tensor.eval())))
# show_image(rgb_image_tensor.eval())

# gray -> rgb
rgb_image_tensor = tf.image.grayscale_to_rgb(gray_image_tensor)
# print("新的数据形状:{}".format(np.shape(rgb_image_tensor.eval())))
# show_image(rgb_image_tensor.eval())

# 图像的二值化
a = gray_image_tensor
b = tf.less_equal(a, 0.9)
# 0就是黑，1就是白
"""
def where(condition, x=None, y=None, name=None):
  condition: 给定一个bool数据组成的tensor对象
  x：当condition中的值为true的时候，返回的值
  y：当condition中的值为false的时候，返回的值
  NOTE: 要求condition、x、y的数据形状是一致的
"""
# 对于a中所有大于0.9的像素，设置为0，小于等于0.9的像素值设置为原始值
c = tf.where(condition=b, x=a, y=a - a)
# 对于a中所有小于等于0的像素，设置为1，大于0.9的像素设置为c的值
d = tf.where(condition=b, x=tf.ones_like(c), y=c)
# print("新的数据形状:{}".format(np.shape(d.eval())))
# show_image(d.eval())

图像的调整

# 亮度调整
"""
def adjust_brightness(image, delta):
  image: 需要调整的图像tensor对象
  delta：调整的参数值，取值范围:(-1,1); 该值表示亮度增加或者减少的值。
底层是将image转换为hsv格式的数据，然后再进行处理。# rgb -> hsv -> h,s,v+delta -> rgb
"""
adjust_brightness_image_tensor = tf.image.adjust_brightness(image_tensor, delta=-0.5)
# print("新的数据形状:{}".format(np.shape(adjust_brightness_image_tensor.eval())))
# show_image(adjust_brightness_image_tensor.eval())

# 色调调整
# delta： 调整的参数值，取值范围:(-1,1); 该值表示色调增加或者减少的值。
adjust_hue_image_tensor = tf.image.adjust_hue(image_tensor, delta=-0.8)
# rgb -> hsv -> h+delta,s,v -> rgb
# print("新的数据形状:{}".format(np.shape(adjust_hue_image_tensor.eval())))
# show_image(adjust_hue_image_tensor.eval())

# 饱和度调整
# saturation_factor： 饱和度系数值
# rgb -> hsv -> h,s*saturation_factor,v -> rgb
adjust_saturation_image_tensor = tf.image.adjust_saturation(image_tensor, saturation_factor=20)
# print("新的数据形状:{}".format(np.shape(adjust_saturation_image_tensor.eval())))
# show_image(adjust_saturation_image_tensor.eval())

# 对比度调整
# 底层计算：(x-mean) * contrast_factor + mean
adjust_contrast_image_tensor = tf.image.adjust_contrast(image_tensor, contrast_factor=20)
# print("新的数据形状:{}".format(np.shape(adjust_contrast_image_tensor.eval())))
# show_image(adjust_contrast_image_tensor.eval())
# 图像的校验(要求输出的图像必须是浮点型的)
adjust_gamma_image_tensor = tf.image.adjust_gamma(float_image_tensor, gamma=100)
# print("新的数据形状:{}".format(np.shape(adjust_gamma_image_tensor.eval())))
# show_image(adjust_gamma_image_tensor.eval())

# 图像的归一化API（只能每次对一张图像做归一化操作）
per_image_standardization_image_tensor = tf.image.per_image_standardization(image_tensor)
# print("新的数据形状:{}".format(np.shape(per_image_standardization_image_tensor.eval())))
# show_image(per_image_standardization_image_tensor.eval())

# 给图像加一个噪音
noisy_image_tensor = image_tensor + tf.cast(5 * tf.random_normal(shape=[600, 510, 3], mean=0, stddev=0.1), tf.uint8)
# print("新的数据形状:{}".format(np.shape(noisy_image_tensor.eval())))
# show_image(noisy_image_tensor.eval())

writer = tf.summary.FileWriter("./model/test03", sess.graph)
writer.close()