目录
计算机眼中的图像
读取图像
# opencv读取的格式是BGR,正常人眼看到的是RGB
import cv2 #opencv读取的格式是BGR
import matplotlib.pyplot as plt
import numpy as np
%matplotlib inline #jupyter特有的显示图像的函数
img=cv2.imread('cat. jpg')
#图像的显示,也可以创建多个窗口
cv2.imshow('image',img)
# 等待时间,毫秒级,0表示任意键终止
cv2.waitKey(0)
cv2.destroyAllWindows()
def cv_show(name, img)
cv2.imshow(name,img)
cv2.waitKey(0)
cv2.destroyAllWindows()
查看图像的属性【H,W,C】,H=414,W=500,C=3
# 读取灰度图
img = cv2.imread('cat.jpg', cv2.IMREAD_GRAYSCALE)
灰度图展示结果
img.shape == (414,500)【灰度图二维的图像,】
【灰度图展示如下】
#保存
cv2.imwrite('mycat.png', img)
数据读取-视频
- cv2.VideoCapture可以捕获摄像头,用数字来控制不同的设备,例如0,1。
- 如果是视频文件,直接指定好路径即可。
vc = cv2.VideoCapture('test.mp4')
#检查是否打开正确
if vc.isOpened() :
open, frame = vc.read()
else:
open = False
while open:
ret, frame = vc.read()
if frame is None:
break
if ret == True:
gray = cv2.cvtColor(frame,CV2.COLOR BGR2GRAY)
cv2.imshow('result', gray)if cv2.waitKey(10) & OxFF == 27:
break
vc.release()
cv2.destroyAllWindows()
截取部分图像数据(ROI)
img=cv2.imread('cat. jpg')
# 从0到200,相当于指定了切片
cat=img[0:200,0:200]
cv_show('cat',cat)
执行代码,切片操作
【cat=img[0:50,0:200]】
颜色通道提取
b,g,r=cv2.split(img)
print(r)
print(r)
array([[160, 164, 169, ..., 185, 184, 183], [126, 131, 136, ..., 184, 183, 182], [127, 131, 137, ..., 183, 182, 181], ..., [198, 193, 178, ..., 206, 195, 174], [176, 183, 175, ..., 188, 144, 125], [190, 190, 157, ..., 200, 145, 144]], dtype=uint8)
img=cv2.merge((b,g,r))
img.shape
(414, 500, 3)
# 只保留R,因为通道顺序是B,G,R,所以将0,1的B,G置为0,保留2的R
cur_img = img.copy()
cur_img[:,:,0] = 0
cur_img[:,:,1] = 0
cv_show('R',cur_img)
# 只保留G
cur_img = img.copy()
cur_img[:,:,0] = 0
cur_img[:,:,2] = 0
cv_show('G',cur_img)
# 只保留B
cur_img = img.copy()
cur_img[:,:,1] = 0
cur_img[:,:,2] = 0
cv_show('B',cur_img)
边界填充
top_size,bottom_size,left_size,right_size = (50,50,50,50)
# BORDER_REPLICATE:复制法,也就是复制最边缘像素。
replicate = cv2.copyMakeBorder(img, top_size, bottom_size, left_size, right_size, borderType=cv2.BORDER_REPLICATE)
# BORDER_REFLECT:反射法,对感兴趣的图像中的像素在两边进行复制例如:fedcba|abcdefgh|hgfedcb
reflect = cv2.copyMakeBorder(img, top_size, bottom_size, left_size, right_size,cv2.BORDER_REFLECT)
# BORDER_REFLECT_101:反射法,也就是以最边缘像素为轴,对称,gfedcb|abcdefgh|gfedcba
reflect101 = cv2.copyMakeBorder(img, top_size, bottom_size, left_size, right_size, cv2.BORDER_REFLECT_101)
# BORDER_WRAP:外包装法cdefgh|abcdefgh|abcdefg
wrap = cv2.copyMakeBorder(img, top_size, bottom_size, left_size, right_size, cv2.BORDER_WRAP)
# BORDER_CONSTANT:常量法,常数值填充。
constant = cv2.copyMakeBorder(img, top_size, bottom_size, left_size, right_size,cv2.BORDER_CONSTANT, value=0)
数值计算
img_cat=cv2.imread('cat.jpg')
img_dog=cv2.imread('dog.jpg')
img_cat2= img_cat +10
img_cat[:5,:,0]
array([[142, 146, 151, ..., 156, 155, 154], [107, 112, 117, ..., 155, 154, 153], [108, 112, 118, ..., 154, 153, 152], [139, 143, 148, ..., 156, 155, 154], [153, 158, 163, ..., 160, 159, 158]], dtype=uint8)
img_cat2[:5,:,0]
array([[152, 156, 161, ..., 166, 165, 164], [117, 122, 127, ..., 165, 164, 163], [118, 122, 128, ..., 164, 163, 162], [149, 153, 158, ..., 166, 165, 164], [163, 168, 173, ..., 170, 169, 168]], dtype=uint8)
#相当于% 256
(img_cat + img_cat2)[:5,:,0]
越界了(超出了255的范围)就对256做取余操作
array([[ 38, 46, 56, ..., 66, 64, 62], [224, 234, 244, ..., 64, 62, 60], [226, 234, 246, ..., 62, 60, 58], [ 32, 40, 50, ..., 66, 64, 62], [ 60, 70, 80, ..., 74, 72, 70]], dtype=uint8)
cv2.add(img_cat,img_cat2)[:5,:,0]
这个函数越界的话,就取255
array([[255, 255, 255, ..., 255, 255, 255], [224, 234, 244, ..., 255, 255, 255], [226, 234, 246, ..., 255, 255, 255], [255, 255, 255, ..., 255, 255, 255], [255, 255, 255, ..., 255, 255, 255]], dtype=uint8)
图像融合
进行resize操作
img_dog = cv2.resize(img_dog, (500, 414))
img_dog.shape
# (414, 500, 3)
# 进行倍数放大,x是四倍,y是4倍
res = cv2.resize(img, (0, 0), fx=4, fy=4)
plt.imshow(res)