OpenCV学习的第二天,唐宇迪老师的声音很好听,很温柔,清澈,让我想起了大学时光里曾经的那件白T恤是内心中永远的美好,好好挣钱,好好学习,好好生活,也许人间还是有那么一丝丝的值得。
第三节、图像处理
一、图像阈值
ret, dst = cv2.threshold(src, thresh, maxval, type)
src: 输入图,只能输入单通道图像,通常来说为灰度图
dst: 输出图
thresh: 阈值
maxval: 当像素值超过了阈值(或者小于阈值,根据type来决定),所赋予的值
type:二值化操作的类型,包含以下5种类型:
cv2.THRESH_BINARY 超过阈值部分取maxval(最大值),否则取0
cv2.THRESH_BINARY_INV THRESH_BINARY的反转
cv2.THRESH_TRUNC 大于阈值部分设为阈值,否则不变
cv2.THRESH_TOZERO 大于阈值部分不改变,否则设为0
cv2.THRESH_TOZERO_INV THRESH_TOZERO的反转
import cv2
import matplotlib.pyplot as plt
import numpy as np
img=cv2.imread(‘IDCard.jpg’)
img_gray = cv2.cvtColor(img,cv2.COLOR_BGR2GRAY)
print(img_gray.shape)
ret, thresh1 = cv2.threshold(img_gray, 127, 255, cv2.THRESH_BINARY)
ret, thresh2 = cv2.threshold(img_gray, 127, 255, cv2.THRESH_BINARY_INV)
ret, thresh3 = cv2.threshold(img_gray, 127, 255, cv2.THRESH_TRUNC)
ret, thresh4 = cv2.threshold(img_gray, 127, 255, cv2.THRESH_TOZERO)
ret, thresh5 = cv2.threshold(img_gray, 127, 255, cv2.THRESH_TOZERO_INV)
titles = [‘Original Image’, ‘BINARY’, ‘BINARY_INV’, ‘TRUNC’, ‘TOZERO’, ‘TOZERO_INV’]
images = [img, thresh1, thresh2, thresh3, thresh4, thresh5]
for i in range(6):
plt.subplot(2, 3, i + 1), plt.imshow(images[i], ‘gray’)
plt.title(titles[i])
plt.xticks([]), plt.yticks([])
plt.show()
二、图像平滑
带噪音点的图片
图像矩阵
3*3的核
图像平滑就是对像素点进行变换
1、均值滤波(简单的平均卷积操作)
与图像矩阵求内积:(1121+175+178+124+1204+1113+1154+1104+1235)/9***
import cv2
import matplotlib.pyplot as plt
import numpy as np
img = cv2.imread(‘lenaNoise.png’)
cv2.imshow(‘img’, img)
cv2.waitKey(0)
cv2.destroyAllWindows()
blur = cv2.blur(img, (3, 3))
cv2.imshow(‘blur’, blur)
cv2.waitKey(0)
cv2.destroyAllWindows()
2、方框滤波(基本和均值一样,可以选择归一化,容易越界)
"-1"参数表示原始图像跟平滑后的图像通道数一致
“normalize=False”,卷积后不做均值处理,直接相加,越界255的像素点直接置为255(白色)
import cv2
import matplotlib.pyplot as plt
import numpy as np
img = cv2.imread(‘lenaNoise.png’)
cv2.imshow(‘img’, img)
cv2.waitKey(0)
cv2.destroyAllWindows()
box = cv2.boxFilter(img,-1,(3,3), normalize=True)
cv2.imshow(‘box’, box)
cv2.waitKey(0)
cv2.destroyAllWindows()
box = cv2.boxFilter(img,-1,(3,3), normalize=False)
cv2.imshow(‘box’, box)
cv2.waitKey(0)
cv2.destroyAllWindows()
3、高斯滤波(高斯模糊的卷积核里的数值是满足高斯分布,相当于更重视中间的)
距离越近的像素点取值应该越相似,所以卷积核对应的像素点比重应该越大
import cv2
import matplotlib.pyplot as plt
import numpy as np
img = cv2.imread(‘lenaNoise.png’)
cv2.imshow(‘img’, img)
cv2.waitKey(0)
cv2.destroyAllWindows()
aussian = cv2.GaussianBlur(img, (5, 5), 1)
cv2.imshow(‘aussian’, aussian)
cv2.waitKey(0)
cv2.destroyAllWindows()
4、中值滤波(相当于用中值代替)
5*5的卷积核,一共25个值,排列好前面12个值,后面12个值,取值第13位置的那个值作为像素点的值
import cv2
import matplotlib.pyplot as plt
import numpy as np
img = cv2.imread(‘lenaNoise.png’)
cv2.imshow(‘img’, img)
cv2.waitKey(0)
cv2.destroyAllWindows()
median = cv2.medianBlur(img, 5)
cv2.imshow(‘median’, median)
cv2.waitKey(0)
cv2.destroyAllWindows()
#展示所有的
res = np.hstack((blur,aussian,median))
#print (res)
cv2.imshow(‘median vs average’, res)
cv2.waitKey(0)
cv2.destroyAllWindows()
三、形态学-腐蚀操作(前提图像是一个二值图像)
import cv2
import matplotlib.pyplot as plt
import numpy as np
img = cv2.imread(‘dige.png’)
cv2.imshow(‘img’, img)
cv2.waitKey(0)
cv2.destroyAllWindows()
kernel = np.ones((3,3),np.uint8)
erosion = cv2.erode(img,kernel,iterations = 1)
cv2.imshow(‘erosion’, erosion)
cv2.waitKey(0)
cv2.destroyAllWindows()
注意:毛刺没了的同时,线条也变细了
卷积核内有不同色调的像素点都要被腐蚀掉,随着迭代次数越多,腐蚀越厉害
import cv2
import matplotlib.pyplot as plt
import numpy as np
pie = cv2.imread(‘pie.png’)
cv2.imshow(‘pie’, pie)
cv2.waitKey(0)
cv2.destroyAllWindows()
kernel = np.ones((30,30),np.uint8)
erosion_1 = cv2.erode(pie,kernel,iterations = 1)
erosion_2 = cv2.erode(pie,kernel,iterations = 2)
erosion_3 = cv2.erode(pie,kernel,iterations = 3)
res = np.hstack((erosion_1,erosion_2,erosion_3))
cv2.imshow(‘res’, res)
cv2.waitKey(0)
cv2.destroyAllWindows()
四、形态学-膨胀操作(图像经过腐蚀操作后去掉毛刺,然后通过膨胀操作去弥补腐蚀造成的图片伤害)
import cv2
import matplotlib.pyplot as plt
import numpy as np
img = cv2.imread(‘dige.png’)
cv2.imshow(‘img’, img)
cv2.waitKey(0)
cv2.destroyAllWindows()
kernel = np.ones((3,3),np.uint8)
dige_erosion = cv2.erode(img,kernel,iterations = 1)
cv2.imshow(‘erosion’, dige_erosion)
cv2.waitKey(0)
cv2.destroyAllWindows()
kernel = np.ones((3,3),np.uint8)
dige_dilate = cv2.dilate(dige_erosion,kernel,iterations = 1)
cv2.imshow(‘dilate’, dige_dilate)
cv2.waitKey(0)
cv2.destroyAllWindows()
pie = cv2.imread(‘pie.png’)
kernel = np.ones((30,30),np.uint8)
dilate_1 = cv2.dilate(pie,kernel,iterations = 1)
dilate_2 = cv2.dilate(pie,kernel,iterations = 2)
dilate_3 = cv2.dilate(pie,kernel,iterations = 3)
res = np.hstack((dilate_1,dilate_2,dilate_3))
cv2.imshow(‘res’, res)
cv2.waitKey(0)
cv2.destroyAllWindows()
五、开运算与闭运算(开:先腐蚀,再膨胀)(闭:先膨胀,再腐蚀)
开:
img = cv2.imread(‘dige.png’)
kernel = np.ones((5,5),np.uint8)
opening = cv2.morphologyEx(img, cv2.MORPH_OPEN, kernel)
cv2.imshow(‘opening’, opening)
cv2.waitKey(0)
cv2.destroyAllWindows()
闭:
img = cv2.imread(‘dige.png’)
kernel = np.ones((5,5),np.uint8)
closing = cv2.morphologyEx(img, cv2.MORPH_CLOSE, kernel)
cv2.imshow(‘closing’, closing)
cv2.waitKey(0)
cv2.destroyAllWindows()
六、梯度运算(梯度=膨胀-腐蚀)(轮廓)
import cv2
import matplotlib.pyplot as plt
import numpy as np
pie = cv2.imread(‘pie.png’)
kernel = np.ones((7,7),np.uint8)
dilate = cv2.dilate(pie,kernel,iterations = 5)
erosion = cv2.erode(pie,kernel,iterations = 5)
res = np.hstack((dilate,erosion))
cv2.imshow(‘res’, res)
cv2.waitKey(0)
cv2.destroyAllWindows()
gradient = cv2.morphologyEx(pie, cv2.MORPH_GRADIENT, kernel)
cv2.imshow(‘gradient’, gradient)
cv2.waitKey(0)
cv2.destroyAllWindows()
***礼帽与黑帽
- **礼帽 = 原始输入-开运算结果(剩下毛刺)
- 黑帽 = 闭运算-原始输入*** (剩下原始图像轮廓)**
#礼帽
img = cv2.imread(‘dige.png’)
tophat = cv2.morphologyEx(img, cv2.MORPH_TOPHAT, kernel)
cv2.imshow(‘tophat’, tophat)
cv2.waitKey(0)
cv2.destroyAllWindows()
#黑帽
img = cv2.imread(‘dige.png’)
blackhat = cv2.morphologyEx(img,cv2.MORPH_BLACKHAT, kernel)
cv2.imshow('blackhat ', blackhat )
cv2.waitKey(0)
cv2.destroyAllWindows()
七、图像梯度-Sobel算子
内外色差才存在梯度,梯度存在水平跟竖直两个方向上
具体计算点越近的点权重越大,右边-左边 下面-上面
*****dst = cv2.Sobel(src, ddepth, dx, dy, ksize)
- ddepth:图像的深度
- dx和dy分别表示水平和竖直方向
- ksize是Sobel算子的大小*****
img = cv2.imread(‘pie.png’,cv2.IMREAD_GRAYSCALE)
cv2.imshow(“img”,img)
cv2.waitKey()
cv2.destroyAllWindows()
def cv_show(img,name):
cv2.imshow(name,img)
cv2.waitKey()
cv2.destroyAllWindows()
sobelx = cv2.Sobel(img,cv2.CV_64F,1,0,ksize=3)
cv_show(sobelx,‘sobelx’)
白到黑是正数,黑到白就是负数了,所有的负数会被截断成0,所以要取绝对值
sobelx = cv2.Sobel(img,cv2.CV_64F,1,0,ksize=3)
sobelx = cv2.convertScaleAbs(sobelx)
cv_show(sobelx,‘sobelx’)
sobely = cv2.Sobel(img,cv2.CV_64F,0,1,ksize=3)
sobely = cv2.convertScaleAbs(sobely)
cv_show(sobely,‘sobely’)
分别计算x和y,再求和
sobelxy = cv2.addWeighted(sobelx,0.5,sobely,0.5,0)
cv_show(sobelxy,‘sobelxy’)
img = cv2.imread(‘lena.jpg’,cv2.IMREAD_GRAYSCALE)
sobelxy=cv2.Sobel(img,cv2.CV_64F,1,1,ksize=3)
sobelxy = cv2.convertScaleAbs(sobelxy)
cv_show(sobelxy,‘sobelxy’)
直接计算的效果不好
八、图像梯度-Scharr算子(核数值加大,对差异更敏感)
九、图像梯度-laplacian算子(二阶导,变化率的导数,对变化更敏感,对噪音也敏感,效果不好)中间点与周围点的计算,与XY无关
#不同算子的差异
img = cv2.imread(‘lena.jpg’,cv2.IMREAD_GRAYSCALE)
cv_show(img,‘img’)
img = cv2.imread(‘lena.jpg’,cv2.IMREAD_GRAYSCALE)
sobelx = cv2.Sobel(img,cv2.CV_64F,1,0,ksize=3)
sobely = cv2.Sobel(img,cv2.CV_64F,0,1,ksize=3)
sobelx = cv2.convertScaleAbs(sobelx)
sobely = cv2.convertScaleAbs(sobely)
sobelxy = cv2.addWeighted(sobelx,0.5,sobely,0.5,0)
scharrx = cv2.Scharr(img,cv2.CV_64F,1,0)
scharry = cv2.Scharr(img,cv2.CV_64F,0,1)
scharrx = cv2.convertScaleAbs(scharrx)
scharry = cv2.convertScaleAbs(scharry)
scharrxy = cv2.addWeighted(scharrx,0.5,scharry,0.5,0)
laplacian = cv2.Laplacian(img,cv2.CV_64F)
laplacian = cv2.convertScaleAbs(laplacian)
res = np.hstack((sobelxy,scharrxy,laplacian))
cv_show(res,‘res’)
不通算子针对差异给出的不通结果
十、Canny边缘检测
图象的边缘是指图象局部区域亮度变化显著的部分
既从一个灰度值在很小的缓冲区域内急剧变化到另一个灰度相差较大的灰度值
根据二维灰度矩阵梯度向量来寻找图像灰度矩阵的灰度跃变位置,然后在图像中将这些位置的点连起来就构成了所谓的图像边缘
-
-
使用高斯滤波器,以平滑图像,滤除噪声。(导数通常对噪声很敏感,因此必须采用滤波器来改善与噪声有关的边缘检测器的性能)
-
-
计算图像中每个像素点的梯度强度和方向。
-
-
应用非极大值(Non-Maximum Suppression)抑制,以消除边缘检测带来的杂散响应。
-
-
-
应用双阈值(Double-Threshold)检测来确定真实的和潜在的边缘。
-
-
-
通过抑制孤立的弱边缘最终完成边缘检测。
-
import cv2
import matplotlib.pyplot as plt
import numpy as np
def cv_show(img,name):
cv2.imshow(name,img)
cv2.waitKey()
cv2.destroyAllWindows()
img=cv2.imread(“lena.jpg”,cv2.IMREAD_GRAYSCALE)
v1=cv2.Canny(img,80,150)
v2=cv2.Canny(img,50,100)
res = np.hstack((v1,v2))
cv_show(res,‘res’)
img=cv2.imread(“car.png”,cv2.IMREAD_GRAYSCALE)
v1=cv2.Canny(img,120,250)
v2=cv2.Canny(img,50,100)
res = np.hstack((v1,v2))
cv_show(res,‘res’)