参考:
1、http://blog.csdn.net/tintinetmilou/article/details/74910558
2、http://blog.csdn.net/tintinetmilou/article/details/75194703
3、https://github.com/davisking/dlib/
4、http://dlib.net
本文主要用到的时Python API中的dlib.correlation_tracker类,里面有关于各个函数的详细介绍。
单目标跟踪
# -*- coding: UTF-8 -*-
import os
import glob
import cv2
import dlib
# Path to the video frames
video_folder = os.path.join("..", "examples", "video_frames")
# Create the correlation tracker - the object needs to be initialized before it can be used
tracker = dlib.correlation_tracker()
selection = None
track_window = None
drag_start = None
def onmouse(event, x, y, flags, param):
global selection,track_window,drag_start
if event == cv2.EVENT_LBUTTONDOWN:
drag_start = (x, y)
track_window = None
if drag_start:
xmin = min(x, drag_start[0])
ymin = min(y, drag_start[1])
xmax = max(x, drag_start[0])
ymax = max(y, drag_start[1])
selection = (xmin, ymin, xmax, ymax)
if event == cv2.EVENT_LBUTTONUP:
drag_start = None
track_window = selection
selection = None
def main():
cv2.namedWindow('image',1)
cv2.setMouseCallback('image',onmouse)
# We will track the frames as we load them off of disk
for k, f in enumerate(sorted(glob.glob(os.path.join(video_folder, "*.jpg")))):
print("Processing Frame {}".format(k))
img_raw = cv2.imread(f)
image = img_raw.copy()
# We need to initialize the tracker on the first frame
if k == 0:
# Start a track on the object you want. box the object using the mouse and press 'Enter' to start tracking
while True:
img_first = image.copy()
if track_window:
cv2.rectangle(img_first,(track_window[0],track_window[1]),(track_window[2],track_window[3]),(0,0,255),1)
elif selection:
cv2.rectangle(img_first,(selection[0],selection[1]),(selection[2],selection[3]),(0,0,255),1)
cv2.imshow('image',img_first)
if cv2.waitKey(10) == 10:
break
tracker.start_track(image, dlib.rectangle(track_window[0], track_window[1], track_window[2], track_window[3]))
else:
# Else we just attempt to track from the previous frame
tracker.update(image)
# Get previous box and draw on showing image
box_predict = tracker.get_position()
cv2.rectangle(image,(int(box_predict.left()),int(box_predict.top())),(int(box_predict.right()),int(box_predict.bottom())),(0,0,255),1)
cv2.imshow('image',image)
cv2.waitKey(10)
cv2.destroyAllWindows()
if __name__ == '__main__':
main()
该py文件放在此下载,视频文件(其实是每帧的图片)在此下载。
- 程序运行后,会显示出第一帧,用鼠标框一个要跟踪的物体
- 框好后按回车进行跟踪
代码分析
- 用opencv的鼠标GUI操作来在第一帧框住要跟踪的目标,这只需要在显示框上设置一个回调函数,来返回鼠标框到的框的坐标。
- 根据框好的框确定要跟踪的目标物体,并传入tracker.start_track中
- 按回车进行跟踪 ,之后用tracker.update(image)来追踪当前帧。tracker.get_position()返回追踪到的框,但要注意的是返回的这个框的数据类型时Dlib中的drectangle,不能直接传给我们显示所用的Opencv函数,所以我们通过drectangle操作函数来将框的坐标信息读出来(关于dlib.drectangle,详细信息去Python API中查)。
- 最后根据跟踪得到的框在图片显示时框出来就好了。
总结一下,使用 dlib.correlation_tracker分四步:
1. 用dlib.correlation_tracker()创建一个跟踪类
2. start_track中设置图片中的要跟踪物体的框
3. update()中输入要跟踪的下一帧图片
4. get_position()得到跟踪到的目标在新一帧中框的位置
视频跟踪
# -*- coding: UTF-8 -*-
import os
import glob
import cv2
import dlib
import time
# Path to the video
video_folder = os.path.join("vtest.avi")
cap = cv2.VideoCapture(video_folder)
if not cap.isOpened():
print("Could not open video", video_folder);exit(-1)
# Create the correlation tracker - the object needs to be initialized before it can be used
tracker = dlib.correlation_tracker()
selection = None
track_window = None
drag_start = None
def onmouse(event, x, y, flags, param):
global selection,track_window,drag_start
if event == cv2.EVENT_LBUTTONDOWN:
drag_start = (x, y)
track_window = None
if drag_start:
xmin = min(x, drag_start[0])
ymin = min(y, drag_start[1])
xmax = max(x, drag_start[0])
ymax = max(y, drag_start[1])
selection = (xmin, ymin, xmax, ymax)
if event == cv2.EVENT_LBUTTONUP:
drag_start = None
track_window = selection
selection = None
def main():
cv2.namedWindow('image',1)
cv2.setMouseCallback('image',onmouse)
# We will track the frames as we load them off of disk
# for k, f in enumerate(sorted(glob.glob(os.path.join(video_folder, "*.jpg")))):
k=0
while(1):
ret, frame = cap.read()
if not ret:
print("Game over!")
break
print("Processing Frame {}".format(k))
img_raw =frame #cv2.imread(f)
image = img_raw.copy()
# We need to initialize the tracker on the first frame
if k == 0:
# Start a track on the object you want. box the object using the mouse and press 'Enter' to start tracking
while True:
img_first = image.copy()
if track_window:
cv2.rectangle(img_first,(track_window[0],track_window[1]),(track_window[2],track_window[3]),(0,0,255),1)
elif selection:
cv2.rectangle(img_first,(selection[0],selection[1]),(selection[2],selection[3]),(0,0,255),1)
cv2.imshow('image',img_first)
if cv2.waitKey(10) == 27: # ESC
break
tracker.start_track(image, dlib.rectangle(track_window[0], track_window[1], track_window[2], track_window[3]))
else:
# Else we just attempt to track from the previous frame
tracker.update(image)
# time.sleep(3)
# Get previous box and draw on showing image
box_predict = tracker.get_position()
cv2.rectangle(image,(int(box_predict.left()),int(box_predict.top())),(int(box_predict.right()),int(box_predict.bottom())),(0,0,255),1)
cv2.imshow('image',image)
# cv2.waitKey(10)
c = cv2.waitKey(10) & 0xff
if c == 27: break # ESC
k+=1
cv2.destroyAllWindows()
if __name__ == '__main__':
main()
多目标跟踪
# -*- coding: UTF-8 -*-
import os
import glob
import cv2
import dlib
import time
# Path to the video
video_folder = os.path.join("vtest.avi")
cap = cv2.VideoCapture(video_folder)
if not cap.isOpened():
print("Could not open video", video_folder);exit(-1)
# Create the correlation tracker - the object needs to be initialized before it can be used
# 创建3个目标跟踪
tracker1 = dlib.correlation_tracker()
tracker2 = dlib.correlation_tracker()
tracker3 = dlib.correlation_tracker()
selection = None
track_window = None
drag_start = None
# 鼠标选框(做目标跟踪框)
def onmouse(event, x, y, flags, param):
global selection,track_window,drag_start
if event == cv2.EVENT_LBUTTONDOWN:
drag_start = (x, y)
track_window = None
if drag_start:
xmin = min(x, drag_start[0])
ymin = min(y, drag_start[1])
xmax = max(x, drag_start[0])
ymax = max(y, drag_start[1])
selection = (xmin, ymin, xmax, ymax)
if event == cv2.EVENT_LBUTTONUP:
drag_start = None
track_window = selection
selection = None
def main():
track_window1 = ()
track_window2 = ()
track_window3 = ()
cv2.namedWindow('image',1)
cv2.setMouseCallback('image',onmouse)
# We will track the frames as we load them off of disk
# for k, f in enumerate(sorted(glob.glob(os.path.join(video_folder, "*.jpg")))):
k=0
while(1):
ret, frame = cap.read()
if not ret:
print("Game over!")
break
print("Processing Frame {}".format(k))
img_raw =frame #cv2.imread(f)
image = img_raw.copy()
# We need to initialize the tracker on the first frame
if k == 0:
# Start a track on the object you want. box the object using the mouse and press 'Enter' to start tracking
while True:
img_first = image.copy()
if track_window:
cv2.rectangle(img_first,(track_window[0],track_window[1]),(track_window[2],track_window[3]),(0,0,255),1)
elif selection:
cv2.rectangle(img_first,(selection[0],selection[1]),(selection[2],selection[3]),(0,0,255),1)
# 选择多个跟踪目标
if track_window1:
cv2.rectangle(img_first, (track_window1[0], track_window1[1]), (track_window1[2], track_window1[3]),
(0, 255, 255), 1)
if track_window2:
cv2.rectangle(img_first, (track_window2[0], track_window2[1]), (track_window2[2], track_window2[3]),
(0, 255, 100), 1)
if track_window3:
cv2.rectangle(img_first, (track_window3[0], track_window3[1]), (track_window3[2], track_window3[3]),
(200, 0, 200), 1)
cv2.imshow('image', img_first)
if cv2.waitKey(10) == 27: # ESC
if not track_window1:
track_window1 = track_window
elif not track_window2:
track_window2 = track_window
elif not track_window3:
track_window3 = track_window
else:
break
tracker1.start_track(image,
dlib.rectangle(track_window1[0], track_window1[1], track_window1[2], track_window1[3]))
tracker2.start_track(image,
dlib.rectangle(track_window2[0], track_window2[1], track_window2[2], track_window2[3]))
tracker3.start_track(image,
dlib.rectangle(track_window3[0], track_window3[1], track_window3[2], track_window3[3]))
else:
# Else we just attempt to track from the previous frame
tracker1.update(image)
tracker2.update(image)
tracker3.update(image)
# Get previous box and draw on showing image
box1_predict = tracker1.get_position()
box2_predict = tracker2.get_position()
box3_predict = tracker3.get_position()
cv2.rectangle(image, (int(box1_predict.left()), int(box1_predict.top())),
(int(box1_predict.right()), int(box1_predict.bottom())), (0, 255, 255), 1)
cv2.rectangle(image, (int(box2_predict.left()), int(box2_predict.top())),
(int(box2_predict.right()), int(box2_predict.bottom())), (0, 255, 100), 1)
cv2.rectangle(image, (int(box3_predict.left()), int(box3_predict.top())),
(int(box3_predict.right()), int(box3_predict.bottom())), (200, 0, 200), 1)
cv2.imshow('image', image)
# cv2.waitKey(10)
c = cv2.waitKey(10) & 0xff
if c == 27: break # ESC
k+=1
cv2.destroyAllWindows()
if __name__ == '__main__':
main()
- 用鼠标框要跟踪的物体,框完按回车键(回车出问题 这里按ESC)确认,同样的手法连框三个
- 再次按回车键开始跟踪