Dlib实现目标跟踪

参考:
1、http://blog.csdn.net/tintinetmilou/article/details/74910558
2、http://blog.csdn.net/tintinetmilou/article/details/75194703
3、https://github.com/davisking/dlib/
4、http://dlib.net


本文主要用到的时Python API中的dlib.correlation_tracker类,里面有关于各个函数的详细介绍。

单目标跟踪

# -*- coding: UTF-8 -*-

import os
import glob
import cv2
import dlib

# Path to the video frames
video_folder = os.path.join("..", "examples", "video_frames")

# Create the correlation tracker - the object needs to be initialized before it can be used
tracker = dlib.correlation_tracker()

selection = None
track_window = None
drag_start = None

def onmouse(event, x, y, flags, param):
    global selection,track_window,drag_start
    if event == cv2.EVENT_LBUTTONDOWN:
        drag_start = (x, y)
        track_window = None
    if drag_start:
        xmin = min(x, drag_start[0])
        ymin = min(y, drag_start[1])
        xmax = max(x, drag_start[0])
        ymax = max(y, drag_start[1])
        selection = (xmin, ymin, xmax, ymax)
    if event == cv2.EVENT_LBUTTONUP:
        drag_start = None
        track_window = selection
        selection = None

def main():
    cv2.namedWindow('image',1)
    cv2.setMouseCallback('image',onmouse)
    # We will track the frames as we load them off of disk
    for k, f in enumerate(sorted(glob.glob(os.path.join(video_folder, "*.jpg")))):
        print("Processing Frame {}".format(k))
        img_raw = cv2.imread(f)
        image = img_raw.copy()

        # We need to initialize the tracker on the first frame
        if k == 0:
            # Start a track on the object you want. box the object using the mouse and press 'Enter' to start tracking  
            while True:
                img_first = image.copy()
                if track_window:
                    cv2.rectangle(img_first,(track_window[0],track_window[1]),(track_window[2],track_window[3]),(0,0,255),1)
                elif selection:
                    cv2.rectangle(img_first,(selection[0],selection[1]),(selection[2],selection[3]),(0,0,255),1)
                cv2.imshow('image',img_first)
                if cv2.waitKey(10) == 10:
                    break
            tracker.start_track(image, dlib.rectangle(track_window[0], track_window[1], track_window[2], track_window[3]))
        else:
            # Else we just attempt to track from the previous frame
            tracker.update(image)

        # Get previous box and draw on showing image
        box_predict = tracker.get_position()
        cv2.rectangle(image,(int(box_predict.left()),int(box_predict.top())),(int(box_predict.right()),int(box_predict.bottom())),(0,0,255),1)
        cv2.imshow('image',image)
        cv2.waitKey(10)

    cv2.destroyAllWindows()

if __name__ == '__main__':
    main()

该py文件放在此下载,视频文件(其实是每帧的图片)在此下载

  • 程序运行后,会显示出第一帧,用鼠标框一个要跟踪的物体
  • 框好后按回车进行跟踪

代码分析

  • 用opencv的鼠标GUI操作来在第一帧框住要跟踪的目标,这只需要在显示框上设置一个回调函数,来返回鼠标框到的框的坐标。
  • 根据框好的框确定要跟踪的目标物体,并传入tracker.start_track中
  • 按回车进行跟踪 ,之后用tracker.update(image)来追踪当前帧。tracker.get_position()返回追踪到的框,但要注意的是返回的这个框的数据类型时Dlib中的drectangle,不能直接传给我们显示所用的Opencv函数,所以我们通过drectangle操作函数来将框的坐标信息读出来(关于dlib.drectangle,详细信息去Python API中查)。
  • 最后根据跟踪得到的框在图片显示时框出来就好了。

总结一下,使用 dlib.correlation_tracker分四步:
1. 用dlib.correlation_tracker()创建一个跟踪类
2. start_track中设置图片中的要跟踪物体的框
3. update()中输入要跟踪的下一帧图片
4. get_position()得到跟踪到的目标在新一帧中框的位置


视频跟踪

# -*- coding: UTF-8 -*-

import os
import glob
import cv2
import dlib
import time

# Path to the video
video_folder = os.path.join("vtest.avi")
cap = cv2.VideoCapture(video_folder)
if not cap.isOpened():
    print("Could not open video", video_folder);exit(-1)

# Create the correlation tracker - the object needs to be initialized before it can be used
tracker = dlib.correlation_tracker()

selection = None
track_window = None
drag_start = None

def onmouse(event, x, y, flags, param):
    global selection,track_window,drag_start
    if event == cv2.EVENT_LBUTTONDOWN:
        drag_start = (x, y)
        track_window = None
    if drag_start:
        xmin = min(x, drag_start[0])
        ymin = min(y, drag_start[1])
        xmax = max(x, drag_start[0])
        ymax = max(y, drag_start[1])
        selection = (xmin, ymin, xmax, ymax)
    if event == cv2.EVENT_LBUTTONUP:
        drag_start = None
        track_window = selection
        selection = None

def main():
    cv2.namedWindow('image',1)
    cv2.setMouseCallback('image',onmouse)
    # We will track the frames as we load them off of disk
    # for k, f in enumerate(sorted(glob.glob(os.path.join(video_folder, "*.jpg")))):
    k=0
    while(1):
        ret, frame = cap.read()
        if not ret:
            print("Game over!")
            break
        print("Processing Frame {}".format(k))
        img_raw =frame #cv2.imread(f)
        image = img_raw.copy()

        # We need to initialize the tracker on the first frame
        if k == 0:
            # Start a track on the object you want. box the object using the mouse and press 'Enter' to start tracking
            while True:
                img_first = image.copy()
                if track_window:
                    cv2.rectangle(img_first,(track_window[0],track_window[1]),(track_window[2],track_window[3]),(0,0,255),1)
                elif selection:
                    cv2.rectangle(img_first,(selection[0],selection[1]),(selection[2],selection[3]),(0,0,255),1)
                cv2.imshow('image',img_first)
                if cv2.waitKey(10) == 27: # ESC
                    break
            tracker.start_track(image, dlib.rectangle(track_window[0], track_window[1], track_window[2], track_window[3]))
        else:
            # Else we just attempt to track from the previous frame
            tracker.update(image)
            # time.sleep(3)

        # Get previous box and draw on showing image
        box_predict = tracker.get_position()
        cv2.rectangle(image,(int(box_predict.left()),int(box_predict.top())),(int(box_predict.right()),int(box_predict.bottom())),(0,0,255),1)
        cv2.imshow('image',image)
        # cv2.waitKey(10)
        c = cv2.waitKey(10) & 0xff
        if c == 27: break # ESC
        k+=1
    cv2.destroyAllWindows()

if __name__ == '__main__':
    main()

多目标跟踪

# -*- coding: UTF-8 -*-

import os
import glob
import cv2
import dlib
import time

# Path to the video
video_folder = os.path.join("vtest.avi")
cap = cv2.VideoCapture(video_folder)
if not cap.isOpened():
    print("Could not open video", video_folder);exit(-1)

# Create the correlation tracker - the object needs to be initialized before it can be used
# 创建3个目标跟踪
tracker1 = dlib.correlation_tracker()
tracker2 = dlib.correlation_tracker()
tracker3 = dlib.correlation_tracker()

selection = None
track_window = None
drag_start = None

# 鼠标选框(做目标跟踪框)
def onmouse(event, x, y, flags, param):
    global selection,track_window,drag_start
    if event == cv2.EVENT_LBUTTONDOWN:
        drag_start = (x, y)
        track_window = None
    if drag_start:
        xmin = min(x, drag_start[0])
        ymin = min(y, drag_start[1])
        xmax = max(x, drag_start[0])
        ymax = max(y, drag_start[1])
        selection = (xmin, ymin, xmax, ymax)
    if event == cv2.EVENT_LBUTTONUP:
        drag_start = None
        track_window = selection
        selection = None

def main():
    track_window1 = ()
    track_window2 = ()
    track_window3 = ()

    cv2.namedWindow('image',1)
    cv2.setMouseCallback('image',onmouse)
    # We will track the frames as we load them off of disk
    # for k, f in enumerate(sorted(glob.glob(os.path.join(video_folder, "*.jpg")))):
    k=0
    while(1):
        ret, frame = cap.read()
        if not ret:
            print("Game over!")
            break
        print("Processing Frame {}".format(k))
        img_raw =frame #cv2.imread(f)
        image = img_raw.copy()

        # We need to initialize the tracker on the first frame
        if k == 0:
            # Start a track on the object you want. box the object using the mouse and press 'Enter' to start tracking
            while True:
                img_first = image.copy()
                if track_window:
                    cv2.rectangle(img_first,(track_window[0],track_window[1]),(track_window[2],track_window[3]),(0,0,255),1)
                elif selection:
                    cv2.rectangle(img_first,(selection[0],selection[1]),(selection[2],selection[3]),(0,0,255),1)

                # 选择多个跟踪目标
                if track_window1:
                    cv2.rectangle(img_first, (track_window1[0], track_window1[1]), (track_window1[2], track_window1[3]),
                                  (0, 255, 255), 1)
                if track_window2:
                    cv2.rectangle(img_first, (track_window2[0], track_window2[1]), (track_window2[2], track_window2[3]),
                                  (0, 255, 100), 1)
                if track_window3:
                    cv2.rectangle(img_first, (track_window3[0], track_window3[1]), (track_window3[2], track_window3[3]),
                                  (200, 0, 200), 1)
                cv2.imshow('image', img_first)
                if cv2.waitKey(10) == 27: # ESC
                    if not track_window1:
                        track_window1 = track_window
                    elif not track_window2:
                        track_window2 = track_window
                    elif not track_window3:
                        track_window3 = track_window
                    else:
                        break
            tracker1.start_track(image,
                                 dlib.rectangle(track_window1[0], track_window1[1], track_window1[2], track_window1[3]))
            tracker2.start_track(image,
                                 dlib.rectangle(track_window2[0], track_window2[1], track_window2[2], track_window2[3]))
            tracker3.start_track(image,
                                 dlib.rectangle(track_window3[0], track_window3[1], track_window3[2], track_window3[3]))
        else:
            # Else we just attempt to track from the previous frame
            tracker1.update(image)
            tracker2.update(image)
            tracker3.update(image)

            # Get previous box and draw on showing image
        box1_predict = tracker1.get_position()
        box2_predict = tracker2.get_position()
        box3_predict = tracker3.get_position()
        cv2.rectangle(image, (int(box1_predict.left()), int(box1_predict.top())),
                      (int(box1_predict.right()), int(box1_predict.bottom())), (0, 255, 255), 1)
        cv2.rectangle(image, (int(box2_predict.left()), int(box2_predict.top())),
                      (int(box2_predict.right()), int(box2_predict.bottom())), (0, 255, 100), 1)
        cv2.rectangle(image, (int(box3_predict.left()), int(box3_predict.top())),
                      (int(box3_predict.right()), int(box3_predict.bottom())), (200, 0, 200), 1)
        cv2.imshow('image', image)
        # cv2.waitKey(10)
        c = cv2.waitKey(10) & 0xff
        if c == 27: break # ESC
        k+=1
    cv2.destroyAllWindows()

if __name__ == '__main__':
    main()
  • 用鼠标框要跟踪的物体,框完按回车键(回车出问题 这里按ESC)确认,同样的手法连框三个
  • 再次按回车键开始跟踪
  • 0
    点赞
  • 20
    收藏
    觉得还不错? 一键收藏
  • 3
    评论
评论 3
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值