yolov8部署ros，stream=True模式，调用摄像头发布坐标信息代码

似苦又甜

已于 2024-03-20 20:17:55 修改

阅读量923

点赞数 6

文章标签： YOLO

于 2024-02-27 14:53:00 首次发布

本文链接：https://blog.csdn.net/qq_44701348/article/details/136322619

版权

本文介绍了如何利用Python编程实现基于YOLOv8的目标检测系统，结合ROS进行通信，用户可以通过鼠标选择并发送选定目标框的坐标。代码展示了如何处理鼠标事件，以及在视频流中实现实时目标框标注和坐标发送。

摘要由CSDN通过智能技术生成

#!/usr/bin/env python
import cv2
from ultralytics import YOLO
import numpy as np
import rospy
from communication_yolo.msg import  yolomsg
 
 
def onMouse(event, x, y, flags,param):      #鼠标回调函数，每点击鼠标响应一次，所做出的动作即：选择出目标框并发送目标框的坐标信息
    global start_x, start_y,n,is_mouse_clicked,boxes_id
    start_x, start_y = -1, -1           #每次执行鼠标响应函数前，将坐标归零
    if event == cv2.EVENT_LBUTTONDOWN:         #鼠标左键下降沿触发
        start_x, start_y = x, y
        n = chooseobj(point, start_x, start_y)           #调用选择目标框函数，传入所有目标框坐标二维列表point、鼠标点击时的坐标start_x、start_y
        boxes_id = results[0].boxes[n].id   #获取点击鼠标时，目标的id
        is_mouse_clicked=True      #记录鼠标点击的标志，为if条件判断作准备
        
 
 
def chooseobj(p,start_x,start_y):           #选择目标框的函数，取目标框中心点与鼠标响应时坐标最短距离的目标框的编号
    point_center = list()           #创建列表，存储计算得来的所有目标框的中心点（为一个二维的列表）
    i = 0
    while i < len(p): 
        point_center.append([int((p[i][2] - p[i][0]) / 2 + p[i][0]), int((p[i][3] - p[i][1]) / 2 + p[i][1])])  #求各个boxes的中心点坐标,并依次赋值于列表
        i=i+1
    distance = list()       #创建列表，存放各个目标框中心点距离与鼠标响应时坐标的距离
    m = 0
    while m < len(p):
        pixe1 = np.array([start_x, start_y]) #鼠标响应时坐标
        pixe2 = np.array([point_center[m][0], point_center[m][1]]) #各个目标框中心点坐标
        distance.append(cv2.norm(pixe1, pixe2)) #计算各个目标框中心点与鼠标响应时坐标的距离(即两个像素点的距离)
        m=m+1
    minimum = min(distance)  #找各个目标框距离列表中的最小值
    boxes_index = distance.index(minimum)  #通过列表索引，将最小值对应的列表下表返回
    return boxes_index
 
rospy.init_node("yolo_ros_pub")        #初始化Ros节点
 
pub = rospy.Publisher("yolomsg",yolomsg,queue_size=10)         #创建发布对象，指定发布方的话题和消息类型
 
# Load the YOLOv8 model
model = YOLO("/home/zzb/yolov8_ws/src/communication_yolo/yolov8_main/yolov8n.pt")    #加载yolo的模型权重
# Open the video file
cap = cv2.VideoCapture(0)
# Loop through the video frames
 
#初始化参数
is_mouse_clicked=False
n = 0
boxes_id=0
 
while cap.isOpened():
    # Read a frame from the video
    success, frame = cap.read()
 
    if success:
        # Run YOLOv8 inference on the frame
        results_generator = model.track(source=frame,persist=True,stream=True)
        # 将Tensor类型的xy坐标数据转为一个二维列表，外层列表长度为识别目标boxes的个数，内层为xyxy四个目标坐标信息
        results=next(results_generator)
        point = results.boxes.xyxy.tolist()

        #确保results是否有目标，且由于point 是实时刷新的，防止出现之前点击选择的n很大，而导致下面实时索引results[0].boxes[n].id时n超出范围的bug，即:使n与results的n实时绑定
        #且鼠标选择了目标且确保发送目标框坐标信息，是自己之前点击的id，就发送信息
        if  n<len(point) and is_mouse_clicked and results.boxes[n].id == boxes_id:
            msg = yolomsg()             #创建自定义消息的对象
            msg.xmin= int(point[n][0])   #赋值选择出的目标框的四个坐标信息
            msg.ymin = int(point[n][1])
            msg.xmax =int(point[n][2])
            msg.ymax = int(point[n][3])
            pub.publish(msg) #发送消息
            annotated_copy = frame.copy()
            x_min, y_min, x_max, y_max = map(int, point[n])  # Extract coordinates
            annotated_results = cv2.rectangle(annotated_copy, (x_min, y_min), (x_max, y_max), (0, 255, 0), 2) #opencv画矩形框的函数，根据选择的目标的坐标画矩形框
            cv2.imshow("YOLOv8 Inference", annotated_results)
        else :
            # Visualize the yolov8 results on the frame
            annotated_frame = results.plot()  #Yolov8的results的plot()方法，绘制结果图片
            # Display the annotated frame
            cv2.imshow("YOLOv8 Inference", annotated_frame)
            is_mouse_clicked = False    #results无目标就将鼠标点击置0等待下次点击

        cv2.setMouseCallback("YOLOv8 Inference", onMouse)      #while循环监听opencv鼠标响应函数
 
        # Break the loop if 'q' is pressed
        if cv2.waitKey(1) & 0xFF == ord("q"):
            break
    else:
        # Break the loop if the end of the video is reached
        break
 
# Release the video capture object and close the display window
cap.release()
cv2.destroyAllWindows()

注：opencv capture.read（）函数好像是一帧一帧读取图片会导致rtsp视频流读取变卡

在usb摄像头好像没有这种bug

opencv的imshow函数后面必须接waitkey函数否则imshow出来是黑屏的https://zhuanlan.zhihu.com/p/251398560

https://www.volcengine.com/theme/7772002-O-7-1