opencv341的ssd_mobilenet应用之cpu65ms

最新推荐文章于 2024-08-16 08:28:43 发布

samylee

最新推荐文章于 2024-08-16 08:28:43 发布

阅读量3k

点赞数 2

分类专栏： caffe 文章标签： ssd_mobilenet

本文链接：https://blog.csdn.net/samylee/article/details/80548323

版权

caffe 专栏收录该内容

21 篇文章 0 订阅

订阅专栏

opencv341可以直接应用ssd_mobilenet（github）前向工程，算法在voc0712上的Map为0.727，有一定的应用价值！

网上一般公开的是opencv341+python版本，很难找到c++版本，所以博主开源一下，以供交流之用！

注意：网络模型请至ssd_mobilenet(github)下载调用！

测试软件：vs2015、opencv341

测试硬件：i7-4790-4core

测试结果：cpu每帧平均耗时65ms

测试代码：

#include <opencv2/core.hpp>
#include <opencv2/highgui.hpp>
#include <opencv2/imgproc.hpp>
#include <opencv2/dnn.hpp>

#include <string>
#include <iostream>
#include <time.h>

using namespace std;
using namespace cv;
using namespace dnn;

int main()
{
	//Net cvNet = readNetFromTensorflow("frozen_inference_graph.pb", "ssd_mobilenet_v1_coco.pbtxt");
	Net net = readNetFromCaffe("MobileNetSSD_deploy.prototxt", "MobileNetSSD_deploy.caffemodel");

	const char* classNames[] = { "background", "aeroplane", "bicycle", "bird", "boat", "bottle", "bus", "car", "cat", "chair",
		"cow", "diningtable", "dog", "horse", "motorbike", "person", "pottedplant", "sheep", "sofa", "train", "tvmonitor" };

	float detect_thresh = 0.24;

	string test_type = "image";
	if (test_type == "image")
	{
		Mat image = imread("test.jpg");

		clock_t start_t = clock();
		net.setInput(blobFromImage(image, 1.0 / 127.5, Size(300, 300), Scalar(127.5, 127.5, 127.5), true, false));
		Mat cvOut = net.forward();
		cout << "Cost time: " << clock() - start_t << endl;

		Mat detectionMat(cvOut.size[2], cvOut.size[3], CV_32F, cvOut.ptr<float>());
		for (int i = 0; i < detectionMat.rows; i++)
		{
			int obj_class = detectionMat.at<float>(i, 1);
			float confidence = detectionMat.at<float>(i, 2);

			if (confidence > detect_thresh)
			{
				size_t objectClass = (size_t)(detectionMat.at<float>(i, 1));

				int xLeftBottom = static_cast<int>(detectionMat.at<float>(i, 3) * image.cols);
				int yLeftBottom = static_cast<int>(detectionMat.at<float>(i, 4) * image.rows);
				int xRightTop = static_cast<int>(detectionMat.at<float>(i, 5) * image.cols);
				int yRightTop = static_cast<int>(detectionMat.at<float>(i, 6) * image.rows);

				Rect object((int)xLeftBottom, (int)yLeftBottom,
					(int)(xRightTop - xLeftBottom),
					(int)(yRightTop - yLeftBottom));

				rectangle(image, object, Scalar(0, 0, 255), 2);
				putText(image, classNames[obj_class], Point(xLeftBottom, yLeftBottom - 10), 3, 0.5, Scalar(0, 0, 255), 2);
			}
		}

		imshow("test", image);
		cv::waitKey(0);
	}
	else if (test_type == "video")
	{
		VideoCapture cap("test.avi");
		if (!cap.isOpened()) return -1;
		Mat frame;

		while (true)
		{
			cap >> frame;
			if (frame.empty()) break;

			clock_t start_t = clock();
			net.setInput(blobFromImage(frame, 1.0 / 127.5, Size(300, 300), Scalar(127.5, 127.5, 127.5), true, false));
			Mat cvOut = net.forward();
			cout << "Cost time: " << clock() - start_t << endl;

			Mat detectionMat(cvOut.size[2], cvOut.size[3], CV_32F, cvOut.ptr<float>());
			for (int i = 0; i < detectionMat.rows; i++)
			{
				int obj_class = detectionMat.at<float>(i, 1);
				float confidence = detectionMat.at<float>(i, 2);
				
				if (confidence > detect_thresh)
				{
					size_t objectClass = (size_t)(detectionMat.at<float>(i, 1));

					int xLeftBottom = static_cast<int>(detectionMat.at<float>(i, 3) * frame.cols);
					int yLeftBottom = static_cast<int>(detectionMat.at<float>(i, 4) * frame.rows);
					int xRightTop = static_cast<int>(detectionMat.at<float>(i, 5) * frame.cols);
					int yRightTop = static_cast<int>(detectionMat.at<float>(i, 6) * frame.rows);

					Rect object((int)xLeftBottom, (int)yLeftBottom,
						(int)(xRightTop - xLeftBottom),
						(int)(yRightTop - yLeftBottom));

					rectangle(frame, object, Scalar(0, 0, 255), 2);
					putText(frame, classNames[obj_class], Point(xLeftBottom, yLeftBottom - 10), 3, 0.5, Scalar(0, 0, 255), 2);
				}
			}

			imshow("test", frame);
			if (cv::waitKey(1) > 1) break;
		}
	}
	else
	{
		cout << "Unknow type!" << endl;
		system("pause");
	}
	
	return 0;
}

测试效果：