opencv下LDA二分类

最新推荐文章于 2024-07-02 13:47:42 发布

元气少女缘结神

最新推荐文章于 2024-07-02 13:47:42 发布

阅读量2.3k

点赞数

分类专栏： OpenCV Basises ML 文章标签： opencv matlab

本文链接：https://blog.csdn.net/wd1603926823/article/details/51906491

版权

OpenCV Basises 同时被 2 个专栏收录

27 篇文章 0 订阅

订阅专栏

10 篇文章 0 订阅

订阅专栏

根据http://www.cnblogs.com/cfantaisie/archive/2011/03/25/1995849.html这是matlab版本下的LDA分类：

[model,k,ClassLabel]=LDATraining(traindata,trainlabel);
>> outputlabel=LDATesting(testdata,k,model,ClassLabel);
>> accurency=length(find(outputlabel==testlabel))/length(testlabel)这样既可实现分类得到测试样本的准确率很简洁方便

测试部分其实就是利用训练得到的model 然后看了下这个model到底是什么怎么来的：

我的是二分类对于二分类而言这个model是这样的：

W是dimsX1的投影矩阵 means是traindata每一类经过投影W后的平均值

在OpenCV里有封装好的LDA类：我知道opencv里有结合好的LDA+Fisher人脸识别的FaceRecognizer这个类那个比较好弄但如果不是用LDA做人脸而是分类普通数据就麻烦点了

根据http://blog.csdn.net/cjc211322/article/details/26590027?utm_source=tuicool&utm_medium=referral

http://www.tuicool.com/articles/BvuQFr http://www.cnblogs.com/freedomshe/archive/2012/04/24/sift_kmeans_lda_img_classification.html#L6

//LDA http://blog.csdn.net/zhazhiqiang/article/details/21189415 http://www.cnblogs.com/cfantaisie/archive/2011/03/25/1995849.html
#include<opencv2/highgui/highgui.hpp>
#include<opencv2/ml/ml.hpp>
#include <iostream>
#include"contrib.hpp"
using namespace cv;
using namespace std;
int main()
{
//sampledata
double sampledata[6][2] = { { 0, 1 }, { 0, 2 }, { 2, 4 }, { 8, 0 }, { 8, 2 }, { 9, 4 } };
Mat mat = Mat(6, 2, CV_64FC1, sampledata);
//labels
vector<int> labels;
for (int i = 0; i<mat.rows; i++)
{
if (i<mat.rows / 2)
{
labels.push_back(0);
}
else
{
labels.push_back(1);
}
}
//do LDA
LDA lda = LDA(mat, labels);
//get the eigenvector
Mat eivector = lda.eigenvectors().clone();
cout << "The eigenvector is:" << endl;
for (int i = 0; i<eivector.rows; i++)
{
for (int j = 0; j<eivector.cols; j++)
{
cout << eivector.ptr<double>(i)[j] << " ";
}
cout << endl;
}
//针对两类分类问题，计算两个数据集的中心
int classNum = 2;
vector<Mat> classmean(classNum);
vector<int> setNum(classNum);
for (int i = 0; i<classNum; i++)
{
classmean[i] = Mat::zeros(1, mat.cols, mat.type());
setNum[i] = 0;
}
Mat instance;
for (int i = 0; i<mat.rows; i++)
{
instance = mat.row(i);
if (labels[i] == 0)
{
add(classmean[0], instance, classmean[0]);
setNum[0]++;
}
else if (labels[i] == 1)
{
add(classmean[1], instance, classmean[1]);
setNum[1]++;
}
else
{
}
}
for (int i = 0; i<classNum; i++)
{
classmean[i].convertTo(classmean[i], CV_64FC1, 1.0 / static_cast<double>(setNum[i]));
}
vector<Mat> cluster(classNum);
for (int i = 0; i<classNum; i++)
{
cluster[i] = Mat::zeros(1, 1, mat.type());
multiply(eivector.t(), classmean[i], cluster[i]);
}
cout << "The project cluster center is:" << endl;
for (int i = 0; i<classNum; i++)
{
cout << cluster[i].at<double>(0) << endl;
}
system("pause");
return 0;
}

现在想用opencv的LDA来对自己的数据分类根据http://blog.csdn.net/cjc211322/article/details/26590027?utm_source=tuicool&utm_medium=referral看到opencv的LDA类有构造函数、投影函数、计算特征向量和特征值的函数，可是没有测试函数？然后应该可以根据matlab的自己写测试部分：

得到两个类投影后的projectionimg的平均值是0.804454 然而我要的是每一类投影后的平均值可是第一类投影后的怎么是个负数呢？难道是我把projectionimg里的第一类的存在myimg1里时候出错了？发现自己太蠢了直接用rowRange就好了不过我觉得自己编得没错数据怎么传不到myimg1里去呢？

这样就可以算出两个类分别投影后的均值了。

这样matlab的model在opencv里就有了接下来就根据测试函数写opencv的测试函数了

function target=LDATesting(input,k,model,ClassLabel)
% input: n*d matrix,representing samples
% target: n*1 matrix,class label
% model: struct type(see codes below)
% k: the total class number
% ClassLabel: the class name of each class
[n,~]=size(input);
s=zeros(n,k);
target=zeros(n,1);
for j=1:k*(k-1)/2
a=model(j).a;
b=model(j).b;
w=model(j).W;
m=model(j).means;
for i=1:n
sample=input(i,:);
tmp=sample*w;
if norm(tmp-m(1,:))<norm(tmp-m(2,:))
s(i,a)=s(i,a)+1;
else
s(i,b)=s(i,b)+1;
end
end
end
for i=1:n
pos=1;
maxV=0;
for j=1:k
if s(i,j)>maxV
maxV=s(i,j);
pos=j;
end
end
target(i)=ClassLabel(pos);
end

发现opencv里的LDA真是矫情，首先要求特征维数要小于样本个数而matlab里的LDA就没这个规定还有要求样本标签不能像matlab里一样nX1的向量如[11111122222]之类的也不能是nX2的矩阵如[0 1]代表第二类 [1 0]代表第一类我试过这两种标签都报错然后改成用[0.9 0.1]代表第一类 [0.1 0.9]代表第二类就不报错了

#include<opencv2/highgui/highgui.hpp>
#include<opencv2/ml/ml.hpp>
#include <iostream>
#include"contrib.hpp"
using namespace cv;
using namespace std;
int main()
{
//read traindata trainlabel testdata testlabel and make them into Mat
CvMLData trainfeature, testfeature, trainlabelprimer, testlabelprimer;
trainfeature.read_csv("traindata.csv");
Mat traindata = Mat(trainfeature.get_values(), true);
testfeature.read_csv("testdata.csv");
Mat testdata = Mat(testfeature.get_values(), true);
trainlabelprimer.read_csv("trainlabel.csv"); //1th :[1 0] 2th:[0 1]
Mat trainlabel = Mat(trainlabelprimer.get_values(), true);
testlabelprimer.read_csv("testlabel.csv");
Mat testlabel = Mat(testlabelprimer.get_values(), true);
int positivenum_train = 128, negativenum_train = 238;
//make trainlabel into vector<int>
vector<int> labelfortrain;
for (int i = 0; i < trainlabel.rows; ++i)
{
uchar* data = trainlabel.ptr<uchar>(i);
labelfortrain.push_back(data[0]);
}
//do LDA
//这里要求训练样本总数N要大于特征的维数D
cout << "LDA training..." << endl;
LDA lda = LDA(traindata, labelfortrain);
cout << "LDA training done!" << endl;
//get the eigenvector //相当于matlab里LDATraining所得model的W dimsX(num-1)
Mat eivector = lda.eigenvectors().clone();
//get the mean after projection //相当于matlab里LDATraining所得model的means 1X2
Mat projectionimg=lda.project(traindata);
//Scalar mean,stddev;
//meanStdDev(projectionimg, mean, stddev);
//float getmean = mean[0];
//cout << "2 classes mean:" << getmean << endl;
//cout << projectionimg << endl;
Mat myimg1 = projectionimg.rowRange(0,positivenum_train).clone();
//cout << myimg1 << endl;
Mat myimg2 = projectionimg.rowRange(positivenum_train, projectionimg.rows).clone();
//cout << myimg2<< endl;
Scalar mean1, stddev1;
meanStdDev(myimg1, mean1, stddev1);
float getmean1 = mean1[0];
cout << "1th classes sample number:"<<myimg1.rows<<" and its mean:" << getmean1 << endl;
Scalar mean2, stddev2;
meanStdDev(myimg2, mean2, stddev2);
float getmean2 = mean2[0];
cout << "2th classes sample number:"<<myimg2.rows<<" and its mean " << getmean2 << endl;
//test
cout << "LDA Testing..." << endl;
Mat testlabelout(testlabel.size(), testlabel.type()); //for LDA output label //matlab:target
Mat s(testlabel.rows, 2, CV_32F,cv::Scalar(0));
int a = 1, b = 2;
for (int i = 0; i < testdata.rows; i++)
{
float *currentrow = s.ptr<float>(i);
Mat sample = testdata.rowRange(i, i+1).clone();
Mat tmp = lda.project(sample);
if (norm(tmp - getmean1)<norm(tmp - getmean2))
currentrow[a] = currentrow[a] + 1;
else
currentrow[b] = currentrow[b] + 1;
}
//cout << s << endl;
cout << "LDA Test done!" << endl;
///accurency
int correct = 0;
float accurency;
for (int i = 0; i < s.rows; ++i)
{
float* p = s.ptr<float>(i);
float* being = testlabel.ptr<float>(i);
//if (p[0] > p[1])
// cout << 0.9 << " " << 0.1 << " " << being[0] << " " << being[1] << endl;
//else
// cout << 0.1 << " " << 0.9 << " " << being[0] << " " << being[1] << endl;
if (((p[0] > p[1]) && (being[0] > being[1])) || ((p[0] < p[1]) && (being[0] < being[1])))
++correct;
}
cout << endl;
accurency = (float)correct / testlabel.rows;
cout << "whole accurency= " << accurency << endl;
///
int alluseless = 0, uselesserror = 0, alluseful = 0, usefulerror = 0;
float stoneerror = 0, kuangerror = 0;
for (int i = 0; i < s.rows; ++i)
{
float* p = s.ptr<float>(i);
float* being = testlabel.ptr<float>(i);
if (being[0] == (float)0.1)
{
++alluseless;
if (p[0] > p[1])
++uselesserror;
}
}
cout << alluseless << " " << uselesserror << endl;
stoneerror = (float)uselesserror / alluseless;
cout << " 1th class error= " << stoneerror << endl;
for (int i = 0; i < s.rows; ++i)
{
float* p = s.ptr<float>(i);
float* being = testlabel.ptr<float>(i);
if (being[0] == (float)0.9)
{
++alluseful;
if (p[0] < p[1])
++usefulerror;
}
}
cout << alluseful << " " << usefulerror << endl;
kuangerror = (float)usefulerror / alluseful;
cout << " 2th class error= " << kuangerror << endl;
return 0;
}

我随便自创的特征矩阵所以出来准确率低。。。不过没关系重点不是这个目前是不报错看起来opencv的LDA初步是这样了。。。可是这个第一类120错45张第二类64错22张总准确率不应该是15% 哦我知道哪里错了出来的s竟然有[0 0]和[1 1]的！！！matlab下面的就没有 matlab下面的只有[0 1]和[1 0]两种情况奇怪改成下面这样就可以算准确率了：

///accurency
Mat s2(testlabel.rows, 2, CV_32F, cv::Scalar(0));
int correct = 0;
float accurency;
for (int i = 0; i < s.rows; ++i)
{
float* p = s.ptr<float>(i);
float* being = testlabel.ptr<float>(i);
float* p2 = s2.ptr<float>(i);
if (p[0] > p[1])
{
//cout << 0.9 << " " << 0.1 << " " << being[0] << " " << being[1] << endl;
p2[0] = float(0.9);
p2[1] = float(0.1);
}
else
{
//cout << 0.1 << " " << 0.9 << " " << being[0] << " " << being[1] << endl;
p2[0] = float(0.1);
p2[1] = float(0.9);
}
}
for (int i = 0; i < s2.rows; ++i)
{
float* p2 = s2.ptr<float>(i);
float* being = testlabel.ptr<float>(i);
if (((p2[0] > p2[1]) && (being[0] > being[1])) || ((p2[0] < p2[1]) && (being[0] < being[1])))
++correct;
}
cout <<testlabel.rows<<" "<<correct<< endl;
accurency = (float)correct / testlabel.rows;
cout << "whole accurency= " << accurency << endl;
///
int alluseless = 0, uselesserror = 0, alluseful = 0, usefulerror = 0;
float stoneerror = 0, kuangerror = 0;
for (int i = 0; i < s2.rows; ++i)
{
float* p = s2.ptr<float>(i);
float* being = testlabel.ptr<float>(i);
if (being[0] == (float)0.1)
{
++alluseless;
if (p[0] > p[1])
++uselesserror;
}
}
cout << alluseless << " " << uselesserror << endl;
stoneerror = (float)uselesserror / alluseless;
cout << " 1th class error= " << stoneerror << endl;
for (int i = 0; i < s2.rows; ++i)
{
float* p = s2.ptr<float>(i);
float* being = testlabel.ptr<float>(i);
if (being[0] == (float)0.9)
{
++alluseful;
if (p[0] < p[1])
++usefulerror;
}
}
cout << alluseful << " " << usefulerror << endl;
kuangerror = (float)usefulerror / alluseful;
cout << " 2th class error= " << kuangerror << endl;
return 0;