LevenshteinDistcance即莱文斯坦距离。
https://zh.wikipedia.org/wiki/%E8%90%8A%E6%96%87%E6%96%AF%E5%9D%A6%E8%B7%9D%E9%9B%A2
http://www.cnblogs.com/ivanyb/archive/2011/11/25/2263356.html
#include<iostream>
#include<algorithm>
#include<string>
#include<cassert>
#include<fstream>
using namespace std;
char s1[100];
char s2[100];
int dp[105][105] = { 0 };
int s1_len;
int s2_len;
/* 求出两文件的最长子序列 */
int LevenshteinDistcance()
{
s1_len = strlen(s1);
s2_len = strlen(s2);
int cost;
//初始化
for (int i = 1; i <= s1_len; i++)
dp[i][0] = i;
for (int j = 1; j <= s2_len; j++)
dp[0][j] = j;
for (int i = 1; i <= s1_len; i++)
{
for (int j = 1; j <= s2_len; j++)
{
if (s1[i - 1] == s2[j - 1])
cost = 1;
else
cost = 0;
dp[i][j] = min(min(dp[i - 1][j] + 1, dp[i][j - 1] + 1), dp[i - 1][j - 1] + cost);
}
}
return dp[s1_len][s2_len];
}
int main()
{
string file_name1("s1.txt");
string file_name2("s2.txt");
ifstream fin;
fin.open(file_name1.data());
if (!fin.is_open())
{
cout << file_name1 << " 无法打开\n";
return -1;
}
fin.getline(s1, 100);
fin.close();
fin.open(file_name2.data());
if (!fin.is_open())
{
cout << file_name2 << " 无法打开\n";
return -1;
}
fin.getline(s2, 100);
fin.close();
int lev = LevenshteinDistcance();
cout << "编辑距离为:" << lev << endl;
cout << "相似度为:" << (1 - double(lev) / max(s1_len, s2_len)) * 100 << "%\n";
return 0;
}