KMP: 当出现字符串不匹配时,可以知道一部分之前已经匹配的文本内容,可以利用这些信息避免从头再去做匹配
28. 找出字符串中第一个匹配项的下标
https://leetcode.cn/problems/find-the-index-of-the-first-occurrence-in-a-string/
前缀表:记录下标i之前(包括i)的字符串中,有多大长度的相同前缀后缀。匹配失败后在哪里重新匹配
时间复杂度:O (m + n)
class Solution {
public:
void getNext(vector<int>&next, string&s) {
int j = -1;
next[0] = j;
// 从index 1 开始
for (int i = 1; i < s.length(); i++) {
while (j >= 0 && s[i] != s[j + 1]) {
j = next[j];
}
if (s[i] == s[j + 1]) {
j++;
}
next[i] = j;
}
}
int strStr(string haystack, string needle) {
if (haystack.length() < needle.length()) {
return -1;
}
vector<int>next(needle.length());
getNext(next, needle);
int j = -1;
for (int i = 0; i < haystack.length(); i++) {
while (j >= 0 && haystack[i] != needle[j + 1]) {
j = next[j];
}
if (haystack[i] == needle[j + 1]) {
j++;
}
if (j == needle.length() - 1) {
return i - needle.length() + 1;
}
}
return -1;
}
};
- Repeated Substring Pattern
https://leetcode.cn/problems/repeated-substring-pattern/
class Solution {
public:
bool repeatedSubstringPattern(string s) {
string copy = s + s;
copy = copy.substr(1, copy.length() - 2);
return copy.find(s) != string::npos;
}
};
KMP: 当一个字符串由重复子串组成的,最长相等前后缀不包含的子串就是最小重复子串。
class Solution {
public:
void getNext (int* next, const string& s){
next[0] = -1;
int j = -1;
for(int i = 1;i < s.size(); i++){
while(j >= 0 && s[i] != s[j + 1]) {
j = next[j];
}
if(s[i] == s[j + 1]) {
j++;
}
next[i] = j;
}
}
bool repeatedSubstringPattern (string s) {
if (s.size() == 0) {
return false;
}
int next[s.size()];
getNext(next, s);
int len = s.size();
if (next[len - 1] != -1 && len % (len - (next[len - 1] + 1)) == 0) {
return true;
}
return false;
}
};