POJ 3690 Constellations + Gym - 100783J The Big Painting 二维字符串hash

最新推荐文章于 2022-01-19 17:32:34 发布

npugenji

最新推荐文章于 2022-01-19 17:32:34 发布

阅读量540

点赞数

分类专栏：字符串文章标签：字符串

本文链接：https://blog.csdn.net/z631681297/article/details/77681227

版权

字符串专栏收录该内容

0 篇文章 0 订阅

订阅专栏

这次组队赛也出现了同样的题目，然而不会做。所以来学习一波新姿势。
二维字符串hash的原理就是先把行横着做普通的一位字符串hash，然后每一行都有一个hash值，再竖着将行与行的hash值再hash一次。原理并不复杂。然后注意横着和竖着hash取两个不同的大质数就可以了。
把 $x1$ , 当做横着hash的质数， $x2$ 当做竖着hash的质数。
对于这题来说。
r[i][j] 表示横着hash的时候，第i行从 $j-q+1 ...j$ 的hash值
c[j][i] 则是从左上角的（j-p+1，i-q+1）到（j，i）的二维矩阵的hash值

r [i] [j] = r [i] [j - 1] * x 1 + s [i] [j] - s [i] [j - q] * x q 1

$r[i][j] =r[i][j-1] * x1 + s[i][j] - s[i][j-q]*x_1^q$

c [j] [i] = c [j - 1] [i] * x 2 + r [j] [i] - r [j - p] [i] * x p 2

$c[j][i] = c[j-1][i]*x2 + r[j][i] - r[j-p][i]*x_2^p$
然后给你的模式矩阵可能会相同，所以使用multiset，可以把hash值相同的全部去掉。
最后用总数减去set中剩余的就是匹配上的数量。

#include <iostream>
#include <cstring>
#include <cstdio>
#include <algorithm>
#include <set>

using namespace std;
typedef unsigned long long ull;
const int maxn = 1010;
ull r[maxn][maxn],c[maxn][maxn];
char s[maxn][maxn],tt[maxn][maxn];
int n,m,p,q,t;
const ull x1 = 100000007;
const ull x2 = 1000000007;
multiset<ull> mp;
ull gethash()
{
    ull tmp=0,ttmp=0;
    for (int i=0;i<p;i++)
    {
        tmp=0;
        for (int j=0;j<q;j++)
            tmp = tmp*x1 + tt[i][j];
        ttmp = ttmp * x2 + tmp;
    }
    mp.insert(ttmp);
}

void solve()
{
    ull o = 1,tmp;
    for (int i=0;i<q;i++) o *= x1;
    for (int i=0;i<n;i++)
    {
        tmp = 0;
        for (int j=0;j<q;j++) tmp = tmp*x1 + s[i][j];
        r[i][q-1] = tmp;
        for (int j=q;j<m;j++) r[i][j] = r[i][j-1] * x1 + s[i][j] - s[i][j-q]*o;
    }
    o = 1;
    for (int i=0;i<p;i++) o *= x2;
    for (int i=q-1;i<m;i++)
    {
        tmp = 0;
        for (int j=0;j<p;j++) tmp = tmp*x2 + r[j][i];
        c[p-1][i] = tmp;
        mp.erase(tmp);
        for (int j=p;j<n;j++)
        {
            c[j][i] = c[j-1][i]*x2 + r[j][i] - r[j-p][i]*o;
            mp.erase(c[j][i]);
        }
    }
}


int main()
{
    int ttt=0;
    while (scanf("%d%d%d%d%d",&n,&m,&t,&p,&q), n||m||t||p||q)
    {
        mp.clear();
        for (int i=0;i<n;i++) scanf("%s",s[i]);
        for (int i=0;i<t;i++)
        {
            memset(tt,0,sizeof tt);
            for (int j=0;j<p;j++) scanf("%s",tt[j]);
            gethash();
        }
        solve();
        printf("Case %d: %d\n",++ttt,t-mp.size());
    }
    return 0;
}