CodeForces - 163E e-Government【Fail树&&AC自动机】

niiick

于 2020-09-28 19:03:47 发布

阅读量205

点赞数

分类专栏： AC自动机 Fail树

本文链接：https://blog.csdn.net/niiick/article/details/108855508

版权

AC自动机同时被 2 个专栏收录

11 篇文章 0 订阅

订阅专栏

Fail树

2 篇文章 0 订阅

订阅专栏

CodeForces - 163E

Time limit 1000 ms Memory limit 262144 kB

The best programmers of Embezzland compete to develop a part of the project called “e-Government” — the system of automated statistic collecting and press analysis.

We know that any of the k citizens can become a member of the Embezzland government. The citizens’ surnames are a1, a2, …, ak. All surnames are different. Initially all k citizens from this list are members of the government. The system should support the following options:

Include citizen ai to the government.
Exclude citizen ai from the government.
Given a newspaper article text, calculate how politicized it is. To do this, for every active government member the system counts the number of times his surname occurs in the text as a substring. All occurrences are taken into consideration, including the intersecting ones. The degree of politicization of a text is defined as the sum of these values for all active government members.
Implement this system.

题目大意

给定k个模式串，n次操作
每次操作可能是删除/增加第 i 个模式串(可能重复)，或询问每个模式串在给定的文本串中出现次数的总和

题目分析

结合AC自动机和Fail树各自长处的好题

一开始k个模式串构造好Trie，并构造fail指针以及Fail树并求DFS序
对于没有被删除的模式串
利用差分数组，每个模式串结尾结点权值+1，其子树中最后一个dfs序编号结点权值-1

每次询问将文本串送入AC自动机逐位匹配
若当前走到AC自动机结点 $u$ ，令 $a n s + = q s u m (1, d f n [u])$
这样即统计了该结点延fail指针走到根路径上模式串结尾结点的个数（其他子树内的结点会因为差分数组抵消掉）

这样虽然不能准确统计每个模式串各自出现的次数
但将AC自动机和Fail树各自的特点巧妙地结合起来直接达到了统计总数的目的

#include<iostream>
#include<cstdio>
#include<vector>
#include<queue>
#include<algorithm>
#include<cstring>
using namespace std;
typedef long long lt;
#define lowbit(x) ((x)&(-x))

int read()
{
    int f=1,x=0;
    char ss=getchar();
    while(ss<'0'||ss>'9'){if(ss=='-')f=-1;ss=getchar();}
    while(ss>='0'&&ss<='9'){x=x*10+ss-'0';ss=getchar();}
    return x*f;
}

const int maxn=1000010;
int n,k,num;
int rem[maxn],cnt;
int ch[maxn][26],fail[maxn];
queue<int> q;
char pt[maxn];
struct edge{int v,nxt;}E[maxn];
int head[maxn],tot;
int dfn[maxn],size[maxn],judge[maxn],sz;
lt sum[maxn];

int get(char* ss)
{
	int x=0,len=strlen(ss);
    for(int i=0;i<len;++i) x=x*10+ss[i]-'0';
    return x;
}

void addE(int u,int v)
{
	E[++tot].nxt=head[u];
	E[tot].v=v;
	head[u]=tot;
}

lt qsum(int x){ lt res=0; for(int i=x;i>0;i-=lowbit(i))res+=sum[i]; return res;}
void add(int x,int v){ for(int i=x;i<=sz;i+=lowbit(i))sum[i]+=v;}
void update(int ll,int rr,int v){ add(ll,v); add(rr+1,-v);}

void ins(char* ss,int len,int d)
{
	int u=0;
	for(int i=0;i<len;++i)
	{
		int x=ss[i]-'a';
		if(!ch[u][x]) ch[u][x]=++cnt;
		u=ch[u][x];
	}
	rem[d]=u;
}

void getf()
{
    for(int i=0;i<26;++i)
    if(ch[0][i]) fail[ch[0][i]]=0,q.push(ch[0][i]);
    
    while(!q.empty())
    {
        int u=q.front(); q.pop();
        for(int i=0;i<26;++i)
        {
            if(!ch[u][i]) ch[u][i]=ch[fail[u]][i];
            else{
                fail[ch[u][i]]=ch[fail[u]][i];
                q.push(ch[u][i]);
            }
        }
    }
    
    for(int i=1;i<=cnt;++i)
    addE(fail[i],i);
}

void dfs(int u)
{
	dfn[u]=++sz; size[u]=1;
	for(int i=head[u];i;i=E[i].nxt)
	{
		int v=E[i].v;
		dfs(v);
		size[u]+=size[v];
	}
}

lt query(char*ss)
{
	lt ans=0;
	int u=0,len=strlen(ss);
	for(int i=0;i<len;++i)
	{
		u=ch[u][ss[i]-'a'];
		ans+=qsum(dfn[u]);
	}
	return ans;
}

int main()
{
	n=read();k=read();
	for(int i=1;i<=k;++i)
	{
		scanf("%s",&pt);
		ins(pt,strlen(pt),i);
	}
	
	getf(); dfs(0);
	for(int i=1;i<=k;++i)
	{
		update(dfn[rem[i]],dfn[rem[i]]+size[rem[i]]-1,1);
		judge[i]=1;
	}
	
	for(int i=1;i<=n;++i)
	{
		scanf("%s",&pt);
		if(pt[0]=='+')
		{
			int x=get(pt+1);
			if(judge[x]) continue;
			update(dfn[rem[x]],dfn[rem[x]]+size[rem[x]]-1,1);
			judge[x]=1;
		}
		else if(pt[0]=='-')
		{
			int x=get(pt+1);
			if(!judge[x]) continue;
			update(dfn[rem[x]],dfn[rem[x]]+size[rem[x]]-1,-1);
			judge[x]=0;
		}
		else if(pt[0]=='?')
		printf("%lld\n",query(pt+1)); 
	}
	
	return 0;
}

niiick

关注

0
点赞
踩
1

收藏

觉得还不错? 一键收藏
0
评论
CodeForces - 163E e-Government【Fail树&&AC自动机】

CodeForces - 163ETime limit 1000 ms Memory limit 262144 kBThe best programmers of Embezzland compete to develop a part of the project called “e-Government” — the system of automated statistic collecting and press analysis.We know that any of the k citiz
复制链接

扫一扫

专栏目录