POJ 3261 Milk Patterns(后缀数组)

题目链接:http://poj.org/problem?id=3261

题意:找出至少出现m次的重复字串。

思路:二分答案,将h分组,同一组中的个数+1就是重复子串的个数。







int r[N],sa[N],wa[N],wb[N],wd[N],rank[N],h[N];





int cmp(int *r,int a,int b,int L)

{

    return r[a]==r[b]&&r[a+L]==r[b+L];

}





void da(int *r,int *sa,int n,int m)

{

    int i,j,p,*x=wa,*y=wb,*t;

    FOR0(i,m) wd[i]=0;

    FOR0(i,n) wd[x[i]=r[i]]++;

    FOR1(i,m-1) wd[i]+=wd[i-1];

    FORL0(i,n-1) sa[--wd[x[i]]]=i;

    for(j=1,p=1;p<n;j<<=1,m=p)

    {

        p=0;

        FOR(i,n-j,n-1) y[p++]=i;

        FOR0(i,n) if(sa[i]>=j) y[p++]=sa[i]-j;

        FOR0(i,m) wd[i]=0;

        FOR0(i,n) wd[x[i]]++;

        FOR1(i,m-1) wd[i]+=wd[i-1];

        FORL0(i,n-1) sa[--wd[x[y[i]]]]=y[i];

        t=x;x=y;y=t;p=1;x[sa[0]]=0;

        FOR1(i,n-1) x[sa[i]]=cmp(y,sa[i-1],sa[i],j)?p-1:p++;

    }

}







void calHeight(int *r,int *sa,int n)

{

    int i,j,k=0;

    FOR1(i,n) rank[sa[i]]=i;

    FOR0(i,n)

    {

        if(k) k--;

        j=sa[rank[i]-1];

        while(i+k<n&&j+k<n&&r[i+k]==r[j+k]) k++;

        h[rank[i]]=k;

    }

}





int n,m;





int OK(int x)

{

    int i=2,j,L,R;

    while(i<=n)

    {

        L=i;

        while(L<=n&&h[L]<x) L++;

        R=L;

        while(R+1<=n&&h[R+1]>=x) R++;

        if(R>n) return 0;

        if(R-L+1+1>=m) return 1;

        i=R+1;

    }

    return 0;

}



void cal()

{

    int low=0,high=n,mid;

    while(low<=high)

    {

        mid=(low+high)>>1;

        if(OK(mid)) low=mid+1;

        else high=mid-1;

    }

    if(low<=n&&OK(low)) PR(low);

    else PR(high);

}



int main()

{

    while(scanf("%d%d",&n,&m)!=-1)

    {

        int i,Max=0;

        FOR0(i,n) RD(r[i]),Max=max(Max,r[i]);

        r[n]=0;

        da(r,sa,n+1,Max+1);

        calHeight(r,sa,n);

        cal();

    }

    return 0;

}

  

 

 

你可能感兴趣的:(Pattern)