codeforces 432D D . Prefixes and Suffixes(后缀数组)

题目链接:

codeforces 432D

题目大意:

给出一个字符串,求有多少种长度的前缀和后缀相等,并且得到的这个子串在原字符串中出现的次数。

题目分析:

  • 首先利用后缀数组处理出sa[i]代表排名第i位的后缀的起始位置
  • 处理出rank[i]代表第i个位置起始的后缀的rank
  • 处理出height[i]代表排名第i位的和排名i-1位的公共前缀的长度。
  • 那么我们要找后缀和前缀相等的就是找到rank[0],然后按照排名,向前向后遍历,任意两个后缀的公共前缀就是他们[i,j]区间内所有height的最小值。只要得到的公共前缀等于后缀的长度,那么证明前缀和后缀匹配上。记录该长度的前缀能够匹配
  • 记录某一个子串出现的次数,就是每次记录和原字符串的公共前缀的长度,然后在对应位置+1,因为比这个长度小的也会得到一个贡献,所以最后求一下后缀和即可。

AC代码:

#include <cstring>
#include <cstdio>
#include <algorithm>
#include <cstring>
#define MAX 100007

using namespace std;

char s[MAX];  
int r[MAX],sa[MAX],wa[MAX],wb[MAX],wv[MAX],wss[MAX],rank[MAX],height[MAX];  
int cnt[MAX];
bool mark[MAX];

int cmp ( int *r , int a , int b , int len )  
{  
    return r[a]==r[b]&&r[a+len]==r[b+len];  
}  

void da ( int* r , int* sa , int n , int m )  
{  
    int i,j,p, *x = wa , *y = wb , *t;  
    for ( i = 0 ; i < m ; i++ ) wss[i] = 0;  
    for ( i = 0 ; i < n ; i++ ) wss[x[i] = r[i]]++;  
    for ( i = 0 ; i < m ; i++ ) wss[i] += wss[i-1];  
    for ( i = n-1 ; i >= 0 ; i-- ) sa[--wss[x[i]]] = i;  

    for ( j = 1 , p = 1 ; p < n ; j *= 2 , m = p )  
    {  
        for ( p = 0 , i = n - j ; i < n ; i++ ) y[p++] = i;  
        for ( i = 0 ; i < n ; i++ ) if ( sa[i] >= j ) y[p++] = sa[i]-j;  
        for ( i = 0 ; i < n ; i++ ) wv[i] = x[y[i]];  
        for ( i = 0 ; i < m ; i++ ) wss[i] = 0;  
        for ( i = 0 ; i < n ; i++ ) wss[wv[i]]++;  
        for ( i = 0 ; i < m ; i++ ) wss[i] += wss[i-1];  
        for ( i = n-1 ; i >= 0 ; i-- ) sa[--wss[wv[i]]] = y[i];  
        for ( t = x , x = y , y = t , p = 1 , x[sa[0]] = 0 , i = 1 ; i < n ; i++ )  
            x[sa[i]] = cmp ( y , sa[i-1] , sa[i] , j ) ? p-1 : p++;  
    }  
}  

void calheight ( int *r , int *sa , int n )
{
    int i , j , k = 0;
    for ( int i = 1 ; i <= n ; i++ ) rank[sa[i]] = i;
    for ( int i = 0 ; i < n ; height[rank[i++]] = k )
        for ( k?k--:0 , j = sa[rank[i]-1] ; r[i+k] == r[j+k] ; k++ );
}

int main ( )
{
    while ( ~scanf ( "%s" , s ) )
    {
        memset ( cnt , 0 , sizeof ( cnt ) );
        memset ( mark , 0 , sizeof ( mark ) );
        int len = strlen ( s );
        for ( int i = 0 ; i < len ; i++ )
            r[i] = s[i] - 'A' + 1;
        da ( r , sa , len+1 , 27 );
        calheight ( r , sa, len );
        int x = rank[0];
        int temp = 1<<29;
        for ( int i = x + 1 ; i <= len;i ++ )
        {
            temp = min ( temp , height[i] );
            int id = sa[i];
            if ( sa[i]+temp >= len ) 
                mark[temp] = true;  
            cnt[temp]++;
        }
        temp = height[x];
        for ( int i = x-1 ; i >= 1; i -- )
        {
            cnt[temp]++;
            int id = sa[i];
            if ( sa[i]+temp >= len )
                mark[temp] = true;
            temp = min ( temp , height[i] );
        }
        mark[len] = true;
        cnt[len] = 1;
        int ans = 0;
        for ( int i = len-1 ;i > 0 ; i-- )
            cnt[i] += cnt[i+1];
        for ( int i = 1 ; i <= len ; i ++ )
            if ( mark[i] )  ans++;
        printf ( "%d\n" , ans );
        for  ( int i = 1 ; i <= len ; i++ )
        {
            if ( !mark[i] ) continue;
            printf ( "%d %d\n" , i , cnt[i] );
        }
    }
}

你可能感兴趣的:(后缀数组,codeforces)