• HDU 5769 Substring 后缀数组


    Substring




    Problem Description
    ?? is practicing his program skill, and now he is given a string, he has to calculate the total number of its distinct substrings. 
    But ?? thinks that is too easy, he wants to make this problem more interesting. 
    ?? likes a character X very much, so he wants to know the number of distinct substrings which contains at least one X. 
    However, ?? is unable to solve it, please help him.
     
    Input
     
    The first line of the input gives the number of test cases T;T test cases follow. 
    Each test case is consist of 2 lines: 
    First line is a character X, and second line is a string S. 
    X is a lowercase letter, and S contains lowercase letters(‘a’-‘z’) only.

    T<=30 
    1<=|S|<=10^5 
    The sum of |S| in all the test cases is no more than 700,000.
     
    Output
     
    For each test case, output one line containing “Case #x: y”(without quotes), where x is the test case number(starting from 1) and y is the answer you get for that case.
     
    Sample Input
     
    2 a abc b bbb
     
    Sample Output
     
    Case #1: 3 Case #2: 3
    Hint
    In first case, all distinct substrings containing at least one a: a, ab, abc. In second case, all distinct substrings containing at least one b: b, bb, bbb.
     
    题意:
      给你一个字符c和一个字符串s
      问你 s的所有有多少个不同的子串是包含c的
    题解:
      考虑后缀数组
      我们对S建立出SA,Height
      在sa中,我们想要知道当前sa[i] 的后缀中是否含有字符c,这个可以预处理呀
      处理后,假设对于当前sa[i],的最前一个字符c的位置存在设为pre[sa[i]],那么我们可以更新答案 n - sa[i]
      但题目要求得是不同子串,那么我们对于每一位sa[i],利用height数组去重就可以了,自己想想把
    #include<set>
    #include<cmath>
    #include<queue>
    #include<bitset>
    #include<math.h>
    #include<vector>
    #include<string>
    #include<stdio.h>
    #include<cstring>
    #include<iostream>
    #include<algorithm>
    using namespace std;
    #pragma comment(linker, "/STACK:102400000,102400000")
    #define ls i<<1
    #define rs ls | 1
    #define mid ((ll+rr)>>1)
    #define pii pair<int,int>
    #define MP make_pair
    typedef long long LL;
    const long long INF = 1e18+1LL;
    const double Pi = acos(-1.0);
    const int N = 2e5+10, M = 2e5+20, mod = 1e9+7, inf = 2e9;
    
    ///heght[i] 表示 Suffix(sa[i-1])和Suffix(sa[i]) 的最长公共前缀:
    ///rk[i] 表示 开头为i的后缀的等级:
    ///sa[i] 表示 排名为i的后缀 的开头位置:
    
    int *rk,r[N],sa[N],height[N],wa[N],wb[N],wm[N];
    bool cmp(int *r,int a,int b,int l) {
        return r[a] == r[b] && r[a+l] == r[b+l];
    }
    void SA(int *r,int *sa,int n,int m) {
        int *x=wa,*y=wb,*t;
        for(int i=0;i<m;++i)wm[i]=0;
        for(int i=0;i<n;++i)wm[x[i]=r[i]]++;
        for(int i=1;i<m;++i)wm[i]+=wm[i-1];
        for(int i=n-1;i>=0;--i)sa[--wm[x[i]]]=i;
        for(int i=0,j=1,p=0;p<n;j=j*2,m=p){
            for(p=0,i=n-j;i<n;++i)y[p++]=i;
            for(i=0;i<n;++i)if(sa[i]>=j)y[p++]=sa[i]-j;
            for(i=0;i<m;++i)wm[i]=0;
            for(i=0;i<n;++i)wm[x[y[i]]]++;
            for(i=1;i<m;++i)wm[i]+=wm[i-1];
            for(i=n-1;i>=0;--i)sa[--wm[x[y[i]]]]=y[i];
            for(t=x,x=y,y=t,i=p=1,x[sa[0]]=0;i<n;++i) {
                x[sa[i]]=cmp(y,sa[i],sa[i-1],j)?p-1:p++;
            }
        }
        rk=x;
    }
    void Height(int *r,int *sa,int n) {
        for(int i=0,j=0,k=0;i<n;height[rk[i++]]=k)
        for(k?--k:0,j=sa[rk[i]-1];r[i+k] == r[j+k];++k);
    }
    
    int pre[N];
    LL ans;
    char ch[2],s[N];
    int main() {
            int T,cas = 1;
            scanf("%d",&T);
            while(T--) {
                scanf("%s%s",ch,s);
                int n = strlen(s);
                for(int i = 0; i < n; ++i) r[i] = s[i] - 'a' + 1;
                r[n] = 0;
                SA(r,sa,n+1,256);
                Height(r,sa,n);
                pre[n] = -1;
                for(int i = n-1; i >= 0; --i) {
                    if(ch[0] == s[i]) pre[i] = i;
                    else pre[i] = pre[i+1];
                }
                ans = 0;
                for(int i = 1; i <= n; ++i) {
                    if(pre[sa[i]] == -1) continue;
                    ans = ans + (n - pre[sa[i]]) -  max(0,height[i]  -  pre[sa[i]] + sa[i]);
                }
                printf("Case #%d: %I64d
    ",cas++,ans);
            }
            return 0;
    }
  • 相关阅读:
    字符编码
    IO流技术
    TreeMap使用和Comparable比较
    Collections工具类
    使用迭代器进行遍历时
    238. 除自身以外数组的乘积
    python 字典按键、值排序
    collections.Counter用法
    442. 数组中重复的数据
    1395. 统计作战单位数
  • 原文地址:https://www.cnblogs.com/zxhl/p/6002089.html
Copyright © 2020-2023  润新知