[USACO5.1]乐曲主题Musical Themes - 后缀数组

Description

求字符串的最长不可重叠重复子串。

Solution

如果有两个子串相同,那么也就是有两个后缀的 \(lcp\) 相同。

所以考虑二分答案 \(K\),如果有连续一段的 \(height\) 都不小于 \(K\),那么这一段区间内,两两后缀的 \(lcp\) 都不小于 \(K\),那么记录一下区间的 \(\max\{sa_i\}\)\(\min\{sa_i\}\),如果 \(\max\{sa_i\}-\min\{sa_i\}\le K\),那么就说明两个子串不重叠。

另外这题有一个“转调”的问题,只要差分一下就可以解决。不过需要注意的是,差分之后二分时的判断条件应该是 \(\max\{sa_i\}-\min\{sa_i\}< K\)

Code

#include <bits/stdc++.h>
using namespace std;

inline int ty() {
    char ch = getchar(); int x = 0, f = 1;
    while (ch < '0' || ch > '9') { if (ch == '-') f = -1; ch = getchar(); }
    while (ch >= '0' && ch <= '9') { x = x * 10 + ch - '0'; ch = getchar(); }
    return x * f;
}

const int _ = 5000 + 10;
const int INF = 0x3f3f3f3f;
int N, s[_], rnk[_], sa[_], height[_];

void SA() {
    static int t[_], a[_], buc[_], fir[_], sec[_], tmp[_];
    copy(s + 1, s + N + 1, t + 1);
    sort(t + 1, t + N + 1);
    int *end = unique(t + 1, t + N + 1);
    for (int i = 1; i <= N; ++i) a[i] = lower_bound(t + 1, end, s[i]) - t;
    for (int i = 1; i <= N; ++i) ++buc[a[i]];
    for (int i = 1; i <= N; ++i) buc[i] += buc[i - 1];
    for (int i = 1; i <= N; ++i) rnk[i] = buc[a[i] - 1] + 1;
    for (int len = 1; len <= N; len <<= 1) {
        for (int i = 1; i <= N; ++i) {
            fir[i] = rnk[i];
            sec[i] = i + len > N ? 0 : rnk[i + len];
        }
        fill(buc + 1, buc + N + 1, 0);
        for (int i = 1; i <= N; ++i) ++buc[sec[i]];
        for (int i = 1; i <= N; ++i) buc[i] += buc[i - 1];
        for (int i = 1; i <= N; ++i) tmp[N - --buc[sec[i]]] = i;
        fill(buc + 1, buc + N + 1, 0);
        for (int i = 1; i <= N; ++i) ++buc[fir[i]];
        for (int i = 1; i <= N; ++i) buc[i] += buc[i - 1];
        for (int i, j = 1; j <= N; ++j) {
            i = tmp[j];
            sa[buc[fir[i]]--] = i;
        }
        bool same = false;
        for (int i, j = 1, last = 0; j <= N; ++j) {
            i = sa[j];
            if (!last) rnk[i] = 1;
            else if (fir[i] == fir[last] && sec[i] == sec[last]) rnk[i] = rnk[last], same = true;
            else rnk[i] = rnk[last] + 1;
            last = i;
        }
        if (!same) break;
    }
    for (int i = 1, k = 0; i <= N; ++i) {
        if (rnk[i] == 1) k = 0;
        else {
            if (k > 0) --k;
            int j = sa[rnk[i] - 1];
            while (i + k <= N && j + k <= N && a[i + k] == a[j + k]) ++k;
        }
        height[rnk[i]] = k;
    }
}

bool check(int mid) {
    int minsa = INF, maxsa = -1;
    for (int i = 1; i <= N; ++i) {
        if (height[i] < mid) minsa = maxsa = sa[i];
        else {
            minsa = min(minsa, sa[i]);
            maxsa = max(maxsa, sa[i]);
            if (maxsa - minsa > mid) return true;
        }
    }
 return false;
}

int main() {
#ifndef ONLINE_JUDGE
    freopen("theme.in", "r", stdin);
    freopen("theme.out", "w", stdout);
#endif
    N = ty();
    for (int i = 1; i <= N; ++i) s[i] = ty();
    for (int i = 1; i <= N; ++i) s[i] = s[i + 1] - s[i] + 100;
    SA();
    // for (int i = 1; i <= N; ++i) printf("%d ", height[i]);
    int l = 0, r = N;
    while (l < r) {
        int mid = (l + r + 1) >> 1;
        if (check(mid)) l = mid;
        else r = mid - 1;
    }
    printf("%d\n", l >= 4 ? l + 1 : 0);
    return 0;
}

猜你喜欢

转载自www.cnblogs.com/newbielyx/p/12160165.html
今日推荐