-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathsuffix_array.cpp
113 lines (98 loc) · 2.54 KB
/
suffix_array.cpp
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
///O(nlogn)
/*
source : https://cp-algorithms.web.app/string/suffix-array.html
S = abaab
0. abaab
1. baab
2. aab
3. ab
4. b
[2, 3, 0, 4, 1] -> suffix array
LCP:
---
aab -> 0
ab -> 1
abaab -> 2
b -> 0
baab -> 1
***No. of substring = (n*(n+1))/2 - sum(lcp[i])
*/
vector<int> sort_cyclic_shifts(string const& s) {
int n = s.size();
const int alphabet = 256;
vector<int> p(n), c(n), cnt(max(alphabet, n), 0);
for(int i = 0; i < n; i++)
cnt[s[i]]++;
for(int i = 1; i < alphabet; i++)
cnt[i] += cnt[i-1];
for(int i = 0; i < n; i++)
p[--cnt[s[i]]] = i;
c[p[0]] = 0;
int classes = 1;
for(int i = 1; i < n; i++) {
if (s[p[i]] != s[p[i-1]])
classes++;
c[p[i]] = classes - 1;
}
vector<int> pn(n), cn(n);
for(int h = 0; (1 << h) < n; ++h) {
for(int i = 0; i < n; i++) {
pn[i] = p[i] - (1 << h);
if (pn[i] < 0)
pn[i] += n;
}
fill(cnt.begin(), cnt.begin() + classes, 0);
///radix sort
for(int i = 0; i < n; i++)
cnt[c[pn[i]]]++;
for(int i = 1; i < classes; i++)
cnt[i] += cnt[i-1];
for(int i = n-1; i >= 0; i--)
p[--cnt[c[pn[i]]]] = pn[i];
cn[p[0]] = 0;
classes = 1;
for(int i = 1; i < n; i++) {
pair<int, int> cur = {c[p[i]], c[(p[i] + (1 << h)) % n]};
pair<int, int> prev = {c[p[i-1]], c[(p[i-1] + (1 << h)) % n]};
if (cur != prev)
++classes;
cn[p[i]] = classes - 1;
}
c.swap(cn);
}
return p;
}
vector<int> suffix_array_construction(string s) {
s += "$";
vector<int> sorted_shifts = sort_cyclic_shifts(s);
sorted_shifts.erase(sorted_shifts.begin());
return sorted_shifts;
}
vector<int> lcp_construction(string const& s, vector<int> const& p) {
int n = s.size();
vector<int> rank(n, 0);
for(int i = 0; i < n; i++)
rank[p[i]] = i;
int k = 0;
vector<int> lcp(n, 0);
for(int i = 0; i < n; i++) {
if (rank[i] == n - 1) {
k = 0;
continue;
}
int j = p[rank[i] + 1];
while(i + k < n && j + k < n && s[i+k] == s[j+k])
k++;
lcp[rank[i]+1] = k;
if (k)
k--;
}
return lcp;
}
ll count_substring(int n, vector<int> const& p) {
ll tot = ((ll)n*(ll)(n+1))/2LL;
ll sum = 0;
for(auto x : p)
sum+=x;
return (tot-sum);
}