-
Notifications
You must be signed in to change notification settings - Fork 4
Expand file tree
/
Copy pathsuffix_array.cpp
More file actions
104 lines (92 loc) · 1.62 KB
/
suffix_array.cpp
File metadata and controls
104 lines (92 loc) · 1.62 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
//Implementation of Suffix array O(n*logn*logn)
//Kasai's algorithm for computing Longest common prefix array in O(n)
//Solution of DISUBSTR - Distinct Substrings problem in Spoj
#include<bits/stdc++.h>
using namespace std;
long cmp(long i,long j);
string str;
long gap=1,sa[1000007],pos[1000007],tmp[1000007],n,lcp[1000007];
int main()
{
int t;
cout<<"Enter the no of Test cases\n";
cin>>t;
while(t--){
cin>>str;
n=str.length();
int i;
for(i=0;i<n;i++)
{
sa[i]=i;
pos[i]=str[i];
tmp[i]=0;
lcp[i]=0;
}
for(gap=1;;gap=gap*2)
{
//printf("%ld ",gap);
sort(sa,sa+n,cmp);
for(i=0;i<n-1;i++)
tmp[i+1]=tmp[i]+cmp(sa[i],sa[i+1]);
for(i=0;i<n;i++)
pos[sa[i]]=tmp[i];
if(tmp[n-1]==n-1)//means all suffix are sorted
break;
}
cout<<"Suffix Array :\n";
for(i=0;i<n;i++)
cout<<sa[i]<<" ";
cout<<endl;
long k=0,j;
for(i=0;i<n;i++)
{
pos[sa[i]]=i;
}
for(i=0;i<n;i++)
{
if(pos[i]==n-1)
{
k=0;
continue;
}
j=sa[pos[i]+1];
while(i+k<n&&j+k<n&&str[i+k]==str[j+k])
k++;
lcp[pos[i]]=k;
if(k>0)
k--;
}
cout<<"Longest Common Prefix :\n";
for(i=0;i<n;i++)
cout<<lcp[i]<<" ";
cout<<endl;
//Counting no of distinct substrings
k=0;
for(i=0;i<n;i++){
k=k+n-sa[i]-lcp[i];
}
printf("No of Distinct Substrings : %ld\n",k);
cout<<endl;
}
return 0;
}
long cmp(long i,long j)
{
if(pos[i]!=pos[j])
return pos[i]<pos[j];
i=i+gap;
j=j+gap;
if(i<n&&j<n)
return pos[i]<pos[j];
else
return i>j;
}
/*
Explanation for the testcase with string ABABA:
len=1 : A,B
len=2 : AB,BA
len=3 : ABA,BAB
len=4 : ABAB,BABA
len=5 : ABABA
Thus, total number of distinct substrings is 9.
*/