-
Notifications
You must be signed in to change notification settings - Fork 1.9k
/
Copy pathCompactSuffixTrie.java
149 lines (138 loc) · 4.42 KB
/
CompactSuffixTrie.java
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
package com.jwetherell.algorithms.data_structures;
import java.util.Set;
import java.util.TreeSet;
/**
* A suffix trie is a data structure that presents the suffixes of a given
* string in a way that allows for a particularly fast implementation of many
* important string operations. This implementation is based upon a patricia
* trie which IS a compact trie.
* <p>
* @see <a href="https://en.wikipedia.org/wiki/Suffix_trie">Suffix Trie (Wikipedia)</a>
* <br>
* @author Justin Wetherell <phishman3579@gmail.com>
*/
@SuppressWarnings("unchecked")
public class CompactSuffixTrie<C extends CharSequence> {
private PatriciaTrie<C> tree = null;
/**
* Create a compact suffix trie from sequence
*
* @param sequence
* to create a suffix trie from.
*/
public CompactSuffixTrie(C sequence) {
tree = new PatriciaTrie<C>();
int length = sequence.length();
for (int i = 0; i < length; i++) {
CharSequence seq = sequence.subSequence(i, length);
tree.add((C) seq);
}
}
/**
* Add character sequence to the trie.
*
* @param sequence
* to add to trie.
* @return True if added successfully.
*/
public boolean add(C sequence) {
int length = sequence.length();
for (int i = 0; i < length; i++) {
CharSequence seq = sequence.subSequence(i, length);
tree.add((C) seq);
}
return true;
}
/**
* Does the sequence exists in the trie.
*
* @param sequence
* to locate in the trie.
* @return True if sequence exists in trie.
*/
public boolean doesSubStringExist(C sequence) {
char[] chars = sequence.toString().toCharArray();
int length = chars.length;
PatriciaTrie.Node current = tree.root;
int index = 0;
for (int i = 0; i < length; i++) {
int innerStringLength = (current.string != null) ? current.string.length : 0;
char c = chars[i];
if (innerStringLength > index) {
boolean inThis = current.partOfThis(c, index++);
if (!inThis)
return false;
} else {
int idx = current.childIndex(c);
if (idx < 0)
return false;
current = current.getChild(idx);
index = 1;
}
}
return true;
}
/**
* Get all suffixes in the trie.
*
* @return set of suffixes in trie.
*/
public Set<String> getSuffixes() {
return this.getSuffixes(tree.root);
}
/**
* Get all suffixes at node.
*
* @param node
* to get all suffixes at.
* @return set of suffixes in trie at node.
*/
private Set<String> getSuffixes(PatriciaTrie.Node node) {
StringBuilder builder = new StringBuilder();
if (node.string != null)
builder.append(node.string);
Set<String> set = new TreeSet<String>();
if (node.type == PatriciaTrie.WHITE) {
set.add(builder.toString());
}
for (int i = 0; i < node.getChildrenSize(); i++) {
PatriciaTrie.Node c = node.getChild(i);
set.addAll(getSuffixes(c, builder.toString()));
}
return set;
}
/**
* Get all suffixes at node and prepend the prefix.
*
* @param node
* to get all suffixes from.
* @param prefix
* to prepend to suffixes.
* @return set of suffixes in trie at node.
*/
private Set<String> getSuffixes(PatriciaTrie.Node node, String prefix) {
StringBuilder builder = new StringBuilder(prefix);
if (node.string != null)
builder.append(node.string);
Set<String> set = new TreeSet<String>();
if (node.type == PatriciaTrie.WHITE) {
set.add(builder.toString());
}
for (int i = 0; i < node.getChildrenSize(); i++) {
PatriciaTrie.Node c = node.getChild(i);
set.addAll(getSuffixes(c, builder.toString()));
}
return set;
}
/**
* {@inheritDoc}
*/
@Override
public String toString() {
return PatriciaTrie.PatriciaTriePrinter.getString(tree);
}
public boolean equals(CompactSuffixTrie<C> trie){
if(this.getSuffixes().equals(trie.getSuffixes())) return true;
return false;
}
}