-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathignored_stopwords.py
49 lines (43 loc) · 1.98 KB
/
ignored_stopwords.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
# Common stopword nouns (NN, NNS, NNP)
nouns = {
'anybody', 'anyone', 'anything', 'example', 'changes', 'course', 'causes',
'everybody', 'everyone', 'everything', 'help', 'nobody', 'none', 'noone',
'nothing', 'somebody', 'someone', 'something', 'time', 'way', 'matter',
'order', 'value'
}
# Common stopword adjectives (JJ)
adjectives = {
'able', 'available', 'brief', 'certain', 'different', 'entire', 'immediate',
'likely', 'necessary', 'new', 'old', 'particular', 'possible', 'present',
'ready', 'recent', 'second', 'third', 'useful', 'whole', 'unlikely',
'willing'
}
# Common stopword prepositions (IN)
prepositions = {
'about', 'above', 'across', 'after', 'against', 'along', 'among', 'amongst',
'around', 'as', 'at', 'before', 'behind', 'below', 'beneath', 'beside',
'besides', 'between', 'beyond', 'by', 'despite', 'during', 'except', 'for',
'from', 'in', 'inside', 'into', 'like', 'near', 'of', 'off', 'on', 'onto',
'out', 'outside', 'over', 'since', 'through', 'throughout', 'till', 'to',
'toward', 'towards', 'under', 'underneath', 'until', 'up', 'upon', 'with',
'within', 'without'
}
spacy_nouns = {
'amount', 'anyone', 'anything', 'bottom', 'everyone', 'everything',
'front', 'name', 'nobody', 'none', 'nothing', 'part', 'side',
'someone', 'something', 'top'
}
# Common stopword adjectives (JJ) from spacy stopwords
spacy_adjectives = {
'empty', 'former', 'full', 'latter', 'next', 'other', 'same',
'serious', 'various', 'whole'
}
# Common stopword prepositions (IN) from spacy stopwords
spacy_prepositions = {
'about', 'above', 'across', 'after', 'against', 'along', 'among',
'amongst', 'at', 'before', 'behind', 'below', 'beside', 'besides',
'between', 'beyond', 'by', 'during', 'except', 'for', 'from', 'in',
'into', 'of', 'off', 'on', 'onto', 'over', 'per', 'since', 'through',
'throughout', 'thru', 'to', 'toward', 'towards', 'under', 'until',
'up', 'upon', 'via', 'with', 'within', 'without'
}