-
Notifications
You must be signed in to change notification settings - Fork 1
/
config.py
executable file
·33 lines (29 loc) · 1.92 KB
/
config.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
import nltk
from nltk import SnowballStemmer
stemmer = SnowballStemmer('english')
punctuations = ['(','-lrb-','.',',','-','?','!',';','_',':','{','}','[','/',']','...','"','``','`','\'',')', '-rrb-', "''", '\\', '/', '\\/', '..', '....', '--', '---', '----', '?!', '!?', '??', '???', '????', '!!', '!!!', '!!!!', "\\*", '|', '-lcb-', '-rcb-', '-lsb-', '-rsb-', '>>', '<<', '+', '\\+', '*', '\\*', '^', '\\^', '#']
# nltk stopwords and more
stop_words = ["i", "me", "my", "myself", "we", "our", "ours",
"ourselves", "you", "your", "yours", "yourself",
"yourselves", "he", "him", "his", "himself", "she", "her",
"hers", "herself", "it", "its", "itself", "they", "them",
"their", "theirs", "themselves", "what", "which", "who",
"whom", "this", "that", "these", "those", "am", "is",
"are", "was", "were", "be", "been", "being", "have",
"has", "had", "having", "do", "does", "did", "doing",
"a", "an", "the", "and", "but", "if", "or", "because",
"as", "until", "while", "of", "at", "by", "for", "with",
"about", "against", "between", "into", "through", "during",
"before", "after", "above", "below", "to", "from", "up",
"down", "in", "out", "on", "off", "over", "under",
"again", "further", "then", "once", "here", "there",
"when", "where", "why", "how", "all", "any", "both",
"each", "few", "more", "most", "other", "some", "such",
"no", "nor", "not", "only", "own", "same", "so", "than",
"too", "very", "s", "t", "can", "will", "just", "don",
"should", "now"]
stop_words += ["'s", "'ll", "'d", "'ve", "'re", "'m", "n't", "&",
"i.e.", "e.g."]
ppdbDict = {}
ppdbSim = 0.9
theta1 = 0.9