-
Notifications
You must be signed in to change notification settings - Fork 4
/
stop_words.py
24 lines (23 loc) · 1.8 KB
/
stop_words.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
# from nltk.corpus import stopwords
# stop_words = set(stopwords.words('english'))
# print(stop_words)
sw_list = {'ll', 'haven', "that'll", 'against', 'himself', 'his', 'all', 'very',
'some', 'm', "needn't", 'only', 'aren', 'i', 'their', 'for', 'between',
'but', "she's", "shan't", 'wouldn', 'then', 'from', 'theirs', "weren't",
'does', 'again', 'when', "you're", 'its', 'and', 'they', 'under', 'shouldn',
'than', 'didn', 'more', 'so', 'on', 'nor', 'any', 'into', 'how', 'whom',
'wasn', 'was', "you've", 'hasn', 'don', 'yourselves', 'y', 'doing',
"doesn't", 'have', 'to', 'same', 'or', 'other', 'ain', 'did', 'mustn',
'my', 'having', 'after', "didn't", 'he', 'should', 'hadn', 'because',
'will', 'with', 'ma', 'our', 'your', 'doesn', "haven't", 'which', 'before',
'below', 'why', 'herself', 'ourselves', 'were', 'once', 'here', 'who', 'been',
'most', 'own', 'just', 'out', 'mightn', "mustn't", "wasn't", 'she', 'of',
'this', 'while', 'about', 'yours', 'the', 've', "it's", 'shan',
'yourself', 'each', 'are', 'an', 'we', 'a', 'up', 'at', 'if', 's', 'until',
"couldn't", 'too', 'hers', "hadn't", 't', "mightn't", 'in', 'there', "won't",
'over', "don't", "you'd", 'that', 'do', 'through', "hasn't", 'myself',
'ours', 'these', "wouldn't", "shouldn't", 'o', "aren't", 'her', 'has', 'now',
'needn', 'what', "should've", 'itself', 'being', 'by', 'won', 'down', 'isn',
'both', 'where', "isn't", 'those', 'themselves', 'am', 'such', 'further',
'them', 'had', 'me', 'him', 'you', 'it', 'be', 'during', 'weren', 'off',
'd', 'above', 'can', 'as', "you'll", 'few', 'is', 're', 'couldn'}