Contact
CoCalc Logo Icon
StoreFeaturesDocsShareSupport News AboutSign UpSign In
| Download

nltk stopwords

Views: 360
Kernel: Python 3 (Ubuntu Linux)
from nltk.tokenize import sent_tokenize, word_tokenize from nltk.corpus import stopwords
data = "All work and no play makes jack dull boy. All work and no play makes jack a dull boy." stopWords = set(stopwords.words('english')) words = word_tokenize(data) wordsFiltered = []
for w in words: if w not in stopWords: wordsFiltered.append(w) print(wordsFiltered)
['All', 'work', 'play', 'makes', 'jack', 'dull', 'boy', '.', 'All', 'work', 'play', 'makes', 'jack', 'dull', 'boy', '.']