Removing common words / stopwords

From Media Design: Networked & Lens-Based wiki
Jump to navigation Jump to search
from nltk.corpus import stopwords
english_stops = set(stopwords.words("english"))
words = "Stopwords are common words that are often handy to remove or ignore when processing text".split()
words = [w for w in words if w not in english_stops]
print words