# removes stop words like the of and ... # that usually do not add more information count_vectorizer = CountVectorizer(stop_words = 'english')