In [3]:
import os
from nltk.tokenize import word_tokenize
from nltk.corpus import stopwords
from nltk import ngrams
import string
from nltk.stem import PorterStemmer
import matplotlib.pyplot as plt
from wordcloud import WordCloud
from collections import Counter
from sklearn.feature_extraction.text import TfidfVectorizer
from sklearn.svm import LinearSVC
from sklearn.feature_extraction.text import TfidfVectorizer
from sklearn.svm import LinearSVC
from pprint import pprint
from sklearn.preprocessing import MultiLabelBinarizer
from sklearn.multiclass import OneVsRestClassifier
from sklearn.metrics import f1_score, precision_score, recall_score
from nltk.corpus import reuters
from operator import itemgetter
# Test that verifies that the imports don't fail and that we have the correct files from nltk downloaded
reuters.fileids()
stopwords.words('english')
word_tokenize('This is just a test')
print('You are all set')
You are all set
In [2]:
! pip install wordcloud
Requirement already satisfied: wordcloud in /Users/tarrysingh/anaconda/lib/python3.6/site-packages Requirement already satisfied: numpy>=1.6.1 in /Users/tarrysingh/anaconda/lib/python3.6/site-packages (from wordcloud) Requirement already satisfied: pillow in /Users/tarrysingh/anaconda/lib/python3.6/site-packages (from wordcloud) Requirement already satisfied: matplotlib in /Users/tarrysingh/anaconda/lib/python3.6/site-packages (from wordcloud) Requirement already satisfied: olefile in /Users/tarrysingh/anaconda/lib/python3.6/site-packages (from pillow->wordcloud) Requirement already satisfied: six>=1.10 in /Users/tarrysingh/anaconda/lib/python3.6/site-packages (from matplotlib->wordcloud) Requirement already satisfied: python-dateutil in /Users/tarrysingh/anaconda/lib/python3.6/site-packages (from matplotlib->wordcloud) Requirement already satisfied: pytz in /Users/tarrysingh/anaconda/lib/python3.6/site-packages (from matplotlib->wordcloud) Requirement already satisfied: cycler>=0.10 in /Users/tarrysingh/anaconda/lib/python3.6/site-packages (from matplotlib->wordcloud) Requirement already satisfied: pyparsing!=2.0.4,!=2.1.2,!=2.1.6,>=1.5.6 in /Users/tarrysingh/anaconda/lib/python3.6/site-packages (from matplotlib->wordcloud)
In [ ]: