In [51]:
import nltk
import nltk.corpus
import nltk.tokenize
import nltk.stem
import nltk.sentiment.vader

In [22]:
text = "John went to the mall to buy some shoes. He went to many different stores. He returned home with a blue pair of shoes."

In [45]:
sentences = nltk.tokenize.sent_tokenize(text)

In [16]:
stop_words = set(nltk.corpus.stopwords.words("english"))
tokens = nltk.tokenize.word_tokenize(text)

In [20]:
text_filtered = []
for word in tokens:
    if word not in stop_words:
        text_filtered.append(word)

In [28]:
print(str(100 - (len(tokens) - len(text_filtered) / len(tokens))) + "% of text remains")

73.7037037037037% of text remains


In [34]:
stemmer = nltk.stem.PorterStemmer()
words = ["ride", "riding", "rider"]
for word in words:
    print(stemmer.stem(word))

ride
ride
rider


In [36]:
for word in text_filtered:
    print(stemmer.stem(word))

john
went
mall
buy
shoe
.
he
went
mani
differ
store
.
he
return
home
blue
pair
shoe
.


In [42]:
print(nltk.pos_tag(text_filtered))

[('John', 'NNP'), ('went', 'VBD'), ('mall', 'JJ'), ('buy', 'NN'), ('shoes', 'NNS'), ('.', '.'), ('He', 'PRP'), ('went', 'VBD'), ('many', 'JJ'), ('different', 'JJ'), ('stores', 'NNS'), ('.', '.'), ('He', 'PRP'), ('returned', 'VBD'), ('home', 'NN'), ('blue', 'NN'), ('pair', 'NN'), ('shoes', 'NNS'), ('.', '.')]


In [53]:
text_positive = "John went to watch the new Cars movie. He enjoyed it greatly. He taught that the cars were very fast and he really likes that."
text_neutral = "John watched the Cars movie. He thinks that it is okay. He felt it wasn't bad."
text_negative = "John went to watch the new Cars movie. He hated it and felt like it should never have been made. He went to the front desk to get his money back."

In [60]:
sentences = nltk.tokenize.sent_tokenize(" ".join([text_positive, text_neutral, text_negative]))
analyzer = nltk.sentiment.vader.SentimentIntensityAnalyzer()

In [64]:
for sentence in sentences:
    print(sentence)
    scores = analyzer.polarity_scores(sentence)
    print(f"\tnegative: {scores['neg']}")
    print(f"\tneutral: {scores['neu']}")
    print(f"\tpositive: {scores['pos']}")

John went to watch the new Cars movie.
	negative: 0.0
	neutral: 1.0
	positive: 0.0
He enjoyed it greatly.
	negative: 0.0
	neutral: 0.476
	positive: 0.524
He taught that the cars were very fast and he really likes that.
	negative: 0.0
	neutral: 0.795
	positive: 0.205
John watched the Cars movie.
	negative: 0.0
	neutral: 1.0
	positive: 0.0
He thinks that it is okay.
	negative: 0.0
	neutral: 0.725
	positive: 0.275
He felt it wasn't bad.
	negative: 0.0
	neutral: 0.584
	positive: 0.416
John went to watch the new Cars movie.
	negative: 0.0
	neutral: 1.0
	positive: 0.0
He hated it and felt like it should never have been made.
	negative: 0.251
	neutral: 0.599
	positive: 0.15
He went to the front desk to get his money back.
	negative: 0.0
	neutral: 1.0
	positive: 0.0
