# Analyze Product Sentiment

In [1]:
import turicreate 

# Read product review data

In [2]:
products =  turicreate.SFrame('amazon_baby.sframe')

# Exploring the Data we have

In [3]:
products

name,review,rating
Planetwise Flannel Wipes,"These flannel wipes are OK, but in my opinion ...",3.0
Planetwise Wipe Pouch,it came early and was not disappointed. i love ...,5.0
Annas Dream Full Quilt with 2 Shams ...,Very soft and comfortable and warmer than it ...,5.0
Stop Pacifier Sucking without tears with ...,This is a product well worth the purchase. I ...,5.0
Stop Pacifier Sucking without tears with ...,All of my kids have cried non-stop when I tried to ...,5.0
Stop Pacifier Sucking without tears with ...,"When the Binky Fairy came to our house, we didn't ...",5.0
A Tale of Baby's Days with Peter Rabbit ...,"Lovely book, it's bound tightly so you may no ...",4.0
"Baby Tracker&reg; - Daily Childcare Journal, ...",Perfect for new parents. We were able to keep ...,5.0
"Baby Tracker&reg; - Daily Childcare Journal, ...",A friend of mine pinned this product on Pinte ...,5.0
"Baby Tracker&reg; - Daily Childcare Journal, ...",This has been an easy way for my nanny to record ...,4.0


In [4]:
# count how many times a product has been reviewed
products.groupby('name',operations={'count':turicreate.aggregate.COUNT()}).sort('count',ascending=False)

name,count
Vulli Sophie the Giraffe Teether ...,785
"Simple Wishes Hands-Free Breastpump Bra, Pink, ...",562
Infant Optics DXR-5 2.4 GHz Digital Video Baby ...,561
Baby Einstein Take Along Tunes ...,547
Cloud b Twilight Constellation Night ...,520
"Fisher-Price Booster Seat, Blue/Green/Gray ...",489
Fisher-Price Rainforest Jumperoo ...,450
"Graco Nautilus 3-in-1 Car Seat, Matrix ...",419
Leachco Snoogle Total Body Pillow ...,388
"Regalo Easy Step Walk Thru Gate, White ...",374


## Examining the reivews for the most-reviewed product

In [5]:
# making another sframe with the only giraffe_teether product rows
giraffe_reviews = products[products['name']=='Vulli Sophie the Giraffe Teether']

In [6]:
giraffe_reviews

name,review,rating
Vulli Sophie the Giraffe Teether ...,He likes chewing on all the parts especially the ...,5.0
Vulli Sophie the Giraffe Teether ...,My son loves this toy and fits great in the diaper ...,5.0
Vulli Sophie the Giraffe Teether ...,There really should be a large warning on the ...,1.0
Vulli Sophie the Giraffe Teether ...,All the moms in my moms' group got Sophie for ...,5.0
Vulli Sophie the Giraffe Teether ...,I was a little skeptical on whether Sophie was ...,5.0
Vulli Sophie the Giraffe Teether ...,I have been reading about Sophie and was going ...,5.0
Vulli Sophie the Giraffe Teether ...,My neice loves her sophie and has spent hours ...,5.0
Vulli Sophie the Giraffe Teether ...,What a friendly face! And those mesmerizing ...,5.0
Vulli Sophie the Giraffe Teether ...,We got this just for my son to chew on instea ...,5.0
Vulli Sophie the Giraffe Teether ...,"My baby seems to like this toy, but I could ...",3.0


In [7]:
len(giraffe_reviews)

785

In [8]:
giraffe_reviews['rating'].show()

## Building word count vectors

In [9]:
products['word_count'] = turicreate.text_analytics.count_words(products['review'])

In [10]:
products

name,review,rating,word_count
Planetwise Flannel Wipes,"These flannel wipes are OK, but in my opinion ...",3.0,"{'handles': 1.0, 'stripping': 1.0, ..."
Planetwise Wipe Pouch,it came early and was not disappointed. i love ...,5.0,"{'recommend': 1.0, 'highly': 1.0, ..."
Annas Dream Full Quilt with 2 Shams ...,Very soft and comfortable and warmer than it ...,5.0,"{'quilt': 1.0, 'of': 1.0, 'the': 1.0, 'than': 1.0, ..."
Stop Pacifier Sucking without tears with ...,This is a product well worth the purchase. I ...,5.0,"{'tool': 1.0, 'clever': 1.0, 'approach': 2.0, ..."
Stop Pacifier Sucking without tears with ...,All of my kids have cried non-stop when I tried to ...,5.0,"{'rock': 1.0, 'many': 1.0, 'headaches': 1.0, ..."
Stop Pacifier Sucking without tears with ...,"When the Binky Fairy came to our house, we didn't ...",5.0,"{'thumb': 1.0, 'or': 1.0, 'break': 1.0, 'trying': ..."
A Tale of Baby's Days with Peter Rabbit ...,"Lovely book, it's bound tightly so you may no ...",4.0,"{'for': 1.0, 'barnes': 1.0, 'at': 1.0, 'is': ..."
"Baby Tracker&reg; - Daily Childcare Journal, ...",Perfect for new parents. We were able to keep ...,5.0,"{'right': 1.0, 'because': 1.0, 'questions': 1.0, ..."
"Baby Tracker&reg; - Daily Childcare Journal, ...",A friend of mine pinned this product on Pinte ...,5.0,"{'like': 1.0, 'and': 1.0, 'changes': 1.0, 'the': ..."
"Baby Tracker&reg; - Daily Childcare Journal, ...",This has been an easy way for my nanny to record ...,4.0,"{'in': 1.0, 'pages': 1.0, 'out': 1.0, 'run': 1.0, ..."


## Define what is positive and negative sentiment

In [11]:
products['rating'].show()

In [12]:
# as the above chart shows most reviews are either 5 or 4*
# also it shows that 1 and 2* are thumbs down and 5 or 4*  are thumbs up
# As 3* is neutral rating 
# so we are going to ignore 3* rating for now
products = products[products['rating']!= 3]

In [13]:
# fromabove we got a table with the reviews having 4 or 5* and also the ones having 1 or 2* rating
# adding sentiment column to the table 
# if rating is 4 or > than 4 than sentiment = 1(or + or thumbs up)
# if rating is less than 4 than sentiment = 0(or - or thumbs down)
products['sentiment'] = products['rating'] >= 4

In [14]:
products

name,review,rating,word_count,sentiment
Planetwise Wipe Pouch,it came early and was not disappointed. i love ...,5.0,"{'recommend': 1.0, 'highly': 1.0, ...",1
Annas Dream Full Quilt with 2 Shams ...,Very soft and comfortable and warmer than it ...,5.0,"{'quilt': 1.0, 'of': 1.0, 'the': 1.0, 'than': 1.0, ...",1
Stop Pacifier Sucking without tears with ...,This is a product well worth the purchase. I ...,5.0,"{'tool': 1.0, 'clever': 1.0, 'approach': 2.0, ...",1
Stop Pacifier Sucking without tears with ...,All of my kids have cried non-stop when I tried to ...,5.0,"{'rock': 1.0, 'many': 1.0, 'headaches': 1.0, ...",1
Stop Pacifier Sucking without tears with ...,"When the Binky Fairy came to our house, we didn't ...",5.0,"{'thumb': 1.0, 'or': 1.0, 'break': 1.0, 'trying': ...",1
A Tale of Baby's Days with Peter Rabbit ...,"Lovely book, it's bound tightly so you may no ...",4.0,"{'for': 1.0, 'barnes': 1.0, 'at': 1.0, 'is': ...",1
"Baby Tracker&reg; - Daily Childcare Journal, ...",Perfect for new parents. We were able to keep ...,5.0,"{'right': 1.0, 'because': 1.0, 'questions': 1.0, ...",1
"Baby Tracker&reg; - Daily Childcare Journal, ...",A friend of mine pinned this product on Pinte ...,5.0,"{'like': 1.0, 'and': 1.0, 'changes': 1.0, 'the': ...",1
"Baby Tracker&reg; - Daily Childcare Journal, ...",This has been an easy way for my nanny to record ...,4.0,"{'in': 1.0, 'pages': 1.0, 'out': 1.0, 'run': 1.0, ...",1
"Baby Tracker&reg; - Daily Childcare Journal, ...",I love this journal and our nanny uses it ...,4.0,"{'tracker': 1.0, 'now': 1.0, 'its': 1.0, 'sti ...",1


In [15]:
products['sentiment'].show()

# Train our sentiment classifier

In [16]:
train_data,test_data = products.random_split(.8,seed=0)

In [18]:
sentiment_model = turicreate.logistic_classifier.create(train_data,target='sentiment', features=['word_count'], validation_set=test_data)

# Evaluate the sentiment classifier

In [20]:
sentiment_model.evaluate(test_data,metric='roc_curve')

{'roc_curve': Columns:
 	threshold	float
 	fpr	float
 	tpr	float
 	p	int
 	n	int
 
 Rows: 100001
 
 Data:
 +-----------+--------------------+--------------------+-------+------+
 | threshold |        fpr         |        tpr         |   p   |  n   |
 +-----------+--------------------+--------------------+-------+------+
 |    0.0    |        1.0         |        1.0         | 27976 | 5328 |
 |   1e-05   | 0.847972972972973  | 0.9975693451529882 | 27976 | 5328 |
 |   2e-05   | 0.829954954954955  | 0.9971761509865599 | 27976 | 5328 |
 |   3e-05   | 0.818506006006006  | 0.9969616814412353 | 27976 | 5328 |
 |   4e-05   | 0.8109984984984985 | 0.9967472118959108 | 27976 | 5328 |
 |   5e-05   | 0.8057432432432432 | 0.9966042321990277 | 27976 | 5328 |
 |   6e-05   | 0.7991741741741741 | 0.9962825278810409 | 27976 | 5328 |
 |   7e-05   | 0.7952327327327328 | 0.9961752931083786 | 27976 | 5328 |
 |   8e-05   | 0.7920420420420421 | 0.9961038032599371 | 27976 | 5328 |
 |   9e-05   | 0.7882882882882

# Apply the sentiment classifier to better understand the Giraffe reviews

In [21]:
products['predicted_sentiment'] = sentiment_model.predict(products, output_type = 'probability')

In [22]:
products

name,review,rating,word_count,sentiment
Planetwise Wipe Pouch,it came early and was not disappointed. i love ...,5.0,"{'recommend': 1.0, 'highly': 1.0, ...",1
Annas Dream Full Quilt with 2 Shams ...,Very soft and comfortable and warmer than it ...,5.0,"{'quilt': 1.0, 'of': 1.0, 'the': 1.0, 'than': 1.0, ...",1
Stop Pacifier Sucking without tears with ...,This is a product well worth the purchase. I ...,5.0,"{'tool': 1.0, 'clever': 1.0, 'approach': 2.0, ...",1
Stop Pacifier Sucking without tears with ...,All of my kids have cried non-stop when I tried to ...,5.0,"{'rock': 1.0, 'many': 1.0, 'headaches': 1.0, ...",1
Stop Pacifier Sucking without tears with ...,"When the Binky Fairy came to our house, we didn't ...",5.0,"{'thumb': 1.0, 'or': 1.0, 'break': 1.0, 'trying': ...",1
A Tale of Baby's Days with Peter Rabbit ...,"Lovely book, it's bound tightly so you may no ...",4.0,"{'for': 1.0, 'barnes': 1.0, 'at': 1.0, 'is': ...",1
"Baby Tracker&reg; - Daily Childcare Journal, ...",Perfect for new parents. We were able to keep ...,5.0,"{'right': 1.0, 'because': 1.0, 'questions': 1.0, ...",1
"Baby Tracker&reg; - Daily Childcare Journal, ...",A friend of mine pinned this product on Pinte ...,5.0,"{'like': 1.0, 'and': 1.0, 'changes': 1.0, 'the': ...",1
"Baby Tracker&reg; - Daily Childcare Journal, ...",This has been an easy way for my nanny to record ...,4.0,"{'in': 1.0, 'pages': 1.0, 'out': 1.0, 'run': 1.0, ...",1
"Baby Tracker&reg; - Daily Childcare Journal, ...",I love this journal and our nanny uses it ...,4.0,"{'tracker': 1.0, 'now': 1.0, 'its': 1.0, 'sti ...",1

predicted_sentiment
0.9997307390047092
0.9985083368316608
0.999748904249988
0.9999916625399972
0.9999999514462168
0.9999146735569904
0.9999916615904652
0.9999938843594008
0.9961247617006423
0.9999999920460632


In [23]:
giraffe_reviews = products[products['name']=='Vulli Sophie the Giraffe Teether']

In [24]:
giraffe_reviews

name,review,rating,word_count,sentiment
Vulli Sophie the Giraffe Teether ...,He likes chewing on all the parts especially the ...,5.0,"{'purchase': 1.0, 'teething': 1.0, ...",1
Vulli Sophie the Giraffe Teether ...,My son loves this toy and fits great in the diaper ...,5.0,"{'a': 1.0, 'is': 1.0, 'when': 1.0, 'him': 1.0, ...",1
Vulli Sophie the Giraffe Teether ...,There really should be a large warning on the ...,1.0,"{'made': 1.0, 'of': 1.0, 'packaging': 1.0, 'no': ...",0
Vulli Sophie the Giraffe Teether ...,All the moms in my moms' group got Sophie for ...,5.0,"{'another': 1.0, 'out': 1.0, 'run': 1.0, 'lost': ...",1
Vulli Sophie the Giraffe Teether ...,I was a little skeptical on whether Sophie was ...,5.0,"{'disappointed': 1.0, 'will': 1.0, 'take': ...",1
Vulli Sophie the Giraffe Teether ...,I have been reading about Sophie and was going ...,5.0,"{'late': 1.0, 'perfect': 1.0, 'pack': 1.0, 'on ...",1
Vulli Sophie the Giraffe Teether ...,My neice loves her sophie and has spent hours ...,5.0,"{'delight': 1.0, 'in': 1.0, 'other': 1.0, ...",1
Vulli Sophie the Giraffe Teether ...,What a friendly face! And those mesmerizing ...,5.0,"{'inside': 1.0, 'water': 1.0, 'don': 1.0, 'up': ...",1
Vulli Sophie the Giraffe Teether ...,We got this just for my son to chew on instea ...,5.0,"{'its': 1.0, 'fine': 1.0, 'is': 1.0, 'which': 1.0, ...",1
Vulli Sophie the Giraffe Teether ...,This product is without a doubt the best on the ...,5.0,"{'belongs': 1.0, 'dog': 1.0, 'if': 1.0, 'bewa ...",1

predicted_sentiment
0.999365536568231
0.999863379168963
0.2545268197812222
0.9165688083915248
0.6855768205886384
0.99999994452112
0.9979351181093526
0.9999745004834384
0.9460144428357122
0.9999999721665868


# Sort the Giraffe reviews according to predicted sentiment

In [25]:
giraffe_reviews = giraffe_reviews.sort('predicted_sentiment', ascending=False)

In [26]:
giraffe_reviews

name,review,rating,word_count,sentiment
Vulli Sophie the Giraffe Teether ...,"Sophie, oh Sophie, your time has come. My ...",5.0,"{'11': 1.0, 'prisrob': 1.0, '12': 1.0, 'who': ...",1
Vulli Sophie the Giraffe Teether ...,I'll be honest...I bought this toy because all the ...,4.0,"{'around': 1.0, 'explore': 1.0, 'they': ...",1
Vulli Sophie the Giraffe Teether ...,As a mother of 16month old twins; I bought ...,5.0,"{'will': 1.0, '15months': 1.0, 'would': 2.0, ...",1
Vulli Sophie the Giraffe Teether ...,We got this little giraffe as a gift from a ...,5.0,"{'out': 1.0, 'would': 1.0, 've': 1.0, 'enou ...",1
Vulli Sophie the Giraffe Teether ...,"As every mom knows, you always want to give your ...",5.0,"{'whether': 1.0, 'neutral': 1.0, 'gend ...",1
Vulli Sophie the Giraffe Teether ...,My Mom-in-Law bought Sophie for my son whe ...,5.0,"{'penny': 1.0, 'little': 1.0, 'perfect': 1.0, ...",1
Vulli Sophie the Giraffe Teether ...,"My 4 month old son is teething, and I've tried ...",4.0,"{'worth': 1.0, 'works': 1.0, 'teether': 1.0, ...",1
Vulli Sophie the Giraffe Teether ...,Let me just start off by addressing the choking ...,5.0,"{'question': 1.0, 'must': 1.0, 'overall': 1.0, ...",1
Vulli Sophie the Giraffe Teether ...,I'm not sure why Sophie is such a hit with the ...,4.0,"{'makers': 1.0, 'or': 1.0, 'take': 1.0, 'can': ...",1
Vulli Sophie the Giraffe Teether ...,"I admit, I didn't get Sophie the Giraffe at ...",4.0,"{'dye': 1.0, 'of': 1.0, 'cause': 1.0, 'fade': ...",1

predicted_sentiment
1.0
1.0
1.0
0.9999999999998376
0.9999999999998284
0.9999999999997958
0.9999999999994914
0.9999999999941254
0.999999999987423
0.9999999999829476


In [27]:
giraffe_reviews.tail()

name,review,rating,word_count,sentiment
Vulli Sophie the Giraffe Teether ...,My 7 1/2 month old grandbaby was sittng up ...,1.0,"{'sopie': 1.0, 'with': 1.0, 'be': 1.0, 'shou ...",0
Vulli Sophie the Giraffe Teether ...,I was so looking forward to getting this for my ...,1.0,"{'amazon': 1.0, 'back': 1.0, 'by': 1.0, 'more': ...",0
Vulli Sophie the Giraffe Teether ...,Received the product and smells like cheap rub ...,1.0,"{'was': 1.0, 'as': 1.0, 'still': 1.0, 'but': ...",0
Vulli Sophie the Giraffe Teether ...,I got one of these as a showe gift that my baby ...,1.0,"{'typical': 1.0, 'paint': 1.0, 'came': 1.0, 'mi ...",0
Vulli Sophie the Giraffe Teether ...,When we first got it I thought did my ...,2.0,"{'mom': 1.0, 'teethers': 1.0, 'btw': 1.0, 'oth ...",0
Vulli Sophie the Giraffe Teether ...,When I received this the paint was peeling off in ...,1.0,"{'risk': 1.0, 'but': 1.0, 'help': 1.0, 'terrible': ...",0
Vulli Sophie the Giraffe Teether ...,"""Sophie the Giraffe"" has tested positive for ...",1.0,"{'ingest': 1.0, 'they': 1.0, 'naturally': 1.0, ...",0
Vulli Sophie the Giraffe Teether ...,"My son (now 2.5) LOVED his Sophie, and I bought ...",1.0,"{'exaggerated': 1.0, 'are': 1.0, 'a': 3.0, ...",0
Vulli Sophie the Giraffe Teether ...,I wanted to love this product and was excited ...,1.0,"{'risk': 1.0, 'ready': 1.0, 'bummed': 1.0, ...",0
Vulli Sophie the Giraffe Teether ...,This children's toy is nostalgic and very cute. ...,1.0,"{'amazon': 1.0, 'from': 1.0, 'one': 1.0, 'by': ...",0

predicted_sentiment
1.9110740195673068e-06
6.547801686064591e-07
3.864236397443623e-07
2.2378225159413762e-07
1.935395528183046e-07
1.6900753980993737e-07
1.1748826795726907e-07
5.364933427024891e-11
3.1090352704675415e-13
4.119269639403062e-15


## Show the most positive reviews

In [28]:
giraffe_reviews[0]['review']

"Sophie, oh Sophie, your time has come. My granddaughter, Violet is 5 months old and starting to teeth. What joy little Sophie brings to Violet. Sophie is made of a very pliable rubber that is sturdy but not tough. It is quite easy for Violet to twist Sophie into unheard of positions to get Sophie into her mouth. The little nose and hooves fit perfectly into small mouths, and the drooling has purpose. The paint on Sophie is food quality.Sophie was born in 1961 in France. The maker had wondered why there was nothing available for babies and made Sophie from the finest rubber, phthalate-free on St Sophie's Day, thus the name was born. Since that time millions of Sophie's populate the world. She is soft and for babies little hands easy to grasp. Violet especially loves the bumpy head and horns of Sophie. Sophie has a long neck that easy to grasp and twist. She has lovely, sizable spots that attract Violet's attention. Sophie has happy little squeaks that bring squeals of delight from Viol

In [29]:
giraffe_reviews[1]['review']

'I\'ll be honest...I bought this toy because all the hip parents seem to have one too and I wanted to be a part of the "hip parent" crowd. The price-tag was somewhat of a deterent but I prevailed and purchased this teether for my daughter.At first, Lily didn\'t know what to make of of Sophie and showed little interest in the polka-dotted creature. I continued to introduce Lily to Sophie and kept the toy in the carrier so that it was on-hand during transitions. Eventually, Lily discovered what a wonderful experience it was to gnaw on the hooves and ears and these two have never been far apart since.Lily really enjoys gumming all the different parts of Sophie like no other teether we have. The size of the toy is great as it is somewhat substantial and so easy for a little one to grasp and hold onto. Lily really enjoys hearing Sophie squeak and will smile whenever Sophie makes a noise or pops her head up from Mommy\'s lap to say hello.People have stopped and commented on Sophie and to the

# Most negative reivews

In [30]:
giraffe_reviews[-1]['review']

"This children's toy is nostalgic and very cute. However, there is a distinct rubber smell and a very odd taste, yes I tried it, that my baby did not enjoy. Also, if it is soiled it is extremely difficult to clean as the rubber is a kind of porus material and does not clean well. The final thing is the squeaking device inside which stopped working after the first couple of days. I returned this item feeling I had overpaid for a toy that was defective and did not meet my expectations. Please do not be swayed by the cute packaging and hype surounding it as I was. One more thing, I was given a full refund from Amazon without any problem."

In [31]:
giraffe_reviews[-2]['review']

'I wanted to love this product and was excited to buy it when I became pregnant but am now hesitant to let my baby use it after reading about the recall in Europe. Apparently, as I understand it, their toxin standards of measurement are lower than ours so they have not been recalled here (apparently we are OK with low levels of nitrates in the toys our children put in their mouths, but Europeans are not...hmmm)...Be that as it may, toxins registering even CLOSE to a dangerous level made me nervous about using. After digging around online I did discover that the company claims to have changed the product after a certain date and lists manufacturing codes so you can check yours (those listed were made after a certain date and are said to be safer). Sadly mine was not made after the &#34;improved&#34; date but I could not return it because there was no formal recall in our country. I considered returning it and hunting for one with an approved manufacturing date but man that was just too 

# ASSIGNMENT

## TASK 1
## Finding word count for all selected words

In [69]:
def awesome_count(word_count):
    if 'awesome' in word_count:
        return word_count['awesome']
    else:
        return 0

In [70]:
def great_count(word_count):
    if 'great' in word_count:
        return word_count['great']
    else:
        return 0

In [71]:
def fantastic_count(word_count):
    if 'fantastic' in word_count:
        return word_count['fantastic']
    else:
        return 0

In [72]:
def amazing_count(word_count):
    if 'amazing' in word_count:
        return word_count['amazing']
    else:
        return 0

In [73]:
def love_count(word_count):
    if 'love' in word_count:
        return word_count['love']
    else:
        return 0

In [74]:
def horrible_count(word_count):
    if 'horrible' in word_count:
        return word_count['horrible']
    else:
        return 0

In [75]:
def bad_count(word_count):
    if 'bad' in word_count:
        return word_count['bad']
    else:
        return 0

In [76]:
def terrible_count(word_count):
    if 'terrible' in word_count:
        return word_count['terrible']
    else:
        return 0

In [77]:
def awful_count(word_count):
    if 'awful' in word_count:
        return word_count['awful']
    else:
        return 0

In [78]:
def wow_count(word_count):
    if 'wow' in word_count:
        return word_count['wow']
    else:
        return 0

In [79]:
def hate_count(word_count):
    if 'hate' in word_count:
        return word_count['hate']
    else:
        return 0

In [80]:
products['awesome'] = products['word_count'].apply(awesome_count)

In [81]:
products['great'] = products['word_count'].apply(great_count)

In [82]:
products['fantastic'] = products['word_count'].apply(fantastic_count)

In [83]:
products['amazing'] = products['word_count'].apply(amazing_count)

In [84]:
products['love'] = products['word_count'].apply(love_count)

In [85]:
products['horrible'] = products['word_count'].apply(horrible_count)

In [86]:
products['bad'] = products['word_count'].apply(bad_count)

In [87]:
products['terrible'] = products['word_count'].apply(terrible_count)

In [88]:
products['awful'] = products['word_count'].apply(awful_count)

In [89]:
products['wow'] = products['word_count'].apply(wow_count)

In [90]:
products['hate'] = products['word_count'].apply(hate_count)

In [91]:
print(products['awesome'].sum())

3892.0


In [92]:
print(products['great'].sum())

55791.0


In [93]:
print(products['fantastic'].sum())

1664.0


In [94]:
print(products['amazing'].sum())

2628.0


In [95]:
print(products['love'].sum())

41994.0


In [96]:
print(products['horrible'].sum())

1110


In [97]:
print(products['bad'].sum())

4183


In [98]:
print(products['terrible'].sum())

1146.0


In [99]:
print(products['awful'].sum())

687


In [100]:
print(products['wow'].sum())

425


In [101]:
print(products['hate'].sum())

1107


## TASK 2
## Create a new sentiment analysis model using only the selected_words as features

In [102]:
selected_words = ['awesome', 'great', 'fantastic', 'amazing', 'love', 'horrible', 'bad', 'terrible', 'awful', 'wow', 'hate']

In [103]:
train_data,test_data = products.random_split(.8,seed=0)

In [104]:
selected_words_model = turicreate.logistic_classifier.create(train_data,target='sentiment', features=selected_words, validation_set=test_data)

In [106]:
selected_words_model.coefficients

name,index,class,value,stderr
(intercept),,1,1.3365913848877726,0.0089299697876559
awesome,,1,1.133534666034134,0.0839964398318756
great,,1,0.8630655001196439,0.0189550524443766
fantastic,,1,0.88580475688142,0.1116759129339965
amazing,,1,1.100093311366018,0.0995477626046598
love,,1,1.359268866922504,0.0280683001520995
horrible,,1,-2.251335236759102,0.0802024938878842
bad,,1,-0.9914778800650664,0.0384842866469906
terrible,,1,-2.2236614360851346,0.0773173620378574
awful,,1,-2.05290820403136,0.1009973543525924


## TASK 3
## Comparing the accuracy of different sentiment analysis model

In [107]:
print(sentiment_model.evaluate(test_data))

{'accuracy': 0.9176975738650012, 'auc': 0.9342357833151299, 'confusion_matrix': Columns:
	target_label	int
	predicted_label	int
	count	int

Rows: 4

Data:
+--------------+-----------------+-------+
| target_label | predicted_label | count |
+--------------+-----------------+-------+
|      0       |        1        |  1397 |
|      1       |        0        |  1344 |
|      0       |        0        |  3931 |
|      1       |        1        | 26632 |
+--------------+-----------------+-------+
[4 rows x 3 columns]
, 'f1_score': 0.951057941255245, 'log_loss': 0.33047871872320644, 'precision': 0.9501587641371436, 'recall': 0.9519588218472976, 'roc_curve': Columns:
	threshold	float
	fpr	float
	tpr	float
	p	int
	n	int

Rows: 100001

Data:
+-----------+--------------------+--------------------+-------+------+
| threshold |        fpr         |        tpr         |   p   |  n   |
+-----------+--------------------+--------------------+-------+------+
|    0.0    |        1.0         |        

In [109]:
print(selected_words_model.evaluate(test_data))

{'accuracy': 0.8463848186404036, 'auc': 0.6936022046674926, 'confusion_matrix': Columns:
	target_label	int
	predicted_label	int
	count	int

Rows: 4

Data:
+--------------+-----------------+-------+
| target_label | predicted_label | count |
+--------------+-----------------+-------+
|      1       |        0        |  159  |
|      0       |        0        |  371  |
|      0       |        1        |  4957 |
|      1       |        1        | 27817 |
+--------------+-----------------+-------+
[4 rows x 3 columns]
, 'f1_score': 0.9157860082304526, 'log_loss': 0.39622654670876317, 'precision': 0.8487520595594068, 'recall': 0.9943165570488991, 'roc_curve': Columns:
	threshold	float
	fpr	float
	tpr	float
	p	int
	n	int

Rows: 100001

Data:
+-----------+--------------------+-----+-------+------+
| threshold |        fpr         | tpr |   p   |  n   |
+-----------+--------------------+-----+-------+------+
|    0.0    |        1.0         | 1.0 | 27976 | 5328 |
|   1e-05   |        1.0      

## TASK 4
## Interpreting the difference in performance between the models

In [113]:
#products['predicted_sentiment'] = sentiment_model.predict(products, output_type = 'probability')

In [114]:
#products

name,review,rating,word_count,sentiment
Planetwise Wipe Pouch,it came early and was not disappointed. i love ...,5.0,"{'recommend': 1.0, 'highly': 1.0, ...",1
Annas Dream Full Quilt with 2 Shams ...,Very soft and comfortable and warmer than it ...,5.0,"{'quilt': 1.0, 'of': 1.0, 'the': 1.0, 'than': 1.0, ...",1
Stop Pacifier Sucking without tears with ...,This is a product well worth the purchase. I ...,5.0,"{'tool': 1.0, 'clever': 1.0, 'approach': 2.0, ...",1
Stop Pacifier Sucking without tears with ...,All of my kids have cried non-stop when I tried to ...,5.0,"{'rock': 1.0, 'many': 1.0, 'headaches': 1.0, ...",1
Stop Pacifier Sucking without tears with ...,"When the Binky Fairy came to our house, we didn't ...",5.0,"{'thumb': 1.0, 'or': 1.0, 'break': 1.0, 'trying': ...",1
A Tale of Baby's Days with Peter Rabbit ...,"Lovely book, it's bound tightly so you may no ...",4.0,"{'for': 1.0, 'barnes': 1.0, 'at': 1.0, 'is': ...",1
"Baby Tracker&reg; - Daily Childcare Journal, ...",Perfect for new parents. We were able to keep ...,5.0,"{'right': 1.0, 'because': 1.0, 'questions': 1.0, ...",1
"Baby Tracker&reg; - Daily Childcare Journal, ...",A friend of mine pinned this product on Pinte ...,5.0,"{'like': 1.0, 'and': 1.0, 'changes': 1.0, 'the': ...",1
"Baby Tracker&reg; - Daily Childcare Journal, ...",This has been an easy way for my nanny to record ...,4.0,"{'in': 1.0, 'pages': 1.0, 'out': 1.0, 'run': 1.0, ...",1
"Baby Tracker&reg; - Daily Childcare Journal, ...",I love this journal and our nanny uses it ...,4.0,"{'tracker': 1.0, 'now': 1.0, 'its': 1.0, 'sti ...",1

predicted_sentiment,awesome,great,fantastic,amazing,love,horrible,bad,awful,wow,hate,terrible
0.9997307390047092,0.0,0.0,0.0,0.0,1.0,0,0,0,0,0,0.0
0.9985083368316608,0.0,0.0,0.0,0.0,0.0,0,0,0,0,0,0.0
0.999748904249988,0.0,0.0,0.0,0.0,2.0,0,0,0,0,0,0.0
0.9999916625399972,0.0,1.0,0.0,0.0,1.0,0,0,0,0,0,0.0
0.9999999514462168,0.0,1.0,0.0,0.0,0.0,0,0,0,0,0,0.0
0.9999146735569904,0.0,0.0,0.0,0.0,0.0,0,0,0,0,0,0.0
0.9999916615904652,0.0,0.0,0.0,0.0,0.0,0,0,0,0,0,0.0
0.9999938843594008,0.0,0.0,1.0,0.0,0.0,0,0,0,0,0,0.0
0.9961247617006423,0.0,0.0,0.0,0.0,0.0,0,0,0,0,0,0.0
0.9999999920460632,0.0,0.0,0.0,0.0,2.0,0,0,0,0,0,0.0


In [120]:
diaper_champ_reviews = products[products['name']=='Baby Trend Diaper Champ']

In [121]:
diaper_champ_reviews

name,review,rating,word_count,sentiment
Baby Trend Diaper Champ,Ok - newsflash. Diapers are just smelly. We've ...,4.0,"{'convenient': 1.0, 'more': 1.0, 'trash': ...",1
Baby Trend Diaper Champ,"My husband and I selected the Diaper ""Champ"" ma ...",1.0,"{'system': 1.0, 'try': 1.0, 're': 1.0, 'still': ...",0
Baby Trend Diaper Champ,Excellent diaper disposal unit. I used it in ...,5.0,"{'nose': 1.0, 'for': 2.0, 'investment': 1.0, ...",1
Baby Trend Diaper Champ,We love our diaper champ. It is very easy to use ...,5.0,"{'out': 1.0, 'pull': 1.0, 'open': 1.0, 'pail': ...",1
Baby Trend Diaper Champ,Two girlfriends and two family members put me ...,5.0,"{'winter': 1.0, 'outside': 1.0, 'day': ...",1
Baby Trend Diaper Champ,I waited to review this until I saw how it ...,4.0,"{'mom': 1.0, 'my': 1.0, 'empty': 2.0, 'poop': ...",1
Baby Trend Diaper Champ,I have had a diaper genie for almost 4 years since ...,1.0,"{'yuck': 1.0, 'clean': 1.0, 'all': 1.0, 'tra ...",0
Baby Trend Diaper Champ,I originally put this item on my baby registry ...,5.0,"{'price': 1.0, 'suggestions': 1.0, ...",1
Baby Trend Diaper Champ,I am so glad I got the Diaper Champ instead of ...,5.0,"{'best': 1.0, 'that': 1.0, 'handle': 1.0, ' ...",1
Baby Trend Diaper Champ,We had 2 diaper Genie's both given to us as a ...,4.0,"{'no': 1.0, 'regular': 1.0, 'part': 1.0, ...",1

predicted_sentiment,awesome,great,fantastic,amazing,love,horrible,bad,awful,wow,hate,terrible
0.9950122935569564,0.0,0.0,0.0,0.0,0.0,0,0,0,0,0,0.0
5.90141453456435e-13,0.0,0.0,0.0,0.0,0.0,0,0,0,0,0,0.0
0.9999996193960344,0.0,0.0,0.0,0.0,0.0,0,0,0,0,0,0.0
0.9999567191544844,0.0,0.0,0.0,0.0,1.0,0,0,0,0,0,0.0
0.9999997013199228,0.0,0.0,0.0,1.0,0.0,1,0,0,1,0,0.0
0.9999920758179406,0.0,0.0,0.0,0.0,0.0,0,1,0,0,0,0.0
0.0017908398242648,0.0,0.0,0.0,0.0,0.0,0,0,0,0,0,0.0
0.9999999999465672,0.0,0.0,0.0,0.0,0.0,0,0,0,0,0,0.0
0.980117441355887,0.0,0.0,0.0,0.0,0.0,0,0,0,0,0,0.0
0.9999454483919004,0.0,0.0,0.0,0.0,2.0,0,0,0,0,0,0.0


In [122]:
diaper_champ_reviews = diaper_champ_reviews.sort('predicted_sentiment', ascending=False)

In [123]:
diaper_champ_reviews

name,review,rating,word_count,sentiment
Baby Trend Diaper Champ,I read a review below that can explain exactly ...,4.0,"{'key': 1.0, 'have': 1.0, 'pieces': 1.0, 'betwe ...",1
Baby Trend Diaper Champ,I have never written a review for Amazon but I ...,5.0,"{'priceless': 1.0, 'knows': 1.0, 'parent': ...",1
Baby Trend Diaper Champ,I originally put this item on my baby registry ...,5.0,"{'price': 1.0, 'suggestions': 1.0, ...",1
Baby Trend Diaper Champ,Baby Luke can turn a clean diaper to a dirty ...,5.0,"{'around': 1.0, 'any': 1.0, 't': 1.0, 'isn': ...",1
Baby Trend Diaper Champ,Diaper Champ or Diaper Genie? That was my ...,5.0,"{'either': 1.0, 'be': 1.0, 't': 1.0, 'not': ...",1
Baby Trend Diaper Champ,I am one of those super- critical shoppers who ...,5.0,"{'hope': 1.0, 'make': 1.0, 'slower': 1.0, ...",1
Baby Trend Diaper Champ,I LOOOVE this diaper pail! Its the easies ...,5.0,"{'buy': 1.0, 'product': 1.0, 'recommend': 1.0, ...",1
Baby Trend Diaper Champ,"As a first time mother, I wanted to get the best ...",5.0,"{'ll': 1.0, 'baby': 1.0, 'recommended': 1.0, ' ...",1
Baby Trend Diaper Champ,I see that there are complaints of stinkiness ...,5.0,"{'very': 1.0, 'told': 1.0, 'all': 1.0, ...",1
Baby Trend Diaper Champ,I have a 10 year old daughter and an 8 month ...,5.0,"{'sorry': 1.0, 'be': 1.0, 'you': 2.0, 'sell': 1.0, ...",1

predicted_sentiment,awesome,great,fantastic,amazing,love,horrible,bad,awful,wow,hate,terrible
0.999999999989594,0.0,0.0,0.0,0.0,0.0,0,0,0,0,0,0.0
0.9999999999868132,0.0,0.0,0.0,0.0,1.0,0,0,0,0,0,0.0
0.9999999999465672,0.0,0.0,0.0,0.0,0.0,0,0,0,0,0,0.0
0.9999999999302822,0.0,1.0,0.0,0.0,0.0,0,0,0,0,0,0.0
0.9999999999174132,0.0,1.0,0.0,0.0,0.0,0,0,0,0,0,0.0
0.9999999998430964,0.0,0.0,0.0,0.0,1.0,0,0,0,0,0,0.0
0.9999999997360196,0.0,0.0,0.0,0.0,1.0,0,0,0,0,0,0.0
0.9999999995664316,0.0,0.0,0.0,0.0,1.0,0,0,0,0,0,0.0
0.9999999985015902,0.0,0.0,0.0,0.0,0.0,0,0,0,0,0,0.0
0.999999998056851,0.0,0.0,0.0,0.0,2.0,0,0,0,0,0,0.0


In [124]:
diaper_champ_reviews.tail()

name,review,rating,word_count,sentiment
Baby Trend Diaper Champ,"Like other reviewers, I put this diaper pail on ...",5.0,"{'plastic': 1.0, 'recycled': 1.0, ...",1
Baby Trend Diaper Champ,This product is nice in theory but not all that ...,1.0,"{'a': 1.0, 'else': 1.0, 'buy': 1.0, 'save': 1.0, ...",0
Baby Trend Diaper Champ,I am really disappointed with the Diaper Champ. ...,2.0,"{'pails': 1.0, 'look': 1.0, 'will': 1.0, 'ba ...",0
Baby Trend Diaper Champ,My 8 year old yellow lab was able to get the top ...,1.0,"{'prevent': 1.0, 'literature': 1.0, ...",0
Baby Trend Diaper Champ,"Well, the first three months were odor free!! ...",2.0,"{'have': 1.0, 'don': 1.0, 'they': 1.0, ...",0
Baby Trend Diaper Champ,This is the worst diaper pail ever! It was great ...,1.0,"{'not': 1.0, 'does': 1.0, 'well': 1.0, 'hopeful': ...",0
Baby Trend Diaper Champ,This thing freakin' stinks. Literally. I ...,1.0,"{'them': 1.0, 'to': 1.0, 'listened': 1.0, 'have': ...",0
Baby Trend Diaper Champ,Worst diaper pale ever!! I've had mine for 2 y ...,1.0,"{'this': 1.0, 'unexpectedly': 1.0, ...",0
Baby Trend Diaper Champ,I LOVED my Champ for the first year as it was all ...,2.0,"{'time': 1.0, 'due': 1.0, 'duty': 1.0, 'fails': ...",0
Baby Trend Diaper Champ,"My husband and I selected the Diaper ""Champ"" ma ...",1.0,"{'system': 1.0, 'try': 1.0, 're': 1.0, 'still': ...",0

predicted_sentiment,awesome,great,fantastic,amazing,love,horrible,bad,awful,wow,hate,terrible
3.6475019655728993e-06,0.0,0.0,0.0,0.0,0.0,0,0,0,0,0,0.0
1.0510930238978092e-06,0.0,0.0,0.0,0.0,0.0,0,0,0,0,0,0.0
7.27701628358055e-07,0.0,1.0,0.0,0.0,0.0,0,0,0,0,0,0.0
6.072573910977713e-07,0.0,0.0,0.0,0.0,0.0,1,0,0,0,0,0.0
4.863991442647668e-07,0.0,0.0,0.0,0.0,0.0,0,0,0,0,0,0.0
3.421249220727012e-07,0.0,1.0,0.0,0.0,0.0,0,0,0,0,0,0.0
5.6482290150888015e-09,0.0,0.0,0.0,0.0,0.0,0,0,0,0,0,0.0
1.7767402456397432e-10,0.0,0.0,0.0,0.0,0.0,0,0,0,0,0,0.0
2.7479419193443168e-11,0.0,0.0,0.0,0.0,0.0,0,0,0,0,0,0.0
5.90141453456435e-13,0.0,0.0,0.0,0.0,0.0,0,0,0,0,0,0.0


In [125]:
diaper_champ_reviews[0]['review']

"I read a review below that can explain exactly what we experienced. We've had it for 16 months and it has worked wonderful for us. No smells, change it out once a week, easy to clean. Then a diaper snagged this foam material in the head part, so I pulled the rest of the foam out. Big mistake!!! Now it can no loner retain the stinkiness and we're looking for a replacement. Be careful of overloading and never take out that foam piece that is cushioned between pieces. I have figured out that it is key to keeping the stink out."

In [127]:
sentiment_model.predict(diaper_champ_reviews[0:1], output_type='probability')

dtype: float
Rows: 1
[0.9999999999895941]

In [128]:
selected_words_model.predict(diaper_champ_reviews[0:1], output_type='probability')

dtype: float
Rows: 1
[0.7919288370624482]