# Analyze Product Sentiment

In [1]:
import turicreate
import zipfile

# Read product review data

In [2]:
products = turicreate.SFrame('amazon_baby.sframe')

# Explore data

In [3]:
products

name,review,rating
Planetwise Flannel Wipes,"These flannel wipes are OK, but in my opinion ...",3.0
Planetwise Wipe Pouch,it came early and was not disappointed. i love ...,5.0
Annas Dream Full Quilt with 2 Shams ...,Very soft and comfortable and warmer than it ...,5.0
Stop Pacifier Sucking without tears with ...,This is a product well worth the purchase. I ...,5.0
Stop Pacifier Sucking without tears with ...,All of my kids have cried non-stop when I tried to ...,5.0
Stop Pacifier Sucking without tears with ...,"When the Binky Fairy came to our house, we didn't ...",5.0
A Tale of Baby's Days with Peter Rabbit ...,"Lovely book, it's bound tightly so you may no ...",4.0
"Baby Tracker&reg; - Daily Childcare Journal, ...",Perfect for new parents. We were able to keep ...,5.0
"Baby Tracker&reg; - Daily Childcare Journal, ...",A friend of mine pinned this product on Pinte ...,5.0
"Baby Tracker&reg; - Daily Childcare Journal, ...",This has been an easy way for my nanny to record ...,4.0


In [4]:
products.groupby('name',operations={'count':turicreate.aggregate.COUNT()}).sort('count',ascending=False)

name,count
Vulli Sophie the Giraffe Teether ...,785
"Simple Wishes Hands-Free Breastpump Bra, Pink, ...",562
Infant Optics DXR-5 2.4 GHz Digital Video Baby ...,561
Baby Einstein Take Along Tunes ...,547
Cloud b Twilight Constellation Night ...,520
"Fisher-Price Booster Seat, Blue/Green/Gray ...",489
Fisher-Price Rainforest Jumperoo ...,450
"Graco Nautilus 3-in-1 Car Seat, Matrix ...",419
Leachco Snoogle Total Body Pillow ...,388
"Regalo Easy Step Walk Thru Gate, White ...",374


In [5]:
products['name'].show()

# Examine the reivews for the most-reviewed product

In [6]:
giraffe_reviews = products[products['name']=='Vulli Sophie the Giraffe Teether']

In [7]:
giraffe_reviews

name,review,rating
Vulli Sophie the Giraffe Teether ...,He likes chewing on all the parts especially the ...,5.0
Vulli Sophie the Giraffe Teether ...,My son loves this toy and fits great in the diaper ...,5.0
Vulli Sophie the Giraffe Teether ...,There really should be a large warning on the ...,1.0
Vulli Sophie the Giraffe Teether ...,All the moms in my moms' group got Sophie for ...,5.0
Vulli Sophie the Giraffe Teether ...,I was a little skeptical on whether Sophie was ...,5.0
Vulli Sophie the Giraffe Teether ...,I have been reading about Sophie and was going ...,5.0
Vulli Sophie the Giraffe Teether ...,My neice loves her sophie and has spent hours ...,5.0
Vulli Sophie the Giraffe Teether ...,What a friendly face! And those mesmerizing ...,5.0
Vulli Sophie the Giraffe Teether ...,We got this just for my son to chew on instea ...,5.0
Vulli Sophie the Giraffe Teether ...,"My baby seems to like this toy, but I could ...",3.0


In [8]:
len(giraffe_reviews)

785

In [9]:
giraffe_reviews['rating'].show()

# Building a sentiment classifier

## Build word count vectors

In [10]:
products['word_count'] = turicreate.text_analytics.count_words(products['review'])

In [11]:
products

name,review,rating,word_count
Planetwise Flannel Wipes,"These flannel wipes are OK, but in my opinion ...",3.0,"{'handles': 1.0, 'stripping': 1.0, ..."
Planetwise Wipe Pouch,it came early and was not disappointed. i love ...,5.0,"{'recommend': 1.0, 'highly': 1.0, ..."
Annas Dream Full Quilt with 2 Shams ...,Very soft and comfortable and warmer than it ...,5.0,"{'quilt': 1.0, 'of': 1.0, 'the': 1.0, 'than': 1.0, ..."
Stop Pacifier Sucking without tears with ...,This is a product well worth the purchase. I ...,5.0,"{'tool': 1.0, 'clever': 1.0, 'approach': 2.0, ..."
Stop Pacifier Sucking without tears with ...,All of my kids have cried non-stop when I tried to ...,5.0,"{'rock': 1.0, 'many': 1.0, 'headaches': 1.0, ..."
Stop Pacifier Sucking without tears with ...,"When the Binky Fairy came to our house, we didn't ...",5.0,"{'thumb': 1.0, 'or': 1.0, 'break': 1.0, 'trying': ..."
A Tale of Baby's Days with Peter Rabbit ...,"Lovely book, it's bound tightly so you may no ...",4.0,"{'for': 1.0, 'barnes': 1.0, 'at': 1.0, 'is': ..."
"Baby Tracker&reg; - Daily Childcare Journal, ...",Perfect for new parents. We were able to keep ...,5.0,"{'right': 1.0, 'because': 1.0, 'questions': 1.0, ..."
"Baby Tracker&reg; - Daily Childcare Journal, ...",A friend of mine pinned this product on Pinte ...,5.0,"{'like': 1.0, 'and': 1.0, 'changes': 1.0, 'the': ..."
"Baby Tracker&reg; - Daily Childcare Journal, ...",This has been an easy way for my nanny to record ...,4.0,"{'in': 1.0, 'pages': 1.0, 'out': 1.0, 'run': 1.0, ..."


# Define what is positive and negative sentiment

In [12]:
products['rating'].show()

In [13]:
#ignore all 3*  reviews
products = products[products['rating']!= 3]

In [14]:
#positive sentiment = 4-star or 5-star reviews
products['sentiment'] = products['rating'] >= 4

In [15]:
products

name,review,rating,word_count,sentiment
Planetwise Wipe Pouch,it came early and was not disappointed. i love ...,5.0,"{'recommend': 1.0, 'highly': 1.0, ...",1
Annas Dream Full Quilt with 2 Shams ...,Very soft and comfortable and warmer than it ...,5.0,"{'quilt': 1.0, 'of': 1.0, 'the': 1.0, 'than': 1.0, ...",1
Stop Pacifier Sucking without tears with ...,This is a product well worth the purchase. I ...,5.0,"{'tool': 1.0, 'clever': 1.0, 'approach': 2.0, ...",1
Stop Pacifier Sucking without tears with ...,All of my kids have cried non-stop when I tried to ...,5.0,"{'rock': 1.0, 'many': 1.0, 'headaches': 1.0, ...",1
Stop Pacifier Sucking without tears with ...,"When the Binky Fairy came to our house, we didn't ...",5.0,"{'thumb': 1.0, 'or': 1.0, 'break': 1.0, 'trying': ...",1
A Tale of Baby's Days with Peter Rabbit ...,"Lovely book, it's bound tightly so you may no ...",4.0,"{'for': 1.0, 'barnes': 1.0, 'at': 1.0, 'is': ...",1
"Baby Tracker&reg; - Daily Childcare Journal, ...",Perfect for new parents. We were able to keep ...,5.0,"{'right': 1.0, 'because': 1.0, 'questions': 1.0, ...",1
"Baby Tracker&reg; - Daily Childcare Journal, ...",A friend of mine pinned this product on Pinte ...,5.0,"{'like': 1.0, 'and': 1.0, 'changes': 1.0, 'the': ...",1
"Baby Tracker&reg; - Daily Childcare Journal, ...",This has been an easy way for my nanny to record ...,4.0,"{'in': 1.0, 'pages': 1.0, 'out': 1.0, 'run': 1.0, ...",1
"Baby Tracker&reg; - Daily Childcare Journal, ...",I love this journal and our nanny uses it ...,4.0,"{'tracker': 1.0, 'now': 1.0, 'its': 1.0, 'sti ...",1


In [16]:
products['sentiment'].show()

# Train our sentiment classifier

In [17]:
train_data,test_data = products.random_split(.8,seed=0)

In [18]:
sentiment_model = turicreate.logistic_classifier.create(train_data,target='sentiment', features=['word_count'], validation_set=test_data)

# Evaluation of Sentiement Model

In [19]:
sentiment_model_performance = sentiment_model.evaluate(test_data)

In [20]:
sentiment_model_performance['accuracy']

0.9176975738650012

In [21]:
test_data['sentiment'].show()

In [22]:
test_data_majority = test_data[test_data['sentiment'] == 1]

In [23]:
len(test_data_majority)/len(test_data)

0.8400192169108815

# Apply the sentiment classifier to better understand the Giraffe reviews

In [24]:
giraffe_reviews = products[products['name']== 'Vulli Sophie the Giraffe Teether']

In [25]:
giraffe_reviews['predicted_sentiment'] = sentiment_model.predict(giraffe_reviews, output_type = 'probability')

In [26]:
giraffe_reviews

name,review,rating,word_count,sentiment
Vulli Sophie the Giraffe Teether ...,He likes chewing on all the parts especially the ...,5.0,"{'purchase': 1.0, 'teething': 1.0, ...",1
Vulli Sophie the Giraffe Teether ...,My son loves this toy and fits great in the diaper ...,5.0,"{'a': 1.0, 'is': 1.0, 'when': 1.0, 'him': 1.0, ...",1
Vulli Sophie the Giraffe Teether ...,There really should be a large warning on the ...,1.0,"{'made': 1.0, 'of': 1.0, 'packaging': 1.0, 'no': ...",0
Vulli Sophie the Giraffe Teether ...,All the moms in my moms' group got Sophie for ...,5.0,"{'another': 1.0, 'out': 1.0, 'run': 1.0, 'lost': ...",1
Vulli Sophie the Giraffe Teether ...,I was a little skeptical on whether Sophie was ...,5.0,"{'disappointed': 1.0, 'will': 1.0, 'take': ...",1
Vulli Sophie the Giraffe Teether ...,I have been reading about Sophie and was going ...,5.0,"{'late': 1.0, 'perfect': 1.0, 'pack': 1.0, 'on ...",1
Vulli Sophie the Giraffe Teether ...,My neice loves her sophie and has spent hours ...,5.0,"{'delight': 1.0, 'in': 1.0, 'other': 1.0, ...",1
Vulli Sophie the Giraffe Teether ...,What a friendly face! And those mesmerizing ...,5.0,"{'inside': 1.0, 'water': 1.0, 'don': 1.0, 'up': ...",1
Vulli Sophie the Giraffe Teether ...,We got this just for my son to chew on instea ...,5.0,"{'its': 1.0, 'fine': 1.0, 'is': 1.0, 'which': 1.0, ...",1
Vulli Sophie the Giraffe Teether ...,This product is without a doubt the best on the ...,5.0,"{'belongs': 1.0, 'dog': 1.0, 'if': 1.0, 'bewa ...",1

predicted_sentiment
0.9993655365682312
0.9998633791689632
0.2545268197809084
0.916568808391505
0.6855768205885338
0.99999994452112
0.997935118109352
0.9999745004834384
0.9460144428356856
0.9999999721665868


# Sort the Giraffe reviews according to predicted sentiment

In [27]:
giraffe_reviews = giraffe_reviews.sort('predicted_sentiment', ascending=False)

In [28]:
giraffe_reviews

name,review,rating,word_count,sentiment
Vulli Sophie the Giraffe Teether ...,"Sophie, oh Sophie, your time has come. My ...",5.0,"{'11': 1.0, 'prisrob': 1.0, '12': 1.0, 'who': ...",1
Vulli Sophie the Giraffe Teether ...,I'll be honest...I bought this toy because all the ...,4.0,"{'around': 1.0, 'explore': 1.0, 'they': ...",1
Vulli Sophie the Giraffe Teether ...,As a mother of 16month old twins; I bought ...,5.0,"{'will': 1.0, '15months': 1.0, 'would': 2.0, ...",1
Vulli Sophie the Giraffe Teether ...,We got this little giraffe as a gift from a ...,5.0,"{'out': 1.0, 'would': 1.0, 've': 1.0, 'enou ...",1
Vulli Sophie the Giraffe Teether ...,"As every mom knows, you always want to give your ...",5.0,"{'whether': 1.0, 'neutral': 1.0, 'gend ...",1
Vulli Sophie the Giraffe Teether ...,My Mom-in-Law bought Sophie for my son whe ...,5.0,"{'penny': 1.0, 'little': 1.0, 'perfect': 1.0, ...",1
Vulli Sophie the Giraffe Teether ...,"My 4 month old son is teething, and I've tried ...",4.0,"{'worth': 1.0, 'works': 1.0, 'teether': 1.0, ...",1
Vulli Sophie the Giraffe Teether ...,Let me just start off by addressing the choking ...,5.0,"{'question': 1.0, 'must': 1.0, 'overall': 1.0, ...",1
Vulli Sophie the Giraffe Teether ...,I'm not sure why Sophie is such a hit with the ...,4.0,"{'makers': 1.0, 'or': 1.0, 'take': 1.0, 'can': ...",1
Vulli Sophie the Giraffe Teether ...,"I admit, I didn't get Sophie the Giraffe at ...",4.0,"{'dye': 1.0, 'of': 1.0, 'cause': 1.0, 'fade': ...",1

predicted_sentiment
1.0
1.0
1.0
0.9999999999998376
0.9999999999998284
0.9999999999997958
0.9999999999994914
0.9999999999941254
0.999999999987423
0.9999999999829476


In [29]:
giraffe_reviews.tail()

name,review,rating,word_count,sentiment
Vulli Sophie the Giraffe Teether ...,My 7 1/2 month old grandbaby was sittng up ...,1.0,"{'sopie': 1.0, 'with': 1.0, 'be': 1.0, 'shou ...",0
Vulli Sophie the Giraffe Teether ...,I was so looking forward to getting this for my ...,1.0,"{'amazon': 1.0, 'back': 1.0, 'by': 1.0, 'more': ...",0
Vulli Sophie the Giraffe Teether ...,Received the product and smells like cheap rub ...,1.0,"{'was': 1.0, 'as': 1.0, 'still': 1.0, 'but': ...",0
Vulli Sophie the Giraffe Teether ...,I got one of these as a showe gift that my baby ...,1.0,"{'typical': 1.0, 'paint': 1.0, 'came': 1.0, 'mi ...",0
Vulli Sophie the Giraffe Teether ...,When we first got it I thought did my ...,2.0,"{'mom': 1.0, 'teethers': 1.0, 'btw': 1.0, 'oth ...",0
Vulli Sophie the Giraffe Teether ...,When I received this the paint was peeling off in ...,1.0,"{'risk': 1.0, 'but': 1.0, 'help': 1.0, 'terrible': ...",0
Vulli Sophie the Giraffe Teether ...,"""Sophie the Giraffe"" has tested positive for ...",1.0,"{'ingest': 1.0, 'they': 1.0, 'naturally': 1.0, ...",0
Vulli Sophie the Giraffe Teether ...,"My son (now 2.5) LOVED his Sophie, and I bought ...",1.0,"{'exaggerated': 1.0, 'are': 1.0, 'a': 3.0, ...",0
Vulli Sophie the Giraffe Teether ...,I wanted to love this product and was excited ...,1.0,"{'risk': 1.0, 'ready': 1.0, 'bummed': 1.0, ...",0
Vulli Sophie the Giraffe Teether ...,This children's toy is nostalgic and very cute. ...,1.0,"{'amazon': 1.0, 'from': 1.0, 'one': 1.0, 'by': ...",0

predicted_sentiment
1.9110740195652222e-06
6.547801686046981e-07
3.86423639743923e-07
2.237822515934467e-07
1.9353955281812584e-07
1.6900753980978605e-07
1.1748826795730037e-07
5.3649334270185817e-11
3.109035270461179e-13
4.119269639396916e-15


## Show the most positive reviews

In [30]:
giraffe_reviews[0]['review']

"Sophie, oh Sophie, your time has come. My granddaughter, Violet is 5 months old and starting to teeth. What joy little Sophie brings to Violet. Sophie is made of a very pliable rubber that is sturdy but not tough. It is quite easy for Violet to twist Sophie into unheard of positions to get Sophie into her mouth. The little nose and hooves fit perfectly into small mouths, and the drooling has purpose. The paint on Sophie is food quality.Sophie was born in 1961 in France. The maker had wondered why there was nothing available for babies and made Sophie from the finest rubber, phthalate-free on St Sophie's Day, thus the name was born. Since that time millions of Sophie's populate the world. She is soft and for babies little hands easy to grasp. Violet especially loves the bumpy head and horns of Sophie. Sophie has a long neck that easy to grasp and twist. She has lovely, sizable spots that attract Violet's attention. Sophie has happy little squeaks that bring squeals of delight from Viol

In [31]:
giraffe_reviews[1]['review']

'I\'ll be honest...I bought this toy because all the hip parents seem to have one too and I wanted to be a part of the "hip parent" crowd. The price-tag was somewhat of a deterent but I prevailed and purchased this teether for my daughter.At first, Lily didn\'t know what to make of of Sophie and showed little interest in the polka-dotted creature. I continued to introduce Lily to Sophie and kept the toy in the carrier so that it was on-hand during transitions. Eventually, Lily discovered what a wonderful experience it was to gnaw on the hooves and ears and these two have never been far apart since.Lily really enjoys gumming all the different parts of Sophie like no other teether we have. The size of the toy is great as it is somewhat substantial and so easy for a little one to grasp and hold onto. Lily really enjoys hearing Sophie squeak and will smile whenever Sophie makes a noise or pops her head up from Mommy\'s lap to say hello.People have stopped and commented on Sophie and to the

# Most negative reivews

In [32]:
giraffe_reviews[-1]['review']

"This children's toy is nostalgic and very cute. However, there is a distinct rubber smell and a very odd taste, yes I tried it, that my baby did not enjoy. Also, if it is soiled it is extremely difficult to clean as the rubber is a kind of porus material and does not clean well. The final thing is the squeaking device inside which stopped working after the first couple of days. I returned this item feeling I had overpaid for a toy that was defective and did not meet my expectations. Please do not be swayed by the cute packaging and hype surounding it as I was. One more thing, I was given a full refund from Amazon without any problem."

In [33]:
giraffe_reviews[-2]['review']

'I wanted to love this product and was excited to buy it when I became pregnant but am now hesitant to let my baby use it after reading about the recall in Europe. Apparently, as I understand it, their toxin standards of measurement are lower than ours so they have not been recalled here (apparently we are OK with low levels of nitrates in the toys our children put in their mouths, but Europeans are not...hmmm)...Be that as it may, toxins registering even CLOSE to a dangerous level made me nervous about using. After digging around online I did discover that the company claims to have changed the product after a certain date and lists manufacturing codes so you can check yours (those listed were made after a certain date and are said to be safer). Sadly mine was not made after the &#34;improved&#34; date but I could not return it because there was no formal recall in our country. I considered returning it and hunting for one with an approved manufacturing date but man that was just too 

# Task 1
## Using .apply() to build a new feature with the counts for each of the selected_words:

In [34]:
selected_words = ['awesome', 'great', 'fantastic', 'amazing', 'love', 'horrible', 'bad', 'terrible', 'awful', 'wow', 'hate']

for product in selected_words:
    products[product] = products['word_count'].apply(lambda counts: counts.get(product, 0))

## Using .sum() method to find most used and least used word:

In [35]:
sum_words = []
for product in selected_words:
    sum_words.append(products[product].sum())

In [36]:
selected_words_total = dict(zip(selected_words, sum_words))

word_max = max(selected_words_total.keys(), key=(lambda k: selected_words_total[k]))
word_min = min(selected_words_total.keys(), key=(lambda k: selected_words_total[k]))

print('Most used word is, %s = %d' % (word_max, selected_words_total[word_max]))
print('Least used word is, %s = %d' % (word_min, selected_words_total[word_min]))

Most used word is, great = 55791
Least used word is, wow = 425


# Task 2
## Create a new sentiment analysis model using only the selected_words as features:

In [37]:
train_data,test_data = products.random_split(.8,seed=0)

In [38]:
selected_words_model = turicreate.logistic_classifier.create(train_data,target='sentiment', features=selected_words, validation_set=test_data)

In [39]:
weights = selected_words_model.coefficients

In [40]:
weights = weights.sort('value', ascending=False)

In [41]:
weights[0]

{'name': 'love',
 'index': None,
 'class': 1,
 'value': 1.359268866922504,
 'stderr': 0.02806830015209953}

In [42]:
weights[-1]

{'name': 'horrible',
 'index': None,
 'class': 1,
 'value': -2.251335236759102,
 'stderr': 0.08020249388788425}

# Task 3
## Comparing the accuracy of different sentiment analysis model:

In [43]:
selected_words_model_performance = selected_words_model.evaluate(test_data)

In [44]:
selected_words_model_performance['accuracy']

0.8463848186404036

In [45]:
test_data['sentiment'].show()

In [46]:
test_data_majority = test_data[test_data['sentiment'] == 1]

len(test_data_majority)/len(test_data)

0.8400192169108815

# Task 4
## Interpreting the difference in performance between the models:

In [47]:
diaper_champ_reviews = products[products['name'] == 'Baby Trend Diaper Champ']

In [48]:
diaper_champ_reviews['predicted_sentiment'] = sentiment_model.predict(diaper_champ_reviews, output_type = 'probability')

In [49]:
diaper_champ_reviews = diaper_champ_reviews.sort('predicted_sentiment', ascending=False)

In [50]:
diaper_champ_reviews[0:1]

name,review,rating,word_count,sentiment,awesome
Baby Trend Diaper Champ,I read a review below that can explain exactly ...,4.0,"{'key': 1.0, 'have': 1.0, 'pieces': 1.0, 'betwe ...",1,0.0

great,fantastic,amazing,love,horrible,bad,terrible,awful,wow,hate,predicted_sentiment
0.0,0.0,0.0,0.0,0,0,0.0,0,0,0,0.999999999989594


In [51]:
diaper_champ_reviews[0]['review']

"I read a review below that can explain exactly what we experienced. We've had it for 16 months and it has worked wonderful for us. No smells, change it out once a week, easy to clean. Then a diaper snagged this foam material in the head part, so I pulled the rest of the foam out. Big mistake!!! Now it can no loner retain the stinkiness and we're looking for a replacement. Be careful of overloading and never take out that foam piece that is cushioned between pieces. I have figured out that it is key to keeping the stink out."

In [52]:
selected_words_model.predict(diaper_champ_reviews[0:1], output_type='probability')

dtype: float
Rows: 1
[0.7919288370624482]

In [53]:
diaper_champ_reviews[0]['word_count']

{'key': 1.0,
 'have': 1.0,
 'pieces': 1.0,
 'between': 1.0,
 'cushioned': 1.0,
 'piece': 1.0,
 'take': 1.0,
 'overloading': 1.0,
 'be': 1.0,
 'looking': 1.0,
 're': 1.0,
 'stinkiness': 1.0,
 'retain': 1.0,
 'now': 1.0,
 'wonderful': 1.0,
 'worked': 1.0,
 '16': 1.0,
 'and': 3.0,
 'months': 1.0,
 've': 1.0,
 'in': 1.0,
 'i': 3.0,
 'experienced': 1.0,
 'read': 1.0,
 'easy': 1.0,
 'for': 3.0,
 'to': 2.0,
 'has': 1.0,
 'review': 1.0,
 'keeping': 1.0,
 'replacement': 1.0,
 'out': 5.0,
 'loner': 1.0,
 'clean': 1.0,
 'we': 3.0,
 'a': 4.0,
 'mistake': 1.0,
 'big': 1.0,
 'pulled': 1.0,
 'it': 5.0,
 'this': 1.0,
 'is': 2.0,
 'explain': 1.0,
 'material': 1.0,
 'exactly': 1.0,
 'that': 4.0,
 'had': 1.0,
 'what': 1.0,
 'part': 1.0,
 'us': 1.0,
 'no': 2.0,
 'smells': 1.0,
 'can': 2.0,
 'change': 1.0,
 'figured': 1.0,
 'week': 1.0,
 'then': 1.0,
 'snagged': 1.0,
 'diaper': 1.0,
 'careful': 1.0,
 'the': 5.0,
 'never': 1.0,
 'foam': 3.0,
 'head': 1.0,
 'so': 1.0,
 'below': 1.0,
 'rest': 1.0,
 'stink': 1

In [54]:
word_count = diaper_champ_reviews[0]['word_count']

In [55]:
selected_word_count = {}

for key, value in word_count.items():
    for word in selected_words:
        if key == word:
            selected_word_count[key] = value

In [56]:
selected_word_count

{}