In [1]:
# import the neccesory modules
import pandas as pd
import numpy as np

In [2]:
# get the data from csv file
df=pd.read_csv('sen.csv', encoding='latin-1')

In [3]:
# see the number of rows and columns
df.shape

(20491, 3)

In [4]:
# see the data of top 5 rows
df.head()

Unnamed: 0,S.No.,Review,Rating
0,1,nice hotel expensive parking got good deal sta...,4
1,2,ok nothing special charge diamond member hilto...,2
2,3,nice rooms not 4* experience hotel monaco seat...,3
3,4,unique \tgreat stay \twonderful time hotel mon...,5
4,5,great stay great stay \twent seahawk game awes...,5


In [5]:
# delete the unwanted columns
df.drop(['S.No.'], axis=1)

Unnamed: 0,Review,Rating
0,nice hotel expensive parking got good deal sta...,4
1,ok nothing special charge diamond member hilto...,2
2,nice rooms not 4* experience hotel monaco seat...,3
3,unique \tgreat stay \twonderful time hotel mon...,5
4,great stay great stay \twent seahawk game awes...,5
...,...,...
20486,best kept secret 3rd time staying charm \tnot ...,5
20487,great location price view hotel great quick pl...,4
20488,ok just looks nice modern outside \tdesk staff...,2
20489,hotel theft ruined vacation hotel opened sept ...,1


In [6]:
# check for null values 
df.isnull().count()

S.No.     20491
Review    20491
Rating    20491
dtype: int64

In [7]:
#count the number of unique ratings
df["Rating"].value_counts()

5    9054
4    6039
3    2184
2    1793
1    1421
Name: Rating, dtype: int64

In [8]:
#create dataframe for bad ratings or negative ratings
df_neg=df.loc[df["Rating"]<3]
df_neg= df_neg.reset_index(drop= True)
df_neg.head()

Unnamed: 0,S.No.,Review,Rating
0,2,ok nothing special charge diamond member hilto...,2
1,11,poor value stayed monaco seattle july \tnice h...,2
2,16,horrible customer service hotel stay february ...,1
3,17,disappointed say anticipating stay hotel monac...,2
4,25,great location need internally upgrade advanta...,2


In [9]:
#create dataframe for bad ratings or negative ratings
df_five=df.loc[df["Rating"]==5]
df_five= df_five.reset_index(drop= True)

In [10]:
#see the number of bad ratings
print(len(df_neg))

3214


In [11]:
#see the number of good ratings
print(len(df_five))

9054


In [12]:
#equalise both ratings
df_pos=df_five.loc[:len(df_neg)]
len(df_pos)

3215

In [13]:
# merge the dataframe
df_all=pd.concat([df_neg,df_pos],axis=0)
df_all=df_all.reset_index(drop =True)

In [14]:
df_all["Sentiment"]=np.where(df_all["Rating"]==5,"Positive","Negative")

In [15]:
df_all=df_all.sample(frac=1)
df_all=df_all.reset_index(drop= True)

In [16]:
df_all.shape

(6429, 4)

In [17]:
df_all.head(10)
df_all.drop(['S.No.'], axis=1)

Unnamed: 0,Review,Rating,Sentiment
0,nice place family great enjoyable hotel stay \...,5,Positive
1,loved minute \tspent 1 week riu taino \tno com...,5,Positive
2,loved westin read reviews daily westin ca n't ...,5,Positive
3,paradise \tfamily went punta cana days \ttrip ...,5,Positive
4,wow n't worry like did \tno fear \tway bad tim...,5,Positive
...,...,...,...
6424,wonderful vacation travelled 15-22 wonderful v...,5,Positive
6425,good location problems hotel good location clo...,2,Negative
6426,clean great location not worth money hotel fri...,2,Negative
6427,wonderful stay highly recommend stayed omni 21...,5,Positive


In [18]:
#split the dataset for training and testing 
from sklearn.model_selection import train_test_split
x_train,x_test,y_train,y_test=train_test_split(df_all.Review,df_all.Sentiment)

In [19]:
#create model
from sklearn.feature_extraction.text import TfidfVectorizer 
# create object
tfidf = TfidfVectorizer()
# get tf-df values
result = tfidf.fit_transform(x_train)
x_train_vec=tfidf.fit_transform(x_train)
x_test_vec=tfidf.transform(x_test)

In [22]:
# get idf values
print('\nidf values:')
for ele1, ele2 in zip(tfidf.get_feature_names(), tfidf.idf_):
    print(ele1, ':', ele2)


idf values:
00 : 3.8179835786051703
000 : 6.113648228754642
000hope : 8.78779687818117
00a : 8.78779687818117
00am : 6.185107192736787
00dollars : 8.78779687818117
00for : 8.78779687818117
00p : 8.382331770073007
00pm : 5.79206460462718
00us : 8.78779687818117
00usd : 8.78779687818117
01 : 7.871506146307016
02 : 7.871506146307016
03 : 7.283719481404897
04 : 6.6477307146849
05 : 6.436421621017693
050700 : 8.78779687818117
06 : 6.6477307146849
0600 : 8.382331770073007
0645 : 8.78779687818117
06there : 8.78779687818117
07 : 6.079746677078961
0705 : 8.78779687818117
08 : 6.302890228393171
0800 : 8.382331770073007
0810 : 8.78779687818117
0820 : 8.78779687818117
0840 : 8.78779687818117
0850 : 8.78779687818117
08if : 8.78779687818117
09 : 8.094649697621225
0900 : 8.382331770073007
0915 : 8.78779687818117
0920 : 8.78779687818117
0930 : 8.78779687818117
0kay : 8.78779687818117
10 : 3.0593217909345984
100 : 4.3629502463243615
1000 : 6.079746677078961
10000 : 8.78779687818117
100am : 8.787796878



8.78779687818117
45min : 8.382331770073007
45mins : 8.78779687818117
45p : 8.78779687818117
45pm : 8.094649697621225
45th : 8.094649697621225
46 : 7.6891845895130615
460 : 8.78779687818117
46th : 8.78779687818117
47 : 7.871506146307016
470 : 8.78779687818117
4701 : 8.78779687818117
4702 : 8.78779687818117
475 : 8.78779687818117
476 : 8.78779687818117
47am : 8.78779687818117
48 : 7.083048785942746
480 : 8.382331770073007
485 : 8.78779687818117
4865 : 8.78779687818117
488 : 8.78779687818117
489 : 8.78779687818117
48hrs : 8.78779687818117
48th : 8.78779687818117
49 : 7.401502517061281
499 : 8.78779687818117
49ers : 8.78779687818117
49th : 8.382331770073007
4__ç : 8.78779687818117
4am : 6.6477307146849
4feet : 8.78779687818117
4h : 8.78779687818117
4hkd : 8.78779687818117
4m2 : 8.78779687818117
4night : 8.78779687818117
4o : 8.78779687818117
4pm : 6.079746677078961
4s : 8.78779687818117
4season : 8.78779687818117
4star : 7.535033909685803
4th : 5.437892790906567
4we : 8.78779687818117
4x4 

adorable : 7.283719481404897
adore : 8.78779687818117
adored : 8.094649697621225
adorning : 8.78779687818117
adres : 8.78779687818117
adress : 8.78779687818117
adrian : 8.78779687818117
adrienne : 8.094649697621225
adrift : 8.78779687818117
ads : 8.094649697621225
adult : 5.696754424822855
adults : 5.0742248114768636
advace : 8.382331770073007
advance : 4.7804636929487
advance__ç : 8.78779687818117
advanced : 7.6891845895130615
advances : 8.78779687818117
advantage : 5.150210718454785
advantages : 7.6891845895130615
adventerous : 8.382331770073007
adventours : 8.78779687818117
adventure : 6.302890228393171
adventurer : 8.382331770073007
adventures : 7.871506146307016
adventurous : 7.083048785942746
adventursome : 8.78779687818117
adverse : 8.78779687818117
advert : 8.382331770073007
advertise : 6.6477307146849
advertised : 5.437892790906567
advertisement : 7.871506146307016
advertisements : 8.382331770073007
advertises : 6.996037408953116
advertising : 6.841886729125858
advertize : 8.7

any : 7.283719481404897
anybody : 6.046956854255971
anybodys : 8.78779687818117
anyday : 8.78779687818117
anyhoo : 8.78779687818117
anymore : 5.84335789901473
anyone : 7.871506146307016
anyone__ç_é_ : 8.78779687818117
anyones : 8.78779687818117
anyopne : 8.78779687818117
anyother : 8.78779687818117
anyplace : 8.78779687818117
anything : 6.996037408953116
anythying : 8.78779687818117
anytime : 5.925595997251703
anytimesoon : 8.78779687818117
anyting : 8.78779687818117
anyway : 6.485211785187126
anyways : 6.5905723008449515
anywere : 8.382331770073007
anywhere : 7.6891845895130615
aol : 7.871506146307016
aortic : 8.78779687818117
aorund : 8.78779687818117
aournd : 8.78779687818117
ap : 8.78779687818117
aparantly : 8.78779687818117
aparatus : 8.78779687818117
aparently : 8.78779687818117
apart : 5.098917424067235
aparthotel : 8.382331770073007
apartment : 6.148739548565913
apartments : 6.708355336501335
apathetic : 8.78779687818117
apathy : 8.78779687818117
apatio : 8.78779687818117
apeac

awoke : 7.535033909685803
awoken : 7.283719481404897
aword : 8.78779687818117
awry : 8.78779687818117
awsome : 6.772893857638906
ay : 7.871506146307016
aybe : 8.78779687818117
ayu : 8.78779687818117
az : 8.382331770073007
azie : 8.78779687818117
aziza : 8.78779687818117
azul : 8.78779687818117
azure : 8.382331770073007
b12 : 8.78779687818117
b4 : 8.382331770073007
b__ç_èû : 8.78779687818117
ba : 7.535033909685803
babies : 7.283719481404897
baby : 5.81738241261147
babylon : 8.382331770073007
babylon__ç : 8.78779687818117
babysat : 8.78779687818117
babysit : 8.382331770073007
babysitters : 8.78779687818117
babysitting : 7.535033909685803
bacalaitos : 8.78779687818117
bacall : 8.78779687818117
bacardi : 7.535033909685803
bacco : 8.382331770073007
bachata : 7.871506146307016
bachelor : 7.871506146307016
bachelorette : 8.78779687818117
bacially : 8.78779687818117
bacically : 8.78779687818117
bacillary : 8.78779687818117
bacio : 8.78779687818117
back : 5.743274440457748
backache : 8.38233177

berchielli : 8.78779687818117
bergdorf : 8.78779687818117
berkshire : 7.401502517061281
berlin : 5.5689210533129705
bermuda : 7.871506146307016
bermudas : 8.78779687818117
berna : 8.78779687818117
bernadins : 8.78779687818117
bernard : 8.382331770073007
bernardins : 8.78779687818117
bernice : 8.78779687818117
berries : 8.78779687818117
bershire : 8.78779687818117
bert : 8.78779687818117
berth : 8.382331770073007
bertold : 8.78779687818117
beside : 8.78779687818117
besideand : 8.78779687818117
besides : 7.6891845895130615
besite : 8.78779687818117
beso : 8.78779687818117
besos : 8.78779687818117
besotted : 8.78779687818117
bessie : 8.78779687818117
best : 2.5475210330104017
bestbeachwonderful : 8.78779687818117
bestial : 8.78779687818117
bestowed : 8.78779687818117
bestti : 8.78779687818117
bet : 5.870026146096892
beth : 8.78779687818117
bets : 8.78779687818117
bette : 8.78779687818117
better : 2.6852382835676023
betters : 8.78779687818117
bettert : 8.78779687818117
betting : 8.78779687

brothers : 8.78779687818117
brought : 4.255197385027915
broussard : 8.78779687818117
brow : 8.382331770073007
browlio : 8.78779687818117
brown : 5.767371992036809
brownie : 8.094649697621225
browns : 7.401502517061281
browse : 8.382331770073007
bruce : 8.78779687818117
brugal : 8.094649697621225
bruised : 8.78779687818117
bruises : 8.78779687818117
bruising : 8.78779687818117
brulee : 8.78779687818117
brum : 8.78779687818117
brunch : 7.178358965747071
brunches : 8.78779687818117
brune : 8.78779687818117
brunelleschi : 8.78779687818117
brunswick : 8.78779687818117
bruschetta : 8.382331770073007
bruse : 8.78779687818117
brush : 6.113648228754642
brushed : 7.283719481404897
brushing : 7.083048785942746
brusque : 8.78779687818117
brussels : 8.78779687818117
brutal : 8.382331770073007
brutalism : 8.78779687818117
brutally : 8.78779687818117
bryant : 6.5905723008449515
bs : 7.871506146307016
bsic : 8.78779687818117
bstaff : 8.78779687818117
bt : 8.78779687818117
bts : 8.78779687818117
btw : 

caters : 6.302890228393171
catfish : 8.78779687818117
cathartic : 8.78779687818117
cathdreal : 8.78779687818117
cathederal : 8.382331770073007
cathedral : 6.185107192736787
cathedrals : 8.382331770073007
catherdal : 8.78779687818117
catherdral : 8.78779687818117
catherine : 8.382331770073007
cathi : 8.78779687818117
cathing : 8.78779687818117
catie : 8.382331770073007
catolonia : 8.78779687818117
cats : 7.178358965747071
catted : 8.78779687818117
cattle : 8.382331770073007
catty : 8.78779687818117
catwalk : 8.78779687818117
caucasian : 8.78779687818117
caucasians : 8.78779687818117
caught : 6.01520815594139
cauldron : 8.78779687818117
caulked : 8.78779687818117
caulking : 8.094649697621225
cause : 5.84335789901473
caused : 5.870026146096892
causes : 7.535033909685803
causing : 7.283719481404897
causions : 8.78779687818117
caution : 6.436421621017693
cautious : 7.6891845895130615
cava : 8.382331770073007
cavalier : 8.78779687818117
cave : 6.772893857638906
caveat : 7.535033909685803
cav

clipped : 8.78779687818117
clipper : 8.382331770073007
clipping : 8.78779687818117
clippings : 8.094649697621225
clips : 8.78779687818117
clipssheets : 8.78779687818117
clock : 5.549118426016791
clocks : 7.871506146307016
clog : 8.78779687818117
clogged : 6.91599470127958
clone : 8.78779687818117
clorox : 8.78779687818117
closable : 8.78779687818117
close : 3.169209249588202
closeby : 7.871506146307016
closed : 4.374998584840536
closed__ç : 8.78779687818117
closely : 7.401502517061281
closeness : 8.382331770073007
closer : 5.3220609753814445
closes : 6.485211785187126
closest : 6.185107192736787
closet : 4.80811522427921
closets : 6.772893857638906
closing : 5.84335789901473
closness : 8.78779687818117
clost : 8.78779687818117
clostrophobic : 8.78779687818117
closure : 8.78779687818117
closures : 8.78779687818117
cloth : 6.536505079574676
clothed : 8.094649697621225
clothes : 4.855971245456845
clothespins : 8.78779687818117
clothing : 6.345449842811966
cloths : 6.185107192736787
cloud 

constuction : 7.871506146307016
consulate : 8.78779687818117
consultant : 8.382331770073007
consultation : 8.094649697621225
consulted : 8.382331770073007
consulting : 8.382331770073007
consults : 8.78779687818117
consumables : 8.78779687818117
consume : 7.871506146307016
consumed : 8.094649697621225
consumer : 8.094649697621225
consuming : 7.871506146307016
consummables : 8.78779687818117
consumption : 8.382331770073007
cont : 8.382331770073007
contact : 5.0382928022508
contacted : 5.5106521451889945
contacting : 6.996037408953116
contagious : 8.094649697621225
contain : 7.283719481404897
contained : 6.708355336501335
container : 6.996037408953116
containers : 7.401502517061281
containing : 7.401502517061281
contains : 7.6891845895130615
contamination : 8.78779687818117
contemplated : 8.78779687818117
contemplating : 8.382331770073007
contemporaneously : 8.78779687818117
contemporary : 6.113648228754642
contempt : 7.871506146307016
contending : 8.78779687818117
content : 7.40150251706

cutter : 7.283719481404897
cutters : 8.78779687818117
cutting : 7.083048785942746
cuz : 7.283719481404897
cycle : 8.78779687818117
cycled : 8.78779687818117
cycling : 8.78779687818117
cylpso : 8.78779687818117
cynical : 8.78779687818117
d__ç_ : 8.78779687818117
d__ç_é : 8.78779687818117
da : 8.382331770073007
daas : 8.78779687818117
dab : 8.382331770073007
dabbed : 8.78779687818117
dad : 7.535033909685803
dadeland : 8.78779687818117
daft : 8.78779687818117
dahlia : 8.78779687818117
dailey : 8.78779687818117
dailly : 8.78779687818117
daily : 4.244502095911168
daiquiri : 8.78779687818117
daiquiris : 8.78779687818117
dairy : 8.094649697621225
daisy : 8.78779687818117
daiy : 8.78779687818117
dakota : 8.78779687818117
dallas : 6.113648228754642
daly : 8.78779687818117
dam : 6.389901605382801
damage : 6.772893857638906
damaged : 6.772893857638906
damages : 8.094649697621225
damario : 8.78779687818117
damarios : 8.78779687818117
dame : 7.283719481404897
damian : 8.78779687818117
damm : 8.0946

diego : 7.401502517061281
dieing : 8.382331770073007
diem : 8.78779687818117
dier : 8.78779687818117
dierctly : 8.78779687818117
dies : 8.78779687818117
diesel : 8.094649697621225
diet : 6.262068233872916
dietary : 8.382331770073007
dietiry : 8.78779687818117
diets : 8.78779687818117
diferance : 8.78779687818117
diferent : 8.78779687818117
diff : 8.78779687818117
diffarent : 8.78779687818117
diffently : 8.78779687818117
differ : 8.094649697621225
differant : 8.78779687818117
difference : 5.0382928022508
differences : 7.535033909685803
differenet : 8.78779687818117
different : 3.4241600455124916
differentiate : 8.78779687818117
differently : 6.841886729125858
differing : 8.382331770073007
differnt : 8.094649697621225
differs : 8.78779687818117
difficult : 4.67692301400786
difficulties : 7.401502517061281
difficulty : 6.222847520719634
diffuse : 8.78779687818117
diffused : 8.78779687818117
difiicult : 8.382331770073007
difo : 8.78779687818117
dig : 8.382331770073007
digestive : 8.0946496

dousing : 8.78779687818117
douvers : 8.78779687818117
dover : 8.382331770073007
doves : 8.78779687818117
dowdy : 8.382331770073007
dowel : 8.78779687818117
down : 5.719743943047554
downand : 8.78779687818117
downed : 8.78779687818117
downer : 7.871506146307016
downers : 8.382331770073007
downfall : 6.91599470127958
downfalls : 8.382331770073007
downgrade : 7.871506146307016
downgraded : 7.871506146307016
downgrading : 8.382331770073007
downhill : 6.5905723008449515
downi : 8.78779687818117
download : 8.382331770073007
downloaded : 8.78779687818117
downpour : 8.382331770073007
downpours : 8.78779687818117
downright : 6.345449842811966
downs : 8.382331770073007
downside : 5.81738241261147
downside__ç : 8.78779687818117
downsides : 7.535033909685803
downstair : 8.78779687818117
downstairs : 4.927067167140576
downtown : 4.525117001139856
downward : 8.382331770073007
downwards : 8.78779687818117
doze : 8.78779687818117
dozen : 6.6477307146849
dozens : 7.083048785942746
dr : 5.00360724426291

encrusted : 8.78779687818117
end : 3.570147414700589
endearing : 8.094649697621225
ended : 4.304794326167287
ending : 6.772893857638906
endless : 7.083048785942746
endlessly : 8.094649697621225
endorse : 8.382331770073007
endorsement : 8.78779687818117
ends : 6.222847520719634
endulge : 8.78779687818117
endulged : 8.78779687818117
endure : 7.535033909685803
endured : 8.094649697621225
enemies : 8.78779687818117
enemy : 8.382331770073007
energetic : 7.535033909685803
energizing : 8.78779687818117
energy : 6.485211785187126
enertainment : 8.78779687818117
enfolded : 8.78779687818117
enforce : 7.6891845895130615
enforced : 8.094649697621225
enfuriated : 8.78779687818117
engage : 7.871506146307016
engaged : 7.178358965747071
engagement : 8.78779687818117
engaging : 7.6891845895130615
engagment : 8.78779687818117
engand : 8.78779687818117
engine : 7.6891845895130615
engineer : 7.535033909685803
engineered : 8.382331770073007
engineering : 7.6891845895130615
engines : 8.094649697621225
engla

extreemly : 8.78779687818117
extreme : 7.083048785942746
extremeley : 8.78779687818117
extremely : 3.3941693318288095
extrememly : 8.382331770073007
extremes : 8.382331770073007
extremlely : 8.78779687818117
extremley : 8.382331770073007
extremly : 7.6891845895130615
extrodinary : 8.78779687818117
extrordinary : 8.78779687818117
extroverted : 8.78779687818117
extrremely : 8.78779687818117
extrusion : 8.78779687818117
exude : 8.78779687818117
exudes : 8.78779687818117
ey : 8.78779687818117
eye : 5.437892790906567
eyeballing : 8.78779687818117
eyebrow : 8.78779687818117
eyed : 8.78779687818117
eyeglasses : 8.78779687818117
eyelash : 8.78779687818117
eyes : 5.984436497274636
eyesore : 8.382331770073007
eyewitness : 8.78779687818117
eyyyeee : 8.78779687818117
eze : 8.78779687818117
f1 : 8.78779687818117
fa : 8.382331770073007
fab : 6.113648228754642
fabienne : 8.094649697621225
fabric : 7.6891845895130615
fabrics : 7.871506146307016
fabulours : 8.78779687818117
fabulous : 4.110306030613454

flamingo : 7.871506146307016
flamingoes : 8.094649697621225
flamingos : 6.345449842811966
flammable : 8.78779687818117
flammatory : 8.78779687818117
flank : 8.78779687818117
flanked : 8.78779687818117
flannel : 8.78779687818117
flapping : 8.78779687818117
flare : 8.78779687818117
flash : 6.996037408953116
flashed : 8.78779687818117
flashing : 8.094649697621225
flashlight : 8.78779687818117
flashy : 8.094649697621225
flask : 8.78779687818117
flat : 4.762445187446022
flatly : 8.382331770073007
flats : 8.78779687818117
flatscreen : 7.283719481404897
flatter : 8.382331770073007
flattering : 8.78779687818117
flatware : 8.382331770073007
flavio : 8.78779687818117
flavor : 6.485211785187126
flavor__çî_ : 8.78779687818117
flavored : 8.382331770073007
flavorful : 8.382331770073007
flavors : 8.094649697621225
flavour : 7.871506146307016
flavours : 8.78779687818117
flaw : 7.871506146307016
flawed : 7.871506146307016
flawless : 6.91599470127958
flawlessly : 8.382331770073007
flaws : 7.535033909685

fustrating : 8.78779687818117
futile : 8.382331770073007
futon : 8.78779687818117
futons : 8.78779687818117
futur : 8.78779687818117
future : 4.885824208606526
futureabsolutely : 8.78779687818117
futuristic : 8.78779687818117
fuzz : 8.78779687818117
fuzzy : 7.871506146307016
fw : 8.78779687818117
fwd : 8.78779687818117
fwe : 8.78779687818117
fx : 8.78779687818117
fyi : 6.536505079574676
fyi__çî__he : 8.78779687818117
g0 : 8.78779687818117
g208 : 8.78779687818117
ga : 8.78779687818117
gabi : 7.871506146307016
gables : 8.78779687818117
gabriel : 8.094649697621225
gabrielle : 8.78779687818117
gaby : 7.283719481404897
gabys : 8.78779687818117
gadets : 8.78779687818117
gadgets : 8.78779687818117
gads : 8.78779687818117
gag : 8.78779687818117
gaggle : 8.78779687818117
gahr : 8.78779687818117
gail : 8.78779687818117
gain : 6.841886729125858
gained : 7.6891845895130615
gaining : 8.094649697621225
gaiting : 8.78779687818117
gal : 8.094649697621225
gala : 8.382331770073007
gale : 8.3823317700730

gratis : 8.094649697621225
gratitude : 8.78779687818117
gratuities : 7.6891845895130615
gratuity : 7.178358965747071
gratutities : 8.78779687818117
grauman : 8.382331770073007
grave : 8.094649697621225
gravel : 8.382331770073007
gravely : 8.78779687818117
graveyard : 8.094649697621225
gravina : 8.78779687818117
gravol : 8.382331770073007
gravy : 8.78779687818117
gray : 8.094649697621225
grayish : 8.78779687818117
grayline : 8.78779687818117
graze : 8.382331770073007
grazie : 8.382331770073007
greaaaat : 8.78779687818117
gread : 8.78779687818117
grease : 7.535033909685803
greasy : 6.5905723008449515
great : 1.810049227378999
great4 : 8.78779687818117
great__ç : 8.382331770073007
great__çî_ : 8.78779687818117
great__çî_êarge : 8.78779687818117
greated : 7.6891845895130615
greater : 7.283719481404897
greatest : 5.870026146096892
greatful : 8.094649697621225
greatfun : 8.78779687818117
greatgood : 8.78779687818117
greaticed : 8.78779687818117
greatjapanese : 8.78779687818117
greatly : 6.01

heritage : 8.78779687818117
herman : 8.78779687818117
hermes : 8.78779687818117
hermetically : 8.78779687818117
hernandez : 8.78779687818117
hero : 8.382331770073007
heroic : 8.78779687818117
heroin : 8.382331770073007
herpack : 8.78779687818117
hertz : 8.78779687818117
hesitant : 6.841886729125858
hesitantly : 8.78779687818117
hesitate : 5.529700340159689
hesitated : 8.094649697621225
hesitating : 8.78779687818117
hesitation : 6.113648228754642
hesitations : 8.382331770073007
hestitation : 8.78779687818117
heterosexual : 8.382331770073007
heven : 8.78779687818117
hey : 5.696754424822855
hey__ç : 8.78779687818117
hgc : 8.78779687818117
hh : 8.382331770073007
hhonor : 8.78779687818117
hhonors : 7.6891845895130615
hi : 6.185107192736787
hibacchi : 8.78779687818117
hibachi : 7.871506146307016
hibatchi : 8.78779687818117
hibiscus : 7.6891845895130615
hiccaps : 8.78779687818117
hiccups : 8.78779687818117
hickson : 8.78779687818117
hid : 8.382331770073007
hidden : 5.954583534124955
hiddeous 

iceskating : 8.78779687818117
icing : 7.178358965747071
ick : 8.094649697621225
icon : 8.78779687818117
iconic : 8.78779687818117
id : 6.389901605382801
idea : 4.621131654379444
idead : 8.78779687818117
ideal : 5.026596762487609
ideally : 6.485211785187126
ideas : 7.283719481404897
identical : 7.401502517061281
identicial : 8.78779687818117
identifiable : 8.78779687818117
identification : 8.78779687818117
identified : 8.094649697621225
identifies : 8.78779687818117
identify : 7.871506146307016
identifying : 8.094649697621225
identity : 8.382331770073007
idiocrincies : 8.78779687818117
idiosyncrasies : 8.78779687818117
idiot : 8.094649697621225
idiotic : 8.78779687818117
idiots : 8.78779687818117
idling : 8.382331770073007
ido : 8.78779687818117
idyllic : 8.78779687818117
ie : 8.094649697621225
if : 4.598142136154745
ifa : 8.094649697621225
ifc : 8.78779687818117
iffy : 7.535033909685803
ifound : 8.78779687818117
ight : 8.78779687818117
ignacio : 8.78779687818117
ignasio : 8.78779687818

inter : 8.78779687818117
interact : 7.871506146307016
interacted : 8.382331770073007
interacting : 8.382331770073007
interaction : 7.6891845895130615
interactions : 8.382331770073007
interactive : 8.094649697621225
intercepted : 8.78779687818117
interchange : 8.78779687818117
interconnecting : 8.094649697621225
intercontential : 8.382331770073007
interconti : 8.78779687818117
intercontinental : 5.870026146096892
intercontis : 8.78779687818117
interconty : 8.78779687818117
interesed : 8.78779687818117
interested : 5.353809673696025
interesting : 5.2182641816998006
interestingly : 8.78779687818117
interests : 8.382331770073007
interfer : 8.78779687818117
interfere : 8.78779687818117
interfered : 8.78779687818117
interferences : 8.78779687818117
interferes : 8.382331770073007
interfering : 8.78779687818117
interim : 8.78779687818117
interior : 5.5689210533129705
interiors : 8.78779687818117
interlude : 8.78779687818117
interminable : 8.78779687818117
intermixed : 8.78779687818117
internal

kahala : 6.996037408953116
kailua : 8.78779687818117
kaiser : 8.78779687818117
kaiulani : 8.78779687818117
kalakaua : 8.78779687818117
kalakeua : 8.78779687818117
kalekahua : 8.78779687818117
kalia : 8.78779687818117
kalika : 8.78779687818117
kamil : 8.78779687818117
kamlyn : 8.78779687818117
kande : 8.78779687818117
kanji : 8.78779687818117
kannapali : 8.78779687818117
kansas : 8.094649697621225
kantstrasse : 8.78779687818117
kapahulu : 8.382331770073007
kapiolani : 7.871506146307016
karaoke : 7.401502517061281
karaoked : 8.78779687818117
karen : 8.094649697621225
kareoke : 8.78779687818117
kareokee : 8.78779687818117
karima : 8.78779687818117
karissa : 8.78779687818117
karoke : 7.535033909685803
karona : 8.78779687818117
karstadt : 8.78779687818117
kasalta : 8.382331770073007
kat : 8.78779687818117
kate : 8.094649697621225
katerina : 8.78779687818117
katherine : 8.78779687818117
kathleen : 8.382331770073007
kathy : 8.78779687818117
katie : 8.382331770073007
katrina : 6.34544984281196

letter : 5.81738241261147
letters : 7.6891845895130615
letting : 6.389901605382801
lettuce : 6.996037408953116
level : 4.276937371664321
level5 : 8.78779687818117
levels : 6.079746677078961
lever : 8.78779687818117
leverage : 8.78779687818117
lewers : 8.094649697621225
lex : 8.78779687818117
lexington : 7.871506146307016
leyva : 8.78779687818117
lg : 8.78779687818117
lga : 8.78779687818117
lhow : 8.78779687818117
lhw : 8.78779687818117
liability : 7.871506146307016
liable : 8.094649697621225
liars : 8.78779687818117
liberal : 8.78779687818117
liberally : 8.78779687818117
liberty : 6.841886729125858
library : 5.79206460462718
libres : 8.78779687818117
lice : 8.382331770073007
licence : 8.78779687818117
license : 8.78779687818117
licensing : 8.382331770073007
licey : 8.094649697621225
licience : 8.78779687818117
lick : 7.401502517061281
licking : 8.78779687818117
lid : 8.094649697621225
lidl : 8.78779687818117
lido : 8.094649697621225
lids : 8.78779687818117
lie : 5.984436497274636
lied 

makeoverat : 8.78779687818117
maker : 5.652302662252021
makers : 8.094649697621225
makes : 4.3629502463243615
makeshift : 8.78779687818117
makesone : 8.78779687818117
maketh : 8.78779687818117
makeup : 7.283719481404897
making : 4.064843656536697
makinig : 8.78779687818117
malaise : 8.78779687818117
malaria : 7.6891845895130615
malasadas : 8.78779687818117
malave : 8.78779687818117
malaysia : 8.382331770073007
malaysian : 8.382331770073007
maldives : 8.382331770073007
male : 6.485211785187126
maleria : 8.78779687818117
males : 8.382331770073007
maleteros : 8.78779687818117
malfunctioned : 8.094649697621225
malfunctioning : 7.535033909685803
malibu : 8.78779687818117
mall : 5.4919600121768415
mallorca : 8.382331770073007
mallorquina : 8.78779687818117
malls : 7.535033909685803
malmaison : 8.78779687818117
maltreated : 8.78779687818117
malts : 8.78779687818117
mama : 7.535033909685803
mamajuana : 8.094649697621225
mamas : 8.382331770073007
mambas : 8.78779687818117
mambo : 8.787796878181

mingle : 7.535033909685803
mingles : 8.78779687818117
mini : 4.239197043681473
miniature : 8.382331770073007
miniba : 8.78779687818117
minibar : 5.3700701945678055
minibars : 8.78779687818117
minibus : 8.78779687818117
miniclub : 8.78779687818117
minifridge : 7.871506146307016
minifridges : 8.78779687818117
minifrig : 8.78779687818117
minifrige : 8.78779687818117
minimal : 6.222847520719634
minimalism : 8.78779687818117
minimalist : 6.841886729125858
minimalistic : 8.094649697621225
minimally : 8.78779687818117
minimarket : 8.382331770073007
minimilist : 8.78779687818117
minimised : 8.78779687818117
minimises : 8.78779687818117
minimize : 8.78779687818117
minimo : 8.78779687818117
minimum : 6.046956854255971
minimumly : 8.78779687818117
minimums : 8.78779687818117
miniscule : 7.535033909685803
ministry : 8.78779687818117
minites : 8.78779687818117
miniutes : 8.78779687818117
minivan : 7.871506146307016
minmim : 8.78779687818117
minnesota : 8.094649697621225
minoirity : 8.78779687818117

natural : 5.84335789901473
naturally : 7.283719481404897
naturapark : 8.78779687818117
nature : 6.389901605382801
natureproblems : 8.78779687818117
naught : 8.382331770073007
naughty : 8.78779687818117
nausea : 8.094649697621225
nauseous : 8.78779687818117
nauseously : 8.78779687818117
nauseus : 8.78779687818117
nautical : 8.382331770073007
navel : 8.78779687818117
navera : 8.78779687818117
naviete : 8.78779687818117
navigate : 6.996037408953116
navigating : 7.6891845895130615
navy : 8.78779687818117
nawlins : 8.78779687818117
nazi : 8.382331770073007
nazionale : 8.78779687818117
nb : 8.78779687818117
nba : 8.78779687818117
nbc : 8.78779687818117
nbot : 8.78779687818117
nc : 8.382331770073007
ncp : 8.382331770073007
ne : 8.78779687818117
neaby : 8.78779687818117
neagtive : 8.78779687818117
nealry : 8.78779687818117
near : 3.6201578352752506
nearby : 4.3629502463243615
nearbye : 8.78779687818117
nearer : 7.178358965747071
nearest : 6.436421621017693
nearly : 5.0742248114768636
neat : 5.

oder : 8.78779687818117
odor : 5.925595997251703
odors : 8.094649697621225
odour : 7.871506146307016
odours : 8.78779687818117
odyssey : 8.382331770073007
oenophile : 8.78779687818117
oerurves : 8.78779687818117
oeuvre : 8.78779687818117
oeuvres : 7.535033909685803
of : 6.536505079574676
ofbeautiful : 8.78779687818117
ofcommunication : 8.78779687818117
off : 5.549118426016791
off__ç : 8.78779687818117
offale : 8.78779687818117
offend : 8.78779687818117
offended : 7.6891845895130615
offending : 8.78779687818117
offends : 8.78779687818117
offensive : 7.6891845895130615
offer : 4.047222055186877
offerd : 8.382331770073007
offered : 3.9202624277255884
offeres : 8.78779687818117
offering : 6.079746677078961
offerings : 7.178358965747071
offerred : 8.78779687818117
offers : 5.0382928022508
offfered : 8.78779687818117
offhand : 8.78779687818117
offi : 8.78779687818117
offical : 8.78779687818117
office : 5.176878965536947
officemax : 8.78779687818117
officer : 7.6891845895130615
officers : 8.3

owe : 7.871506146307016
owed : 8.094649697621225
owes : 8.78779687818117
owl : 8.094649697621225
own : 7.401502517061281
own_ : 8.78779687818117
owned : 6.079746677078961
owner : 5.652302662252021
owners : 5.696754424822855
ownership : 7.401502517061281
owns : 7.401502517061281
oxfam : 8.78779687818117
oxford : 7.535033909685803
oxidized : 8.78779687818117
oyster : 8.382331770073007
oysters : 8.78779687818117
oz : 7.6891845895130615
pa : 7.871506146307016
pablo : 8.094649697621225
pac : 8.78779687818117
pace : 7.083048785942746
paced : 8.78779687818117
paces : 8.78779687818117
pacha : 8.382331770073007
pacient : 8.78779687818117
pacific : 6.6477307146849
pack : 5.58912376063049
package : 4.644662151789639
package__ç : 8.78779687818117
packaged : 8.094649697621225
packages : 6.708355336501335
packed : 5.353809673696025
packer : 8.78779687818117
packers : 8.382331770073007
packet : 7.401502517061281
packets : 7.6891845895130615
packing : 7.178358965747071
packs : 7.283719481404897
pad : 

phillip : 8.78779687818117
phillipe : 8.78779687818117
phillips : 8.78779687818117
philly : 8.094649697621225
philosophies : 8.78779687818117
philosophy : 8.382331770073007
philthy : 8.78779687818117
phobe : 8.78779687818117
phobia : 8.78779687818117
phobic : 8.78779687818117
phoenician : 7.871506146307016
phoenix : 6.436421621017693
phone : 3.9554911196093325
phonecall : 8.78779687818117
phonecalls : 8.78779687818117
phoned : 6.485211785187126
phones : 6.302890228393171
phoning : 7.871506146307016
phony : 8.382331770073007
phosphorus : 8.78779687818117
photgrapher : 8.78779687818117
photgraphy : 8.78779687818117
photo : 6.436421621017693
photocopies : 8.78779687818117
photogenic : 8.78779687818117
photograper : 8.78779687818117
photograph : 8.78779687818117
photographer : 7.401502517061281
photographers : 8.78779687818117
photographing : 8.78779687818117
photographs : 8.094649697621225
photograpy : 8.78779687818117
photons : 8.78779687818117
photos : 5.925595997251703
phrase : 7.40150

premo : 8.78779687818117
preoccupied : 8.094649697621225
preordered : 8.78779687818117
prep : 8.094649697621225
prepackaged : 8.78779687818117
prepaid : 6.5905723008449515
preparation : 7.178358965747071
prepard : 8.78779687818117
prepare : 6.185107192736787
prepared : 4.598142136154745
preparing : 7.871506146307016
prepay : 8.382331770073007
prepaying : 8.78779687818117
prepayment : 8.382331770073007
preperation : 8.78779687818117
preplanning : 8.78779687818117
prepositioned : 8.78779687818117
preprared : 8.78779687818117
pres : 7.401502517061281
prescription : 8.382331770073007
presdential : 8.78779687818117
presedente : 8.094649697621225
presence : 6.841886729125858
present : 6.046956854255971
presentable : 8.094649697621225
presentation : 5.954583534124955
presentations : 7.535033909685803
presented : 5.870026146096892
presenters : 8.78779687818117
presenting : 8.094649697621225
presents : 8.094649697621225
preservance : 8.78779687818117
preservation : 8.78779687818117
preserve : 8

rainstorm : 8.78779687818117
rainy : 6.996037408953116
raise : 8.094649697621225
raised : 7.283719481404897
raisin : 8.78779687818117
raising : 7.6891845895130615
raisins : 8.382331770073007
raj : 8.78779687818117
rake : 8.094649697621225
raked : 7.401502517061281
rakes : 8.78779687818117
raking : 8.094649697621225
rallies : 8.78779687818117
ralph : 8.382331770073007
ramada : 7.401502517061281
ramadas : 8.78779687818117
rambla : 6.91599470127958
ramblas : 6.01520815594139
rambles : 8.78779687818117
rambling : 8.78779687818117
ramlas : 8.78779687818117
ramon : 8.382331770073007
ramone : 8.78779687818117
ramp : 7.401502517061281
rampage : 8.78779687818117
rampant : 8.094649697621225
ramps : 8.382331770073007
ran : 5.0382928022508
ranch : 7.6891845895130615
rancho : 8.382331770073007
rancid : 8.094649697621225
random : 6.772893857638906
randomly : 7.535033909685803
rang : 6.185107192736787
range : 5.3220609753814445
ranged : 6.708355336501335
ranges : 7.871506146307016
rangetop : 8.787796

replaces : 8.78779687818117
replacing : 7.083048785942746
replanted : 8.78779687818117
replellent : 8.78779687818117
replenish : 7.535033909685803
replenished : 6.6477307146849
replenishes : 8.78779687818117
replete : 8.78779687818117
replica : 8.78779687818117
replicate : 8.78779687818117
replicated : 8.78779687818117
replied : 6.345449842811966
reply : 6.302890228393171
repond : 8.78779687818117
reponded : 8.78779687818117
report : 5.652302662252021
reported : 5.719743943047554
reporting : 7.535033909685803
reports : 6.536505079574676
repremand : 8.78779687818117
represent : 8.094649697621225
representable : 8.78779687818117
representative : 6.148739548565913
representatives : 7.6891845895130615
represented : 7.401502517061281
representing : 8.382331770073007
represents : 8.78779687818117
reprobate : 8.78779687818117
reproduce : 8.78779687818117
reproductive : 8.78779687818117
reprogram : 8.78779687818117
reprogrammed : 8.094649697621225
reproted : 8.78779687818117
reps : 6.647730714

rocky : 7.178358965747071
rod : 7.535033909685803
rode : 6.841886729125858
rodent : 8.78779687818117
rodeo : 7.6891845895130615
rodriguez : 8.78779687818117
rods : 8.78779687818117
roemer : 8.78779687818117
roger : 8.78779687818117
rogers : 8.78779687818117
roh : 8.78779687818117
roland : 8.78779687818117
rolando : 8.78779687818117
role : 7.535033909685803
roles : 8.78779687818117
roll : 5.897425120285006
rollaway : 7.178358965747071
rolled : 6.708355336501335
roller : 7.871506146307016
rollers : 8.78779687818117
rolling : 7.401502517061281
rolls : 6.222847520719634
rolls__çî_ : 8.78779687818117
roma : 8.382331770073007
romaine : 8.382331770073007
roman : 8.78779687818117
romana : 7.283719481404897
romance : 7.871506146307016
romancecons : 8.78779687818117
romancing : 8.78779687818117
romano : 8.78779687818117
romantic : 4.8365531595997435
romantice : 8.78779687818117
romantico : 7.083048785942746
romantics : 8.78779687818117
romantique : 8.78779687818117
romas : 8.78779687818117
romat

scotia : 8.78779687818117
scotland : 7.401502517061281
scott : 8.78779687818117
scottish : 8.78779687818117
scotts : 7.871506146307016
scottsdale : 7.178358965747071
scoured : 8.78779687818117
scout : 8.78779687818117
scouted : 8.78779687818117
scouting : 8.78779687818117
scrabble : 8.78779687818117
scrambed : 8.78779687818117
scramble : 7.871506146307016
scrambled : 6.436421621017693
scrape : 8.78779687818117
scraped : 8.382331770073007
scrapes : 8.78779687818117
scraps : 8.382331770073007
scratch : 7.6891845895130615
scratched : 7.283719481404897
scratches : 7.871506146307016
scratching : 7.401502517061281
scratchy : 7.6891845895130615
screaching : 8.78779687818117
scream : 7.6891845895130615
screamed : 7.6891845895130615
screaming : 6.262068233872916
screaminig : 8.78779687818117
screams : 7.871506146307016
screeching : 8.382331770073007
screen : 4.970084552224266
screened : 8.78779687818117
screens : 6.996037408953116
screming : 8.78779687818117
screw : 6.91599470127958
screwed : 6

sill : 8.78779687818117
silly : 6.302890228393171
silver : 6.389901605382801
silverjet : 8.78779687818117
silvermine : 8.78779687818117
silversmith : 8.78779687818117
silverware : 7.083048785942746
sily : 8.78779687818117
sim : 8.78779687818117
similar : 5.204277939725062
similarities : 8.78779687818117
similarly : 7.535033909685803
similiar : 7.871506146307016
simlar : 8.78779687818117
simmering : 8.78779687818117
simmilar : 8.78779687818117
simone : 8.382331770073007
simple : 5.026596762487609
simpler : 8.78779687818117
simplest : 7.871506146307016
simplicity : 8.78779687818117
simply : 4.553690373583912
simpply : 8.78779687818117
simpsons : 8.78779687818117
simular : 8.78779687818117
simultaneously : 7.871506146307016
sin : 8.094649697621225
since : 7.535033909685803
sincerely : 6.996037408953116
sincerity : 8.78779687818117
sine : 8.78779687818117
sing : 7.083048785942746
singapore : 5.79206460462718
singaporean : 8.78779687818117
singaporeans : 8.382331770073007
singaporei : 8.787

specatacular : 8.78779687818117
specatcular : 8.78779687818117
special : 3.882522099742742
specialised : 8.78779687818117
specialist : 8.094649697621225
specialists : 8.382331770073007
specialities : 7.871506146307016
speciality : 6.996037408953116
specializing : 8.78779687818117
specially : 7.178358965747071
specials : 6.996037408953116
specialthe : 8.78779687818117
specialties : 8.382331770073007
specialty : 6.046956854255971
specialy : 8.78779687818117
species : 8.094649697621225
specifcally : 8.78779687818117
specific : 6.185107192736787
specifically : 5.767371992036809
specification : 8.78779687818117
specifichotel : 8.78779687818117
specified : 7.6891845895130615
specify : 8.382331770073007
specilaity : 8.78779687818117
specilist : 8.78779687818117
specks : 8.78779687818117
spectaclar : 8.78779687818117
spectacle : 8.78779687818117
spectactular : 8.78779687818117
spectacular : 5.050127259897803
spectacularl : 8.78779687818117
spectular : 8.094649697621225
speculate : 8.7877968781

stretches : 8.094649697621225
stretching : 7.535033909685803
strewn : 7.871506146307016
strewth : 8.78779687818117
strick : 8.78779687818117
stricken : 8.78779687818117
strict : 7.535033909685803
strictly : 7.6891845895130615
stride : 8.78779687818117
strident : 8.78779687818117
strides : 8.78779687818117
strike : 7.6891845895130615
strikes : 8.094649697621225
striking : 7.6891845895130615
string : 7.6891845895130615
stringent : 8.78779687818117
strings : 8.78779687818117
stringy : 8.78779687818117
strip : 5.897425120285006
stripe : 8.78779687818117
striped : 8.78779687818117
stripey : 8.78779687818117
stripped : 7.871506146307016
stripping : 8.78779687818117
strips : 8.382331770073007
strive : 8.094649697621225
strives : 8.78779687818117
striving : 8.78779687818117
stroh : 8.78779687818117
strokes : 8.78779687818117
strole : 8.78779687818117
stroll : 6.079746677078961
strolled : 8.78779687818117
stroller : 8.382331770073007
strollers : 8.78779687818117
strolling : 8.382331770073007
st

tax : 5.954583534124955
taxed : 8.78779687818117
taxes : 5.984436497274636
taxi : 4.381077630916918
taxicab : 8.78779687818117
taxies : 8.78779687818117
taxing : 8.382331770073007
taxis : 5.652302662252021
tay : 8.382331770073007
taylor : 8.78779687818117
tazo : 8.78779687818117
tbr : 8.78779687818117
tc : 8.78779687818117
tchoupitoulas : 8.78779687818117
tcm : 8.78779687818117
te : 8.78779687818117
tea : 4.532184168362948
teabags : 8.78779687818117
teach : 6.996037408953116
teacher : 8.382331770073007
teachers : 8.78779687818117
teaching : 8.382331770073007
teak : 8.78779687818117
teal : 8.78779687818117
team : 5.5689210533129705
team__ç_é_ : 8.78779687818117
teams : 8.382331770073007
teapot : 8.78779687818117
tear : 6.996037408953116
tears : 7.283719481404897
teas : 6.91599470127958
teaspoon : 8.78779687818117
tech : 7.283719481404897
techical : 8.78779687818117
techie : 8.78779687818117
technical : 7.6891845895130615
technically : 7.871506146307016
technican : 8.78779687818117
techn

tiolet : 8.78779687818117
tip : 4.0827813572233635
tipers : 8.78779687818117
tipped : 5.098917424067235
tipper : 8.094649697621225
tipping : 5.549118426016791
tippled : 8.78779687818117
tippy : 8.78779687818117
tips : 4.927067167140576
tipsthe : 8.78779687818117
tipsy : 8.78779687818117
tipthe : 8.78779687818117
tiramisu : 8.78779687818117
tire : 7.6891845895130615
tired : 4.405770243507289
tirelessly : 8.094649697621225
tires : 8.382331770073007
tiring : 7.178358965747071
tissue : 7.178358965747071
tissues : 8.094649697621225
tissume : 8.78779687818117
title : 7.6891845895130615
titled : 8.78779687818117
titles : 8.382331770073007
tito : 8.78779687818117
tix : 8.78779687818117
tjhoroughfare : 8.78779687818117
tlc : 8.094649697621225
tmb : 8.78779687818117
tneed : 8.78779687818117
tnt : 7.871506146307016
to : 5.455592368005967
to4 : 8.78779687818117
to8 : 8.78779687818117
toady : 8.78779687818117
toast : 5.5689210533129705
toasted : 8.382331770073007
toaster : 7.178358965747071
toastin

uconn : 8.78779687818117
ucsf : 8.78779687818117
udge : 8.78779687818117
udine : 8.78779687818117
uds : 8.78779687818117
ueno : 8.78779687818117
ufff : 8.78779687818117
uffizi : 6.485211785187126
uffizzi : 8.382331770073007
uffzi : 8.78779687818117
ufizzi : 8.382331770073007
ugggg : 8.78779687818117
ugh : 7.283719481404897
ughh : 8.78779687818117
uglier : 8.78779687818117
ugly : 5.81738241261147
uglyiest : 8.78779687818117
ugraded : 8.78779687818117
uh : 8.382331770073007
uhm : 8.78779687818117
uht : 8.78779687818117
ujs : 8.78779687818117
uk : 5.529700340159689
ultimate : 7.401502517061281
ultimately : 7.283719481404897
ultra : 6.389901605382801
um : 7.6891845895130615
umberella : 8.78779687818117
umbrealla : 8.78779687818117
umbrella : 6.302890228393171
umbrellas : 6.222847520719634
umm : 8.382331770073007
ummmm : 8.78779687818117
umms : 8.78779687818117
umo : 8.78779687818117
umpleseant : 8.78779687818117
umpteen : 8.78779687818117
ums : 8.78779687818117
un : 7.083048785942746
unaba

useful : 5.925595997251703
usefull : 8.78779687818117
useing : 8.78779687818117
useless : 6.345449842811966
uselessly : 8.78779687818117
uselessness : 8.78779687818117
user : 7.178358965747071
users : 7.178358965747071
uses : 6.996037408953116
usfrom : 8.78779687818117
usher : 8.78779687818117
ushered : 8.382331770073007
ushering : 8.78779687818117
using : 4.628913794821499
usopen : 8.78779687818117
uss : 8.78779687818117
ussr : 8.78779687818117
ussual : 8.78779687818117
ust : 8.382331770073007
usthe : 8.78779687818117
usual : 5.086494904068678
usually : 4.437518941821869
usuals : 8.78779687818117
usualy : 8.382331770073007
ususal : 8.382331770073007
uswe : 8.78779687818117
utell : 8.78779687818117
utencils : 8.78779687818117
utensils : 6.708355336501335
utentils : 8.78779687818117
utilitarian : 8.78779687818117
utilities : 8.382331770073007
utility : 7.871506146307016
utilization : 8.78779687818117
utilize : 8.094649697621225
utilized : 7.401502517061281
utilizing : 8.78779687818117
u

waters : 6.302890228393171
waterside : 8.78779687818117
waterslide : 7.6891845895130615
watersport : 8.382331770073007
watersports : 7.083048785942746
watertown : 8.382331770073007
watery : 7.871506146307016
watford : 8.78779687818117
wathc : 8.78779687818117
watied : 8.78779687818117
watmmense : 8.78779687818117
watt : 8.382331770073007
wave : 6.91599470127958
waved : 7.6891845895130615
waverunners : 8.78779687818117
waves : 5.27625143935015
wavied : 8.78779687818117
waving : 8.382331770073007
wavy : 8.78779687818117
wax : 8.094649697621225
waxy : 8.78779687818117
way : 2.689722596014931
wayall : 8.78779687818117
wayne : 8.094649697621225
ways : 5.870026146096892
wayscamp : 8.78779687818117
wayward : 8.78779687818117
waywith : 8.78779687818117
wayy : 8.78779687818117
wayyyyy : 8.78779687818117
wayyyyyyyyyyyy : 8.78779687818117
wc : 7.871506146307016
wd : 8.78779687818117
we : 3.3540748746269315
we__ç_é : 7.6891845895130615
we__ç_éèe : 7.401502517061281
we__ç_éö : 7.283719481404897
wea

yoou : 8.78779687818117
yor : 8.78779687818117
yore : 8.78779687818117
york : 4.345145621690854
yorker : 7.871506146307016
yorkers : 7.871506146307016
yorks : 8.78779687818117
yory : 8.78779687818117
yosemite : 8.78779687818117
you : 5.026596762487609
you__ç : 8.78779687818117
you__ç_é : 8.094649697621225
you__ç_éèe : 6.5905723008449515
you__ç_éêl : 6.996037408953116
you__ç_éö : 7.6891845895130615
you__çî_ : 8.78779687818117
you__çî_à__ç_é : 8.78779687818117
youall : 8.78779687818117
youd : 8.78779687818117
youg : 8.78779687818117
yougert : 8.78779687818117
youll : 7.871506146307016
young : 4.553690373583912
younger : 6.345449842811966
youngest : 7.6891845895130615
youngsters : 8.382331770073007
younow : 8.78779687818117
youomewhere : 8.78779687818117
your : 7.6891845895130615
youre : 8.094649697621225
yourfeet : 8.78779687818117
yours : 8.78779687818117
yourself : 7.283719481404897
youself : 8.382331770073007
youth : 7.401502517061281
youthful : 8.78779687818117
youths : 8.78779687818

In [23]:
print('\ntf-idf value:')
print(result)
 
# in matrix form
print('\ntf-idf values in matrix form:')
print(result.toarray())


tf-idf value:
  (0, 4208)	0.10309075931174097
  (0, 5287)	0.12737951594411567
  (0, 13129)	0.11026591478477563
  (0, 6575)	0.1621409594416718
  (0, 6683)	0.12720359198079154
  (0, 21169)	0.12327196637399938
  (0, 25759)	0.24443716765882353
  (0, 22944)	0.1413831924033372
  (0, 14311)	0.18739852244486097
  (0, 24536)	0.12063662141488016
  (0, 3828)	0.06535240107253559
  (0, 2675)	0.08493198751799264
  (0, 3631)	0.07961679229004627
  (0, 10171)	0.14882288528308396
  (0, 23398)	0.0902321274164432
  (0, 13230)	0.2490488632447211
  (0, 7257)	0.05615492900097509
  (0, 10662)	0.0725440056242383
  (0, 4805)	0.11391661682438758
  (0, 10597)	0.08597715815240092
  (0, 4902)	0.09983223254537006
  (0, 10991)	0.1334385807641101
  (0, 9150)	0.1122956791343086
  (0, 24487)	0.15193146983787312
  (0, 21997)	0.04697628475379618
  :	:
  (4820, 6338)	0.09281359161937072
  (4820, 6093)	0.06242455269708887
  (4820, 3010)	0.07474169226624384
  (4820, 17478)	0.03323440105081049
  (4820, 17132)	0.0717697656653

In [20]:
# create the model 
from sklearn import svm
clf_svm= svm.SVC(kernel="linear")
clf_svm.fit(x_train_vec,y_train)

SVC(kernel='linear')

In [21]:
# see accuracy
clf_svm.score(x_test_vec,y_test)

0.9639303482587065

In [22]:
from sklearn.metrics import f1_score
f1_score(y_test,clf_svm.predict(x_test_vec),average= None)

array([0.96375   , 0.96410891])

In [29]:
#test the model with sample text
rev=["this hotel is nice.I just love it, highly recommended"]
rec_vec=tfidf.transform(rev)
clf_svm.predict(rec_vec)

array(['Positive'], dtype=object)

In [27]:
#test the model with sample text
rev=["absolulatey hated this hotel, horrible food"]
rec_vec=tfidf.transform(rev)
clf_svm.predict(rec_vec)

array(['Negative'], dtype=object)

In [25]:
#test the model with sample text
r=["I like the hotel.It is beautiful.Must visit"]
rec_v=tfidf.transform(r)
clf_svm.predict(rec_v)

array(['Positive'], dtype=object)