In [8]:
import pandas as pd
import numpy as np
import torch
from torchtext import datasets
import random
import nltk
from nltk.corpus import stopwords
from  nltk.stem import SnowballStemmer
import re
from sklearn.model_selection import train_test_split


SEED=42
TEST_SIZE=0.2

In [2]:
DATASET_COLUMNS = ["target", "ids", "date", "flag", "user", "text"]
DATASET_ENCODING = "ISO-8859-1"



df = pd.read_csv("../data/training.1600000.processed.noemoticon.csv", encoding =DATASET_ENCODING , names=DATASET_COLUMNS)

data=pd.DataFrame()
data["text"]=df["text"]
data["target"]=df["target"]

### Equal Number of Negative and Positive Tweet

In [3]:
df.groupby("target").size()

target
0    800000
4    800000
dtype: int64

In [4]:
nltk.download('stopwords')
torch.manual_seed(SEED)
torch.backends.cudnn.deterministic = True

[nltk_data] Downloading package stopwords to
[nltk_data]     /Users/shaunkim/nltk_data...
[nltk_data]   Package stopwords is already up-to-date!


In [5]:
decode_map = {0: "NEGATIVE", 2: "NEUTRAL", 4: "POSITIVE"}

def decode_sentiment(label):
    return decode_map[int(label)]
data.target = data.target.apply(lambda x: decode_sentiment(x))

In [12]:
stop_words = stopwords.words("english")
stemmer = SnowballStemmer("english")

TEXT_CLEANING_RE = "@\S+|https?:\S+|http?:\S|[^A-Za-z0-9]+"


def preprocess(text, stem=False):
    text = re.sub(TEXT_CLEANING_RE, ' ', str(text).lower()).strip()
    tokens = []
    for token in text.split():
        if token not in stop_words:
            if stem:
                tokens.append(stemmer.stem(token))
            else:
                tokens.append(token)
            print(token)
    return " ".join(tokens)

data.text = data.text.apply(lambda x: preprocess(x))

awww
bummer
shoulda
got
david
carr
third
day
upset
update
facebook
texting
might
cry
result
school
today
also
blah
dived
many
times
ball
managed
save
50
rest
go
bounds
whole
body
feels
itchy
like
fire
behaving
mad
see
whole
crew
need
hug
hey
long
time
see
yes
rains
bit
bit
lol
fine
thanks
nope
que
muera
spring
break
plain
city
snowing
pierced
ears
bear
watch
thought
ua
loss
embarrassing
counts
idk
either
never
talk
anymore
would
first
gun
really
though
zac
snyder
doucheclown
wish
got
watch
miss
iamlilnicki
premiere
hollis
death
scene
hurt
severely
watch
film
wry
directors
cut
file
taxes
ahh
ive
always
wanted
see
rent
love
soundtrack
oh
dear
drinking
forgotten
table
drinks
day
get
much
done
one
friend
called
asked
meet
mid
valley
today
time
sigh
baked
cake
ated
week
going
hoped
blagh
class
8
tomorrow
hate
call
wake
people
going
cry
sleep
watching
marley
im
sad
miss
lilly
ooooh
lol
leslie
ok
leslie
get
mad
meh
almost
lover
exception
track
gets
depressed
every
time
some1
hacked
account
ai

forget
8th
april
amp
13th
july
dierks
bentley
comin
columbus
oh
wanna
go
bad
take
sidekick
back
congrats
totally
jealous
wish
xm
working
gr8t
face
itchy
poor
socks
luvvvvv
golden
retriever
want
one
sighhhh
saw
found
tracy
girl
piece
luggage
fucking
terrible
aaaaand
nausea
back
ooh
excited
even
going
2
long
love
youtube
spent
1
hour
reach
axis
bank
find
today
holiday
mahavir
jayanti
contd
agree
jobros
dont
update
theres
often
hilarious
linked
clip
lj
time
ago
went
back
dead
link
oooooooo
im
neither
thats
need
study
tweeted
nearly
day
posted
website
tonight
hopefully
goes
well
night
time
miss
bentley
seriously
needs
finish
job
applications
son
vincas
sick
stay
home
three
tense
days
work
back
holiday
kids
whinging
client
amp
boss
understand
english
well
rewrote
text
unreadable
written
v
good
writer
amp
reviewed
correctly
want
ever
punch
sooo
sick
snow
ughh
work
fan
upset
would
like
apologize
repeated
video
games
live
related
tweets
going
stern
discussion
koodo
soon
stern
cant
figure
get
b

drain
fired
haz
1
job
2
amp
iz
fail
got
drano
ass
amp
iz
still
draining
wanna
shower
dangit
stuck
home
mine
1
10
get
duckling
famous
children
book
stolen
boston
public
garden
boston
globe
via
sharethis
oh
thank
however
hate
list
includes
2
convicts
heading
altrincham
hours
install
morning
good
im
bloody
knackered
work
today
helppp
xxx
garage
park
driveway
happened
quot
popular
music
quot
w
adorno
probably
difficult
reading
ever
prescribed
actually
struggling
continue
cant
see
flowers
falling
dont
camera
cellphone
good
liking
snow
right
getting
used
nice
spring
like
weather
pity
youtube
currently
blocked
china
see
vids
happened
show
hightlight
life
best
leather
sofa
world
office
though
means
still
working
still
3
days
internet
gets
uncapped
get
better
days
could
something
lodged
belly
love
atekinzz
much
amp
amp
soo
miss
wanna
sneak
zoo
play
kitties
oh
hope
getting
sick
dont
think
cause
cousins
birthday
party
sweet
little
man
fell
asleep
waiting
daddy
big
brother
get
home
poor
baby
misse

everytime
click
twitter
thing
myspace
goes
dude
page
horrible
sorryto
hear
cant
find
says
dtmafiaofficial
doesnt
exist
jus
1
dtmafia
found
n
u
dun
seem
b
followin
wht
thought
would
support
augh
eff
sarth
stole
mil
nail
polish
pretty
wishes
spring
fling
tour
dawn
amp
neecee
sigh
g
knight
hoyts
distribution
nz
website
working
great
like
need
like
first
movie
cillian
murphy
hot
wishes
good
old
cartoons
come
back
ie
captain
planet
wally
daria
sadness
feeling
v
good
abt
got
text
sarah
another
day
centre
point
time
early
start
guessing
train
rammed
commuters
four
games
fall
modern
warfare
2
halo
3
odst
brutal
legend
bioshock
2
need
cash
ugh
disconcerting
actually
whole
site
finally
taken
damn
russians
tweets
arent
going
finished
delicious
breakfast
last
paris
miss
milk
europe
tastiest
milk
world
drink
us
ilearn
great
considering
finals
week
stressed
outttt
also
shouldve
bern
asleep
hour
ago
trying
figure
twitter
thing
none
friends
yet
soo
much
see
pinging
kyle44
custom
icons
made
look
cool
e

much
sodding
m25
oh
thought
pirate
bay
trial
verdict
today
apparently
10
days
call
back
study
hall
log
immediately
tired
im
crying
reason
im
try
get
hour
half
tonight
half
got
last
night
totally
like
four
girl
options
none
seem
viable
far
311
veiws
sites
put
together
checking
updates
made
listening
bjork
full
love
crying
omg
hills
love
money2
aww
think
becky
buckwild
goes
craving
tantan
nabe
c
mon
sean
man
watching
quot
league
quot
makes
miss
mint
chocolate
ice
cream
cones
grand
fuck
lost
phone
maybe
grass
long
hope
rain
hope
referring
say
hello
new
stalker
lol
u
sleeping
ur
gonna
night
ur
bike
ride
wanna
listen
masters
looking
good
stuff
write
also
loads
uni
work
feel
unloved
dropped
2
tweeters
london
day
thursday
gonna
raining
oh
fab
see
much
london
eye
still
robbie
care
bless
completely
wiped
reloaded
8900
lost
bbm
contacts
going
bed
sad
sayyyy
whaaaa
invited
sleep
bad
considering
workshop
starting
today
beginnings
sore
throat
though
oh
gosh
made
emotional
haha
idk
dont
want
get
old

ouch
running
morning
help
smart
shower
hope
wake
last
oh
synth
experiments
yielded
nothing
last
night
really
bored
really
sleepy
mad
find
custom
lanyard
maker
wont
make
buy
1000000
minimum
ooh
nice
williams
sonoma
already
got
finally
given
malaysian
restaurant
waiting
nasi
lemak
teh
tarik
mereka
tak
faham
bm
waitin
4
theory
test
centre
2
open
got
woken
mornng
7am
damn
lorry
van
car
accident
outside
main
road
also
causing
car
alarms
go
think
need
get
laid
sad
revolution
earlier
rofl
sudden
want
amanita
someone
made
feel
unliving
hahahahhha
hows
food
poisening
going
gone
away
heard
hannah
yet
disappointing
everything
alright
procrastinating
feel
ill
want
go
bed
gonna
try
find
sports
bar
watch
got
chance
though
think
wants
go
home
watch
hills
guess
funny
aww
moe
planning
leaving
tomorrow
evening
gonna
town
chance
wanna
write
cool
enough
make
storylineee
agreed
love
sound
hates
everyone
knows
art
tomorrow
nice
see
joined
twitter
sigh
think
pms
making
mind
totally
analyse
things
making
sad


tom
cruise
quot
jerry
maguire
got
fired
right
yo
lol
worst
dream
abt
turd
face
used
date
ugh
awful
ouch
imagine
toothpic
eye
something
uh
feel
lonely
wish
bffwiamc
best
friend
forever
also
cousin
twitter
people
keep
following
randomly
stop
makes
sad
still
feeling
bleh
spew
burps
hot
deadline
return
shirt
bought
topshop
bc
50
bank
account
last
rest
month
life
sucks
woke
6am
far
early
coffee
tooooooooo
cold
raining
tomorrow
night
sooo
nice
today
guess
thankful
able
enjoy
least
michael
crichton
curse
slow
internet
miss
youtube
feels
headache
coming
one
letter
alway
koreans
use
quot
x
quot
hope
working
holy
week
haha
nope
guess
nothing
original
days
lots
revision
tonight
final
assessments
assessments
today
well
90
pass
mark
harsh
thats
stapling
chipped
nails
cold
passed
border
chewie
update
ocd
left
legs
fixed
possible
ocd
right
leg
well
worse
still
hip
dysplasia
hips
good
got
back
hospital
bf
nephew
might
meningitis
chi
u
nay
h
p
chu
n
b
ch
c
ki
n
tr
ng
bao
nhi
u
vi
c
coldd
please
watch
v

orders
catch
blogged
since
31st
enough
hrs
day
right
got
stinking
headache
need
run
happy
bunny
sorry
say
vid
hits
hard
please
beware
last
2
minutes
especially
wondering
gamebattles
much
traffic
a2
wait
till
10
lanes
ready
2010
slept
11
hours
awake
since
5
30am
yesterday
still
late
exam
gotta
wake
5
tomoro
onwards
almost
finished
new
moon
work
tomorrow
would
totally
finish
tonight
geez
ok
wonder
twitpix
option
new
phone
got
win
leave
photos
cuz
guess
usually
make
zzzz
today
macbook
froze
luckily
able
take
screen
shot
paper
retyped
end
submitted
paper
1
min
late
faffing
actually
reading
work
feel
productive
forcasters
believed
lucky
lasts
till
afternoon
hard
thanks
rebuilders
rebuilding
tip
trying
help
mom
thru
divorce
thru
breakup
left
head
phone
died
morning
1
head
phone
keep
company
journey
drizzling
day
u
going
rain
might
well
pour
cant
sleep
ugghhh
got
work
ravenous
eaten
gipton
steak
amp
branston
sarnies
buy
something
lunch
doh
new
iphone
yay
restoring
backup
stupid
apple
catering

home
today
usually
sleep
4
hours
night
going
bed
get
5am
good
morning
tom
send
message
short
question
well
bad
guess
guess
dad
pregnant
lol
nah
doctor
give
epidural
chronic
back
pain
though
yeah
good
news
combinator
interview
next
week
dunno
bout
oyster
suck
guess
wont
let
play
doh
keeps
saying
user
valid
would
knew
ed
si
que
se
duerme
temprano
lol
awwww
sorry
stuck
n
bored
yes
hun
thought
trying
keep
entertained
easy
knowwwwww
sukkkk
take
care
gurls
arrrggghhh
seen
last
night
episode
yet
pity
lose
though
early
morning
meetings
ugh
depressing
want
punch
something
still
understand
setup
subversion
website
brahbrah
ugh
bed
hour
money
yet
dont
know
anyone
maybe
lie
hes
us
like
little
bit
lol
sat
work
fair
fair
whoh
day
shut
part
hydraulics
assignment
time
oh
wtf
house
cool
brain
hurty
squishy
mess
ahh
ai
dreptate
pixar
woke
early
watching
tv
trying
sleep
working
part
freeview
get
sports
channel
way
gonna
sleep
tonight
travoradio
morning
blipfm
took
entire
walk
train
station
undo
thats
rea

people
home
town
using
irl
connect
ritz
lol
ok
gig
got
planned
work
xx
need
old
world
misses
hanging
awkward
amazes
men
like
actually
exist
hope
find
someone
someday
love
value
going
school
dt
yaaaay
maybe
gone
guess
counting
sheep
work
hope
get
sleep
really
need
clean
sensor
slr
spot
removal
several
hundred
pictures
woken
someone
hammering
gt
lt
stopped
get
back
sleep
hangover
stuck
traffic
haha
yeah
thought
would
much
complicated
well
ive
got
home
school
got
holidays
x
think
tonsillitis
would
meant
spending
day
heaven
w
mom
getting
see
clean
resulted
soft
top
beaing
soaked
wet
open
dry
mhbigcatch
8oz
golem
finally
got
wight
3oz
time
warcraft
yes
simple
game
group
fans
let
us
know
u
figure
want
prize
sure
tell
u
truth
long
since
seen
ask
sumo
daddy
paulskratch
full
custody
lol
really
wish
could
see
eddie
izzard
tour
damn
stupid
expensive
tickets
cake
death
sleep
stressing
jpc
lt
3
think
im
insomniac
cant
sleep
birthday
5
days
oh
yay
cough
cough
cough
seem
right
confusing
hour
life
ano

back
going
nice
baby
bath
back
nappies
go
anger
getting
bigger
every
minute
goes
got
uglycomments
one
videos
today
day
government
kills
us
talk
aaliyah
love
miss
wife
says
thank
mags
sent
us
awwwww
ur
gunna
make
cry
miss
much
blessed
w
much
love
memories
lol
still
gotta
work
always
finished
everything
needs
work
tonight
ugh
three
hours
nothing
coming
wish
easier
got
hint
booooo
good
morning
believe
last
week
london
back
marketingworld
london
sure
im
boring
really
dont
understand
use
thank
nothing
contribute
discussion
angels
airwaves
vs
blink
182
want
go
remembered
forgotten
best
friends
birthday
awww
ellie
sounds
sick
poor
thing
baby
miss
much
writing
article
video
converters
test
take
long
time
good
luck
enduring
tiring
journey
start
epic
drive
glasgow
alton
towers
looks
like
rainy
days
work
tired
reports
fun
really
maya
spayed
today
nervous
thats
im
folding
getting
tweetie
iphone
twitteriffic
taking
toooo
long
update
need
grouping
amp
replies
tired
mac
going
long
week
funeral
work
t

going
die
soon
good
start
day
woppygook
omniaaaa
said
crackberrryyy
time
depart
flip
phone
hermes
packetdienst
sucks
much
fun
last
night
paying
going
go
fry
egg
squirrels
today
must
hiding
yeah
ploughed
around
last
night
nothing
happening
omg
daughter
come
home
last
night
huge
worry
would
mind
poor
bought
car
impending
fatherhood
affecting
judgement
plans
330ci
rav
4
even
aust
gov
rolls
43
bln
100mb
b
band
still
way
behind
rest
worlds
b
band
speeds
dan
grabbed
yardhouse
earlier
pirate
disappointed
work
early
team
meeting
forgot
lunch
worried
cutting
hours
start
10
00am
every
day
except
may
give
morning
starbucks
sorry
hear
bike
ms
xp
im
afriad
laptop
3yrs
old
think
bit
messed
well
going
rpm
vespa
needs
oil
going
anywhere
fast
remains
un
broken
year
since
mark
speight
died
year
goes
fast
exactly
cities
burn
worries
quot
cities
burn
third
likely
final
outing
quot
new
album
review
like
9
5
malarky
seeing
friends
seen
months
stupid
work
aw
balls
new
shirt
got
aerie
today
fit
wear
medium
sm

sucks
flickr
letting
view
says
private
bet
remember
easter
kid
excited
great
day
wow
welcome
home
eh
well
shit
especially
coming
back
holiday
fucking
people
excellent
missed
saturday
night
good
coz
bad
coz
get
paid
going
sunny
today
right
forecasters
always
put
hopes
fb
carousella
another
doctors
appointment
9
another
one
11
sucks
still
bit
sick
working
2
articles
today
last
2
days
nice
little
office
dont
wanna
move
want
go
college
want
cuddle
babyyy
hmm
shoulder
making
bad
noises
move
arm
back
forth
know
fear
return
physio
may
required
welcome
back
sorry
hear
ants
pest
grr
spam
oh
yesses
quot
road
rash
quot
hip
lovely
ay
rock
welcome
home
sounds
like
hell
journey
back
got
offer
go
camping
fraser
island
weekend
would
jump
offer
without
2nd
thought
forecast
rain
sadly
feed
wordpress
feed
usually
would
bla
com
feed
bla
com
feed
rss2
two
exist
fiuhh
nice
get
info
one
fans
indonesia
still
waiting
movie
country
thanx
want
leave
college
cant
give
smoking
tried
easy
see
moved
dwsr
3am
btw
con

2
ish
alright
late
got
go
college
today
holidays
yeah
get
spraying
going
pay
spray
m3
point
dont
e46
m3
white
europe
would
love
ill
next
week
dude
pay
innocent
happened
last
night
twits
gone
run
away
internet
still
thinks
going
traffic
light
night
haha
edict
announced
social
networking
using
office
system
ok
tweet
evening
chaps
bored
tec
wish
could
seasons
change
365
days
year
heyxboxlive
probably
mention
show
drew
carey
considering
done
major
nelson
man
im
fucked
work
still
business
plan
meeting
many
back
back
presentations
sitting
outside
doctor
surgery
turn
bah
holiday
well
pishing
sun
looks
like
wants
break
hope
dows
kids
head
finally
home
sooo
tired
omg
breech
sob
whitout
friends
pisses
legs
feet
loads
pain
running
old
man
tryed
trash
tent
going
swimming
things
never
get
old
miss
maya
wants
go
shopping
making
short
video
windows
movie
maker
crashed
20th
time
middle
name
perseverence
p
finish
video
soon
tommcfly
good
morning
guys
know
frustrating
never
get
reply
hugs
hope
day
gets


music
dude
called
andy
hull
afew
blokes
even
hear
playing
ldn
tomorrow
snoo
snoo
computers
might
operational
still
much
think
wifi
iphone
broken
quot
connect
quot
actually
use
another
story
oh
pants
hanging
old
folks
back
england
defo
b
4
1
get
back
tho
watching
death
race
found
sandra
cantu
dead
pizza
night
feel
sick
playing
basketball
today
lol
wanna
go
pub
antibiotics
root
canal
take
polaramine
tonight
hives
symptoms
gone
thank
goodness
impressed
rain
wanted
go
market
shopping
bleh
wish
could
link
things
good
yep
6
weeks
lady
church
watching
ah
pox
say
raining
outside
looks
like
snow
raining
cry
im
still
awake
lol
cant
sleep
glad
tho
yep
6
weeks
lady
church
watching
advertised
blog
career
sites
used
agencies
sure
else
go
last
week
got
bike
minus
saddle
great
license
wish
got
rest
back
pissed
coz
friend
busy
see
me2day
coffee
33
turning
starbucks
feral
children
wise
yeah
infact
spray
paint
mutt
got
real
delayed
problems
finished
either
yet
mama
ji
place
everybody
keeps
giving
new
opt

last
week
cant
eat
drink
breath
thanks
bad
throat
infection
cant
eat
drink
breath
properly
thanks
bad
throat
infection
shattered
nanna
passed
away
delay
1500
uni
sucks
leave
home
12
00
attend
lecture
14
30
16
30
amp
roadworks
everywhere
mt
installing
fibre
cables
started
12
week
training
going
tobbr
tough
many
birthdays
currently
work
upsetting
ami
agony
vet
see
6pm
poor
little
thing
know
ping
site
load
trying
contact
dreamhost
body
ever
replys
thanks
good
luck
alas
good
enough
really
want
explain
thanks
everything
lt
3
cannot
stop
coughing
much
sleeeping
wet
hair
eyes
bro
sis
young
mums
working
today
thought
would
help
sun
coffee
going
twitter
facebook
social
networks
seems
become
full
time
job
keep
gets
speak
boyfriend
til
3
happy
cant
speak
til
may
may
hurt
little
im
problem
never
drive
anymore
still
sad
lost
followers
sad
day
morn
awesome
car
ok
think
finally
done
work
yester
day
beer
tv
hitting
sack
back
around
9am
working
life
away
examz
coming
really
feeling
helplessssss
creepy


fed
pain
permanent
earache
almost
yr
fun
liking
new
itunes
pricing
mean
seen
several
songs
1
29
one
0
69
would
great
havin
crappy
day
seem
get
good
mood
sun
would
help
god
pls
tryna
good
gal
u
noe
best
dun
n
dun
n
dun
wana
deep
shit
help
omg
hate
new
facebook
look
either
messy
everything
place
want
old
one
back
yeah
rubbish
think
bill
gone
well
filter
crap
water
deal
murph
pliplup
whatever
water
one
barely
level
20
someone
somewhere
like
sheepish
stuck
chapter
3
incineration
destination
3
days
6
days
work
missing
daughter
went
away
yesterday
week
course
help
teach
gymnastics
house
quiet
yippee
skype
app
available
phone
whatever
next
xcept
cant
use
video
liking
new
itunes
pricing
mean
seen
several
songs
1
29
one
0
69
feeling
really
sick
today
webview
one
control
iphone
sdk
slow
even
loading
local
custom
page
takes
marginal
time
cant
eat
drink
breath
properly
thanks
bad
throat
infection
depends
going
though
dont
want
hanging
around
town
ages
ooo
aisha
tune
doreta
beach
would
rock
x
breat

kelly
fault
know
cakestand
full
cupcakes
getting
hooked
haha
snot
power
1
week
counting
whats
world
ppl
decide
shoot
others
watching
news
depressing
sure
anymore
much
flash
guestbook
outdated
many
updates
twitter
able
follow
everything
situation
write
internals
write
dmw
want
go
town
really
feel
like
walking
got
really
bad
throat
gonna
see
got
yoghurt
pls
pls
photos
gonna
sign
facebook
see
photos
put
flickr
something
good
morning
work
wanna
fuckit
another
day
another
dollar
good
movie
premier
would
cheer
actually
2
blankets
control
poor
guy
bad
head
sims
2
shut
hey
good
thanks
lunch
hehe
noon
overhere
belgium
raining
eric
get
twitter
lol
sorry
teeth
getting
dentists
anything
money
thoughts
prayers
go
people
affected
earthquake
italy
heard
somebody
going
killed
csi
ny
noooooo
sad
eating
cold
dinner
know
mean
drop
start
getting
complaints
win
feel
sorry
women
lost
husband
disgusting
thugs
hearing
story
made
cry
gets
kinda
annoyed
apparent
reason
religion
homework
english
still
reconcilli

lost
first
ten
minutes
maybe
even
first
five
congrats
enjoyed
wrestlemania
would
much
rather
home
stuck
work
mornin
babes
hella
pissed
hungry
op
2h
food
since
9pm
feel
bad
fully
dug
empty
outta
recycle
lookin
like
wats
good
sorry
hope
feel
better
soon
get
ready
work
awww
maaaaan
beautiful
day
cant
watch
twitchhiker
streaming
banned
work
hope
someone
records
mp4
email
cutting
grass
dad
hayfever
grandad
know
mam
stop
crying
occupy
mind
poor
gran
goodbye
watching
buffy
sob
sad
responsible
adult
aw
man
know
tyra
feels
slept
late
go
run
morning
liverpool
get
jealous
going
london
thursdaiii
fed
stir
crazy
bought
lovely
new
clothes
lst
wk
even
got
bag
check
pman
kicking
moldova
hope
people
ok
save
shekels
weekend
plus
tonne
work
responsibilities
ruin
everything
really
wish
could
sleep
mean
oh
hope
everything
turns
alright
sound
like
easy
fix
seem
black
tops
wtf
miss
chai
latte
expresso
house
suffered
writers
block
entire
day
yesterday
midnight
ideas
started
hitting
havnt
yet
sleep
5
37
oh
god

needa
replace
one
asap
maybe
sign
listen
snot
love
ya
x
bad
time
hooked
twilight
11
assignments
due
may
29th
lost
voice
anyone
finds
please
let
know
super
taco
walk
school
im
testing
today
dx
come
never
reply
little
sleep
please
sorry
hear
reivanna
chronic
ones
assume
first
timtam
year
gone
verrrrry
well
miss
australia
getting
ready
head
cousins
hair
dentist
ugh
yet
another
tooth
yanked
lord
help
lol
flat
iron
melted
glasses
found
got
ripped
fraudster
bookseller
us
signed
1st
ed
john
irving
novel
arse
tell
something
hmm
long
charging
sleep
last
nite
wif
nightmares
one
last
night
medan
pine
imap
slow
gmail
inbox
gets
closed
time
time
big
hassle
going
school
enjoying
last
day
16
year
old
let
give
hug
cold
worried
robert
englund
good
loved
movie
dreams
speak
night
honoring
michelle
obama
fashion
icon
wearing
clothes
got
pee
changing
g
mornin
dont
wanna
go
work
2day
think
might
still
sick
pretty
last
week
btw
end
fed
hr1207
yeah
internet
shaped
anything
wish
tech
guy
cannot
unlock
espresso

miss
much
feeling
ecstatic
met
james
matthews
josh
wilkinson
got
james
towel
xd
maan
ears
still
ringing
throat
hurts
kennymeyers
post
playcode
victor
previously
banned
god
blizzard
really
ugh
todays
going
bad
great
started
rain
tired
crying
ohnoes
bansal
trainer
calls
go
sport
aww
thank
much
want
see
make
stop
fu
headache
cold
hell
come
wrong
times
bahah
two
days
birthday
shittest
mood
ever
beware
seb
28th
april
well
im
someone
bitch
cant
say
cause
feel
guilty
even
though
hate
arms
sore
moving
fixtures
far
much
going
today
wait
see
today
brings
guess
another
yucky
day
though
omg
slept
2
hours
sucks
school
5
30
memorize
french
oral
study
exams
much
early
work
till
6
30pm
bleh
late
work
wondering
smells
else
would
two
best
friends
world
leave
woke
need
sleep
funeral
12
got
call
s2bx
little
one
sick
wants
stay
home
today
nawww
love
dont
like
yeah
gotta
find
way
okay
buttercup
cheer
snow
still
chicken
sarnies
makes
sick
oh
ill
get
heinz
big
soup
later
jquery
bringing
gonna
go
dig
stumps
ye

morning
awake
since
4
2nd
born
night
happy
camper
wch
tired
needs
tlc
hey
finished
homework
b
tired
aww
thats
beautiful
sad
way
true
riddle
answer
romeo
juliet
fish
broken
glass
water
fishbowl
breaking
early
morning
flights
sooo
tired
know
find
someone
play
anyone
playing
violin
mozart
sonate
lol
poor
msu
feel
bad
taco
bell
sounds
really
freaking
good
right
thanks
might
get
yeah
got
4
5
cm
snow
newmarket
yesterday
seems
following
ugh
studying
today
need
study
place
study
buddy
anyone
also
lovely
fuck
leaving
cert
disappointed
missing
music
video
lead
role
back
new
york
wants
go
back
badly
much
overtime
work
quite
bad
break
drop
mobile
fair
bit
reading
news
seems
keep
getting
worse
terrible
back
india
feels
good
resumed
office
caught
cold
excel
2003
handle
7
nested
statements
much
pics
wanted
post
room
drum
kit
proven
beyond
impossible
since
bedroom
light
blew
soo
tired
sigh
grumpy
ones
bestest
friend
msu
fans
one
thing
ohio
state
fan
relate
losing
national
championship
feel
loss
feel
b

love
money
baston
sucks
dude
sending
happy
thoughts
way
ew
meatloaf
go
pie
wow
said
like
2
hours
ago
omg
soon
logged
got
typical
mr
twitter
r
u
send
direct
messages
anymore
sick
little
dudes
mucinex
commerials
throwing
party
chest
pet
society
aint
working
cried
blair
got
expelled
poooooor
blair
okay
going
yale
everything
okay
stuck
home
watch
way
many
border
patrol
programs
watching
new
zeland
one
hell
maf
ahh
food
class
hdd
dvd
died
picked
new
topfield
tf71000hdpvrt
wife
permission
course
good
morning
wish
nicer
outside
boston
spring
go
gonna
go
school
40min
know
people
put
lack
spelling
ability
looked
couple
posts
messed
word
get
taking
breakers
getting
ready
school
tooo
early
got
home
taking
lynsey
airport
cold
snowing
hear
think
said
high
today
20
hate
student
teacher
mrs
rolls
unproductive
morning
thanks
link
keep
next
time
already
ordered
glasses
sitting
office
colleagues
abandoned
cold
still
understand
get
date
please
sound
wrong
say
miss
already
cuz
gaaah
monty
streaming
head
t

web
site
listen
work
blocked
playlist
com
meant
getting
ready
see
sophie
half
past
havent
even
got
dressed
yet
xd
headache
oh
better
rush
lt
3
following
anyway
probs
want
followed
lonely
lol
really
want
next
tattoo
got
cash
right
many
gd
ideas
head
cant
get
afford
needle
skin
ugh
head
many
margaritas
monday
wit
arsenal
game
though
omg
recap
sorry
crazy
day
laura
oh
look
snow
outside
please
go
away
amp
eyes
close
tired
sucks
hairy
donkey
balls
knowing
hit
x
dream
finish
rendering
woke
shaking
apple
juice
watching
snow
fall
snow
watching
extras
disk
quot
star
wreck
quot
items
none
menus
yawwwwwwning
office
eight
hours
1500
words
lucy
happily
reparked
brain
composed
largely
mush
beginning
freak
thursday
tuesday
still
hurting
still
eat
chunky
monkey
ice
cream
tired
walk
side
campus
class
9
12
schedule
test
first
hour
would
rolled
twitter
seriously
fucked
last
night
allergies
kicked
already
runny
nose
itchy
eyes
wait
weeks
morning
tweeties
well
cool
windy
snow
ground
day
expected
next
2
day

back
sleep
thing
making
go
school
dumb
precal
quiz
im
afraid
sony
viao
thats
officially
mine
windows
desktop
wanna
uni
work
today
finals
tunes
ceased
working
middle
loading
doubt
singles
collection
pod
worried
sick
santino
fever
need
pick
probably
tackling
cardio
right
like
gonna
happen
sorry
see
twitter
account
personally
follow
another
qt4
community
events
alone
yay
bitch
flaky
broke
zip
trousers
shot
900
photos
today
kyoto
black
dot
dust
sensor
fixed
sorting
nightmare
dog
poor
thing
word
street
quot
face
time
quot
worth
375
individual
pics
rush
rush
rush
9
00
gotta
15
minutes
early
sisters
boyfriends
day
supposed
working
moment
pretty
bored
tho
ugh
im
tired
dont
feel
like
goin
scool
good
morning
amy
snow
going
away
yet
deal
budgets
amp
numbers
early
morning
work
cool
snow
detroit
lately
haha
friday
yet
thankfully
friday
maybe
ask
thursday
yet
answer
unfortunately
still
way
airport
leaving
florida
worst
day
ever
feel
like
death
even
believe
work
right
simba
already
missing
sally
amp


well
told
weeks
ago
downward
spiral
ever
since
even
mention
name
goes
nuts
prodigy
playing
glasgow
tonight
amp
go
gutted
12
years
since
last
saw
bird
keeps
waking
right
wish
would
shut
says
walang
rc
upset
cat
take
medicine
tax
day
started
tedious
task
saying
hello
friend
turbo
tax
fun
day
even
put
words
everything
hurts
uh
wow
missed
lot
twitter
last
night
soo
sleepy
still
high
primer
fumes
joe
said
put
second
coat
wish
1st
period
imy
smile
dunno
atm
iloveyou
xoxo
wearing
nothing
sarong
house
dress
weather
feels
heavy
humid
lovely
avacado
bacon
chicken
baguette
time
work
blow
drying
hair
getting
ready
go
school
believe
cold
outside
april
spring
hot
winter
going
cold
spring
sick
guess
ftsk
show
tonight
unfortunately
allowed
splurge
otherwise
netbook
dsi
sure
choose
one
new
xserve
new
higher
price
surprise
oh
server
died
support
e
g
brother
law
onto
though
feel
fancy
failing
five
times
row
lost
50
though
work
tiiiiiiiiired
oshkosh
wi
work
although
think
home
bed
instead
weather
looking


wish
mesh09
could
bronchitis
allergies
ugh
feel
sick
jakazid
envy
neither
phone
nabaztag
managed
wake
1pm
today
nothing
itunes
australia
country
come
b
c
iraq
mean
sad
day
flack
things
fault
cool
oh
bet
got
lot
people
reason
right
knee
checked
feeling
right
needs
pre
yuck
topless
tired
get
ready
school
hungry
place
eat
right
bakery
goes
workout
great
got
first
tattoo
yesterday
neck
really
sore
mostly
year
11s
someone
somewhere
like
yubotu
2
hour
break
work
twitter
5
hours
boss
put
ban
phones
net
slow
today
many
sites
opening
digging
taste
water
right
baby
woke
quot
hey
mom
dad
time
change
baby
diaper
quot
hmm
mouth
giving
baby
crackers
gingerale
sick
hate
global
warming
hate
snow
april
ffs
way
2
class
hate
art
history
psyc
class
work
rest
day
want
sleep
oh
got
woke
mornin
bad
thng
hella
sick
today
realz
mah
head
hurts
advil
helping
amp
work
go
today
gonna
fun
version
near
live
either
full
2
expensive
space
home
feel
nothing
near
house
val
waiting
wife
youngest
flight
leave
long
drive
c

nights
work
dont
go
noon
go
back
sleep
dunno
oh
tittch
sorry
get
say
goodbye
hugs
still
airport
waiting
ground
20
min
wheres
900
im
poor
uni
student
know
twss
means
snowing
montreal
looking
clock
good
god
still
47
minutes
till
go
home
youu
like
good
wish
could
afford
get
wisdom
teeth
killing
week
says
200
na
ang
dead
sa
italy
bummer
says
page
exist
karelman
thinking
italy
sorry
got
fucking
clue
lmao
wher
wanted
sit
comeeeeee
8
30
pm
still
musica
sigh
still
cant
find
friends
k
pouty
face
shitty
day
boston
ugh
wonder
sick
math
klass
bored
hell
urghhhhh
hate
math
uughhhh
back
work
help
please
hello
everyone
sorry
yesterday
updates
kept
disappearing
hand
hurts
playing
much
last
night
oh
scratch
lost
two
followers
boo
working
home
son
allergies
killing
drop
visit
www
ideastorm
com
already
teel
going
b
rough
day
even
9
30
yet
need
get
ready
work
hi
face
outcome
last
tweet
late
nights
early
monrnings
bad
stuwart
college
opportunity
really
ill
hate
snow
come
back
seeing
monsters
vs
aliens
toni

job
frontpage
win98
exactly
grab
sheets
tonight
tomorrow
forgot
cheesey
ads
impressed
banana
plant
put
nice
weather
see
wilt
babysittin
stupid
lil
sister
wen
actually
shud
friends
enjoyin
weather
think
im
jokin
hi
gabby
sabina
told
use
cocaine
sleep
last
night
terrible
dream
caught
car
zombies
trying
get
eat
bueno
english
bummer
go
class
study
dentist
later
hoping
teeth
plates
nothing
nasty
last
time
want
puppy
anyone
know
anyone
would
like
adopt
trained
lab
bff
moving
find
place
allows
2
dogs
yep
ottawa
lmao
bullshit
nope
forgot
turn
espresso
machine
morning
sigh
guess
breakfast
going
wait
happy
haha
ottawa
effing
april
snow
snowing
april
omfg
im
friggin
bored
cant
jus
something
wait
check
new
splattercast
get
home
aw
oh
well
one
jan
guillou
everyone
might
like
company
blocked
twitter
today
oh
well
still
mobile
way
id
spell
wensday
unfortunatly
im
roman
emperor
viking
god
say
matter
really
need
getting
work
done
twitter
entertaining
right
left
coffee
home
want
awake
right
math
class
h

love
last
day
vacation
hip
hip
hooray
hip
hip
hooray
alarm
go
morning
making
unproductive
busy
day
damn
get
followers
write
got
hardly
sleep
missed
errands
morning
aww
dear
sorry
hear
really
hope
dad
getting
better
phil
stay
strong
play
wii
get
wiispeak
havent
logged
awhile
probably
roaches
oh
god
back
wound
care
center
2
wounds
lower
leg
getting
larger
go
back
tomorrow
chocolate
bad
dogs
lost
follower
thats
upsetting
ha
im
safety
meeting
hope
long
miss
sora
sad
want
cry
stephdau
saw
snowflakes
bus
work
morning
belgian
cable
cnn
euronews
choose
rubbish
either
way
oh
cable
even
works
grrrhhh
im
soo
bored
going
attempt
walk
see
eases
things
miss
bb
oh
good
last
day
chicago
rip
94
7
globe
missed
need
new
radio
station
preset
coming
may
4th
bummin
local
starbucks
doubleshots
cans
sorry
burst
sunny
bubble
pouring
westboro
probs
moving
way
guuuuuuyyyyyyyssssss
dont
wanna
frankie
hellohhhh
mariahdaily
taking
starbucks
break
ugh
sleepy
emotionally
feeling
good
sc
cold
spring
break
hubby
called

tho
home
sick
chicken
noodle
soup
lt
3
briefly
follower
left
feel
alone
vacation
drove
straight
hot
springs
17
amp
1
2
hours
pictures
video
media
break
heart
devastating
think
many
hurt
dead
homeless
need
get
tang
bodega
orange
strawberry
mix
gone
today
duchy
originals
peppermint
tea
gone
last
2
bags
replacements
sight
get
new
camera
thursday
im
excited
could
piss
oops
already
yo
homie
whats
nyc
saying
gonna
miss
weekend
twitter
crackberry
still
go
today
wish
get
australia
tomorrow
wish
looks
good
im
gonna
twitpic
red
im
definitely
sore
today
tyra
show
watch
online
dont
show
uk
dont
think
trying
decipher
german
friend
message
sad
part
speak
english
well
wish
let
us
know
man
missing
lately
template
computer
innit
sorry
unreliable
internet
potholes
phone
dial
properly
text
formatting
stripped
pages
ideas
lol
yea
eeeeew
get
coffee
beforehand
hate
weather
taipei
always
makes
sick
wowzer
u
gonna
come
see
could
bowl
oh
boring
starting
day
nice
quiet
engineering
library
quot
quot
key
stuck
go

yep
yep
certainly
child
friendly
hk
wide
pavements
tricky
maneuvers
strollers
air
gd
hi
tried
meeting
tour
las
year
man
said
youd
gone
u
hadnt
missed
u
wondered
fav
song
x
eyedrops
four
times
day
almost
fortnight
miss
every
single
time
end
wet
face
epic
epic
fail
hard
time
dealing
everything
help
think
alot
wonder
shes
handling
another
day
another
half
dollar
sarah
two
month
check
12
4
lbs
22
5
inches
long
poor
baby
get
shots
sorry
missed
bday
bash
dam
work
wishing
weekend
tuesday
people
hasnt
twitter
days
internet
mums
house
moment
way
school
wearing
retainer
lately
teeth
sore
got
th
longest
trip
back
train
ever
london
tired
last
week
late
dr
week
running
late
amp
forgot
book
hardest
time
getting
outta
bed
sore
throat
doom
ache
nevaa
finished
reading
4
imade
class
gross
desk
wish
ny
misunderstood
bitch
oh
looks
like
going
rain
neither
jacket
umbrella
rain
right
easter
wtf
still
feel
good
snow
really
reallly
sucks
today
keeps
getting
worse
woke
want
school
awww
miss
singing
quot
alabas

griffin
would
stay
one
year
know
better
tiiiired
cruel
girl
make
end
massive
queues
m25
took
wrong
turn
right
near
wembley
gutted
x
thinking
hate
yankees
dont
yankees
fan
losing
orioles
less
work
tho
friday
awful
friday
take
n
income
n
calls
9
hrs
usually
make
outbound
calls
day
5
prank
calls
2
days
completely
different
really
wanna
know
morning
folks
la
traffic
work
listening
mario
break
goes
sooo
hard
2
justin
hard
time
finding
work
hard
time
happy
awesome
voice
today
work
going
impossible
got
home
parcel
meant
delivered
neighbours
house
home
voluneering
focus
uni
stuff
need
write
press
release
hard
wish
practice
saw
video
grown
man
champaign
il
tell
donnie
back
hurting
usual
hip
action
toned
way
still
sitting
class
eating
goldfish
drinking
sprite
lunch
time
robert
englund
quot
pack
quot
duckling
found
safe
webbed
feet
cut
new
one
still
made
trying
find
good
vet
around
think
one
kitties
asthma
write
anymore
papers
five
go
mitchell
james
uncle
kappa
man
passed
4
yrs
ago
kappas
named
s

one
know
tired
shotts
u
know
lol
leave
raw
talent
early
man
well
wounded
gonna
send
v
p
tickets
haa
got
mosquito
bite
morning
hate
big
mama
missing
mommy
always
gone
student
poverty
supposed
haddad
maybe
tweetdeck
like
updates
seen
time
staff
meeting
boss
next
surfing
much
today
coffee
keeps
going
oh
god
work
tomorrowm
good
ol
maccas
ugh
sorry
chica
feel
like
one
understands
issues
like
w
makeup
least
monday
japanese
amp
hiragana
amp
saying
something
since
japanese
man
hate
culture
made
easy
super
overwhelmed
schoolwork
edison
please
shut
power
yet
music
play
day
absolutely
soul
destroying
hope
get
better
soon
make
sure
alot
fluids
wishing
spring
temperatures
break
winter
jacket
today
woken
v
early
big
pair
brown
eyes
unfortunately
belong
puppy
belong
evil
mayan
unfortunately
probably
never
needs
trip
vegas
soon
miss
find
pool
bikini
people
watching
football
long
island
oh
yea
would
better
function
well
work
dies
sobs
cept
still
get
early
sucks
haha
reno
911
always
remember
different
c

KeyboardInterrupt: 

In [10]:
train,test = train_test_split(data, test_size=TEST_SIZE, random_state=SEED)
print("TRAIN size:", len(train))
print("TEST size:", len(test))

TRAIN size: 1280000
TEST size: 320000


In [11]:
train

Unnamed: 0,text,target
1374558,ya quot like palm pre touchstone charger ready...,POSITIVE
1389115,felt earthquake afternoon seems epicenter,POSITIVE
1137831,ruffles shirts like likey,POSITIVE
790714,pretty bad night crappy morning fml buttface d...,NEGATIVE
1117911,yeah clear view,POSITIVE
...,...,...
259178,song middle change want born arghhhh,NEGATIVE
1414414,good luck,POSITIVE
131932,rather average 32370,NEGATIVE
671155,pickin misstinayao waitin sadittysash 2 hurry ...,NEGATIVE


In [43]:
test_tensor = torch.tensor(test.to_numpy())
train_tensor = torch.tensor(train.to_numpy())

TypeError: can't convert np.ndarray of type numpy.object_. The only supported types are: float64, float32, float16, complex64, complex128, int64, int32, int16, int8, uint8, and bool.