## Text Preprocessing

This notebook is to process and clean 5000 lines of blog data.

***

In [None]:
# Initialize NLTK
# import nltk
# nltk.download('popular')

In [None]:
#nltk.__version__

In [1]:
import pandas as pd
import numpy as np
import nltk
import string
import re
import matplotlib.pyplot as plt
import wordcloud
from wordcloud import WordCloud, ImageColorGenerator
from collections import OrderedDict
from ast import literal_eval

from nltk.tokenize import word_tokenize
from nltk.corpus import stopwords, wordnet
from nltk.stem import WordNetLemmatizer, PorterStemmer, SnowballStemmer
from nltk.probability import FreqDist
from nltk.util import bigrams, ngrams, trigrams

pd.set_option('display.width', 1000)
pd.set_option('display.max_colwidth', 1000)
%matplotlib inline

In [2]:
df = pd.read_csv('blogdata_5000.csv')

In [4]:
df.head()

Unnamed: 0,words
0,"We have given our hearts away, a sordid boon !”"
1,1. Start it on the side
2,"Sugar’s sweet, so is she,"
3,"So because the Asian community was so by need tight-knit, the next thing you know I have Asian kids following me around, you know doing more shit for me than the boys that wanted inside of me. Especially the two in particular. They thought I was “so wonderful” which sickened me even further. I was not wonderful, it reminds me of that quote, from WWII era forget it but goes on to say something like, “It was not that I was a hero, it was everyone around me was acting so badly” when someone won a humanitarian award."
4,Nicholas’ brain runs on and is excellent at processing data and concrete facts. He works best with things he can quantify. He runs into an almost insurmountable challenge in trying to rationalize the existence of his exceptional infant daughter and what she represents. He isn’t without a sense of humor and is very loving but he is forced to radically confront his limitations.


In [None]:
df.shape

In [None]:
df.info()

In [None]:
df.describe()

In [None]:
len(df.words)

### Tokenization

In [5]:
df['tokenized'] = df['words'].apply(word_tokenize)

In [6]:
df.head()

Unnamed: 0,words,tokenized
0,"We have given our hearts away, a sordid boon !”","[We, have, given, our, hearts, away, ,, a, sordid, boon, !, ”]"
1,1. Start it on the side,"[1, ., Start, it, on, the, side]"
2,"Sugar’s sweet, so is she,","[Sugar, ’, s, sweet, ,, so, is, she, ,]"
3,"So because the Asian community was so by need tight-knit, the next thing you know I have Asian kids following me around, you know doing more shit for me than the boys that wanted inside of me. Especially the two in particular. They thought I was “so wonderful” which sickened me even further. I was not wonderful, it reminds me of that quote, from WWII era forget it but goes on to say something like, “It was not that I was a hero, it was everyone around me was acting so badly” when someone won a humanitarian award.","[So, because, the, Asian, community, was, so, by, need, tight-knit, ,, the, next, thing, you, know, I, have, Asian, kids, following, me, around, ,, you, know, doing, more, shit, for, me, than, the, boys, that, wanted, inside, of, me, ., Especially, the, two, in, particular, ., They, thought, I, was, “, so, wonderful, ”, which, sickened, me, even, further, ., I, was, not, wonderful, ,, it, reminds, me, of, that, quote, ,, from, WWII, era, forget, it, but, goes, on, to, say, something, like, ,, “, It, was, not, that, I, was, a, hero, ,, it, was, everyone, around, me, ...]"
4,Nicholas’ brain runs on and is excellent at processing data and concrete facts. He works best with things he can quantify. He runs into an almost insurmountable challenge in trying to rationalize the existence of his exceptional infant daughter and what she represents. He isn’t without a sense of humor and is very loving but he is forced to radically confront his limitations.,"[Nicholas, ’, brain, runs, on, and, is, excellent, at, processing, data, and, concrete, facts, ., He, works, best, with, things, he, can, quantify, ., He, runs, into, an, almost, insurmountable, challenge, in, trying, to, rationalize, the, existence, of, his, exceptional, infant, daughter, and, what, she, represents, ., He, isn, ’, t, without, a, sense, of, humor, and, is, very, loving, but, he, is, forced, to, radically, confront, his, limitations, .]"


### Removing Punctuations

In [7]:
punc = string.punctuation

In [8]:
df['no_punc'] = df['tokenized'].apply(lambda x: [word for word in x if word not in punc])

In [9]:
df.head()

Unnamed: 0,words,tokenized,no_punc
0,"We have given our hearts away, a sordid boon !”","[We, have, given, our, hearts, away, ,, a, sordid, boon, !, ”]","[We, have, given, our, hearts, away, a, sordid, boon, ”]"
1,1. Start it on the side,"[1, ., Start, it, on, the, side]","[1, Start, it, on, the, side]"
2,"Sugar’s sweet, so is she,","[Sugar, ’, s, sweet, ,, so, is, she, ,]","[Sugar, ’, s, sweet, so, is, she]"
3,"So because the Asian community was so by need tight-knit, the next thing you know I have Asian kids following me around, you know doing more shit for me than the boys that wanted inside of me. Especially the two in particular. They thought I was “so wonderful” which sickened me even further. I was not wonderful, it reminds me of that quote, from WWII era forget it but goes on to say something like, “It was not that I was a hero, it was everyone around me was acting so badly” when someone won a humanitarian award.","[So, because, the, Asian, community, was, so, by, need, tight-knit, ,, the, next, thing, you, know, I, have, Asian, kids, following, me, around, ,, you, know, doing, more, shit, for, me, than, the, boys, that, wanted, inside, of, me, ., Especially, the, two, in, particular, ., They, thought, I, was, “, so, wonderful, ”, which, sickened, me, even, further, ., I, was, not, wonderful, ,, it, reminds, me, of, that, quote, ,, from, WWII, era, forget, it, but, goes, on, to, say, something, like, ,, “, It, was, not, that, I, was, a, hero, ,, it, was, everyone, around, me, ...]","[So, because, the, Asian, community, was, so, by, need, tight-knit, the, next, thing, you, know, I, have, Asian, kids, following, me, around, you, know, doing, more, shit, for, me, than, the, boys, that, wanted, inside, of, me, Especially, the, two, in, particular, They, thought, I, was, “, so, wonderful, ”, which, sickened, me, even, further, I, was, not, wonderful, it, reminds, me, of, that, quote, from, WWII, era, forget, it, but, goes, on, to, say, something, like, “, It, was, not, that, I, was, a, hero, it, was, everyone, around, me, was, acting, so, badly, ”, when, someone, won, a, ...]"
4,Nicholas’ brain runs on and is excellent at processing data and concrete facts. He works best with things he can quantify. He runs into an almost insurmountable challenge in trying to rationalize the existence of his exceptional infant daughter and what she represents. He isn’t without a sense of humor and is very loving but he is forced to radically confront his limitations.,"[Nicholas, ’, brain, runs, on, and, is, excellent, at, processing, data, and, concrete, facts, ., He, works, best, with, things, he, can, quantify, ., He, runs, into, an, almost, insurmountable, challenge, in, trying, to, rationalize, the, existence, of, his, exceptional, infant, daughter, and, what, she, represents, ., He, isn, ’, t, without, a, sense, of, humor, and, is, very, loving, but, he, is, forced, to, radically, confront, his, limitations, .]","[Nicholas, ’, brain, runs, on, and, is, excellent, at, processing, data, and, concrete, facts, He, works, best, with, things, he, can, quantify, He, runs, into, an, almost, insurmountable, challenge, in, trying, to, rationalize, the, existence, of, his, exceptional, infant, daughter, and, what, she, represents, He, isn, ’, t, without, a, sense, of, humor, and, is, very, loving, but, he, is, forced, to, radically, confront, his, limitations]"


### Removing numbers and remaining punctuation marks

In [10]:
df['no_numbers'] = df['no_punc'].apply(lambda x: [word for word in x if word.isalpha()])

In [11]:
df.head()

Unnamed: 0,words,tokenized,no_punc,no_numbers
0,"We have given our hearts away, a sordid boon !”","[We, have, given, our, hearts, away, ,, a, sordid, boon, !, ”]","[We, have, given, our, hearts, away, a, sordid, boon, ”]","[We, have, given, our, hearts, away, a, sordid, boon]"
1,1. Start it on the side,"[1, ., Start, it, on, the, side]","[1, Start, it, on, the, side]","[Start, it, on, the, side]"
2,"Sugar’s sweet, so is she,","[Sugar, ’, s, sweet, ,, so, is, she, ,]","[Sugar, ’, s, sweet, so, is, she]","[Sugar, s, sweet, so, is, she]"
3,"So because the Asian community was so by need tight-knit, the next thing you know I have Asian kids following me around, you know doing more shit for me than the boys that wanted inside of me. Especially the two in particular. They thought I was “so wonderful” which sickened me even further. I was not wonderful, it reminds me of that quote, from WWII era forget it but goes on to say something like, “It was not that I was a hero, it was everyone around me was acting so badly” when someone won a humanitarian award.","[So, because, the, Asian, community, was, so, by, need, tight-knit, ,, the, next, thing, you, know, I, have, Asian, kids, following, me, around, ,, you, know, doing, more, shit, for, me, than, the, boys, that, wanted, inside, of, me, ., Especially, the, two, in, particular, ., They, thought, I, was, “, so, wonderful, ”, which, sickened, me, even, further, ., I, was, not, wonderful, ,, it, reminds, me, of, that, quote, ,, from, WWII, era, forget, it, but, goes, on, to, say, something, like, ,, “, It, was, not, that, I, was, a, hero, ,, it, was, everyone, around, me, ...]","[So, because, the, Asian, community, was, so, by, need, tight-knit, the, next, thing, you, know, I, have, Asian, kids, following, me, around, you, know, doing, more, shit, for, me, than, the, boys, that, wanted, inside, of, me, Especially, the, two, in, particular, They, thought, I, was, “, so, wonderful, ”, which, sickened, me, even, further, I, was, not, wonderful, it, reminds, me, of, that, quote, from, WWII, era, forget, it, but, goes, on, to, say, something, like, “, It, was, not, that, I, was, a, hero, it, was, everyone, around, me, was, acting, so, badly, ”, when, someone, won, a, ...]","[So, because, the, Asian, community, was, so, by, need, the, next, thing, you, know, I, have, Asian, kids, following, me, around, you, know, doing, more, shit, for, me, than, the, boys, that, wanted, inside, of, me, Especially, the, two, in, particular, They, thought, I, was, so, wonderful, which, sickened, me, even, further, I, was, not, wonderful, it, reminds, me, of, that, quote, from, WWII, era, forget, it, but, goes, on, to, say, something, like, It, was, not, that, I, was, a, hero, it, was, everyone, around, me, was, acting, so, badly, when, someone, won, a, humanitarian, award]"
4,Nicholas’ brain runs on and is excellent at processing data and concrete facts. He works best with things he can quantify. He runs into an almost insurmountable challenge in trying to rationalize the existence of his exceptional infant daughter and what she represents. He isn’t without a sense of humor and is very loving but he is forced to radically confront his limitations.,"[Nicholas, ’, brain, runs, on, and, is, excellent, at, processing, data, and, concrete, facts, ., He, works, best, with, things, he, can, quantify, ., He, runs, into, an, almost, insurmountable, challenge, in, trying, to, rationalize, the, existence, of, his, exceptional, infant, daughter, and, what, she, represents, ., He, isn, ’, t, without, a, sense, of, humor, and, is, very, loving, but, he, is, forced, to, radically, confront, his, limitations, .]","[Nicholas, ’, brain, runs, on, and, is, excellent, at, processing, data, and, concrete, facts, He, works, best, with, things, he, can, quantify, He, runs, into, an, almost, insurmountable, challenge, in, trying, to, rationalize, the, existence, of, his, exceptional, infant, daughter, and, what, she, represents, He, isn, ’, t, without, a, sense, of, humor, and, is, very, loving, but, he, is, forced, to, radically, confront, his, limitations]","[Nicholas, brain, runs, on, and, is, excellent, at, processing, data, and, concrete, facts, He, works, best, with, things, he, can, quantify, He, runs, into, an, almost, insurmountable, challenge, in, trying, to, rationalize, the, existence, of, his, exceptional, infant, daughter, and, what, she, represents, He, isn, t, without, a, sense, of, humor, and, is, very, loving, but, he, is, forced, to, radically, confront, his, limitations]"


### Lower Case Letters Conversion

In [12]:
df['final'] = df['no_numbers'].apply(lambda x: [word.lower() for word in x])

In [13]:
df.head()

Unnamed: 0,words,tokenized,no_punc,no_numbers,final
0,"We have given our hearts away, a sordid boon !”","[We, have, given, our, hearts, away, ,, a, sordid, boon, !, ”]","[We, have, given, our, hearts, away, a, sordid, boon, ”]","[We, have, given, our, hearts, away, a, sordid, boon]","[we, have, given, our, hearts, away, a, sordid, boon]"
1,1. Start it on the side,"[1, ., Start, it, on, the, side]","[1, Start, it, on, the, side]","[Start, it, on, the, side]","[start, it, on, the, side]"
2,"Sugar’s sweet, so is she,","[Sugar, ’, s, sweet, ,, so, is, she, ,]","[Sugar, ’, s, sweet, so, is, she]","[Sugar, s, sweet, so, is, she]","[sugar, s, sweet, so, is, she]"
3,"So because the Asian community was so by need tight-knit, the next thing you know I have Asian kids following me around, you know doing more shit for me than the boys that wanted inside of me. Especially the two in particular. They thought I was “so wonderful” which sickened me even further. I was not wonderful, it reminds me of that quote, from WWII era forget it but goes on to say something like, “It was not that I was a hero, it was everyone around me was acting so badly” when someone won a humanitarian award.","[So, because, the, Asian, community, was, so, by, need, tight-knit, ,, the, next, thing, you, know, I, have, Asian, kids, following, me, around, ,, you, know, doing, more, shit, for, me, than, the, boys, that, wanted, inside, of, me, ., Especially, the, two, in, particular, ., They, thought, I, was, “, so, wonderful, ”, which, sickened, me, even, further, ., I, was, not, wonderful, ,, it, reminds, me, of, that, quote, ,, from, WWII, era, forget, it, but, goes, on, to, say, something, like, ,, “, It, was, not, that, I, was, a, hero, ,, it, was, everyone, around, me, ...]","[So, because, the, Asian, community, was, so, by, need, tight-knit, the, next, thing, you, know, I, have, Asian, kids, following, me, around, you, know, doing, more, shit, for, me, than, the, boys, that, wanted, inside, of, me, Especially, the, two, in, particular, They, thought, I, was, “, so, wonderful, ”, which, sickened, me, even, further, I, was, not, wonderful, it, reminds, me, of, that, quote, from, WWII, era, forget, it, but, goes, on, to, say, something, like, “, It, was, not, that, I, was, a, hero, it, was, everyone, around, me, was, acting, so, badly, ”, when, someone, won, a, ...]","[So, because, the, Asian, community, was, so, by, need, the, next, thing, you, know, I, have, Asian, kids, following, me, around, you, know, doing, more, shit, for, me, than, the, boys, that, wanted, inside, of, me, Especially, the, two, in, particular, They, thought, I, was, so, wonderful, which, sickened, me, even, further, I, was, not, wonderful, it, reminds, me, of, that, quote, from, WWII, era, forget, it, but, goes, on, to, say, something, like, It, was, not, that, I, was, a, hero, it, was, everyone, around, me, was, acting, so, badly, when, someone, won, a, humanitarian, award]","[so, because, the, asian, community, was, so, by, need, the, next, thing, you, know, i, have, asian, kids, following, me, around, you, know, doing, more, shit, for, me, than, the, boys, that, wanted, inside, of, me, especially, the, two, in, particular, they, thought, i, was, so, wonderful, which, sickened, me, even, further, i, was, not, wonderful, it, reminds, me, of, that, quote, from, wwii, era, forget, it, but, goes, on, to, say, something, like, it, was, not, that, i, was, a, hero, it, was, everyone, around, me, was, acting, so, badly, when, someone, won, a, humanitarian, award]"
4,Nicholas’ brain runs on and is excellent at processing data and concrete facts. He works best with things he can quantify. He runs into an almost insurmountable challenge in trying to rationalize the existence of his exceptional infant daughter and what she represents. He isn’t without a sense of humor and is very loving but he is forced to radically confront his limitations.,"[Nicholas, ’, brain, runs, on, and, is, excellent, at, processing, data, and, concrete, facts, ., He, works, best, with, things, he, can, quantify, ., He, runs, into, an, almost, insurmountable, challenge, in, trying, to, rationalize, the, existence, of, his, exceptional, infant, daughter, and, what, she, represents, ., He, isn, ’, t, without, a, sense, of, humor, and, is, very, loving, but, he, is, forced, to, radically, confront, his, limitations, .]","[Nicholas, ’, brain, runs, on, and, is, excellent, at, processing, data, and, concrete, facts, He, works, best, with, things, he, can, quantify, He, runs, into, an, almost, insurmountable, challenge, in, trying, to, rationalize, the, existence, of, his, exceptional, infant, daughter, and, what, she, represents, He, isn, ’, t, without, a, sense, of, humor, and, is, very, loving, but, he, is, forced, to, radically, confront, his, limitations]","[Nicholas, brain, runs, on, and, is, excellent, at, processing, data, and, concrete, facts, He, works, best, with, things, he, can, quantify, He, runs, into, an, almost, insurmountable, challenge, in, trying, to, rationalize, the, existence, of, his, exceptional, infant, daughter, and, what, she, represents, He, isn, t, without, a, sense, of, humor, and, is, very, loving, but, he, is, forced, to, radically, confront, his, limitations]","[nicholas, brain, runs, on, and, is, excellent, at, processing, data, and, concrete, facts, he, works, best, with, things, he, can, quantify, he, runs, into, an, almost, insurmountable, challenge, in, trying, to, rationalize, the, existence, of, his, exceptional, infant, daughter, and, what, she, represents, he, isn, t, without, a, sense, of, humor, and, is, very, loving, but, he, is, forced, to, radically, confront, his, limitations]"


### Drop columns and save to csv

In [14]:
df.columns

Index(['words', 'tokenized', 'no_punc', 'no_numbers', 'final'], dtype='object')

In [15]:
df.drop(['words', 'tokenized', 'no_punc', 'no_numbers'], axis=1, inplace=True)

In [17]:
df.head()

Unnamed: 0,final
0,"[we, have, given, our, hearts, away, a, sordid, boon]"
1,"[start, it, on, the, side]"
2,"[sugar, s, sweet, so, is, she]"
3,"[so, because, the, asian, community, was, so, by, need, the, next, thing, you, know, i, have, asian, kids, following, me, around, you, know, doing, more, shit, for, me, than, the, boys, that, wanted, inside, of, me, especially, the, two, in, particular, they, thought, i, was, so, wonderful, which, sickened, me, even, further, i, was, not, wonderful, it, reminds, me, of, that, quote, from, wwii, era, forget, it, but, goes, on, to, say, something, like, it, was, not, that, i, was, a, hero, it, was, everyone, around, me, was, acting, so, badly, when, someone, won, a, humanitarian, award]"
4,"[nicholas, brain, runs, on, and, is, excellent, at, processing, data, and, concrete, facts, he, works, best, with, things, he, can, quantify, he, runs, into, an, almost, insurmountable, challenge, in, trying, to, rationalize, the, existence, of, his, exceptional, infant, daughter, and, what, she, represents, he, isn, t, without, a, sense, of, humor, and, is, very, loving, but, he, is, forced, to, radically, confront, his, limitations]"


In [18]:
#df.to_csv("blogclean5000.csv",index=False)

### Exploratory Data Analysis and Visualization

In [None]:
df = pd.read_csv("blogclean5000.csv")

In [29]:
df.head()

Unnamed: 0,final
0,"[we, have, given, our, hearts, away, a, sordid, boon]"
1,"[start, it, on, the, side]"
2,"[sugar, s, sweet, so, is, she]"
3,"[so, because, the, asian, community, was, so, by, need, the, next, thing, you, know, i, have, asian, kids, following, me, around, you, know, doing, more, shit, for, me, than, the, boys, that, wanted, inside, of, me, especially, the, two, in, particular, they, thought, i, was, so, wonderful, which, sickened, me, even, further, i, was, not, wonderful, it, reminds, me, of, that, quote, from, wwii, era, forget, it, but, goes, on, to, say, something, like, it, was, not, that, i, was, a, hero, it, was, everyone, around, me, was, acting, so, badly, when, someone, won, a, humanitarian, award]"
4,"[nicholas, brain, runs, on, and, is, excellent, at, processing, data, and, concrete, facts, he, works, best, with, things, he, can, quantify, he, runs, into, an, almost, insurmountable, challenge, in, trying, to, rationalize, the, existence, of, his, exceptional, infant, daughter, and, what, she, represents, he, isn, t, without, a, sense, of, humor, and, is, very, loving, but, he, is, forced, to, radically, confront, his, limitations]"


In [30]:
df['word_count'] = df['final'].apply(lambda x: len(str(x).split()))

In [31]:
df.head()

Unnamed: 0,final,word_count
0,"[we, have, given, our, hearts, away, a, sordid, boon]",9
1,"[start, it, on, the, side]",5
2,"[sugar, s, sweet, so, is, she]",6
3,"[so, because, the, asian, community, was, so, by, need, the, next, thing, you, know, i, have, asian, kids, following, me, around, you, know, doing, more, shit, for, me, than, the, boys, that, wanted, inside, of, me, especially, the, two, in, particular, they, thought, i, was, so, wonderful, which, sickened, me, even, further, i, was, not, wonderful, it, reminds, me, of, that, quote, from, wwii, era, forget, it, but, goes, on, to, say, something, like, it, was, not, that, i, was, a, hero, it, was, everyone, around, me, was, acting, so, badly, when, someone, won, a, humanitarian, award]",97
4,"[nicholas, brain, runs, on, and, is, excellent, at, processing, data, and, concrete, facts, he, works, best, with, things, he, can, quantify, he, runs, into, an, almost, insurmountable, challenge, in, trying, to, rationalize, the, existence, of, his, exceptional, infant, daughter, and, what, she, represents, he, isn, t, without, a, sense, of, humor, and, is, very, loving, but, he, is, forced, to, radically, confront, his, limitations]",64


In [32]:
df['char_count'] = df["final"].apply(lambda x: len(x))

In [33]:
df.head()

Unnamed: 0,final,word_count,char_count
0,"[we, have, given, our, hearts, away, a, sordid, boon]",9,9
1,"[start, it, on, the, side]",5,5
2,"[sugar, s, sweet, so, is, she]",6,6
3,"[so, because, the, asian, community, was, so, by, need, the, next, thing, you, know, i, have, asian, kids, following, me, around, you, know, doing, more, shit, for, me, than, the, boys, that, wanted, inside, of, me, especially, the, two, in, particular, they, thought, i, was, so, wonderful, which, sickened, me, even, further, i, was, not, wonderful, it, reminds, me, of, that, quote, from, wwii, era, forget, it, but, goes, on, to, say, something, like, it, was, not, that, i, was, a, hero, it, was, everyone, around, me, was, acting, so, badly, when, someone, won, a, humanitarian, award]",97,97
4,"[nicholas, brain, runs, on, and, is, excellent, at, processing, data, and, concrete, facts, he, works, best, with, things, he, can, quantify, he, runs, into, an, almost, insurmountable, challenge, in, trying, to, rationalize, the, existence, of, his, exceptional, infant, daughter, and, what, she, represents, he, isn, t, without, a, sense, of, humor, and, is, very, loving, but, he, is, forced, to, radically, confront, his, limitations]",64,64


In [34]:
df.describe()

Unnamed: 0,word_count,char_count
count,5000.0,5000.0
mean,41.6246,41.6228
std,48.825568,48.827084
min,1.0,0.0
25%,8.0,8.0
50%,27.0,27.0
75%,59.0,59.0
max,1192.0,1192.0


In [35]:
df.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 5000 entries, 0 to 4999
Data columns (total 3 columns):
 #   Column      Non-Null Count  Dtype 
---  ------      --------------  ----- 
 0   final       5000 non-null   object
 1   word_count  5000 non-null   int64 
 2   char_count  5000 non-null   int64 
dtypes: int64(2), object(1)
memory usage: 117.3+ KB


### Flattening list from tokens of list of lists in python

In [40]:
L1 = ''.join(str(df['final']))

In [41]:
L1

'0                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                 [we, have, given, our, hearts, away, a, sordid, boon]\n1                                                                                                                                                                                                                                                                                                                                                                                                             

In [49]:
literal_eval(L1).sum()

SyntaxError: invalid syntax (<unknown>, line 2)

In [44]:
words = df['final']
allwords = []
for wordlist in words:
    allwords+= wordlist

In [45]:
allwords

['we',
 'have',
 'given',
 'our',
 'hearts',
 'away',
 'a',
 'sordid',
 'boon',
 'start',
 'it',
 'on',
 'the',
 'side',
 'sugar',
 's',
 'sweet',
 'so',
 'is',
 'she',
 'so',
 'because',
 'the',
 'asian',
 'community',
 'was',
 'so',
 'by',
 'need',
 'the',
 'next',
 'thing',
 'you',
 'know',
 'i',
 'have',
 'asian',
 'kids',
 'following',
 'me',
 'around',
 'you',
 'know',
 'doing',
 'more',
 'shit',
 'for',
 'me',
 'than',
 'the',
 'boys',
 'that',
 'wanted',
 'inside',
 'of',
 'me',
 'especially',
 'the',
 'two',
 'in',
 'particular',
 'they',
 'thought',
 'i',
 'was',
 'so',
 'wonderful',
 'which',
 'sickened',
 'me',
 'even',
 'further',
 'i',
 'was',
 'not',
 'wonderful',
 'it',
 'reminds',
 'me',
 'of',
 'that',
 'quote',
 'from',
 'wwii',
 'era',
 'forget',
 'it',
 'but',
 'goes',
 'on',
 'to',
 'say',
 'something',
 'like',
 'it',
 'was',
 'not',
 'that',
 'i',
 'was',
 'a',
 'hero',
 'it',
 'was',
 'everyone',
 'around',
 'me',
 'was',
 'acting',
 'so',
 'badly',
 'when',
 '

In [21]:
type(wordlist)

list

In [28]:
len(wordlist)

14

In [48]:
df2 = pd.DataFrame(

ValueError: DataFrame constructor not properly called!

In [26]:
df2.shape

(14, 1)

In [27]:
df2.to_csv("data2.csv", index=False)

### Save as Textfile

In [None]:
#textformat = ''.join(df["words"])

In [None]:
#textformat

In [None]:
#textfile = open('textfile2.txt','w', encoding="utf-8")

In [None]:
#textfile.write(textformat)

In [None]:
#textfile.close()

***

#### Coded and submitted by Dennis Lam 2021