In [1]:
# Import Dependencies
import pandas as pd
import re
from collections import Counter

In [2]:
# Grabbing stored Reddit Data files
date = '2021-06-10'
subreddit_list = ['askmen', 'askscience', 'askwomen', 'confession', 
                  'fitness', 'food', 'gaming', 'jokes', 'letstalkmusic', 
                  'lifeprotips', 'machinelearning', 'math', 
                  'relationships', 'roastme', 'science', 'sex', 
                  'therapy', 'todayilearned', 'totallynotrobots', 
                  'travel', 'wouldyourather', 'writingprompts', 'zen']

file_name_list = []

for subreddit in subreddit_list:
    file_name = date + '_' + subreddit + '.csv'
    file_name_list.append(file_name)

In [3]:
# Loading stored Reddit Data files
list_df = []
for file_name in file_name_list:
    df = pd.read_csv(file_name, index_col=None, header=0)
    list_df.append(df)

    
raw_reddit_data = pd.concat(list_df, axis=0, ignore_index=True)

In [4]:
raw_reddit_data

Unnamed: 0,Post_ID,Post,Comment,Score
0,4biemc,Basically it goes like this. Somebody posts a...,"[Today, our commenters were pretty cool guys](...",16629
1,4r1sqx,"She claims she thought her stuff was ""too girl...","Read the bottle - if it says ""shower gel"" or ""...",6458
2,5bvh8n,"Thanks, and have a good day.",[The mods' feelings about any posts/comments r...,5744
3,6a0lns,"Kidding. Relax. It's next Sunday, don't forget.",HAHAHA PSYCH YOU TOTALLY GOT US ALL OP YOU'RE ...,1875
4,6kfzpq,Background story: I've been dating my current ...,The moral of the story is: Work up an appetite...,25849
...,...,...,...,...
5503,nj95cc,It feels like a good percentage of this sub is...,right now the only thing i see on this subredd...,46
5504,xy322,http://i.imgur.com/jqyhw.jpg It's more about t...,zen is the most simple belief set out there: i...,16
5505,y8325,"We have very few submissions, but quite a lot ...",deleted ^^^^^^^^^^^^^^^^0.6321gone94407),21
5506,y9swt,"Posters to r/Zen, please - terse Zen-like sayi...","Definitely agree with this. A lot of the ""ridd...",31


In [5]:
# Selecting Post and Comment into (comment/reply) pair
reddit_data = raw_reddit_data[['Post', 'Comment']]

In [6]:
# Renaming columns
old_columns = ['Post', 'Comment']
new_columns = ['Comment', 'Reply']
reddit_data = reddit_data.rename(dict(zip(old_columns, new_columns)), 
                                 axis='columns')

In [7]:
reddit_data

Unnamed: 0,Comment,Reply
0,Basically it goes like this. Somebody posts a...,"[Today, our commenters were pretty cool guys](..."
1,"She claims she thought her stuff was ""too girl...","Read the bottle - if it says ""shower gel"" or ""..."
2,"Thanks, and have a good day.",[The mods' feelings about any posts/comments r...
3,"Kidding. Relax. It's next Sunday, don't forget.",HAHAHA PSYCH YOU TOTALLY GOT US ALL OP YOU'RE ...
4,Background story: I've been dating my current ...,The moral of the story is: Work up an appetite...
...,...,...
5503,It feels like a good percentage of this sub is...,right now the only thing i see on this subredd...
5504,http://i.imgur.com/jqyhw.jpg It's more about t...,zen is the most simple belief set out there: i...
5505,"We have very few submissions, but quite a lot ...",deleted ^^^^^^^^^^^^^^^^0.6321gone94407)
5506,"Posters to r/Zen, please - terse Zen-like sayi...","Definitely agree with this. A lot of the ""ridd..."


In [8]:
# Cleaning text in reddit data
reddit_data['Comment'] = reddit_data['Comment'].apply(lambda x: ' '.join(str(x).split()))
reddit_data['Reply'] = reddit_data['Reply'].apply(lambda x: ' '.join(str(x).split()))

In [9]:
reddit_data

Unnamed: 0,Comment,Reply
0,Basically it goes like this. Somebody posts a ...,"[Today, our commenters were pretty cool guys](..."
1,"She claims she thought her stuff was ""too girl...","Read the bottle - if it says ""shower gel"" or ""..."
2,"Thanks, and have a good day.",[The mods' feelings about any posts/comments r...
3,"Kidding. Relax. It's next Sunday, don't forget.",HAHAHA PSYCH YOU TOTALLY GOT US ALL OP YOU'RE ...
4,Background story: I've been dating my current ...,The moral of the story is: Work up an appetite...
...,...,...
5503,It feels like a good percentage of this sub is...,right now the only thing i see on this subredd...
5504,http://i.imgur.com/jqyhw.jpg It's more about t...,zen is the most simple belief set out there: i...
5505,"We have very few submissions, but quite a lot ...",deleted ^^^^^^^^^^^^^^^^0.6321gone94407)
5506,"Posters to r/Zen, please - terse Zen-like sayi...","Definitely agree with this. A lot of the ""ridd..."


In [10]:
# Retaining only alphabet, numbers and /.':?!,
reddit_data['Comment'] = reddit_data['Comment'].str.replace("[^a-zA-Z0-9/.':?!,]", ' ')
reddit_data['Reply'] = reddit_data['Reply'].str.replace("[^a-zA-Z0-9/.':?!,]", ' ')

In [11]:
reddit_data

Unnamed: 0,Comment,Reply
0,Basically it goes like this. Somebody posts a ...,"Today, our commenters were pretty cool guys ..."
1,She claims she thought her stuff was too girl...,Read the bottle if it says shower gel or ...
2,"Thanks, and have a good day.",The mods' feelings about any posts/comments r...
3,"Kidding. Relax. It's next Sunday, don't forget.",HAHAHA PSYCH YOU TOTALLY GOT US ALL OP YOU'RE ...
4,Background story: I've been dating my current ...,The moral of the story is: Work up an appetite...
...,...,...
5503,It feels like a good percentage of this sub is...,right now the only thing i see on this subredd...
5504,http://i.imgur.com/jqyhw.jpg It's more about t...,zen is the most simple belief set out there: i...
5505,"We have very few submissions, but quite a lot ...",deleted 0.6321gone94407
5506,"Posters to r/Zen, please terse Zen like sayi...",Definitely agree with this. A lot of the ridd...


In [12]:
reddit_data['Reply'][0]

' Today, our commenters were pretty cool guys  http://imgur.com/HcR1Opd '

In [13]:
# Recleaning text in reddit data
reddit_data['Comment'] = reddit_data['Comment'].apply(lambda x: ' '.join(str(x).split()))
reddit_data['Reply'] = reddit_data['Reply'].apply(lambda x: ' '.join(str(x).split()))

In [14]:
reddit_data['Reply'][0]

'Today, our commenters were pretty cool guys http://imgur.com/HcR1Opd'

In [15]:
# Removing links
reddit_data['Comment'] = reddit_data['Comment'].str.replace('https:\/\/.*', '')
reddit_data['Comment'] = reddit_data['Comment'].str.replace('https:\/\/*.*/*', '')
reddit_data['Comment'] = reddit_data['Comment'].str.replace('http:\/\/.*', '')
reddit_data['Comment'] = reddit_data['Comment'].str.replace('http:\/\/*.*/*', '')
reddit_data['Reply'] = reddit_data['Reply'].str.replace('https:\/\/.*', '')
reddit_data['Reply'] = reddit_data['Reply'].str.replace('https:\/\/*.*/*', '')
reddit_data['Reply'] = reddit_data['Reply'].str.replace('http:\/\/.*', '')
reddit_data['Reply'] = reddit_data['Reply'].str.replace('http:\/\/*.*/*', '')

In [16]:
reddit_data['Reply'][0]

'Today, our commenters were pretty cool guys '

In [17]:
# Recleaning text in reddit data
reddit_data['Comment'] = reddit_data['Comment'].apply(lambda x: ' '.join(str(x).split()))
reddit_data['Reply'] = reddit_data['Reply'].apply(lambda x: ' '.join(str(x).split()))

In [18]:
reddit_data['Reply'][0]

'Today, our commenters were pretty cool guys'

In [19]:
reddit_data

Unnamed: 0,Comment,Reply
0,Basically it goes like this. Somebody posts a ...,"Today, our commenters were pretty cool guys"
1,She claims she thought her stuff was too girly...,Read the bottle if it says shower gel or body ...
2,"Thanks, and have a good day.",The mods' feelings about any posts/comments re...
3,"Kidding. Relax. It's next Sunday, don't forget.",HAHAHA PSYCH YOU TOTALLY GOT US ALL OP YOU'RE ...
4,Background story: I've been dating my current ...,The moral of the story is: Work up an appetite...
...,...,...
5503,It feels like a good percentage of this sub is...,right now the only thing i see on this subredd...
5504,,zen is the most simple belief set out there: i...
5505,"We have very few submissions, but quite a lot ...",deleted 0.6321gone94407
5506,"Posters to r/Zen, please terse Zen like saying...",Definitely agree with this. A lot of the riddl...


In [20]:
reddit_data['Reply'][5505]

'deleted 0.6321gone94407'

In [21]:
# Filtering alphanumeric words
reddit_data['Comment'] = reddit_data['Comment'].str.replace("[a-zA-Z]*\d+[a-zA-Z]+|[a-zA-Z]+\d+[a-zA-Z]*", '')
reddit_data['Reply'] = reddit_data['Reply'].str.replace("[a-zA-Z]*\d+[a-zA-Z]+|[a-zA-Z]+\d+[a-zA-Z]*", '')

In [22]:
reddit_data

Unnamed: 0,Comment,Reply
0,Basically it goes like this. Somebody posts a ...,"Today, our commenters were pretty cool guys"
1,She claims she thought her stuff was too girly...,Read the bottle if it says shower gel or body ...
2,"Thanks, and have a good day.",The mods' feelings about any posts/comments re...
3,"Kidding. Relax. It's next Sunday, don't forget.",HAHAHA PSYCH YOU TOTALLY GOT US ALL OP YOU'RE ...
4,Background story: I've been dating my current ...,The moral of the story is: Work up an appetite...
...,...,...
5503,It feels like a good percentage of this sub is...,right now the only thing i see on this subredd...
5504,,zen is the most simple belief set out there: i...
5505,"We have very few submissions, but quite a lot ...",deleted 0.94407
5506,"Posters to r/Zen, please terse Zen like saying...",Definitely agree with this. A lot of the riddl...


In [23]:
# Removing cleaned empty posts and comments
empty_comments = reddit_data['Comment'] != ""
empty_replies = reddit_data['Reply'] != ""
reddit_data = reddit_data[empty_comments & empty_replies]

In [24]:
reddit_data

Unnamed: 0,Comment,Reply
0,Basically it goes like this. Somebody posts a ...,"Today, our commenters were pretty cool guys"
1,She claims she thought her stuff was too girly...,Read the bottle if it says shower gel or body ...
2,"Thanks, and have a good day.",The mods' feelings about any posts/comments re...
3,"Kidding. Relax. It's next Sunday, don't forget.",HAHAHA PSYCH YOU TOTALLY GOT US ALL OP YOU'RE ...
4,Background story: I've been dating my current ...,The moral of the story is: Work up an appetite...
...,...,...
5502,I never posted here and mostly just lurk occas...,This is how the place has always been. There a...
5503,It feels like a good percentage of this sub is...,right now the only thing i see on this subredd...
5505,"We have very few submissions, but quite a lot ...",deleted 0.94407
5506,"Posters to r/Zen, please terse Zen like saying...",Definitely agree with this. A lot of the riddl...


In [25]:
reddit_data['Comment'][7]

'This is more for those who built their own wealth instead of those who were born into it. I m wondering as your wealth grew, or you became rich , what changes occurred that you did not expect? EDIT: I m getting a lot of what about wealthy women? questions. I just want to say, I am asking males because I m a male myself so I feel their experiences to be more relatable, this is the r/askmen sub and you are very free to ask women the same question on the r/askwomen sub. No sexist intentions, just find males more relatable in this context.'

In [26]:
reddit_data['Reply'][7]

'Things haven t changed much for me. Neither friends nor family hit me up for money. I dress like a slob. I only work when I want to but that has gotten me complacent. Women don t throw themselves at me nor do I think they re after my money. I travel a lot. I almost never cook for myself. I default to ordering in or picking up fast food. I love fancy restaurants. I still struggle to spend money on some things. And yet on other things, I ll drop thousands of dollars without blinking. The biggest change for me has been motivation. I used to love working and now I m struggling to be excited about anything. The biggest challenge is teaching my kids how to be self sufficient. I had house cleaners and cancelled the service. We do our own house chores. I do my own yard work. I still want them to have pride in ownership and recognize that there isn t a magical money tree.'

In [27]:
len(reddit_data['Comment'][0].split())

34

In [28]:
reddit_data

Unnamed: 0,Comment,Reply
0,Basically it goes like this. Somebody posts a ...,"Today, our commenters were pretty cool guys"
1,She claims she thought her stuff was too girly...,Read the bottle if it says shower gel or body ...
2,"Thanks, and have a good day.",The mods' feelings about any posts/comments re...
3,"Kidding. Relax. It's next Sunday, don't forget.",HAHAHA PSYCH YOU TOTALLY GOT US ALL OP YOU'RE ...
4,Background story: I've been dating my current ...,The moral of the story is: Work up an appetite...
...,...,...
5502,I never posted here and mostly just lurk occas...,This is how the place has always been. There a...
5503,It feels like a good percentage of this sub is...,right now the only thing i see on this subredd...
5505,"We have very few submissions, but quite a lot ...",deleted 0.94407
5506,"Posters to r/Zen, please terse Zen like saying...",Definitely agree with this. A lot of the riddl...


In [29]:
polls = reddit_data[reddit_data['Comment'] == "View Poll"]

In [30]:
polls

Unnamed: 0,Comment,Reply
4855,View Poll,If you were able to air bend would you just su...
4858,View Poll,"When in doubt, go with C."
4860,View Poll,I would master learning everything faster.
4862,View Poll,What I like about the poll is that you get a r...
4863,View Poll,My 8 hour job everyday would just be walking. ...
...,...,...
5279,View Poll,I'm currently eighteen so... Where's my cash
5280,View Poll,I m someone who is terrible at making quick de...
5282,View Poll,so I can sell and buy a lite switch and a ton...
5284,View Poll,"While mental health is important, it doesn t k..."


In [31]:
reddit_data = reddit_data.drop(list(polls.index))

In [32]:
reddit_data

Unnamed: 0,Comment,Reply
0,Basically it goes like this. Somebody posts a ...,"Today, our commenters were pretty cool guys"
1,She claims she thought her stuff was too girly...,Read the bottle if it says shower gel or body ...
2,"Thanks, and have a good day.",The mods' feelings about any posts/comments re...
3,"Kidding. Relax. It's next Sunday, don't forget.",HAHAHA PSYCH YOU TOTALLY GOT US ALL OP YOU'RE ...
4,Background story: I've been dating my current ...,The moral of the story is: Work up an appetite...
...,...,...
5502,I never posted here and mostly just lurk occas...,This is how the place has always been. There a...
5503,It feels like a good percentage of this sub is...,right now the only thing i see on this subredd...
5505,"We have very few submissions, but quite a lot ...",deleted 0.94407
5506,"Posters to r/Zen, please terse Zen like saying...",Definitely agree with this. A lot of the riddl...


In [33]:
reddit_data['Comment_Length'] = reddit_data['Comment'].apply(lambda x: len(x.split()))
reddit_data['Reply_Length'] = reddit_data['Reply'].apply(lambda x: len(x.split()))

In [34]:
comment_less_than_2 = reddit_data[reddit_data['Comment_Length'] < 2]

In [35]:
reddit_data = reddit_data.drop(list(comment_less_than_2.index))

In [36]:
reddit_data

Unnamed: 0,Comment,Reply,Comment_Length,Reply_Length
0,Basically it goes like this. Somebody posts a ...,"Today, our commenters were pretty cool guys",34,7
1,She claims she thought her stuff was too girly...,Read the bottle if it says shower gel or body ...,79,81
2,"Thanks, and have a good day.",The mods' feelings about any posts/comments re...,6,9
3,"Kidding. Relax. It's next Sunday, don't forget.",HAHAHA PSYCH YOU TOTALLY GOT US ALL OP YOU'RE ...,7,13
4,Background story: I've been dating my current ...,The moral of the story is: Work up an appetite...,384,17
...,...,...,...,...
5502,I never posted here and mostly just lurk occas...,This is how the place has always been. There a...,168,15
5503,It feels like a good percentage of this sub is...,right now the only thing i see on this subredd...,272,19
5505,"We have very few submissions, but quite a lot ...",deleted 0.94407,145,2
5506,"Posters to r/Zen, please terse Zen like saying...",Definitely agree with this. A lot of the riddl...,90,218


In [37]:
comment_less_than_3 = reddit_data[reddit_data['Comment_Length'] < 3]

In [38]:
reddit_data = reddit_data.drop(list(comment_less_than_3.index))

In [39]:
reddit_data

Unnamed: 0,Comment,Reply,Comment_Length,Reply_Length
0,Basically it goes like this. Somebody posts a ...,"Today, our commenters were pretty cool guys",34,7
1,She claims she thought her stuff was too girly...,Read the bottle if it says shower gel or body ...,79,81
2,"Thanks, and have a good day.",The mods' feelings about any posts/comments re...,6,9
3,"Kidding. Relax. It's next Sunday, don't forget.",HAHAHA PSYCH YOU TOTALLY GOT US ALL OP YOU'RE ...,7,13
4,Background story: I've been dating my current ...,The moral of the story is: Work up an appetite...,384,17
...,...,...,...,...
5502,I never posted here and mostly just lurk occas...,This is how the place has always been. There a...,168,15
5503,It feels like a good percentage of this sub is...,right now the only thing i see on this subredd...,272,19
5505,"We have very few submissions, but quite a lot ...",deleted 0.94407,145,2
5506,"Posters to r/Zen, please terse Zen like saying...",Definitely agree with this. A lot of the riddl...,90,218


In [40]:
reddit_data[reddit_data['Reply_Length'] < 2]

Unnamed: 0,Comment,Reply,Comment_Length,Reply_Length
696,Edit: my inbox is mega full. You guys seriousl...,Pho,30,1
772,Edit: Wow! I didn t even think this would blow...,r/wholesomeconfessions,58,1
780,She doesn t have much time to get new ones so ...,r/wholesomeconfessions,57,1
800,"He always left his Locker unlocked, I decided ...",Nice!,15,1
1289,Here's the article:,Picture,3,1
1392,I lost over 200 pounds in about 2 years. Peopl...,deleted,860,1
1421,I run about 5 7 miles once a week for cardio a...,nope,127,1
1519,NYT article: Why Everything We Know About Salt...,.,11,1
1540,"Hello, i was always curious about what are som...",Pullups,31,1
1599,"Started my fitness journey back in June 24, 20...",REGILOUSLY,31,1


In [41]:
reddit_data = reddit_data.drop([1519, 1392, 5505, 431, 3267])

In [42]:
reddit_data

Unnamed: 0,Comment,Reply,Comment_Length,Reply_Length
0,Basically it goes like this. Somebody posts a ...,"Today, our commenters were pretty cool guys",34,7
1,She claims she thought her stuff was too girly...,Read the bottle if it says shower gel or body ...,79,81
2,"Thanks, and have a good day.",The mods' feelings about any posts/comments re...,6,9
3,"Kidding. Relax. It's next Sunday, don't forget.",HAHAHA PSYCH YOU TOTALLY GOT US ALL OP YOU'RE ...,7,13
4,Background story: I've been dating my current ...,The moral of the story is: Work up an appetite...,384,17
...,...,...,...,...
5501,Suddenly becoming aware of your true nature wo...,"That's not really what enlightenment is about,...",85,241
5502,I never posted here and mostly just lurk occas...,This is how the place has always been. There a...,168,15
5503,It feels like a good percentage of this sub is...,right now the only thing i see on this subredd...,272,19
5506,"Posters to r/Zen, please terse Zen like saying...",Definitely agree with this. A lot of the riddl...,90,218


In [43]:
reddit_data['Comment'].describe()

count                       4895
unique                      4837
top       Link to original post:
freq                           9
Name: Comment, dtype: object

In [44]:
link_to_orig_post = reddit_data[reddit_data['Comment'] == "Link to original post"]
link_to_orig_post_2 = reddit_data[reddit_data['Comment'] == "Link to original post:"]
link_to_orig_post_3 = reddit_data[reddit_data['Comment'] == "Link to original post."]
link_to_orig_post_4 = reddit_data[reddit_data['Comment'] == "Link to original:"]
link_to_orig_post_5 = reddit_data[reddit_data['Comment'] == "Link to original"]
link_to_orig_post_6 = reddit_data[reddit_data['Comment'] == "Link to original."]
link_to_orig_post_7 = reddit_data[reddit_data['Comment'] == "Original Post here"]
link_to_orig_post_8 = reddit_data[reddit_data['Comment'] == "Here is the original post."]
orig_post_here = reddit_data[reddit_data['Comment'] == "Original post here"]
orig_post_here_2 = reddit_data[reddit_data['Comment'] == "Original post here:"]
link_to_prev_post = reddit_data[reddit_data['Comment'] == "Link to previous post:"]
removed_by_reddit = reddit_data[reddit_data['Comment'].str.contains('Removed by reddit')]
duplicates_1 = reddit_data[reddit_data['Comment'].str.contains('previous 101 posts right')]
wrong_sub = reddit_data[reddit_data['Comment'].str.contains('Whoops, wrong sub')]
link_to_article = reddit_data[reddit_data['Comment'].str.contains('Link to article')]
welcome_to_sub = reddit_data[reddit_data['Reply'].str.contains('Hello and welcome to')]
welcome_to_sub_2 = reddit_data[reddit_data['Reply'].str.contains('Welcome to the Prompt')]
this_thread_is_tagged = reddit_data[reddit_data['Reply'].str.contains('This thread has been tagged')]
off_topic = reddit_data[reddit_data['Reply'].str.contains('Off Topic Discussion :')]
repeating_topic = reddit_data[reddit_data['Reply'].str.contains('This topic comes up')]


In [45]:
reddit_data = reddit_data.drop(list(link_to_orig_post.index))
reddit_data = reddit_data.drop(list(link_to_orig_post_2.index))
reddit_data = reddit_data.drop(list(link_to_orig_post_3.index))
reddit_data = reddit_data.drop(list(link_to_orig_post_4.index))
reddit_data = reddit_data.drop(list(link_to_orig_post_5.index))
reddit_data = reddit_data.drop(list(link_to_orig_post_6.index))
reddit_data = reddit_data.drop(list(link_to_orig_post_7.index))
reddit_data = reddit_data.drop(list(link_to_orig_post_8.index))
reddit_data = reddit_data.drop(list(orig_post_here.index))
reddit_data = reddit_data.drop(list(orig_post_here_2.index))
reddit_data = reddit_data.drop(list(link_to_prev_post.index))
reddit_data = reddit_data.drop(list(removed_by_reddit.index))
reddit_data = reddit_data.drop(list(duplicates_1.index))
reddit_data = reddit_data.drop(list(wrong_sub.index))
reddit_data = reddit_data.drop(list(welcome_to_sub.index))
reddit_data = reddit_data.drop(list(welcome_to_sub_2.index))
reddit_data = reddit_data.drop(list(link_to_article.index))
reddit_data = reddit_data.drop(list(this_thread_is_tagged.index))
reddit_data = reddit_data.drop(list(off_topic.index))
reddit_data = reddit_data.drop(list(repeating_topic.index))

In [46]:
reddit_data['Comment'].describe()

count                                                  4740
unique                                                 4729
top       She said, Yes, the others were at least sevens...
freq                                                      2
Name: Comment, dtype: object

In [47]:
reddit_data['Reply'].describe()

count           4740
unique          4738
top       Thank you.
freq               2
Name: Reply, dtype: object

In [48]:
[k for (k,v) in Counter(reddit_data['Comment']).items() if v > 1]

['Before and After',
 'Jane explained to him what it was. Tarzan said, Ohhh...Tarzan use knot hole in trunk of tree. Horrified, Jane said, Tarzan, you have it all wrong, but I will show you how to do it properly. She took off her clothing and lay down on the ground. Here. she said, pointing to her privates. You must put it in here. Tarzan removed his loin cloth, showing Jane his considerable manhood, stepped closer to her and kicked her right in the crotch! Jane rolled around in agony for what seemed like an eternity. Eventually, she managed to gasp for air and screamed, What did you do that for?! Tarzan replied, Check for squirrel.',
 'School is my answer',
 'I told her we use names here.',
 'So I took down his confederate flag.',
 "A few days ago I was talking to some friends, and friends of those friends, at a bar. I decided to break the ice with the new friends with a few jokes, most of which went down very well...until I decided to tell a few more offensive ones...and picked the w

In [52]:
reddit_data = reddit_data.reset_index()

In [55]:
reddit_data = reddit_data.drop(columns='index')

In [56]:
reddit_data

Unnamed: 0,Comment,Reply,Comment_Length,Reply_Length
0,Basically it goes like this. Somebody posts a ...,"Today, our commenters were pretty cool guys",34,7
1,She claims she thought her stuff was too girly...,Read the bottle if it says shower gel or body ...,79,81
2,"Thanks, and have a good day.",The mods' feelings about any posts/comments re...,6,9
3,"Kidding. Relax. It's next Sunday, don't forget.",HAHAHA PSYCH YOU TOTALLY GOT US ALL OP YOU'RE ...,7,13
4,Background story: I've been dating my current ...,The moral of the story is: Work up an appetite...,384,17
...,...,...,...,...
4735,Suddenly becoming aware of your true nature wo...,"That's not really what enlightenment is about,...",85,241
4736,I never posted here and mostly just lurk occas...,This is how the place has always been. There a...,168,15
4737,It feels like a good percentage of this sub is...,right now the only thing i see on this subredd...,272,19
4738,"Posters to r/Zen, please terse Zen like saying...",Definitely agree with this. A lot of the riddl...,90,218


In [58]:
reddit_data_processed = reddit_data[['Comment', 'Reply']]

In [59]:
reddit_data_processed

Unnamed: 0,Comment,Reply
0,Basically it goes like this. Somebody posts a ...,"Today, our commenters were pretty cool guys"
1,She claims she thought her stuff was too girly...,Read the bottle if it says shower gel or body ...
2,"Thanks, and have a good day.",The mods' feelings about any posts/comments re...
3,"Kidding. Relax. It's next Sunday, don't forget.",HAHAHA PSYCH YOU TOTALLY GOT US ALL OP YOU'RE ...
4,Background story: I've been dating my current ...,The moral of the story is: Work up an appetite...
...,...,...
4735,Suddenly becoming aware of your true nature wo...,"That's not really what enlightenment is about,..."
4736,I never posted here and mostly just lurk occas...,This is how the place has always been. There a...
4737,It feels like a good percentage of this sub is...,right now the only thing i see on this subredd...
4738,"Posters to r/Zen, please terse Zen like saying...",Definitely agree with this. A lot of the riddl...
