In [21]:
import pandas as pd
import os
from glob import glob
from nrclex import NRCLex
import moralstrength as ms
from tqdm import tqdm
from sentistrength import PySentiStr
from time import time

In [17]:
def load_reddit(path):
    df = pd.read_csv(path)
    df["full_text"] = df["title"].str.cat(df["text"].astype(str), sep=' ').fillna('')
    return df

In [18]:
def sentiment_ms(df):
    df['care'] = 0
    df['fairness'] = 0
    df['loyalty'] = 0
    df['authority'] = 0
    df['purity'] = 0
    df['non_moral'] = 0
    df.reset_index(drop=True, inplace=True)
    
    for j in tqdm(range(df.shape[0])):

        d = ms.string_moral_values(df.loc[j, 'full_text'])
        df.loc[j, 'care'] = d['care']
        df.loc[j, 'fairness'] = d['fairness']
        df.loc[j, 'loyalty'] = d['loyalty']
        df.loc[j, 'authority'] = d['authority']
        df.loc[j, 'purity'] = d['purity']
        df.loc[j, 'non_moral'] = d['non-moral']
    return df

def sentiment_nrc(df):
    df['fear'] = 0
    df['anger'] = 0
    df['anticip'] = 0
    df['trust'] = 0
    df['surprise'] = 0
    df['positive'] = 0
    df['negative'] = 0
    df['sadness'] = 0
    df['disgust'] = 0
    df['joy'] = 0
    df['full_text'] = df['full_text'].fillna("")
    df.reset_index(drop=True, inplace=True)
    
    for j in tqdm(range(df.shape[0])):

        d = NRCLex(df.loc[j, 'full_text']).affect_frequencies
        df.loc[j, 'fear'] = d['fear']
        df.loc[j, 'anger'] = d['anger']
        df.loc[j, 'anticip'] = d['anticip']
        df.loc[j, 'trust'] = d['trust']
        df.loc[j, 'surprise'] = d['surprise']
        df.loc[j, 'positive'] = d['positive']
        df.loc[j, 'negative'] = d['negative']
        df.loc[j, 'sadness'] = d['sadness']
        df.loc[j, 'disgust'] = d['disgust']
        df.loc[j, 'joy'] = d['joy']
    return df

def sentiment_sentistrength(df):
    senti = PySentiStr()
    senti.setSentiStrengthPath('/Users/prady/softwares/SentiStrengthCom.jar')
    senti.setSentiStrengthLanguageFolderPath('/Users/prady/softwares/SentStrength_Data_Sept2011/')
    df["full_text"] = [t if t!="" else " " for t in df['full_text']]
    result = senti.getSentiment(df["full_text"], score='trinary')
    df["sentistrength_pos"] = [r[0] for r in result]
    df["sentistrength_neg"] = [r[1] for r in result]
    df["sentistrength_neutral"] = [r[2] for r in result]
    return df

In [22]:
reddit_dir = '../../rawdata/'
reddit_list = [y for x in os.walk(reddit_dir) for y in glob(os.path.join(x[0], '*.csv')) if 'comment' not in y]
for j,r in enumerate(reddit_list):
    print(str(j+1) + " out of " + str(len(reddit_list)))
    print(r)
    t0 = time()
    df = load_reddit(r)
    df = sentiment_nrc(df)
    df = sentiment_ms(df)
    df = sentiment_sentistrength(df)
    df.to_csv(r, index=False, index_label=False)
    print("completed in "+str(time()-t0))

  1%|▏         | 13/916 [00:00<00:07, 122.79it/s]

1 out of 50
../../rawdata/Venturecapital/venturecapital_hot.csv


100%|██████████| 916/916 [00:05<00:00, 169.68it/s]
100%|██████████| 916/916 [02:20<00:00,  6.51it/s]
  2%|▏         | 18/991 [00:00<00:05, 176.35it/s]

completed in 147.50815391540527
2 out of 50
../../rawdata/Venturecapital/venturecapital_top.csv


100%|██████████| 991/991 [00:05<00:00, 194.50it/s]
100%|██████████| 991/991 [02:39<00:00,  6.21it/s]
  2%|▏         | 17/988 [00:00<00:06, 158.99it/s]

completed in 165.68257689476013
3 out of 50
../../rawdata/Venturecapital/venturecapital_new.csv


100%|██████████| 988/988 [00:05<00:00, 192.16it/s]
100%|██████████| 988/988 [02:36<00:00,  6.31it/s]
100%|██████████| 24/24 [00:00<00:00, 145.94it/s]
  0%|          | 0/24 [00:00<?, ?it/s]

completed in 162.76311802864075
4 out of 50
../../rawdata/Venturecapital/venturecapital_rising.csv


100%|██████████| 24/24 [00:04<00:00,  5.62it/s]
  2%|▏         | 16/924 [00:00<00:05, 156.71it/s]

completed in 4.77788519859314
5 out of 50
../../rawdata/Venturecapital/venturecapital_controversial.csv


100%|██████████| 924/924 [00:04<00:00, 186.93it/s]
100%|██████████| 924/924 [02:34<00:00,  5.99it/s]
  1%|▏         | 13/992 [00:00<00:07, 126.19it/s]

completed in 160.34686303138733
6 out of 50
../../rawdata/Startups/startups_controversial.csv


100%|██████████| 992/992 [00:07<00:00, 126.42it/s]
  np.exp(prob, prob)
100%|██████████| 992/992 [05:39<00:00,  2.93it/s]
100%|██████████| 16/16 [00:00<00:00, 105.39it/s]
  0%|          | 0/16 [00:00<?, ?it/s]

completed in 348.46965980529785
7 out of 50
../../rawdata/Startups/startups_rising.csv


100%|██████████| 16/16 [00:05<00:00,  2.70it/s]
  1%|▏         | 6/438 [00:00<00:07, 57.05it/s]

completed in 6.4671690464019775
8 out of 50
../../rawdata/Startups/startups_hot.csv


100%|██████████| 438/438 [00:03<00:00, 113.86it/s]
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
100%|██████████| 438/438 [03:33<00:00,  2.05it/s]
  1%|          | 7/872 [00:00<00:14, 61.05it/s]

completed in 218.8126471042633
9 out of 50
../../rawdata/Startups/startups_new.csv


100%|██████████| 872/872 [00:07<00:00, 122.42it/s]
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
100%|██████████| 872/872 [06:58<00:00,  2.08it/s]
  0%|          | 0/999 [00:00<?, ?it/s]

completed in 427.7185649871826
10 out of 50
../../rawdata/Startups/startups_top.csv


100%|██████████| 999/999 [00:14<00:00, 70.74it/s]
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
100%|██████████| 999/999 [17:25<00:00,  1.05s/it]
100%|██████████| 23/23 [00:00<00:00, 182.41it/s]
  0%|          | 0/23 [00:00<?, ?it/s]

completed in 1063.315551996231
11 out of 50
../../rawdata/Entrepreneurship/entrepreneurship_rising.csv


100%|██████████| 23/23 [00:02<00:00,  8.71it/s]
  2%|▏         | 18/934 [00:00<00:05, 175.54it/s]

completed in 3.0897998809814453
12 out of 50
../../rawdata/Entrepreneurship/entrepreneurship_hot.csv


100%|██████████| 934/934 [00:05<00:00, 174.03it/s]
  np.exp(prob, prob)
100%|██████████| 934/934 [03:02<00:00,  5.11it/s]
  2%|▏         | 20/998 [00:00<00:04, 195.67it/s]

completed in 189.23744583129883
13 out of 50
../../rawdata/Entrepreneurship/entrepreneurship_top.csv


100%|██████████| 998/998 [00:09<00:00, 105.45it/s]
  np.exp(prob, prob)
100%|██████████| 998/998 [05:24<00:00,  3.08it/s]
  2%|▏         | 17/1000 [00:00<00:05, 165.27it/s]

completed in 335.22205424308777
14 out of 50
../../rawdata/Entrepreneurship/entrepreneurship_controversial.csv


100%|██████████| 1000/1000 [00:06<00:00, 161.05it/s]
  np.exp(prob, prob)
100%|██████████| 1000/1000 [03:18<00:00,  5.04it/s]
  2%|▏         | 19/855 [00:00<00:04, 179.78it/s]

completed in 205.6031517982483
15 out of 50
../../rawdata/Entrepreneurship/entrepreneurship_new.csv


100%|██████████| 855/855 [00:04<00:00, 188.17it/s]
  np.exp(prob, prob)
100%|██████████| 855/855 [02:56<00:00,  4.84it/s]
  0%|          | 0/982 [00:00<?, ?it/s]

completed in 182.32005190849304
16 out of 50
../../rawdata/EntrepreneurRideAlong/EntrepreneurRideAlong_controversial.csv


100%|██████████| 982/982 [00:12<00:00, 81.13it/s] 
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
100%|██████████| 982/982 [15:03<00:00,  1.09it/s]
  0%|          | 0/952 [00:00<?, ?it/s

completed in 919.2850480079651
17 out of 50
../../rawdata/EntrepreneurRideAlong/EntrepreneurRideAlong_hot.csv


100%|██████████| 952/952 [00:21<00:00, 44.73it/s]
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)


  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
100%|██████████| 952/952 [20:05<00:00,  1.27s/it]
 33%|███▎      | 7/21 [00:00<00:00, 54.29it/s]

completed in 1230.4275200366974
18 out of 50
../../rawdata/EntrepreneurRideAlong/EntrepreneurRideAlong_rising.csv


100%|██████████| 21/21 [00:00<00:00, 36.16it/s]
  np.exp(prob, prob)
100%|██████████| 21/21 [00:33<00:00,  1.59s/it]
  0%|          | 0/923 [00:00<?, ?it/s]

completed in 34.481842041015625
19 out of 50
../../rawdata/EntrepreneurRideAlong/EntrepreneurRideAlong_new.csv


100%|██████████| 923/923 [00:18<00:00, 50.16it/s]
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)


  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
100%|██████████| 923/923 [20:07<00:00,  1.31s/it]


completed in 1229.312996149063
20 out of 50
../../rawdata/EntrepreneurRideAlong/EntrepreneurRideAlong_top.csv


100%|██████████| 993/993 [00:21<00:00, 46.75it/s]
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)


  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)


  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
100%|██████████| 993/993 [27:43<00:00,  1.68s/it]
  2%|▏         | 21/1000 [00:00<00:04, 205.78it/s]

completed in 1689.6086840629578
21 out of 50
../../rawdata/Business/business_controversial.csv


100%|██████████| 1000/1000 [00:04<00:00, 216.01it/s]
100%|██████████| 1000/1000 [01:28<00:00, 11.30it/s]
100%|██████████| 23/23 [00:00<00:00, 208.10it/s]
  0%|          | 0/23 [00:00<?, ?it/s]

completed in 93.84876799583435
22 out of 50
../../rawdata/Business/business_rising.csv


100%|██████████| 23/23 [00:01<00:00, 12.29it/s]
 11%|█         | 16/149 [00:00<00:00, 154.24it/s]

completed in 2.3542888164520264
23 out of 50
../../rawdata/Business/business_new.csv


100%|██████████| 149/149 [00:00<00:00, 180.19it/s]
100%|██████████| 149/149 [00:23<00:00,  6.29it/s]
  2%|▏         | 20/994 [00:00<00:04, 198.37it/s]

completed in 24.99462127685547
24 out of 50
../../rawdata/Business/business_top.csv


100%|██████████| 994/994 [00:04<00:00, 209.47it/s]
100%|██████████| 994/994 [01:22<00:00, 12.00it/s]
  9%|▊         | 20/234 [00:00<00:01, 188.16it/s]

completed in 88.26550817489624
25 out of 50
../../rawdata/Business/business_hot.csv


100%|██████████| 234/234 [00:01<00:00, 189.48it/s]
100%|██████████| 234/234 [00:37<00:00,  6.18it/s]
 29%|██▉       | 7/24 [00:00<00:00, 68.72it/s]

completed in 39.93836498260498
26 out of 50
../../rawdata/Smallbusiness/smallbusiness_rising.csv


100%|██████████| 24/24 [00:00<00:00, 96.91it/s]
100%|██████████| 24/24 [00:11<00:00,  2.04it/s]
  2%|▏         | 15/1000 [00:00<00:06, 142.30it/s]

completed in 12.465172052383423
27 out of 50
../../rawdata/Smallbusiness/smallbusiness_controversial.csv


100%|██████████| 1000/1000 [00:08<00:00, 115.33it/s]
  np.exp(prob, prob)
  np.exp(prob, prob)
100%|██████████| 1000/1000 [05:42<00:00,  2.92it/s]
  2%|▏         | 16/992 [00:00<00:07, 137.30it/s]

completed in 353.2127161026001
28 out of 50
../../rawdata/Smallbusiness/smallbusiness_hot.csv


100%|██████████| 992/992 [00:06<00:00, 146.39it/s]
100%|██████████| 992/992 [05:20<00:00,  3.10it/s]
  1%|▏         | 14/985 [00:00<00:07, 137.24it/s]

completed in 328.5312428474426
29 out of 50
../../rawdata/Smallbusiness/smallbusiness_new.csv


100%|██████████| 985/985 [00:07<00:00, 137.19it/s]
100%|██████████| 985/985 [05:27<00:00,  3.01it/s]
  0%|          | 0/999 [00:00<?, ?it/s]

completed in 335.81929111480713
30 out of 50
../../rawdata/Smallbusiness/smallbusiness_top.csv


100%|██████████| 999/999 [00:09<00:00, 102.03it/s]
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
100%|██████████| 999/999 [09:40<00:00,  1.72it/s]
  2%|▏         | 14/622 [00:00<00:04, 139.71it/s]

completed in 592.1795530319214
31 out of 50
../../rawdata/Growmybusiness/growmybusiness_hot.csv


100%|██████████| 622/622 [00:04<00:00, 148.63it/s]
100%|██████████| 622/622 [03:36<00:00,  2.87it/s]
  1%|▏         | 12/956 [00:00<00:08, 115.70it/s]

completed in 221.99511194229126
32 out of 50
../../rawdata/Growmybusiness/growmybusiness_new.csv


100%|██████████| 956/956 [00:06<00:00, 147.12it/s]
  np.exp(prob, prob)
100%|██████████| 956/956 [05:27<00:00,  2.92it/s]
  0%|          | 0/999 [00:00<?, ?it/s]

completed in 335.76973009109497
33 out of 50
../../rawdata/Growmybusiness/growmybusiness_top.csv


100%|██████████| 999/999 [00:08<00:00, 122.25it/s]
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
100%|██████████| 999/999 [59:47<00:00,  3.59s/it]
100%|██████████| 16/16 [00:00<00:00, 121.58it/s]
  0%|          | 0/16 [00:00<?, ?it/s]

completed in 3597.3223989009857
34 out of 50
../../rawdata/Growmybusiness/growmybusiness_rising.csv


100%|██████████| 16/16 [00:04<00:00,  3.73it/s]
  0%|          | 0/944 [00:00<?, ?it/s]

completed in 4.791272878646851
35 out of 50
../../rawdata/Growmybusiness/growmybusiness_controversial.csv


100%|██████████| 944/944 [00:06<00:00, 135.57it/s]
  np.exp(prob, prob)
  np.exp(prob, prob)
100%|██████████| 944/944 [05:44<00:00,  2.74it/s]
100%|██████████| 7/7 [00:00<00:00, 149.74it/s]
 14%|█▍        | 1/7 [00:00<00:00,  8.34it/s]

completed in 353.63845014572144
36 out of 50
../../rawdata/Startup_ideas/startup_ideas_rising.csv


100%|██████████| 7/7 [00:01<00:00,  5.81it/s]
  3%|▎         | 14/529 [00:00<00:03, 136.31it/s]

completed in 1.6099369525909424
37 out of 50
../../rawdata/Startup_ideas/startup_ideas_hot.csv


100%|██████████| 529/529 [00:03<00:00, 134.19it/s]
100%|██████████| 529/529 [02:52<00:00,  3.07it/s]
  1%|▏         | 13/940 [00:00<00:07, 124.18it/s]

completed in 177.20469307899475
38 out of 50
../../rawdata/Startup_ideas/startup_ideas_controversial.csv


100%|██████████| 940/940 [00:06<00:00, 134.45it/s]
100%|██████████| 940/940 [05:06<00:00,  3.06it/s]
  1%|▏         | 14/999 [00:00<00:07, 137.92it/s]

completed in 315.551216840744
39 out of 50
../../rawdata/Startup_ideas/startup_ideas_top.csv


100%|██████████| 999/999 [00:06<00:00, 146.47it/s]
100%|██████████| 999/999 [05:11<00:00,  3.21it/s]
  1%|▏         | 14/995 [00:00<00:07, 136.49it/s]

completed in 319.9115068912506
40 out of 50
../../rawdata/Startup_ideas/startup_ideas_new.csv


100%|██████████| 995/995 [00:06<00:00, 153.01it/s]
100%|██████████| 995/995 [05:08<00:00,  3.23it/s]
  2%|▏         | 18/813 [00:00<00:04, 175.42it/s]

completed in 316.3389849662781
41 out of 50
../../rawdata/Ladybusiness/ladybusiness_new.csv


100%|██████████| 813/813 [00:04<00:00, 178.97it/s]
100%|██████████| 813/813 [18:41<00:00,  1.38s/it]   
  1%|▏         | 13/916 [00:00<00:06, 129.96it/s]

completed in 1127.6013178825378
42 out of 50
../../rawdata/Ladybusiness/ladybusiness_top.csv


100%|██████████| 916/916 [00:05<00:00, 158.15it/s]
100%|██████████| 916/916 [03:06<00:00,  4.92it/s]
100%|██████████| 23/23 [00:00<00:00, 134.28it/s]
  0%|          | 0/23 [00:00<?, ?it/s]

completed in 192.9261350631714
43 out of 50
../../rawdata/Ladybusiness/ladybusiness_rising.csv


100%|██████████| 23/23 [00:06<00:00,  3.36it/s]
  2%|▏         | 13/688 [00:00<00:05, 124.23it/s]

completed in 7.407363653182983
44 out of 50
../../rawdata/Ladybusiness/ladybusiness_controversial.csv


100%|██████████| 688/688 [00:03<00:00, 175.20it/s]
100%|██████████| 688/688 [02:21<00:00,  4.87it/s]
  3%|▎         | 17/673 [00:00<00:03, 164.07it/s]

completed in 146.5443480014801
45 out of 50
../../rawdata/Ladybusiness/ladybusiness_hot.csv


100%|██████████| 673/673 [00:04<00:00, 166.89it/s]
100%|██████████| 673/673 [02:16<00:00,  4.92it/s]


completed in 141.85762214660645
46 out of 50
../../rawdata/entrepreneur/entrepreneur_top.csv


100%|██████████| 998/998 [00:19<00:00, 50.80it/s]
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)


  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
100%|██████████| 998/998 [26:50<00:00,  1.61s/it]
  0%|          | 0/996 [00:00<?, ?it/s]

completed in 1634.8995230197906
47 out of 50
../../rawdata/entrepreneur/entrepreneur_controversial.csv


100%|██████████| 996/996 [00:11<00:00, 84.57it/s] 
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
100%|██████████| 996/996 [11:12<00:00,  1.48it/s]
  2%|▏         | 14/586 [00:00<00:04, 139.74it/s]

completed in 686.3056910037994
48 out of 50
../../rawdata/entrepreneur/entrepreneur_new.csv


100%|██████████| 586/586 [00:04<00:00, 119.21it/s]
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
100%|██████████| 586/586 [25:38<00:00,  2.62s/it]
100%|██████████| 18/18 [00:00<00:00, 109.48it/s]
  0%|          | 0/18 [00:00<?, ?it/s]

completed in 1544.6287701129913
49 out of 50
../../rawdata/entrepreneur/entrepreneur_rising.csv


100%|██████████| 18/18 [00:07<00:00,  2.28it/s]
  2%|▏         | 10/659 [00:00<00:06, 93.84it/s]

completed in 8.475209951400757
50 out of 50
../../rawdata/entrepreneur/entrepreneur_hot.csv


100%|██████████| 659/659 [00:06<00:00, 105.30it/s]
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
  np.exp(prob, prob)
100%|██████████| 659/659 [05:15<00:00,  2.09it/s]


completed in 323.9657289981842
