### notebook purpose

- input csv created via mytomatoes.com pomodoro method
- create list of verbs for wordcloud

In [1]:
import os, sys
import pandas as pd
from nltk.stem.wordnet import WordNetLemmatizer as WNL

In [2]:
df = pd.read_csv('csv/mytomatoes.csv', 
                  sep=',', 
                  names=['start', 'end', 'did'])
# df

In [3]:
def get_conjug_verb_list(did):
    ''' given a list of did (activities), 
        extract verbs and conjugate to present tense
        note: assumes verb is first word in did column '''

    verbs = [s.split(' ')[0] for s in did]

    verbs_conjug = [WNL().lemmatize(s,'v') for s in verbs]

    subs = { # substitutes to manually correct ntlk error
            'instal': 'install',
            'robustified': 'robustify'
    }
    verbs_conjug = [subs.get(i,i) for i in verbs_conjug]
    assert len(did) == len(verbs_conjug)
    
    return verbs_conjug

def conjug_did_list(did, verbs_conjug):
    ''' given a list of did (activities) and conjugated verbs
        return the same list w conjugated verbs as first word '''
    
    did_conjug = []

    for idx, d in enumerate(did):

        # swap conjugated verb for first word in list
        words = d.split(' ')
        words[0] = verbs_conjug[idx]
        did_conjug.append(' '.join(words))

    return did_conjug

In [4]:
did = df['did'].tolist()

verbs_conjug = get_conjug_verb_list(did)

# did_conjug = conjug_did_list(did, verbs_conjug)

with open('verbs.txt', mode='wt', encoding='utf-8') as f:
    f.write('\n'.join(verbs_conjug))