In [None]:
# Import regression data set
# using statsmodel, run regression looking at impact on return of treatment

In [4]:
# Combine and Clean CRSP Data
from datetime import datetime
import funcy
import numpy as np
import pandas as pd
import os

from analysis.utilities.dropbox_client import DropboxAPI

DROPBOX_ANALYSIS_DATA = '/intermediate_data'
DROPBOX_CRSP = '/data/CRSP'
DATA = os.path.join(os.path.abspath(os.curdir), 'analysis/Data')
CRSP_FLAG_FNAME = 'crsp_event_flags'
TT_FNAME = 'treating_treated_ticker'

In [5]:
TREATED_SM_ST = '{}_TREATED_SAMEMKT_SAMETECH'
TREATED_DM_ST = '{}_TREATED_DIFFMKT_SAMETECH'
TREATED_SM_DT = '{}_TREATED_SAMEMKT_DIFFTECH'
NO_TREATED_CE_FMT = '{}_OTHER_TREATED'
NO_OWN_NO_TREATED_CE_FMT = '{}_NO_OWN_NO_OTHER_TREATED'
OWN_FAILS_FMT = '{}_DISC'
OWN_FAILS_CE_FMT = '{}_NO_OWN'
PLUS_MINUS_PERIODS = [(3,3), (3, 5), (5, 5)]

FLAG_RECIPES = {
   NO_TREATED_CE_FMT: [
       TREATED_SM_ST,
       TREATED_DM_ST,
       TREATED_SM_DT
    ],
    NO_OWN_NO_TREATED_CE_FMT: [
        TREATED_SM_ST,
        TREATED_DM_ST,
        TREATED_SM_DT,
        OWN_FAILS_FMT],
    OWN_FAILS_CE_FMT: [OWN_FAILS_FMT]}

In [12]:
PIVOTS = ['PRC', 'VOL', 'RET']
TTYPES = ['TREATING', 'TREATED']
TREATING = 'TREATING'
TREATED = 'TREATED'
TREATING_DT = 'TREATING_DISCONTINUED_IKT_DATE'
TREATED_DT = 'DISCONTINUED_IKT_DATE'
FLAGS = ['SAMEMKT_SAMETECH', 'SAMEMKT_DIFFTECH', 'DIFFMKT_SAMETECH']
CRSP_LONG_FNAME = 'PRC_RET_VOL_long'
SEARCH_ONLINE = False 
UPLOAD_DATA = True 
REG_DATA_FMT = 'crsp_event_plus_{0}_minus_{1}'

In [13]:
drop = DropboxAPI()

In [18]:
reg_data_dict = {}
for plus, minus in PLUS_MINUS_PERIODS:
    reg_data_dict['{0}_{1}'.format(plus, minus)] = drop.search_and_download(
        REG_DATA_FMT.format(plus, minus), DROPBOX_ANALYSIS_DATA, DATA, ',', SEARCH_ONLINE)


Searching local path
Full path /Users/lrraymond13/MIT/Kreiger_RA_2016/mkt_reaction_drug_failure/analysis/Data/crsp_event_plus_3_minus_3.csv
Searching local path
Full path /Users/lrraymond13/MIT/Kreiger_RA_2016/mkt_reaction_drug_failure/analysis/Data/crsp_event_plus_3_minus_5.csv
Searching local path
Full path /Users/lrraymond13/MIT/Kreiger_RA_2016/mkt_reaction_drug_failure/analysis/Data/crsp_event_plus_5_minus_5.csv


In [None]:
# code that looks at x day return after a treated event
# code to calculate total return over x days
# the look at dataset of all 'clean events' - subset data set to those matching criteria

In [15]:
# setup basic OLS regression
y = 

['3__3', '5__5', '3__5']

In [None]:
# for each of the events

In [23]:
reg_data_dict['3__3'].columns[:20]

Index([u'Unnamed: 0', u'ABBV_DISC', u'ABBV_PRC', u'ABBV_RET',
       u'ABBV_TREATED_DIFFMKT_SAMETECH', u'ABBV_TREATED_SAMEMKT_DIFFTECH',
       u'ABBV_TREATED_SAMEMKT_SAMETECH', u'ABBV_TREATING_DIFFMKT_SAMETECH',
       u'ABBV_TREATING_SAMEMKT_DIFFTECH', u'ABBV_TREATING_SAMEMKT_SAMETECH',
       u'ABBV_VOL', u'ABEO_DISC', u'ABEO_PRC', u'ABEO_RET',
       u'ABEO_TREATED_DIFFMKT_SAMETECH', u'ABEO_TREATED_SAMEMKT_DIFFTECH',
       u'ABEO_TREATED_SAMEMKT_SAMETECH', u'ABEO_VOL', u'ABIO_DISC',
       u'ABIO_PRC'],
      dtype='object')

In [19]:
reg_data_dict['3__3']

Unnamed: 0.1,Unnamed: 0,ABBV_DISC,ABBV_PRC,ABBV_RET,ABBV_TREATED_DIFFMKT_SAMETECH,ABBV_TREATED_SAMEMKT_DIFFTECH,ABBV_TREATED_SAMEMKT_SAMETECH,ABBV_TREATING_DIFFMKT_SAMETECH,ABBV_TREATING_SAMEMKT_DIFFTECH,ABBV_TREATING_SAMEMKT_SAMETECH,...,ZFGN_OTHER_TREATED,ZGNX_NO_OWN,ZGNX_NO_OWN_NO_OTHER_TREATED,ZGNX_OTHER_TREATED,ZIOP_NO_OWN,ZIOP_NO_OWN_NO_OTHER_TREATED,ZIOP_OTHER_TREATED,ZSAN_NO_OWN,ZSAN_NO_OWN_NO_OTHER_TREATED,ZSAN_OTHER_TREATED
0,1990-01-02,0.0,,,0.0,0.0,0.0,0.0,0.0,0.0,...,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
1,1990-01-03,0.0,,,0.0,0.0,0.0,0.0,0.0,0.0,...,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
2,1990-01-04,0.0,,,0.0,0.0,0.0,0.0,0.0,0.0,...,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
3,1990-01-05,0.0,,,0.0,0.0,0.0,0.0,0.0,0.0,...,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
4,1990-01-08,0.0,,,0.0,0.0,0.0,0.0,0.0,0.0,...,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
5,1990-01-09,0.0,,,0.0,0.0,0.0,0.0,0.0,0.0,...,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
6,1990-01-10,0.0,,,0.0,0.0,0.0,0.0,0.0,0.0,...,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
7,1990-01-11,0.0,,,0.0,0.0,0.0,0.0,0.0,0.0,...,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
8,1990-01-12,0.0,,,0.0,0.0,0.0,0.0,0.0,0.0,...,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
9,1990-01-15,0.0,,,0.0,0.0,0.0,0.0,0.0,0.0,...,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
