In [None]:
import os
import pandas as pd

# Working Dir.
os.chdir('/Users/fogellmcmuffin/Documents/ra/team_discussions/AI/')

In [None]:
##########################
## Tests using raw data ##
##########################

# Importing trim files
merged = pd.read_csv('trim_data/merged.csv')
no_noise = pd.read_csv('trim_data/no_noise.csv')
noise = pd.read_csv('trim_data/noise.csv')

# Test info
test_windows = ['ucoop']    # Windows for test
test_treatment = 'no_noise'   # Test data treatment type 

# Adjusting 'merged' columns based on test_treatment
merged = merged[no_noise.columns.to_list() if test_treatment == 'no_noise' else noise.columns.to_list()]

# Creating test dfs
def create_test_dfs():
    treatment = (0 if test_treatment == 'no_noise' else 1)
    test_ucoop, test_udef = [merged.loc[merged['treatment'] == treatment]] * 2
    
    test_ucoop = merged.loc[merged['window_ucoop'] == 1]
    test_ucoop = test_ucoop.drop(['window_ucoop', 'window_udef'], axis=1)
    
    test_udef = merged.loc[merged['window_udef'] == 1]
    test_udef = test_udef.drop(['window_ucoop', 'window_udef'], axis=1)
    return test_ucoop, test_udef


test_ucoop, test_udef = create_test_dfs()

# Export
def export_test():
    if 'ucoop' in test_windows:
        test_ucoop.to_csv(f'test_data/{test_treatment}_ucoop.csv', index=False)
    if 'udef' in test_windows:
        test_udef.to_csv(f'test_data/{test_treatment}_udef.csv', index=False)


export_test()

In [None]:
##############################
## Tests using summary data ##
##############################

# Importing
version = '3'
ra_no_noise = pd.read_csv(f'trim_data/RAsum_no_noise_v{version}.csv')
ra_noise = pd.read_csv(f'trim_data/RAsum_noise_v{version}.csv')
ra_merge = pd.read_csv(f'trim_data/RAsum_merged_v{version}.csv')

# Creating ucoop and udef test dfs
def ucoop_udef_windows(df): # Function to get ucoop & udef test data sets
    df['summary'] = df['summary'].str.replace(',', '', regex=False) # Removing commas in summary 
    df_ucoop = df.loc[(df['unilateral_cooperate'] == 1)]
    df_ucoop = df_ucoop.drop(['unilateral_cooperate', 'unilateral_defect', 'Unnamed: 0'], axis=1)
    
    df_udef = df.loc[(df['unilateral_defect'] == 1)]
    df_udef = df_udef.drop(['unilateral_defect', 'unilateral_cooperate', 'Unnamed: 0'], axis=1)
    
    return df_ucoop, df_udef

# Creating merged noise and no-noise test dfs
def merged_test_df(df):
    df['summary'] = df['summary'].str.replace(',', '', regex=False) # Removing commas in summary 
    df = df.drop(['Unnamed: 0'], axis=1)
    
    return df


ra_no_noise_ucoop, ra_no_noise_udef = ucoop_udef_windows(ra_no_noise)   # ucoop & udef no-noise test data
ra_noise_ucoop, ra_noise_udef = ucoop_udef_windows(ra_noise)    # ucoop & udef noise test data
ra_merge_ucoop, ra_merge_udef = ucoop_udef_windows(ra_merge)    # ucoop & udef merged test data
ra_merge_noise = merged_test_df(ra_noise)   # noise merged test data
ra_merge_no_noise = merged_test_df(ra_no_noise)     # no-noise merged test data

# Export
ra_no_noise_ucoop.to_csv(f'test_data/RAsum_no_noise_v{version}_ucoop.csv', index=False)
ra_no_noise_udef.to_csv(f'test_data/RAsum_no_noise_v{version}_udef.csv', index=False)
ra_noise_ucoop.to_csv(f'test_data/RAsum_noise_v{version}_ucoop.csv', index=False)
ra_noise_udef.to_csv(f'test_data/RAsum_noise_v{version}_udef.csv', index=False)
ra_merge_ucoop.to_csv(f'test_data/RAsum_merged_v{version}_ucoop.csv', index=False)
ra_merge_udef.to_csv(f'test_data/RAsum_merged_v{version}_udef.csv', index=False)
ra_merge_noise.to_csv(f'test_data/RAsum_merged_v{version}_noise.csv', index=False)
ra_merge_no_noise.to_csv(f'test_data/RAsum_merged_v{version}_no_noise.csv', index=False)