In [1]:
import os
import pandas as pd
import gene_cocktail_analyser as gca

In [2]:
# Define your paths to files here: your cocktails and filters
# Construct dictionaries for both
filters_path = "input_data/filters/"
cocktail_path = "input_data/cocktails/"

filters = {"aav-lung-mef": "filters-AAV-LUNG-MEF.csv",
           "no-wt-n-d-pool": "filters_NO-WT-N-D-POOL.csv"}

for key in filters:
    filters[key] = filters_path + filters[key]
    
cocktails = {
    "aav": "AAVCocktail-01_Unique_Seq.csv",
    "d2": "D2_Unique_Seq.csv",
    "d7": "D7_Unique_Seq.csv",
    "lung1": "LUNG1_Unique_Seq.csv",
    "lung2": "LUNG2_Unique_Seq.csv",
    "lung3": "LUNG3_Unique_Seq.csv",
    "lung4": "LUNG4_Unique_Seq.csv",
    "lungc": "LUNGC_Unique_Seq.csv",
    "mef2": "MEF2_Unique_Seq.csv",
    "mef3": "MEF3_Unique_Seq.csv",
    "n1_2": "N1-2_Unique_Seq.csv",
    "n1_7": "N1-7_Unique_Seq.csv",
    "n2_2": "N2-2_Unique_Seq.csv",
    "n2_7": "N2-7_Unique_Seq.csv",
    "no2": "NO2_Unique_Seq.csv",
    "n07": "NO7_Unique_Seq.csv",
    "pool": "POOL_Unique_Seq.csv",
    "wt2": "WT2_Unique_Seq.csv",
    "wt7": "WT7_Unique_Seq.csv"
}

for key in cocktails:
    cocktails[key] = cocktail_path + cocktails[key]
    
# Now make another dictionary that maps the
# cocktails to filters
    
cocktail_to_filter = {
    "aav": "aav-lung-mef",
    "d2": "no-wt-n-d-pool",
    "d7": "no-wt-n-d-pool",
    "lung1": "aav-lung-mef",
    "lung2": "aav-lung-mef",
    "lung3": "aav-lung-mef",
    "lung4": "aav-lung-mef",
    "lungc": "aav-lung-mef",
    "mef2": "aav-lung-mef",
    "mef3": "aav-lung-mef",
    "n1_2": "no-wt-n-d-pool",
    "n1_7": "no-wt-n-d-pool",
    "n2_2": "no-wt-n-d-pool",
    "n2_7": "no-wt-n-d-pool",
    "no2": "no-wt-n-d-pool",
    "n07": "no-wt-n-d-pool",
    "pool": "no-wt-n-d-pool",
    "wt2": "no-wt-n-d-pool",
    "wt7": "no-wt-n-d-pool"
}



In [None]:
%%time

# Here process all data at once
# might take a bit of time but everything 
# wil lbe done in one go
for cocktail_key, filter_key in cocktail_to_filter.items():
    cocktail_data = gca.GeneCocktailAnalyser(cocktails[cocktail_key], filters[filter_key])
    cocktail_data.process_data()
    cocktail_data.display_results()
    cocktail_data.plot_visualisations()

In [None]:
%%time
test_dataset = "tests/test_data/test_sequence_data.csv"
test_filters = "tests/test_data/test_filters.csv"

test_data = gca.GeneCocktailAnalyser(test_dataset, test_filters)

test_data.process_data()
test_data.display_results()