##### Imports/Settings

In [1]:
# General imports
import pandas as pd
import numpy as np
import csv
import os

# Pandas display settings
pd.set_option("display.max_colwidth",150)
pd.set_option('display.max_columns', None)

# Graph imports
import seaborn as sns
import matplotlib.pyplot as plt

# Graph settings
sns.set(context = "notebook", style = "white", font="verdana") # font_scale = 1.35)

# Function imports
from function_scripts.temp_funcs import read_file, merge_dataframes, \
                                        drop_cols, drop_nans, \
                                        filter_date_range, filter_df, create_cond_df, \
                                        create_container_df, create_user_tube_id, create_user_ivscc

##### Graph details

In [2]:
sub_region_order = ["MB", "PAL", "STRd", "STRv", "TH"]
sub_layer_order = ["SNc", "SNr", "Gpe", "Gpi", "CP", "ACB", "MD", "VAL"]

##### Paths

In [3]:
# IVSCC Data Blitz directory
path_ivscc = "C:/Users/ramr/Documents/Github/analysis_projects/ivscc_data_blitz"

# Ephys features csv
path_ephys = os.path.join(path_ivscc, "ephys_features.csv")

# Main JEM directory
path_main_jem = "//allen/programs/celltypes/workgroups/279/Patch-Seq/compiled-jem-data"

# JEM csv files
path_jem = os.path.join(path_main_jem, "jem_metadata.csv")
path_jem_na = os.path.join(path_main_jem, "jem_metadata_tubeNA.csv")
path_jem_fail = os.path.join(path_main_jem, "jem_metadata_wFAILURE.csv")

# Shiny directory
path_shiny_mouse = "//allen/programs/celltypes/workgroups/rnaseqanalysis/shiny/patch_seq/star/mouse_patchseq_VISp_current/mapping.df.with.bp.40.lastmap.csv"

In [4]:
fields_jem = ["date", "name", "organism_name", "status", "roi_major", "roi_minor", "rigOperator", "container"]
fields_shiny = ["sample_id", "cell_name", "percent_cdna_longer_than_400bp", "rna_amplification_pass_fail",
                "amplified_quantity_ng", "Genes.With.CPM", "marker_sum_norm_label", "Norm_Marker_Sum.0.4_label"]

In [5]:
jem = read_file(path_jem, fields_jem)
shiny_mouse = read_file(path_shiny_mouse, fields_shiny)

jem = create_user_tube_id(jem, "rigOperator")
jem = create_user_ivscc(jem, "rigOperator")

drop_nans_list = ["date", "roi_major", "user_tube_id"]
jem = drop_nans(jem, drop_nans_list)

jem = filter_df(jem, "organism_name", "Mouse")
jem = create_cond_df(jem, "roi_major", sub_region_order)

INFO:function_scripts.temp_funcs:Read file in as a pandas dataframe
INFO:function_scripts.temp_funcs:Read file in as a pandas dataframe
INFO:function_scripts.temp_funcs:Created a user_tube_id column to show(ex.'PA')
INFO:function_scripts.temp_funcs:Created a user_ivscc column to show(ex.'Ram')
INFO:function_scripts.temp_funcs:Dropped NaNs from these columns: ['date', 'roi_major', 'user_tube_id']
INFO:function_scripts.temp_funcs:Filtered dataframe based on organism_name == Mouse
INFO:function_scripts.temp_funcs:Created a conditional dataframe based on roi_major containing ['MB', 'PAL', 'STRd', 'STRv', 'TH']


In [6]:
jem.user_tube_id.unique()

array(['P8', 'PA', 'PJ', 'PE'], dtype=object)

In [12]:
jem = drop_cols(jem, ["container", "status", "organism_name", "rigOperator"])

INFO:function_scripts.temp_funcs:Dropped columns: ['container', 'status', 'organism_name', 'rigOperator']


KeyError: "['container' 'status' 'organism_name'] not found in axis"

In [13]:
jem

Unnamed: 0,name,date,rigOperator,roi_major,roi_minor,user_tube_id,user_ivscc
12350,Vip-IRES-Cre;Ai14-542026.11.09.02,2020-09-02 11:00:04 -0700,lindsayn,PAL,Gpi,P8,Lindsay
12351,Vip-IRES-Cre;Ai14-542026.11.09.01,2020-09-02 11:00:04 -0700,lindsayn,PAL,Gpi,P8,Lindsay
12410,Slc17a8-iCre;Ai14-544246.10.09.01,2020-09-15 15:10:07 -0700,ramr,PAL,Gpi,PA,Ram
12490,Sncg-IRES2-FlpO-neo;Ai65F-546568.07.06.01,2020-10-02 14:09:18 -0700,sarav,PAL,Gpi,PJ,Sara
12491,Sncg-IRES2-FlpO-neo;Ai65F-546568.07.06.02,2020-10-02 14:09:18 -0700,sarav,PAL,Gpi,PJ,Sara
...,...,...,...,...,...,...,...
13008,Slc17a7-IRES2-Cre;Ai14-565032.08.09.01,2021-02-09 10:51:55 -0800,ramr,TH,MD,PA,Ram
13013,Vip-IRES-Cre;Ai14-564742.04.10.02,2021-02-10 14:16:31 -0800,ramr,STRv,ACB,PA,Ram
13014,Vip-IRES-Cre;Ai14-564742.04.10.01,2021-02-10 14:16:31 -0800,ramr,STRv,ACB,PA,Ram
13015,Vip-IRES-Cre;Ai14-564742.04.10.03,2021-02-10 14:16:31 -0800,ramr,STRv,ACB,PA,Ram
