##### Imports

In [1]:
import pandas as pd
import csv
import logging

import seaborn as sns

##### Logging Set-up

In [2]:
logging.basicConfig(level=logging.INFO)
logger = logging.getLogger(__name__)

##### Miscellaneous Settings

In [3]:
sns.set(context = "notebook", style = "ticks", font="verdana", font_scale = 1.35)
pd.set_option("display.max_colwidth",150) #Expands the number of characters shown in the columns
pd.set_option('display.max_columns', None)

##### Logging Comments about this project

In [4]:
logger.info("""Purpose: Personal Tracker for 2020
            
            Checklist:
            1) Counts of RSPd, RSPv, SSp for coronal
            2) Track ORB, CLA, MO for sagittal
            3) Obtains ephys features for all the mouse regions
            4) Plot similarities/differences""")

INFO:__main__:Purpose: Personal Tracker for 2020
            
            Checklist:
            1) Counts of RSPd, RSPv, SSp for coronal
            2) Track ORB, CLA, MO for sagittal
            3) Obtains ephys features for all the mouse regions
            4) Plot similarities/differences


##### Load in JEM form automatically from file path

In [5]:
def read_jem_csv(fields=None):
    """
    Finds and read jem metadata csv.
    
    Args: 
        directory_name: file directory path of jem matadata file
        jem_file: jem metadata file name

    Returns:
        jem: a pandas dataframe with jem metadata
    """
    global jem  # Define as global to return outside of function
    
    csv_path = "Z:/Patch-Seq/compiled-jem-data/"
    csv_file = "jem_metadata.csv"
    jem = pd.read_csv(csv_path + csv_file, usecols=fields, index_col=["date"])
    logger.info("Read jem metadata csv (date: 2/07/2020)")

In [25]:
def read_shiny_csv(fields=None):
    """
    Finds and read jem metadata csv.
    
    Args: 
        directory_name: file directory path of jem matadata file
        jem_file: jem metadata file name

    Returns:
        jem: a pandas dataframe with jem metadata
    """
    global shiny  # Define as global to return outside of function
    
    csv_path = "//allen/programs/celltypes/workgroups/rnaseqanalysis/shiny/patch_seq/star/mouse_patchseq_VISp_current/mapping.df.with.bp.40.lastmap.csv"
    shiny = pd.read_csv(csv_path, usecols=fields)
    logger.info("Read jem metadata csv (date: 2/07/2020)")

In [26]:
read_shiny_csv()

INFO:__main__:Read jem metadata csv (date: 2/07/2020)


In [22]:
shiny

Unnamed: 0.1,Unnamed: 0,sample_id,cluster_detail,cluster_label,score,n_marker,res_index,h_score,marker_genes,res_index_pctile,exp_component_name,ar_id,exp_component_vendor_name,batch,batch_vendor_name,tube,tube_internal_name,tube_contents_nm,tube_contents_nm_from_vendor,tube_avg_size_bp,tube_input_fmol,r1_index,r2_index,index_sequence_pair,organism,facs_container,sample_name,patched_cell_container,cell_name,cell_id,sample_quantity_count,sample_quantity_pg,external_donor_name,gender,control,cell_prep_type,full_genotype,facs_population_plan,cre_line,reporter,injection_roi,injection_method,injection_materials,propagation_type,roi,patchseq_roi,medical_conditions,slice_min_pos,slice_max_pos,rna_amplification_set,rna_amplification,amp_date,pcr_cycles,percent_cdna_longer_than_400bp,rna_amplification_pass_fail,amplified_quantity_ng,library_prep_set,library_prep,lib_date,library_input_ng,avg_size_bp,quantification2_ng,quantification_fmol,quantification2_nm,library_prep_pass_fail,exp_cluster_density_thousands_per_mm2,lane_read_count,alignment_date,vendor_read_count,total_reads,percent_reads_aligned_to_exons,percent_reads_aligned_to_rrna,percent_reads_aligned_to_trna,percent_reads_aligned_to_rrna_rmsk,percent_reads_aligned_to_trna_rmsk,percent_reads_aligned_to_ncrna,percent_reads_aligned_to_mt_exons,percent_reads_aligned_to_introns,percent_reads_aligned_to_intergenic,percent_reads_aligned_unique,percent_reads_aligned_to_ecoli,percent_reads_aligned_to_synthetic_constructs,percent_reads_aligned_total,complexity_aatt,complexity_acgt,complexity_agct,complexity_at,complexity_catg,complexity_ccgg,complexity_cg,complexity_gatc,complexity_gc,complexity_ta,experiment_component_failed,fpkm_published,fpkm_dir,fpkm_filename,transcriptome_bam_filename,fastq_path_list,S4.Lot,Data,MultiPlex,Genes.With.FPKM,Genes.Detected,FPKM.4,FPKM.8,FPKM.16,FPKM.32,FPKM.64,Genes.With.CPM,Genes.Detected.CPM,CPM.4,CPM.8,CPM.16,CPM.32,CPM.64,Exclude.STAR,Region,Well.Row,Well.Column,Type,tubeID,patch.date,rigOperator,rigNumber,Fill.Date,internalFillDate,pilotName,creCell,autoRoi,manualRoi,cell_depth,sliceHealth,timeWholeCellStart,timeExtractionStart,pressureApplied,timeExtractionEnd,retractionPressureApplied,timeRetractionEnd,postPatch,endPipetteR,Total_time,Ephys_time,Retraction_time,Virus,cell_specimen_project,structure,go_no_go_63x,image_series_63x_qc,Class,last_map,last_score,last_res,cluster_same,topLeaf,topLeafValue,broad_class_label,subclass_label,topLeaf_label,quality_score_label,marker_sum_norm_label,Norm_Marker_Sum.0.4_label,contaminationType_label,seurat_cluster_label,seurat_prediction_score_label,Tree_first_cl,Tree_second_cl,Tree_third_cl,Tree_first_bt,Tree_second_bt,Tree_third_bt,Tree_first_KL,Tree_second_KL,Tree_third_KL,Tree_first_cor,Tree_second_cor,Tree_third_cor,Tree_call,Old_call
0,1,P1S4_170807_003_A01,L2/3 IT VISp Rrad,L2/3 IT VISp Rrad,1.0,8,1.0,1.0,"L2/3 IT VISp Rrad:Baz1a Fosb Fosl2 Csrnp1 Rrad Pim1 Met Nos1,n39:Calb1 Meis2 Pdzrn3 Dscaml1 Cux2 Fam19a1 Gpc6 Nov Rgs8 Npnt Igsf11 Kitl Ccbe1 Pcdh...",100,PS0830_E1-50_S91,687624861,,P3S4-170830,BT038,PS0830,BT170830_01,5.000000,,350.0,5,N729,S505,TCGACGTC-GTAAGGAG,Mouse,,,P1S4_170807_003_A01,Vipr2-IRES2-Cre;Slc32a1-T2A-FlpO;Ai65-338915.05.02.03,606790451,1,,338915,M,,,Vipr2-IRES2-Cre/wt;Slc32a1-T2A-FlpO/wt;Ai65(RCFL-tdT)/wt,,Slc32a1-T2A-FlpO_and_Vipr2,Ai65(RCFL-tdT),,,,,,VISp,,3.0,6.0,A3S4_170810b,A3S4_170810_016,,21x,0.669407,Pass,35.670000,L3S4_170824,L3S4_170824_043,8/24/2017 7:00,0.15,378.0,,42.568543,,Pass,,,25:23.1,,1981074,63.790063,0.088538,0.040584,0.268087,0.014739,2.894995,0.0,31.720522,4.489415,53.815759,0.000725,0.006814,59.538008,1.002786,0.909747,1.199936,0.867220,1.252630,1.106709,0.348370,1.067803,0.935120,0.676909,False,,/allen/programs/celltypes/production/mousecelltypes/prod217/Star_Analysis_Run_687624861/687624861/,ar_687624861_STAR_ReadsPerGene.out.tab,ar_618245608.aligned_transcriptome.sorted.bam,/allen/programs/celltypes/production/mousecelltypes/prod101/rseq_tube_set_P3S4-170830/BT038_P3S4-170830/RAW-DATA/PS0830/PS0830_E1-50_TCGACGTC-GTAA...,1608207A,Pre-Production,index96,5221,4699,3877,3492,3046,2499,1777,7275,5833,5084,4751,4455,4027,3413,YES,VISp,L3S4_170824_043,L3S4_170824_043,patch_seq,,8/7/2017,,,,,,tdt-,,,50.0,3.0,,,-50,,,,Nucleated,,,,,,T301x,VISp2/3,63x go,ready_for_dendrite_trace,noclass,L2/3 IT VISp Rrad,1.00,1.0,True,L2/3 IT VISp Rrad,1.00,Glutamatergic,L2/3 IT,L2/3 IT VISp Rrad,0.303021,0.860635,True,Macrophage,L2/3 IT VISp Rrad,0.963955,L2/3 IT VISp Rrad,L2/3 IT VISp Adamts2,L2/3 IT VISp Agmat,1.00,0.00,0.00,0.077244,2.690474,2.356859,0.699350,0.668879,0.655481,Core,Leaf_node
1,2,P1S4_190214_003_A01,L2/3 IT VISp Rrad,L2/3 IT VISp Rrad,1.0,6,1.0,1.0,"L2/3 IT VISp Rrad:Baz1a Fosb Fosl2 Csrnp1 Tnfaip6 Cpne7,n39:Calb1 Meis2 Pdzrn3 Dscaml1 Lypd1 Cux2 Stxbp6 Fam19a1 Gpc6 Nov Gpr88 Otof Rgs8 Syt17 Ma...",100,SM-GE4RC_S053_E1-50,838985624,SM-GE4RC-S053,R8S4-190307,RSC-199,SM-GE4RC,R8S4-19030708,6.309855,3.71,332.0,8,NEXT-i7-IDT-138,NEXT-i5-IDT-247,GTGCTTAC-AGAGCAGA,Mouse,,,P1S4_190214_003_A01,Glt25d2-Cre_NF107;Ai14-442297.04.01.02,823231829,1,,442297,M,,,Glt25d2-Cre_NF107/wt;Ai14(RCL-tdT)/wt,,Glt25d2-Cre_NF107,Ai14(RCL-tdT),,,,,VISp2-3,VISp2-3,,3.0,5.0,A8S4_190221_08,A8S4_190221_08_E07,,20x,0.635000,Pass,16.223226,L8S4_190228_04,L8S4_190228_04_E07,2/28/2019 8:00,0.05,344.0,33.025570,145.461460,8.081192,Pass,952.0,114458099.0,25:53.9,1376745.0,1341754,61.929367,0.719133,0.312576,4.461772,0.091820,4.916475,0.0,32.571684,5.498949,83.269213,0.005314,0.001099,91.982360,1.001292,0.942622,1.253766,0.812799,1.223535,1.041625,0.379886,1.074233,0.948359,0.692316,False,,/allen/programs/celltypes/production/mousecelltypes/prod362/Star_Analysis_Run_838985624/838985624/,ar_838985624_STAR_ReadsPerGene.out.tab,,/allen/programs/celltypes/production/mousecelltypes/prod359/rseq_tube_set_R8S4-190307/RSC-199_R8S4-190307/RAW-DATA/SM-GE4RC/SM-GE4RC_E1-50_GTGCTTA...,1709695A,Production,index192,8769,7997,6502,5508,4230,2654,1401,10458,9248,8394,7796,7015,5724,3836,No,VISp,E,7,patch_seq,P1S4_190214_003_A01,2/14/2019,kristenh,5,1/25/2019,12/5/2018,,Cre+,"None, None",VISp2/3,119.7,3.0,14:03:04-08:00,14:18:17-08:00,-40,14:18:46-08:00,-40.0,14:20:48-08:00,nucleus_present,1500.0,1064.0,29.0,122.0,,mIVSCC-MET,VISp2/3,63x go,deferred,noclass,L2/3 IT VISp Rrad,1.00,1.0,True,L2/3 IT VISp Rrad,1.00,Glutamatergic,L2/3 IT,L2/3 IT VISp Rrad,0.317663,1.008909,True,Macrophage,L2/3 IT VISp Rrad,0.405910,L2/3 IT VISp Rrad,L2/3 IT VISp Adamts2,L2/3 IT VISp Agmat,1.00,0.00,0.00,0.077244,2.690474,2.356859,0.737537,0.726389,0.723405,Core,Leaf_node
2,3,P1S4_190624_004_A01,L2/3 IT VISp Rrad,L2/3 IT VISp Rrad,1.0,7,1.0,1.0,"L2/3 IT VISp Rrad:Baz1a Fosb Fst Pim1 Tnfaip6 Col23a1 Met,n39:Calb1 Meis2 Pdzrn3 Dscaml1 Lypd1 Cux2 Stxbp6 Fam19a1 Gpc6 Nov Gpr88 Otof Syt17 Mas1 ...",100,SM-GE4XY_S036_E1-50,924012662,SM-GE4XY-S036,R8S4-190731,RSC-218,SM-GE4XY,R8S4-19073108,2.315578,1.48,339.0,6,IDT_10nt_NXT_i7_329,IDT_10nt_NXT_i5_329,GCTACAGGTC-TCCTGCATAA,Mouse,,,P1S4_190624_004_A01,Slc17a7-IRES2-Cre;Ai14-470692.04.01.04,893406540,1,,470692,M,,,Slc17a7-IRES2-Cre/wt;Ai14(RCL-tdT)/wt,,Slc17a7,Ai14(RCL-tdT),,,,,VISp2-3,VISp2-3,,4.0,4.0,A8S4_190717_07,A8S4_190717_07_D05,,20x,0.648000,Pass,21.532627,L8S4_190725_02,L8S4_190725_02_D05,7/25/2019 7:00,0.05,332.0,27.552400,125.741145,6.985619,Pass,944.0,117056997.0,28:17.1,1344716.0,1289667,49.458974,0.224399,0.102740,5.294855,0.048695,4.859161,0.0,43.989879,6.551147,83.289950,0.003743,0.004908,90.762577,1.019504,0.941122,1.258137,0.792132,1.209253,1.045120,0.376151,1.080586,0.946976,0.684672,False,,/allen/programs/celltypes/production/mousecelltypes/prod412/Star_Analysis_Run_924012662/924012662/,ar_924012662_STAR_ReadsPerGene.out.tab,,/allen/programs/celltypes/production/mousecelltypes/prod410/rseq_tube_set_R8S4-190731/RSC-218_R8S4-190731/RAW-DATA/SM-GE4XY/SM-GE4XY_E1-50_GCTACAG...,1709695A,Production,index192,8581,7943,6431,5385,4068,2617,1391,10486,9235,8366,7726,6833,5490,3669,No,VISp,D,5,patch_seq,P1S4_190624_004_A01,2019-06-24T10:08:10-07:00,kristenh,6,5/9/2019,5/6/2019,,Cre+,"None, None",VISp2/3,40.0,3.0,11:28:48-07:00,11:39:52-07:00,-35,11:40:40-07:00,-35.0,11:43:02-07:00,nucleus_present,55.0,854.0,48.0,142.0,,mIVSCC-MET,VISp,63x no go,,noclass,L2/3 IT VISp Rrad,1.00,1.0,True,L2/3 IT VISp Rrad,1.00,Glutamatergic,L2/3 IT,L2/3 IT VISp Rrad,0.307486,0.929440,True,Macrophage,L2/3 IT VISp Rrad,0.564633,L2/3 IT VISp Rrad,L2/3 IT VISp Adamts2,L2/3 IT VISp Agmat,1.00,0.00,0.00,0.077244,2.690474,2.356859,0.763153,0.750406,0.735887,Core,Leaf_node
3,4,P1S4_190628_007_A01,L2/3 IT VISp Rrad,L2/3 IT VISp Rrad,1.0,5,1.0,1.0,"L2/3 IT VISp Rrad:Baz1a Fosb Fosl2 Gpr3 Rrad,n39:Calb1 Meis2 Pdzrn3 Dscaml1 Cux2 Fam19a1 Gpc6 Rgs8 Mas1 Npnt Myh7 Igsf11 Kitl BC048546 6330403A02R...",100,SM-GE4XY_S145_E1-50,924012888,SM-GE4XY-S145,R8S4-190731,RSC-218,SM-GE4XY,R8S4-19073108,2.315578,1.48,339.0,6,IDT_10nt_NXT_i7_391,IDT_10nt_NXT_i5_391,TGTCTTCATC-TAGCGTGAAT,Mouse,,,P1S4_190628_007_A01,Slc17a7-IRES2-Cre;Ai14-470694.04.01.02,896877084,1,,470694,M,,,Slc17a7-IRES2-Cre/wt;Ai14(RCL-tdT)/wt,,Slc17a7,Ai14(RCL-tdT),,,,,VISp2-3,VISp2-3,,3.0,4.0,A8S4_190717_08,A8S4_190717_08_A07,,20x,0.681000,Pass,13.323022,L8S4_190725_03,L8S4_190725_03_A07,7/25/2019 7:00,0.05,362.0,29.331131,122.765491,6.820305,Pass,944.0,117056997.0,06:41.8,1297879.0,1253325,89.340494,0.281651,0.140666,8.569844,0.036383,2.901243,0.0,4.970598,5.688908,76.498753,0.005581,0.012477,89.461233,1.020070,0.921824,1.238218,0.800546,1.207471,1.046916,0.463236,1.104368,0.947359,0.629609,False,,/allen/programs/celltypes/production/mousecelltypes/prod413/Star_Analysis_Run_924012888/924012888/,ar_924012888_STAR_ReadsPerGene.out.tab,,/allen/programs/celltypes/production/mousecelltypes/prod410/rseq_tube_set_R8S4-190731/RSC-218_R8S4-190731/RAW-DATA/SM-GE4XY/SM-GE4XY_E1-50_TGTCTTC...,1709695A,Production,index192,7312,6690,5666,5054,4111,2719,1549,8274,8274,6554,6120,5647,5034,3900,No,VISp,A,7,patch_seq,P1S4_190628_007_A01,2019-06-28T12:44:21-07:00,kristenh,6,5/9/2019,5/6/2019,,Cre+,"None, None",VISp2/3,47.7,3.0,13:24:07-07:00,13:32:03-07:00,-40,13:32:49-07:00,-55.0,13:36:57-07:00,nucleus_absent,2000.0,770.0,46.0,248.0,,mIVSCC-MET,VISp2/3,63x go,deferred,noclass,L2/3 IT VISp Rrad,0.99,1.0,True,L2/3 IT VISp Rrad,1.00,Glutamatergic,L2/3 IT,L2/3 IT VISp Rrad,0.240986,0.863722,True,Macrophage,L2/3 IT VISp Agmat,0.382207,L2/3 IT VISp Rrad,L2/3 IT VISp Adamts2,L2/3 IT VISp Agmat,1.00,0.00,0.00,0.077244,2.690474,2.356859,0.533772,0.521344,0.545990,Core,Leaf_node
4,5,P1S4_190725_002_A01,L2/3 IT VISp Rrad,L2/3 IT VISp Rrad,1.0,9,1.0,1.0,"L2/3 IT VISp Rrad:Baz1a Fosb Fosl2 Csrnp1 Shroom3 Fst Rrad Tnfaip6 Col23a1,n39:Calb1 Meis2 Pdzrn3 Dscaml1 Lypd1 Cux2 Stxbp6 Fam19a1 Gpc6 Nov Gpr88...",100,SM-GE4W8_S073_E1-50,937700850,SM-GE4W8-S073,R8S4-190821,RSC-221,SM-GE4W8,R8S4-19082103,2.667801,1.51,330.0,6,IDT_10nt_NXT_i7_490,IDT_10nt_NXT_i5_490,TTGCGCCAAG-GATAGCCGAG,Mouse,,,P1S4_190725_002_A01,Slc32a1-IRES-Cre;Ai14-476712.04.01.02,912008949,1,,476712,M,,,Slc32a1-IRES-Cre/wt;Ai14(RCL-tdT)/wt,,Slc32a1,Ai14(RCL-tdT),,,,,VISp2-3,VISp2-3,,2.0,5.0,A8S4_190802_10,A8S4_190802_10_A10,,20x,0.633000,Pass,13.609205,L8S4_190809_05,L8S4_190809_05_A10,8/9/2019 7:00,0.05,326.0,19.609070,91.137152,5.063175,Pass,1043.0,142235349.0,05:16.7,1433855.0,1379103,47.061596,0.111087,0.035820,1.858599,0.037923,6.524241,0.0,46.109490,6.828913,84.139836,0.004996,0.001585,89.829621,1.015759,0.947892,1.268953,0.785113,1.215130,1.034363,0.359755,1.069798,0.962513,0.694875,False,,/allen/programs/celltypes/production/mousecelltypes/prod418/Star_Analysis_Run_937700850/937700850/,ar_937700850_STAR_ReadsPerGene.out.tab,,/allen/programs/celltypes/production/mousecelltypes/prod418/rseq_tube_set_R8S4-190821/RSC-221_R8S4-190821/RAW-DATA/SM-GE4W8/SM-GE4W8_E1-50_TTGCGCC...,1709695A,Production,index192,7722,7102,5825,4906,3842,2623,1394,10225,8967,8079,7575,6689,5467,3742,No,VISp,A,10,patch_seq,P1S4_190725_002_A01,2019-07-25T10:39:25-07:00,kristenh,6,6/25/2019,6/24/2019,,Cre-,"None, None",VISp2/3,38.6,3.0,11:08:14-07:00,11:15:38-07:00,-60,11:17:37-07:00,-60.0,11:19:10-07:00,nucleus_present,2500.0,656.0,119.0,93.0,,mIVSCC-MET,VISp2/3,63x no go,,noclass,L2/3 IT VISp Rrad,1.00,1.0,True,L2/3 IT VISp Rrad,1.00,Glutamatergic,L2/3 IT,L2/3 IT VISp Rrad,0.434085,0.984183,True,Macrophage,L2/3 IT VISp Rrad,0.828399,L2/3 IT VISp Rrad,L2/3 IT VISp Adamts2,L2/3 IT VISp Agmat,1.00,0.00,0.00,0.077244,2.690474,2.356859,0.782459,0.770916,0.797846,Core,Leaf_node
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
10336,10337,PXS4_190306_402_A01,n3,n3,1.0,1,0.0,0.0,n3:,4,SM-GE4QN_S130_E1-50,846392401,SM-GE4QN-S130,R8S4-190327,RSC-202,SM-GE4QN,R8S4-19032708,2.857375,1.72,323.0,8,NEXT-i7-IDT-80,NEXT-i5-IDT-305,ATGCACGA-AAGGAGAC,Mouse,,,PXS4_190306_402_A01,Nr5a1-Cre;Ai140;Pvalb-T2A-FlpO;Ai65F-449966.07.06.01.05,834013800,1,,449966,M,,,Pvalb-T2A-FlpO/wt;Ai65F/wt,,Pvalb-T2A-FlpO,Ai65F,,,,,VISp5,VISp5,,0.0,0.0,A8S4_190314_06,A8S4_190314_06_B05,,20x,0.289000,Fail,4.891684,L8S4_190321_03,L8S4_190321_03_B05,3/21/2019 7:00,0.05,301.0,18.188599,91.556422,5.086468,Fail,978.0,98560943.0,51:40.5,1108141.0,1052403,69.218320,1.187093,0.260832,50.869296,0.050646,2.006741,0.0,13.447120,17.334560,29.238704,0.024718,0.020471,67.069554,1.123349,0.980875,1.000200,0.937529,0.909552,1.051221,0.941515,1.086885,0.958512,0.805874,False,,/allen/programs/celltypes/production/mousecelltypes/prod370/Star_Analysis_Run_846392401/846392401/,ar_846392401_STAR_ReadsPerGene.out.tab,,/allen/programs/celltypes/production/mousecelltypes/prod367/rseq_tube_set_R8S4-190327/RSC-202_R8S4-190327/RAW-DATA/SM-GE4QN/SM-GE4QN_E1-50_ATGCACG...,1709695A,Production,index192,1168,1066,804,652,521,420,316,2382,2382,1437,1220,1006,786,606,YES,VISp,B,5,patch_seq,PXS4_190306_402_A01,3/6/2019,lisak,MP2,2/5/2019,2/8/2019,,Cre+,"None, None",VISp5,60.0,3.0,12:55:03-08:00,12:55:07-08:00,-34,12:55:07-08:00,-34.0,12:55:08-08:00,nucleus_present,0.0,5.0,0.0,1.0,,mMPATCH,VISp,,,noclass,n3,1.00,0.0,True,L6 CT VISp Nxph2 Wls,0.38,Glutamatergic,L6 CT,L6 CT VISp Nxph2 Wls,0.213413,0.230697,False,Oligo,ZZ_Missing,0.000000,L6 CT VISp Nxph2 Wls,Lamp5 Ntn1 Npy2r,L6 CT VISp Gpr139,0.38,0.27,0.06,7.896514,9.054855,10.329515,0.410978,0.388367,0.392829,PoorQ,PoorQ
10337,10338,PXS4_190306_403_A01,n3,n3,1.0,1,0.0,0.0,n3:,4,SM-GE4QN_S131_E1-50,846392403,SM-GE4QN-S131,R8S4-190327,RSC-202,SM-GE4QN,R8S4-19032708,2.857375,1.72,323.0,8,NEXT-i7-IDT-68,NEXT-i5-IDT-317,ACGTTCAG-CACAGACT,Mouse,,,PXS4_190306_403_A01,Nr5a1-Cre;Ai140;Pvalb-T2A-FlpO;Ai65F-449966.07.06.01.06,834013807,1,,449966,M,,,Pvalb-T2A-FlpO/wt;Ai65F/wt,,Pvalb-T2A-FlpO,Ai65F,,,,,VISp4,VISp4,,0.0,0.0,A8S4_190314_06,A8S4_190314_06_C05,,20x,0.279000,Fail,3.775876,L8S4_190321_03,L8S4_190321_03_C05,3/21/2019 7:00,0.05,298.0,20.202185,102.716013,5.706445,Fail,978.0,98560943.0,51:41.2,1044127.0,990308,69.539666,0.864479,0.107643,40.545467,0.032717,1.698058,0.0,13.603374,16.856960,29.760539,0.027896,0.018946,58.350735,1.118273,0.986071,1.039064,0.885142,0.952165,1.047564,0.897287,1.079069,0.991996,0.777734,False,,/allen/programs/celltypes/production/mousecelltypes/prod370/Star_Analysis_Run_846392403/846392403/,ar_846392403_STAR_ReadsPerGene.out.tab,,/allen/programs/celltypes/production/mousecelltypes/prod367/rseq_tube_set_R8S4-190327/RSC-202_R8S4-190327/RAW-DATA/SM-GE4QN/SM-GE4QN_E1-50_ACGTTCA...,1709695A,Production,index192,1408,1302,1083,922,738,584,439,2552,2552,2552,1728,1345,1057,819,YES,VISp,C,5,patch_seq,PXS4_190306_403_A01,3/6/2019,lisak,MP2,2/5/2019,2/8/2019,,Cre+,"None, None",VISp4,60.0,3.0,12:55:39-08:00,12:55:43-08:00,-34,12:55:44-08:00,-34.0,12:55:44-08:00,nucleus_present,1000.0,5.0,1.0,0.0,,mMPATCH,VISp,,,noclass,n3,1.00,0.0,True,Pvalb Reln Itm2a,0.18,GABAergic,Pvalb,Pvalb Reln Itm2a,0.142597,0.148171,False,Peri,ZZ_Missing,0.000000,Pvalb Reln Itm2a,L5 PT VISp Lgr5,L5 PT VISp Krt80,0.18,0.12,0.09,10.253034,10.117435,10.349889,0.435000,0.412395,0.420699,PoorQ,PoorQ
10338,10339,PXS4_190307_302_A01,n3,n3,1.0,1,0.0,0.0,n3:,4,SM-GE4Q8_S019_E1-50,856697833,SM-GE4Q8-S019,R8S4-190417,RSC-205,SM-GE4Q8,R8S4-19041701,3.293740,1.89,323.0,6,NEXT-i7-IDT-166,NEXT-i5-IDT-219,CATCGTGA-GATGTCGA,Mouse,,,PXS4_190307_302_A01,Sst-IRES-Cre;Chrna6-IRES2-FlpO-WPRE-neo-445889-Ai193-hyg.04.01,839878441,1,,445889,M,,,Sst-IRES-Cre/wt;Chrna6-IRES2-FlpO-WPRE-neo/wt;Ai193(TICL-EGFP-ICF-tdT)-hyg/wt,,Chrna6,Ai193(TICL-EGFP-ICF-tdT)-hyg,,,,,FCx5,FCx5,,,,A8S4_190327_06,A8S4_190327_06_C03,,20x,0.344000,Fail,34.619231,L8S4_190405_02,L8S4_190405_02_C03,4/5/2019 7:00,0.05,327.0,13.620255,63.109327,3.506074,Fail,853.0,214100000.0,42:19.1,851734.0,802545,34.677443,0.064669,0.000125,3.538992,0.000125,0.091708,0.0,27.388573,37.933984,4.224187,0.046220,0.010046,11.356746,1.743318,0.429857,1.597950,0.232063,0.342938,1.424154,0.571730,1.584399,0.623079,0.244256,False,,/allen/programs/celltypes/production/mousecelltypes/prod375/Star_Analysis_Run_856697833/856697833/,ar_856697833_STAR_ReadsPerGene.out.tab,,/allen/programs/celltypes/production/mousecelltypes/prod372/rseq_tube_set_R8S4-190417/RSC-205_R8S4-190417/RAW-DATA/SM-GE4Q8/SM-GE4Q8_E1-50_CATCGTG...,1709695A,Production,index192,713,708,699,680,613,510,399,3229,3229,3229,3229,3229,3229,1448,YES,FCx,C,3,patch_seq,PXS4_190307_302_A01,2019-03-07 12:33:51 -08:00,briank,HCT2,3/4/2019,2/5/2019,,Cre+,"None, None",FCx5,60.0,2.0,12:35:31 -07:00,12:35:38 -07:00,-60,12:35:39 -07:00,-80.0,12:35:39 -07:00,nucleus_present,1000.0,8.0,1.0,0.0,,mIVSCC-METx,,,,noclass,n3,1.00,0.0,True,L4 IT VISp Rspo1,0.15,Glutamatergic,L4,L4 IT VISp Rspo1,0.064791,0.201339,False,Oligo,ZZ_Missing,0.000000,L4 IT VISp Rspo1,Pvalb Reln Itm2a,Pvalb Th Sst,0.15,0.15,0.12,9.414784,10.127995,9.914666,0.208256,0.197606,0.178528,PoorQ,PoorQ
10339,10340,PXS4_190313_404_A01,n3,n3,1.0,1,0.0,0.0,n3:,4,SM-GE4SJ_S095_E1-50,855238658,SM-GE4SJ-S095,R8S4-190410,RSC-204,SM-GE4SJ,R8S4-19041002,2.881613,1.32,327.0,6,NEXT-i7-IDT-109,NEXT-i5-IDT-276,CTTACCTG-ACAGTTCG,Mouse,,,PXS4_190313_404_A01,Sst-IRES-Cre;Ai140;Pvalb-T2A-FlpO;Ai65F-451706.08.06.01.06,837035702,1,,451706,F,,,Pvalb-T2A-FlpO/wt;Ai65F/wt,,Pvalb-T2A-FlpO,Ai65F,,,,,VISp5,VISp5,,0.0,0.0,A8S4_190320_09,A8S4_190320_09_G12,,20x,0.253000,Fail,4.921167,L8S4_190328_01,L8S4_190328_01_G12,3/28/2019 7:00,0.05,258.0,13.709148,80.509444,4.472747,Fail,999.0,132928463.0,44:20.4,1086009.0,1007349,72.389188,0.792675,0.112076,20.423706,0.027399,0.817393,0.0,11.169496,16.441316,15.623582,0.043251,0.036240,34.926724,1.102528,0.997927,1.065123,0.824957,0.984441,1.065198,0.890705,1.000402,1.109455,0.797551,False,,/allen/programs/celltypes/production/mousecelltypes/prod373/Star_Analysis_Run_855238658/855238658/,ar_855238658_STAR_ReadsPerGene.out.tab,,/allen/programs/celltypes/production/mousecelltypes/prod372/rseq_tube_set_R8S4-190410/RSC-204_R8S4-190410/RAW-DATA/SM-GE4SJ/SM-GE4SJ_E1-50_CTTACCT...,1709695A,Production,index192,685,656,552,478,387,301,245,1844,1844,1844,1057,851,653,485,YES,VISp,G,12,patch_seq,PXS4_190313_404_A01,2019-03-13T09:50:33-07:00,lisak,MP2,2/5/2019,2/8/2019,,Cre+,"None, None",VISp5,60.0,2.0,09:53:43-07:00,09:53:47-07:00,-60,09:53:47-07:00,-60.0,09:53:48-07:00,nucleus_present,1000.0,5.0,0.0,1.0,,mMPATCH,VISp,,,noclass,n3,1.00,0.0,True,Pvalb Vipr2,0.19,GABAergic,Pvalb,Pvalb Vipr2,0.105246,0.182289,False,Macrophage,ZZ_Missing,0.000000,Pvalb Vipr2,Sst Tac1 Tacr3,Pvalb Calb1 Sst,0.19,0.10,0.09,10.331568,8.721058,9.116839,0.293777,0.314389,0.286599,PoorQ,PoorQ


In [8]:
#If you want to filter on the columns immediately
all_jem_fields=["date", "organism_name", "name", "container", "rigOperator",
                "status", "roi_major", "roi_minor",
                "extraction.postPatch", "extraction.endPipetteR",
                "extraction.pressureApplied", "extraction.retractionPressureApplied",
                "recording.timeStart", "recording.timeWholeCellStart",
                "extraction.timeExtractionStart", "extraction.timeExtractionEnd", "extraction.timeRetractionEnd",
                "cell_depth",
                "approach.creCell",
                "approach.sliceHealth"]

jem_fields = ["date", "organism_name", "container", "rigOperator",
              "status", "roi_major", "roi_minor",
              "extraction.postPatch", "extraction.endPipetteR"]

read_jem_csv(jem_fields)
#jem.tail(1490) # first recording 2020-01-03 10:40:30 -0800 and last recording of 2019: 2019-12-23 15:51:07 -0800

INFO:__main__:Read jem metadata csv (date: 2/07/2020)


In [9]:
jem_2020 = jem.loc["2020-01-03 10:40:30 -0800":,:]
logger.info("Date Range: 2020-01-03 to Present 2020")

#jem_2020["p_container"] = jem_2020.container.str[0:4]
#logger.info("Creating column to check p_container")
#jem_2020.p_container.unique()

r_users = ["ramr"] 
m_users = ["PA", "PC"]

jem_2020 = jem_2020[jem_2020.index.notnull()]
logger.info("Dropped NaNs from index date column")
jem_2020.dropna(subset=["rigOperator", "container"], inplace=True)
logger.info("Dropped NaNs from rigOperator and container column")

jem_2020 = jem_2020[jem_2020["status"] == "SUCCESS"]
jem_2020 = jem_2020[jem_2020.rigOperator.str.contains("|".join(r_users))]
jem_2020 = jem_2020[jem_2020.container.str.contains("|".join(m_users))]
logger.info("Created dataframe with selected users in container column")

INFO:__main__:Date Range: 2020-01-03 to Present 2020
INFO:__main__:Dropped NaNs from index date column
INFO:__main__:Dropped NaNs from rigOperator and container column
INFO:__main__:Created dataframe with selected users in container column


In [10]:
mjem_2020 = jem_2020[jem_2020.organism_name == "Mouse"]
logger.info("Mouse count: %s", mjem_2020.organism_name.count())
hjem_2020 = jem_2020[jem_2020.organism_name == "Human"]
logger.info("Human count: %s", hjem_2020.organism_name.count())

INFO:__main__:Mouse count: 55
INFO:__main__:Human count: 30


In [11]:
jem_2020

Unnamed: 0_level_0,organism_name,extraction.endPipetteR,extraction.postPatch,rigOperator,status,roi_major,roi_minor,container
date,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1
2020-01-07 10:11:39 -0800,Mouse,2000.0,nucleus_present,ramr,SUCCESS,MOp,layer 2/3,PAS4_200107_451_A01
2020-01-07 15:19:20 -0800,Mouse,2000.0,nucleus_present,ramr,SUCCESS,RSPd,layer 5,PAS4_200107_452_A01
2020-01-10 13:15:48 -0800,Mouse,500.0,nucleus_present,ramr,SUCCESS,MOp,layer 5,PAS4_200110_451_A01
2020-01-10 13:15:48 -0800,Mouse,2.5,nucleus_present,ramr,SUCCESS,SSp,layer 5,PAS4_200110_454_A01
2020-01-10 13:15:48 -0800,Mouse,6.0,nucleus_present,ramr,SUCCESS,RSPd,layer 5,PAS4_200110_452_A01
...,...,...,...,...,...,...,...,...
2020-02-04 14:13:07 -0800,Human,1900.0,nucleus_present,ramr,SUCCESS,TCx,layer 1,PAS4_200204_457_A01
2020-02-04 14:13:07 -0800,Human,110.0,nucleus_present,ramr,SUCCESS,TCx,layer 4,PAS4_200204_459_A01
2020-02-04 14:13:07 -0800,Human,2000.0,nucleus_present,ramr,SUCCESS,TCx,layer 1,PAS4_200204_455_A01
2020-02-04 14:13:07 -0800,Human,1400.0,nucleus_present,ramr,SUCCESS,TCx,layer 1,PAS4_200204_454_A01


In [12]:
mjem_2020["new_region"] = "default_value"
logger.info("Created a new column(new_region) with default_value")

c_region = ["RSPd", "RSPv", "SSp"] 
s_region = ["MOs", "MOp", "ORB", "CTXsp"]
o_region = ["TCx", "HY"]
v_region = ["VISp"]

mjem_2020["new_region"][mjem_2020.roi_major.str.contains("|".join(c_region))] = "coronal_region"
mjem_2020["new_region"][mjem_2020.roi_major.str.contains("|".join(s_region))] = "sagittal_region"
mjem_2020["new_region"][mjem_2020.roi_major.str.contains("|".join(o_region))] = "other_region"
mjem_2020["new_region"][mjem_2020.roi_major.str.contains("|".join(v_region))] = "v1_region"
logger.info("Filled in new_region with corresponding region")

cor = mjem_2020[mjem_2020["new_region"] == "coronal_region"] 
sag = mjem_2020[mjem_2020["new_region"] == "sagittal_region"]
other = mjem_2020[mjem_2020["new_region"] == "other_region"]
v1 = mjem_2020[mjem_2020["new_region"] == "v1_region"]
logger.info("Created region pandas dataframes")

logger.info("Coronal Region count: %s", cor.organism_name.count())
logger.info("Sagittal Region count: %s", sag.organism_name.count())
logger.info("Other Region count: %s", other.organism_name.count())
logger.info("V1 Region count: %s", v1.organism_name.count())

A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: http://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  """Entry point for launching an IPython kernel.
INFO:__main__:Created a new column(new_region) with default_value
A value is trying to be set on a copy of a slice from a DataFrame

See the caveats in the documentation: http://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  if __name__ == '__main__':
A value is trying to be set on a copy of a slice from a DataFrame

See the caveats in the documentation: http://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  self._update_inplace(new_data)
A value is trying to be set on a copy of a slice from a DataFrame

See the caveats in the documentation: http://pandas.pydata.org/pandas-docs/stable/u

In [13]:
mjem_2020

Unnamed: 0_level_0,organism_name,extraction.endPipetteR,extraction.postPatch,rigOperator,status,roi_major,roi_minor,container,new_region
date,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1
2020-01-07 10:11:39 -0800,Mouse,2000.0,nucleus_present,ramr,SUCCESS,MOp,layer 2/3,PAS4_200107_451_A01,sagittal_region
2020-01-07 15:19:20 -0800,Mouse,2000.0,nucleus_present,ramr,SUCCESS,RSPd,layer 5,PAS4_200107_452_A01,coronal_region
2020-01-10 13:15:48 -0800,Mouse,500.0,nucleus_present,ramr,SUCCESS,MOp,layer 5,PAS4_200110_451_A01,sagittal_region
2020-01-10 13:15:48 -0800,Mouse,2.5,nucleus_present,ramr,SUCCESS,SSp,layer 5,PAS4_200110_454_A01,coronal_region
2020-01-10 13:15:48 -0800,Mouse,6.0,nucleus_present,ramr,SUCCESS,RSPd,layer 5,PAS4_200110_452_A01,coronal_region
2020-01-10 13:15:48 -0800,Mouse,2000.0,nucleus_present,ramr,SUCCESS,SSp,layer 2/3,PAS4_200110_453_A01,coronal_region
2020-01-10 15:29:02 -0800,Mouse,2900.0,nucleus_present,ramr,SUCCESS,RSPv,layer 2/3,PAS4_200110_455_A01,coronal_region
2020-01-10 15:29:02 -0800,Mouse,2300.0,nucleus_present,ramr,SUCCESS,RSPv,layer 2/3,PAS4_200110_456_A01,coronal_region
2020-01-13 11:14:15 -0800,Mouse,6.1,nucleus_present,ramr,SUCCESS,ORB,layer 5,PAS4_200113_451_A01,sagittal_region
2020-01-13 11:14:15 -0800,Mouse,8.7,nucleus_present,ramr,SUCCESS,ORB,layer 5,PAS4_200113_452_A01,sagittal_region


##### File Paths

In [14]:
csv_path = "C:/Users/ramr/Documents/Github/analysis_projects/csv/"
excel_path = "C:/Users/ramr/Documents/Github/analysis_projects/excel/"

##### Writing to csv_file

In [27]:
shiny.to_csv(csv_path + "shiny.csv")

##### Writing to excel_file

In [15]:
writer = pd.ExcelWriter(excel_path + "personal_tracker.xlsx")
mjem_2020.to_excel(writer, "mouse_2020", freeze_panes=(1,0))
hjem_2020.to_excel(writer, "human_2020", freeze_panes=(1,0))
cor.to_excel(writer, "coronal_region", freeze_panes=(1,0))
sag.to_excel(writer, "sagittal_region", freeze_panes=(1,0))
v1.to_excel(writer, "v1_region", freeze_panes=(1,0))
writer.save()