# Set-up
Just need to add a barcode column

In [1]:
import os
import glob
import pandas as pd

In [2]:
# Inputs
indir_path = "/cellar/users/aklie/data/datasets/igvf_sc-islet_10X-Multiome/annotation/2023_11_15/cellcommander/"
timecourses = [
    'A2_3-cyt',
    'A2_IFNg',
    'A2_control',
    'A2_dex',
    'A2_ext4',
    'H1_control',
    'H1_palmitate'
]
conditions = [
    '3-cyt',
    'IFNg',
    'dex',
    'ext4',
    'palmitate'
]
cellid_column = "integrated_manual_cellid_annotation"

# All

In [5]:
# Load in the metadata
cell_metadata = pd.read_csv(os.path.join(indir_path,"integrated/rna/annotate/annotate_metadata.tsv"), sep="\t", index_col=0)
cell_metadata.head()

Unnamed: 0,gex_barcode_cellranger,atac_barcode_cellranger,is_cell_cellranger,excluded_reason_cellranger,gex_raw_reads_cellranger,gex_mapped_reads_cellranger,gex_conf_intergenic_reads_cellranger,gex_conf_exonic_reads_cellranger,gex_conf_intronic_reads_cellranger,gex_conf_exonic_unique_reads_cellranger,...,scrublet_predicted_doublet,scDblFinder_doublet_score,scDblFinder_doublet_class,scDblFinder_predicted_doublet,cellranger_predicted_doublet,doublet_filter,pre_doublet_filter_leiden_1,leiden_1,sample,integrated_manual_cellid_annotation
dm25a#AAACAGCCATTGTGCA-1,AAACAGCCATTGTGCA-1,ACAGCGGGTTAGCCAT-1,1,0,32953,31944,2047,5245,23572,4774,...,False,0.438505,singlet,False,False,False,4,6,dm25a,SC.EC
dm25a#AAACATGCAATTGAGA-1,AAACATGCAATTGAGA-1,CATTTAGGTCCTGCAA-1,1,0,9061,8535,690,2301,4918,2192,...,False,5.6e-05,singlet,False,False,False,6,1,dm25a,SC.EC
dm25a#AAACCAACAGCCTTGG-1,AAACCAACAGCCTTGG-1,CTTTATCGTTAAGGAT-1,1,0,48199,46896,3183,6107,36231,5283,...,False,0.014432,singlet,False,False,False,4,6,dm25a,SC.EC
dm25a#AAACCAACAGTAGCCT-1,AAACCAACAGTAGCCT-1,CTTTATCGTTGCTCAG-1,1,0,18510,18064,1201,2826,13532,2250,...,False,0.000295,singlet,False,False,False,1,13,dm25a,SC.alpha
dm25a#AAACCAACAGTCTAAT-1,AAACCAACAGTCTAAT-1,CTTTATCGTTAGTACC-1,1,0,16760,16319,1654,2663,11482,2158,...,False,1.2e-05,singlet,False,False,False,2,4,dm25a,SC.beta


In [6]:
# Grab the cell metadata
print(f"First few barcodes in cell metadata: {list(cell_metadata.index[:2])}")

First few barcodes in cell metadata: ['dm25a#AAACAGCCATTGTGCA-1', 'dm25a#AAACATGCAATTGAGA-1']


In [7]:
# Add "barcode" column for pycistopic
cell_metadata["barcode"] = cell_metadata["gex_barcode_cellranger"]
cell_metadata.to_csv(os.path.join(indir_path, "integrated/rna/annotate/annotate_metadata_pycistopic.tsv"), sep="\t")

# Time course

In [10]:
for timecourse in timecourses:
    # Load in the adata object
    cell_metadata = pd.read_csv(os.path.join(indir_path, timecourse, "integrated/rna/annotate/annotate_metadata.tsv"), sep="\t", index_col=0)

    # Grab the cell metadata
    print(f"First few barcodes in {timecourse} cell metadata: {list(cell_metadata.index[:2])}")
    
    # Add "barcode" column for pycistopic
    cell_metadata["barcode"] = cell_metadata["gex_barcode_cellranger"]
    #cell_metadata.to_csv(os.path.join(indir_path, timecourse, "integrated/rna/annotate/annotate_metadata_pycistopic.tsv"), sep="\t")b

First few barcodes in A2_3-cyt cell metadata: ['dm31a#AAACAGCCAGCACGTT-1', 'dm31a#AAACAGCCATAAACCT-1']
First few barcodes in A2_IFNg cell metadata: ['dm42b#AAACAGCCAATGCGCT-1', 'dm42b#AAACATGCAGTCTAGC-1']
First few barcodes in A2_control cell metadata: ['dm25a#AAACAGCCATTGTGCA-1', 'dm25a#AAACATGCAATTGAGA-1']
First few barcodes in A2_dex cell metadata: ['dm43b#AAACAGCCAAGGTGCA-1', 'dm43b#AAACAGCCAGGAATCG-1']
First few barcodes in A2_ext4 cell metadata: ['dm14b#AAACAGCCAATAATCC-1', 'dm14b#AAACAGCCACCTCAGG-1']
First few barcodes in H1_control cell metadata: ['mo1#AAACAGCCAAAGGTAC-1', 'mo1#AAACAGCCACCTACTT-1']
First few barcodes in H1_palmitate cell metadata: ['mo33#AAACAGCCAAATGCCC-1', 'mo33#AAACAGCCAGGCGAGT-1']


# Condition

In [4]:
for condition in conditions:
    # Load in the adata object
    cell_metadata = pd.read_csv(os.path.join(indir_path, condition, "rna/annotate/annotate_metadata.tsv"), sep="\t", index_col=0)

    # Grab the cell metadata
    print(f"First few barcodes in {condition} cell metadata: {list(cell_metadata.index[:2])}")
    
    # Add "barcode" column for pycistopic
    cell_metadata["barcode"] = cell_metadata["gex_barcode_cellranger"]
    cell_metadata.to_csv(os.path.join(indir_path, condition, "rna/annotate/annotate_metadata_pycistopic.tsv"), sep="\t")

First few barcodes in 3-cyt cell metadata: ['dm31a#AAACAGCCAGCACGTT-1', 'dm31a#AAACAGCCATAAACCT-1']
First few barcodes in IFNg cell metadata: ['dm42b#AAACAGCCAATGCGCT-1', 'dm42b#AAACATGCAGTCTAGC-1']
First few barcodes in dex cell metadata: ['dm43b#AAACAGCCAAGGTGCA-1', 'dm43b#AAACAGCCAGGAATCG-1']
First few barcodes in ext4 cell metadata: ['dm14b#AAACAGCCAATAATCC-1', 'dm14b#AAACAGCCACCTCAGG-1']
First few barcodes in palmitate cell metadata: ['mo33#AAACAGCCAAATGCCC-1', 'mo33#AAACAGCCAGGCGAGT-1']


# DONE!

---