In [1]:
import pandas as pd
import numpy as np
import scanpy as sc
import os
import seaborn as sns
import matplotlib.pyplot as plt
from sklearn.utils import shuffle

In [2]:
sc.set_figure_params(dpi=200, dpi_save=300)

In [3]:
adata = sc.read('../../Data/adata_scRNA_Annotated.h5ad')
sc.pp.normalize_total(adata, target_sum=1e4)
sc.pp.log1p(adata)

In [4]:
muscle_subset = ['muscle DV', 'muscle body 1', 'muscle body 2', 'muscle genital', 'muscle pharynx']

In [5]:
adata_muscle = adata[adata.obs['Annotation'].isin(muscle_subset)]

In [6]:
marker_list_dict = {}
marker_list_dict['known markers'] = ['SMED30023573', 'SMED30008639', 'SMED30025723', 
                                     'SMED30016686', 'SMED30019740', 'SMED30002349', 
                                     'SMED30002616', 'SMED30022812', 'SMED30017714']

marker_list_dict['muscle body 1'] = ['SMED30019102', 'SMED30018614', 'SMED30026932', 'SMED30018309']

marker_list_dict['muscle body 2'] = ['SMED30017664', 'SMED30018205', 'SMED30015232', 'SMED30024125']

marker_list_dict['muscle DV'] = ['SMED30024778', 'SMED30028312', 'SMED30028043', 'SMED30015191']

marker_list_dict['pharynx'] = ['SMED30015345', 'SMED30004154', 'SMED30025680', 'SMED30004868']

In [7]:
symbol_trans_dict = {}
symbol_trans_dict['SMED30023573'] = 'snail'
symbol_trans_dict['SMED30008639'] = 'myod'
symbol_trans_dict['SMED30025723'] = 'lbx1'
symbol_trans_dict['SMED30016686'] = 'nkx6-2'
symbol_trans_dict['SMED30019740'] = 'nkx1-1'
symbol_trans_dict['SMED30002349'] = 'gata4/5/6-2'
symbol_trans_dict['SMED30002616'] = 'nk4'
symbol_trans_dict['SMED30022812'] = 'ptprd'
symbol_trans_dict['SMED30017714'] = 'hspg2'

symbol_trans_dict['SMED30019102'] = "SMED19102" #'dd_15058'
symbol_trans_dict['SMED30018614'] = "SMED18614" #'dd_5372'
symbol_trans_dict['SMED30026932'] = 'nog'
symbol_trans_dict['SMED30018309'] = 'irx4'

symbol_trans_dict['SMED30017664'] = 'anos1'
symbol_trans_dict['SMED30018205'] = 'jag1'
symbol_trans_dict['SMED30015232'] = 'ntn1'
symbol_trans_dict['SMED30024125'] = 'otop2'


symbol_trans_dict['SMED30024778'] = 'sbspon'
symbol_trans_dict['SMED30028312'] = 'ptprs'
symbol_trans_dict['SMED30028043'] = 'atx1l'
symbol_trans_dict['SMED30015191'] = 'six6'

symbol_trans_dict['SMED30015345'] = 'tpm1'
symbol_trans_dict['SMED30004154'] = 'rorb'
symbol_trans_dict['SMED30025680'] = 'kalm'
symbol_trans_dict['SMED30004868'] = 'neurod-2'

In [8]:
heatmap_df = pd.DataFrame(index=list(symbol_trans_dict.keys()))
for it in muscle_subset:
    subadata = adata_muscle[adata_muscle.obs['Annotation'] == it]
    sub_df = pd.DataFrame(subadata.X.toarray(), columns=subadata.var_names)
    sub_df = sub_df.loc[:, list(symbol_trans_dict.keys())]
    heatmap_df[it] = np.mean(sub_df)

In [9]:
heatmap_df_symbol = heatmap_df.copy()
heatmap_df_symbol.index = [symbol_trans_dict[x] for x in heatmap_df_symbol.index]

In [10]:
heatmap_df.to_csv('muscle_Markers_Expression.txt', sep='\t')

In [11]:
heatmap_df_symbol.to_csv('muscle_Markers_Expression_symbol.txt', sep='\t')

In [12]:
heatmap_df = heatmap_df.T
heatmap_df = heatmap_df - np.min(heatmap_df)
heatmap_df = heatmap_df/np.max(heatmap_df)
heatmap_df = heatmap_df.T

In [13]:
heatmap_df_symbol = heatmap_df.copy()
heatmap_df_symbol.index = [symbol_trans_dict[x] for x in heatmap_df_symbol.index]

In [14]:
heatmap_df.to_csv('muscle_Markers_Expression_scaled.txt', sep='\t')

In [15]:
heatmap_df_symbol.to_csv('muscle_Markers_Expression_symbol_scaled.txt', sep='\t')