In [1]:
# Integration of biopsies and organ donors from 2 studies
import anndata, numpy as np, pandas as pd, imp, lpy, scanpy as sc
sc.logging.print_header()
%load_ext rpy2.ipython
%matplotlib inline



scanpy==1.6.0 anndata==0.7.5 umap==0.3.10 numpy==1.18.1 scipy==1.5.4 pandas==1.0.1 scikit-learn==0.22.2 statsmodels==0.11.1 python-igraph==0.8.0 louvain==0.6.1 leidenalg==0.8.3


In [2]:
adata = anndata.read_h5ad("N3-integrated_organoids.h5ad")

In [3]:
#Remove temporary annotation for cellxgene hosting
adata.obsm['X_umap'] = adata.obsm['X_umap_bulkorg']
adata.obsm['X_umap_without_inhibitors']  = adata.obsm['X_umap_bulkorg_noinhib']
adata.obs['Celltype_without_inhibitors'] = adata.obs['bulkorg_noinhib']
adata.obs['Celltype']  = adata.obs['bulkorg']
adata.obs['CellCycle Phase']  = adata.obs['phase']

adata.uns['Celltype_without_inhibitors_colors'] = adata.uns['bulkorg_noinhib_colors']
adata.uns['Celltype_colors']  = adata.uns['bulkorg_colors']
adata.uns['CellCycle Phase_colors']  = adata.uns['phase_colors']

uns_toremove =  ['Binary Stage_colors',
 'bulkorg', 'bulkorg_colors', 'bulkorg_hormnoinhib_colors', 'bulkorg_hormnoinhib_res2_colors',
 'bulkorg_hormones_colors', 'bulkorg_noinhib_colors', 'bulkorg_strhormnoinhib_colors',
 'cosine_logXformedproj_Binary Stage_colors', 'cosine_logXformedproj_subcluster_epithelial_balanced_broad_colors',
 'cosine_logXformedproj_subcluster_epithelial_balanced_colors', 'cosine_proj_Binary Stage_colors',
 'cosine_proj_subcluster_epithelial_balanced_broad_colors', 'cosine_proj_subcluster_epithelial_balanced_colors',
 'demultiplexed_colors', 'logist_proj_subcluster_epithelial_balanced_colors',
 'phase_colors', 'primary_epithelial_colors', 'projection_primary_epithelial_broad_colors',
 'projection_primary_epithelial_colors', 'sample_names_colors']

obs_toremove = ['souporcell', 'batch', 'Lane', 'scrublet_pred', 'scrublet_local_pred', 'phase',
       'scrublet_score', 'scrublet_cluster_score', 'filtered_cells', 'S_score',
       'G2M_score', 'leiden_noinhib', 'leidenres2_noinhib',
       'leiden_bulkorg_noinhib', 'leidenres2_bulkorg_noinhib',
       'leiden_bulkorg_hormones', 'leidenres2_bulkorg_hormones',
       'leiden_bulkorg', 'leidenres2_bulkorg',
       'leiden_samplecorr_bulkorg_hormones',
       'leidenres2_samplecorr_bulkorg_hormones', 'leiden_samplecorr_bulkorg',
       'leidenres2_samplecorr_bulkorg', 'bulkorg_hormones',
       'cosine_proj_subcluster_epithelial_balanced',
       'cosine_proj_subcluster_epithelial_balanced_distance',
       'cosine_logXformedproj_subcluster_epithelial_balanced',
       'cosine_logXformedproj_subcluster_epithelial_balanced_distance',
       'primary_epithelial_probability', 'tmpindex',
       'projection_primary_epithelial', 'projection_primary_epithelial_probability', 'leiden_bulksmpl',
       'leiden_bulksmpl_hormones', 'leiden_bulksmpl_noinhib',
       'leidenres2_bulksmpl', 'leidenres2_bulksmpl_hormones',
       'leidenres2_bulksmpl_noinhib',
       'cosine_proj_subcluster_epithelial_balanced_broad',
       'cosine_proj_subcluster_epithelial_balanced_broad_distance',
       'cosine_logXformedproj_subcluster_epithelial_balanced_broad',
       'cosine_logXformedproj_subcluster_epithelial_balanced_broad_distance',
       'projection_primary_epithelial_broad',
       'projection_primary_epithelial_broad_probability',
       'cosine_proj_subcluster_epithelial_balanced_broader',
       'cosine_proj_subcluster_epithelial_balanced_broader_distance',
       'cosine_logXformedproj_subcluster_epithelial_balanced_broader',
       'cosine_logXformedproj_subcluster_epithelial_balanced_broader_distance',
       'subcluster_epithelial_balanced_broader',
       'subcluster_epithelial_balanced_broader_probability',
       'cosine_proj_Binary Stage', 'cosine_proj_Binary Stage_distance',
       'cosine_logXformedproj_Binary Stage',
       'cosine_logXformedproj_Binary Stage_distance', 'Binary Stage',
       'Binary Stage_probability', 'leiden_bulkorg_hormnoinhib',
       'leidenres2_bulkorg_hormnoinhib', 'bulkorg_hormnoinhib',
       'bulkorg_hormnoinhib_res2', 'leiden_bulkorg_strhormnoinhib',
       'leidenres2_bulkorg_strhormnoinhib', 'bulkorg_strhormnoinhib',
       'logist_proj_subcluster_epithelial_balanced_0.01',
       'logist_proj_subcluster_epithelial_balanced_probability_0.01',
       'bulkorg_noinhib', 'bulkorg']
                                           
obsm_toremove = ['X_cosproj_subcluster_epithelial_balanced',
 'X_cosproj_subcluster_epithelial_balanced_broad', 'X_logistproj_subcluster_epithelial_balanced',
 'X_logistproj_subcluster_epithelial_balanced_0.01', 'X_logistproj_subcluster_epithelial_balanced_broad',
 'X_lxfcosproj_subcluster_epithelial_balanced', 'X_lxfcosproj_subcluster_epithelial_balanced_broad',
 'X_umap_bulkorg_hormnoinhib', 'X_umap_bulkorg_hormones', 'X_umap_bulkorg', 'X_umap_bulkorg_noinhib',
 'X_umap_bulkorg_strhormnoinhib', 'X_umap_bulksmpl', 'X_umap_bulksmpl_hormones', 'X_umap_bulksmpl_noinhib',
 'X_umap_noinhib', 'X_umap_samplecorr_bulkorg', 'X_umap_samplecorr_bulkorg_hormones',
 'cosproj_subcluster_epithelial_balanced', 'lxfcosproj_subcluster_epithelial_balanced',
 'scvi_bulkorg', 'scvi_bulkorg_hormones', 'scvi_bulkorg_noinhib', 'scvi_noinhib',
 'scvi_samplecorr_bulkorg', 'scvi_samplecorr_bulkorg_hormones', 'subcluster_epithelial_balanced_logist_0.01']

# rename fibroblast
# rename fibroblast

for x in uns_toremove:
    del adata.uns[x]
for x in obs_toremove:
    del adata.obs[x]
for x in obsm_toremove:
    del adata.obsm[x]

In [4]:
adata = adata[ [x not in ["filtered"] for x in adata.obs["Celltype"] ] ]
adata.write_h5ad("Integrated_organoids.h5ad")