# Sample File on Renaming Leiden Clusters

In [1]:
import scanpy

Load data into an anndata object

In [3]:
path = "/my/path/"
adata = scanpy.read_h5ad(path+"adata_w_leiden_groups.h5ad")
print(adata)

AnnData object with n_obs × n_vars = 81501 × 8619
    obs: 'sample_id', 'condition', 'batch', 'doublet', 'n_genes_by_counts', 'total_counts', 'total_counts_mt', 'pct_counts_mt', 'total_counts_ribo', 'pct_counts_ribo', 'n_genes', 'leiden', 'merged leiden'
    var: 'mean', 'std', 'highly_variable', 'means', 'dispersions', 'dispersions_norm'
    uns: 'batch_colors', 'hvg', 'leiden', 'leiden_colors', 'log1p', 'neighbors', 'pca', 'sample_id_colors', 'umap'
    obsm: 'X_pca', 'X_umap'
    varm: 'PCs'
    layers: 'counts'
    obsp: 'connectivities', 'distances'


  utils.warn_names_duplicates("obs")


Create a dictionary with the old and new names

In [10]:
# Current set of cell types
current_cell_types = list(set(adata.obs["merged leiden"].tolist()))
print(current_cell_types)

['Plasma cells', 'Erythrocytes', 'B cells', 'Platelets', 'Undefined lymphocytes', 'CD4 T cells', 'Proliferating lymphocytes', 'Monocytes', 'CD8 T cells']


In [13]:
# New cell types
new_cell_types = ["Plasma cells", "Erythrocytes", "B cells", "Platelets", "Undefined lymphocytes", "CD4 T cells", "Proliferating lymphocytes", "Monocytes", "CD8 T cells / NK cells"]

# Creae mapping from the old to the new cell types
cell_map = dict(map(lambda i,j : (i,j) , current_cell_types,new_cell_types))

print(cell_map)

{'Plasma cells': 'Plasma cells', 'Erythrocytes': 'Erythrocytes', 'B cells': 'B cells', 'Platelets': 'Platelets', 'Undefined lymphocytes': 'Undefined lymphocytes', 'CD4 T cells': 'CD4 T cells', 'Proliferating lymphocytes': 'Proliferating lymphocytes', 'Monocytes': 'Monocytes', 'CD8 T cells': 'CD8 T cells / NK cells'}


Add the new names to the anndata

In [14]:
adata.obs["merged leiden"] = (adata.obs["merged leiden"].map(lambda x: cell_map.get(x)).astype("category"))
print(adata.obs["merged leiden"])

AAACCTGAGTTCCACA-1               CD4 T cells
AAACCTGCAGGGATTG-1    CD8 T cells / NK cells
AAACCTGGTATAGGGC-1               CD4 T cells
AAACCTGGTGGTCTCG-1                 Monocytes
AAACCTGTCCAAACAC-1                 Monocytes
                               ...          
TTTGTTGGTTCTCCTG-1    CD8 T cells / NK cells
TTTGTTGTCCCGTGAG-1               CD4 T cells
TTTGTTGTCCGTGACG-1               CD4 T cells
TTTGTTGTCTGAGGCC-1                   B cells
TTTGTTGTCTGCTGAA-1                   B cells
Name: merged leiden, Length: 81501, dtype: category
Categories (9, object): ['B cells', 'CD4 T cells', 'CD8 T cells / NK cells', 'Erythrocytes', ..., 'Plasma cells', 'Platelets', 'Proliferating lymphocytes', 'Undefined lymphocytes']
