### Loading Anndata in python using scanpy

In [1]:
import scanpy as sc

anndata = sc.read_h5ad('local.h5ad')

In [2]:
anndata

AnnData object with n_obs × n_vars = 483152 × 58559
    obs: 'tissue_in_publication', 'assay_ontology_term_id', 'donor', 'anatomical_information', 'n_counts_UMIs', 'n_genes', 'cell_ontology_class', 'free_annotation', 'manually_annotated', 'compartment', 'sex_ontology_term_id', 'is_primary_data', 'organism_ontology_term_id', 'disease_ontology_term_id', 'ethnicity_ontology_term_id', 'development_stage_ontology_term_id', 'cell_type_ontology_term_id', 'tissue_ontology_term_id', 'cell_type', 'assay', 'disease', 'organism', 'sex', 'tissue', 'ethnicity', 'development_stage'
    var: 'feature_type', 'ensemblid', 'highly_variable', 'means', 'dispersions', 'dispersions_norm', 'mean', 'std', 'feature_biotype', 'feature_is_filtered', 'feature_name', 'feature_reference'
    uns: 'X_normalization', '_scvi', '_training_mode', 'compartment_colors', 'default_embedding', 'dendrogram_cell_type_tissue', 'dendrogram_computational_compartment_assignment', 'dendrogram_consensus_prediction', 'dendrogram_tissu

### Extracting information about genes

In [5]:
genes_data = anndata.var
genes_data.head()


Unnamed: 0_level_0,feature_type,ensemblid,highly_variable,means,dispersions,dispersions_norm,mean,std,feature_biotype,feature_is_filtered,feature_name,feature_reference
gene_id,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1
ENSG00000223972,Gene Expression,ENSG00000223972.5,False,6.398244e-05,0.835044,-0.573947,3.9e-05,0.005574,gene,False,DDX11L1,NCBITaxon:9606
ENSG00000227232,Gene Expression,ENSG00000227232.5,False,0.002274395,2.44228,0.533203,0.00108,0.031731,gene,False,WASH7P,NCBITaxon:9606
ENSG00000278267,Gene Expression,ENSG00000278267.1,False,6.175251e-05,1.295335,-0.256874,3.3e-05,0.005634,gene,False,MIR6859-1,NCBITaxon:9606
ENSG00000243485,Gene Expression,ENSG00000243485.5,False,0.0001372886,2.656352,0.680668,4.8e-05,0.008041,gene,False,MIR1302-2HG,NCBITaxon:9606
ENSG00000284332,Gene Expression,ENSG00000284332.1,False,1e-12,,0.0,0.0,1.0,gene,False,MIR1302-2,NCBITaxon:9606


In [10]:
#only keeping columns of interest
genes_data = genes_data.loc[:,['feature_name']]
genes_data.head()

Unnamed: 0_level_0,feature_name
gene_id,Unnamed: 1_level_1
ENSG00000223972,DDX11L1
ENSG00000227232,WASH7P
ENSG00000278267,MIR6859-1
ENSG00000243485,MIR1302-2HG
ENSG00000284332,MIR1302-2


In [11]:
genes_data.to_csv('allgenes_tabulasapiens.csv')

### Extracting information about all the cells in Tabula Sapiens dataset

In [14]:
cell_data = anndata.obs
cell_data.columns

Index(['tissue_in_publication', 'assay_ontology_term_id', 'donor',
       'anatomical_information', 'n_counts_UMIs', 'n_genes',
       'cell_ontology_class', 'free_annotation', 'manually_annotated',
       'compartment', 'sex_ontology_term_id', 'is_primary_data',
       'organism_ontology_term_id', 'disease_ontology_term_id',
       'ethnicity_ontology_term_id', 'development_stage_ontology_term_id',
       'cell_type_ontology_term_id', 'tissue_ontology_term_id', 'cell_type',
       'assay', 'disease', 'organism', 'sex', 'tissue', 'ethnicity',
       'development_stage'],
      dtype='object')

In [15]:
cell_data.head()

Unnamed: 0_level_0,tissue_in_publication,assay_ontology_term_id,donor,anatomical_information,n_counts_UMIs,n_genes,cell_ontology_class,free_annotation,manually_annotated,compartment,...,cell_type_ontology_term_id,tissue_ontology_term_id,cell_type,assay,disease,organism,sex,tissue,ethnicity,development_stage
cell_id,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
AAACCCACACTCCTGT_TSP6_Liver_NA_10X_1_1,Liver,EFO:0009922,TSP6,,7633.0,2259,macrophage,Monocyte/Macrophage,True,immune,...,CL:0000235,UBERON:0002107,macrophage,10x 3' v3,normal,Homo sapiens,male,liver,European,67-year-old human stage
AAACGAAGTACCAGAG_TSP6_Liver_NA_10X_1_1,Liver,EFO:0009922,TSP6,,2858.0,1152,monocyte,Monocyte,True,immune,...,CL:0000576,UBERON:0002107,monocyte,10x 3' v3,normal,Homo sapiens,male,liver,European,67-year-old human stage
AAACGCTCAACGGCTC_TSP6_Liver_NA_10X_1_1,Liver,EFO:0009922,TSP6,,7787.0,2983,endothelial cell of hepatic sinusoid,Endothelial,True,endothelial,...,CL:1000398,UBERON:0002107,endothelial cell of hepatic sinusoid,10x 3' v3,normal,Homo sapiens,male,liver,European,67-year-old human stage
AAAGAACAGCCTCTTC_TSP6_Liver_NA_10X_1_1,Liver,EFO:0009922,TSP6,,10395.0,2598,macrophage,Monocyte/Macrophage,True,immune,...,CL:0000235,UBERON:0002107,macrophage,10x 3' v3,normal,Homo sapiens,male,liver,European,67-year-old human stage
AAAGAACGTAGCACAG_TSP6_Liver_NA_10X_1_1,Liver,EFO:0009922,TSP6,,6610.0,2125,liver dendritic cell,Dendritic cell,True,immune,...,CL:2000055,UBERON:0002107,liver dendritic cell,10x 3' v3,normal,Homo sapiens,male,liver,European,67-year-old human stage


In [19]:
#only keeping columns of interest
cell_data = cell_data.loc[:,['tissue_in_publication','anatomical_information','tissue','tissue_ontology_term_id','cell_type','cell_type_ontology_term_id','n_genes','sex','ethnicity','development_stage']]
cell_data.head()

Unnamed: 0_level_0,tissue_in_publication,anatomical_information,tissue,tissue_ontology_term_id,cell_type,cell_type_ontology_term_id,n_genes,sex,ethnicity,development_stage
cell_id,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1
AAACCCACACTCCTGT_TSP6_Liver_NA_10X_1_1,Liver,,liver,UBERON:0002107,macrophage,CL:0000235,2259,male,European,67-year-old human stage
AAACGAAGTACCAGAG_TSP6_Liver_NA_10X_1_1,Liver,,liver,UBERON:0002107,monocyte,CL:0000576,1152,male,European,67-year-old human stage
AAACGCTCAACGGCTC_TSP6_Liver_NA_10X_1_1,Liver,,liver,UBERON:0002107,endothelial cell of hepatic sinusoid,CL:1000398,2983,male,European,67-year-old human stage
AAAGAACAGCCTCTTC_TSP6_Liver_NA_10X_1_1,Liver,,liver,UBERON:0002107,macrophage,CL:0000235,2598,male,European,67-year-old human stage
AAAGAACGTAGCACAG_TSP6_Liver_NA_10X_1_1,Liver,,liver,UBERON:0002107,liver dendritic cell,CL:2000055,2125,male,European,67-year-old human stage


In [20]:
cell_data.to_csv('genecountdata_tabulasapiens.csv')