In [1]:
! pip install scHDeepInsight

Looking in indexes: https://pypi.org/simple, https://pypi.ngc.nvidia.com


In [2]:
from scHDeepInsight import Immune

# Initialize the Immune class
immune = Immune()

Loaded pretrained weights for efficientnet-b5


In [3]:
# Step 1: Preprocess the .h5ad file
immune.preprocess(query_path="sample_immune.h5ad", output_path="./output_immune/preprocessed_query.h5ad")

AnnData object with n_obs × n_vars = 10229 × 36571
    obs: 'orig.ident', 'nCount_RNA', 'nFeature_RNA', 'percent.mt', 'donor_id', 'pool_number', 'predicted.celltype.l2', 'predicted.celltype.l2.score', 'age', 'organism_ontology_term_id', 'tissue_ontology_term_id', 'assay_ontology_term_id', 'disease_ontology_term_id', 'cell_type_ontology_term_id', 'self_reported_ethnicity_ontology_term_id', 'development_stage_ontology_term_id', 'sex_ontology_term_id', 'is_primary_data', 'suspension_type', 'cell_type', 'assay', 'disease', 'organism', 'sex', 'tissue', 'self_reported_ethnicity', 'development_stage', 'n_counts'
    var: 'vst.mean', 'vst.variance', 'vst.variance.expected', 'vst.variance.standardized', 'vst.variable', 'feature_is_filtered', 'feature_name', 'feature_reference', 'feature_biotype'
    uns: 'log1p'

In [4]:
# Step 2: Transform the preprocessed data into images
immune.image_transform(query_path="./output_immune/preprocessed_query.h5ad", 
                       barcode_path="./output_immune/barcode.csv", 
                       image_path="./output_immune/query_images.npy")

In [5]:
# Step 3: Predict cell types and identify potential rare cells
pred_label = immune.predict(barcode_path="./output_immune/barcode.csv", 
                            image_path="./output_immune/query_images.npy", 
                            batch_size=128)

In [6]:
pred_label

Unnamed: 0,barcode,prediceted_base_type,prediceted_detailed_type,prediceted_base_type_prob,prediceted_detailed_type_prob,is_potential_rare
0,TGCGCAGCATCAGTAC-19,B,B_gc,0.998971,0.998186,False
1,AAGGTTCCAACCGCCA-28,B,B_gc,0.995672,0.978519,False
2,CTACCCACAGATGGGT-15,DC,DC_cDC2,0.999748,0.998150,False
3,ATAAGAGCACTAGTAC-26,B,B_gc,0.995536,0.981670,False
4,TTATGCTCAATGCCAT-2,NK,NK_CD16+,0.990403,0.990325,False
...,...,...,...,...,...,...
10224,TCTTTCCAGTGAAGAG-10,B,B_gc,0.992760,0.976728,False
10225,AGTCTTTCAGCTGTTA-28,NK,NK_CD16+,0.998799,0.998777,False
10226,TTCTTAGTCTGCCCTA-17,NK,NK_CD16+,0.999963,0.999962,False
10227,GGACATTAGACGCTTT-16,CD4+T,CD4+T_fh,0.999857,0.999816,False


In [7]:
# Save the predicted labels to a CSV file
pred_label.to_csv("./output_immune/predicted_labels.csv", index=False)