In [1]:
import os
import sys

import numpy as np
import matplotlib.pyplot as plt

import scanpy as sc
import scvi
import torch

from pytorch_lightning.loggers import WandbLogger
import wandb
from dotenv import load_dotenv

import session_info
import warnings
from pyprojroot.here import here

warnings.filterwarnings("ignore")
sys.path.insert(1, str(here('bin')))

torch.set_float32_matmul_precision('high')

#plt.style.use(['science','nature','no-latex'])
dpi_fig_save = 300
sc.set_figure_params(dpi=100, dpi_save=dpi_fig_save, vector_friendly=True)

load_dotenv(here('.env'))

  from .autonotebook import tqdm as notebook_tqdm


True

In [2]:
class CustomWandbLogger(WandbLogger):
    @property
    def save_dir(self):
        return self.experiment.dir

In [3]:
scvi.settings.seed = 0
print("Last run with scvi-tools version:", scvi.__version__)

Seed set to 0


Last run with scvi-tools version: 1.1.2


**Setting parameters** 

In [4]:
overwriteFigures = True
overwriteData = True

In [5]:
cellGroup = 'T_NonNaive'
workDir = os.getcwd()

In [6]:
annotationLevel = os.path.basename(os.path.normpath(workDir))

In [7]:
workDir

'/scratch_isilon/groups/singlecell/shared/projects/Inflammation-PBMCs-Atlas/02_cell_annotation/SCGT00_CentralizedDataset/02_fromCellLineages_to_CellTypes/Step2'

**Load data**

In [8]:
adata = sc.read_h5ad(here(f"{workDir}/{cellGroup}/results/01_{cellGroup}_normalized_HVGsubset.h5ad"))
adata

AnnData object with n_obs × n_vars = 241341 × 4257
    obs: 'studyID', 'libraryID', 'sampleID', 'chemistry', 'technology', 'patientID', 'disease', 'timepoint_replicate', 'treatmentStatus', 'therapyResponse', 'sex', 'age', 'BMI', 'binned_age', 'diseaseStatus', 'smokingStatus', 'ethnicity', 'institute', 'diseaseGroup', 'batches', 'n_genes_by_counts', 'log1p_n_genes_by_counts', 'total_counts', 'log1p_total_counts', 'pct_counts_in_top_20_genes', 'total_counts_mt', 'log1p_total_counts_mt', 'pct_counts_mt', 'total_counts_ribo', 'log1p_total_counts_ribo', 'pct_counts_ribo', 'total_counts_hb', 'log1p_total_counts_hb', 'pct_counts_hb', 'total_counts_plt', 'log1p_total_counts_plt', 'pct_counts_plt', 'S_score', 'G2M_score', 'phase'
    var: 'hgnc_id', 'symbol', 'locus_group', 'HUGO_status', 'mt', 'ribo', 'hb', 'plt', 'n_cells_by_counts', 'mean_counts', 'log1p_mean_counts', 'pct_dropout_by_counts', 'total_counts', 'log1p_total_counts', 'highly_variable', 'means', 'dispersions', 'dispersions_norm',

## scVI integration

**scVI parameters**

In [9]:
# https://docs.scvi-tools.org/en/stable/api/reference/scvi.train.Trainer.html#scvi.train.Trainer
setup_kwargs = dict(
    layer="counts", 
    batch_key='libraryID', 
    categorical_covariate_keys = ['disease', 'sampleID'],
)

scvi_kwargs = dict(n_hidden=512,
                   n_latent=10, # reduced to 20 after step 00 (main) and to 10 after step 03
                   n_layers=2,
                   gene_likelihood='nb')

trainer_kwargs = dict(
    checkpointing_monitor = 'elbo_validation',
    early_stopping_monitor = 'reconstruction_loss_validation',
    early_stopping_patience = 10,
    early_stopping_min_delta=0.1,
    early_stopping = True,
    max_epochs = 1000,

    #logger = # wandb
)
# https://docs.scvi-tools.org/en/stable/api/reference/scvi.train.TrainingPlan.html#scvi.train.TrainingPlan
plan_kwargs = dict(
    lr = 5e-4,
    #reduce_lr_on_plateau = True
)

# https://docs.scvi-tools.org/en/stable/api/reference/scvi.module.VAE.html#scvi.module.VAE
#vae = dict(
#    use_layer_norm='both',
#    use_batch_norm='none',
#    encode_covariates=True,
#    deeply_inject_covariates=False
#)
parameter_dict = setup_kwargs | scvi_kwargs | trainer_kwargs | plan_kwargs

**wandb parameter**

In [10]:
run_name = f"{annotationLevel}_{cellGroup}"
run_name

'Step2_T_NonNaive'

In [11]:
logger = CustomWandbLogger(name = run_name, project='inflammation_atlas_R1', config=parameter_dict)

**Running integration**

In [12]:
scvi.model.SCVI.setup_anndata(adata, 
                              **setup_kwargs)

CUDA backend failed to initialize: Unable to use CUDA because of the following issues with CUDA components:
Outdated cuSPARSE installation found.
Version JAX was built against: 12200
Minimum supported: 12100
Installed version: 12002
The local installation version must be no lower than 12100. (Set TF_CPP_MIN_LOG_LEVEL=0 and rerun for more info.)


In [13]:
model = scvi.model.SCVI(adata, **scvi_kwargs)

In [14]:
model.train(logger=logger, plan_kwargs = plan_kwargs, **trainer_kwargs)

GPU available: True (cuda), used: True


TPU available: False, using: 0 TPU cores


IPU available: False, using: 0 IPUs


HPU available: False, using: 0 HPUs


[34m[1mwandb[0m: Currently logged in as: [33mdav1989[0m ([33minflammation[0m). Use [1m`wandb login --relogin`[0m to force relogin


[34m[1mwandb[0m: - Waiting for wandb.init()...

[34m[1mwandb[0m: \ Waiting for wandb.init()...

[34m[1mwandb[0m: wandb version 0.18.5 is available!  To upgrade, please run:
[34m[1mwandb[0m:  $ pip install wandb --upgrade


[34m[1mwandb[0m: Tracking run with wandb version 0.16.5


[34m[1mwandb[0m: Run data is saved locally in [35m[1m./wandb/run-20241021_094646-s58o4yez[0m
[34m[1mwandb[0m: Run [1m`wandb offline`[0m to turn off syncing.


[34m[1mwandb[0m: Syncing run [33mStep2_T_NonNaive[0m


[34m[1mwandb[0m: ⭐️ View project at [34m[4mhttps://wandb.ai/inflammation/inflammation_atlas_R1[0m


[34m[1mwandb[0m: 🚀 View run at [34m[4mhttps://wandb.ai/inflammation/inflammation_atlas_R1/runs/s58o4yez/workspace[0m


LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]


Training:   0%|          | 0/1000 [00:00<?, ?it/s]

Epoch 1/1000:   0%|          | 0/1000 [00:00<?, ?it/s]

Epoch 1/1000:   0%|          | 1/1000 [00:14<4:01:34, 14.51s/it]

Epoch 1/1000:   0%|          | 1/1000 [00:14<4:01:34, 14.51s/it, v_num=4yez, train_loss_step=1.07e+3, train_loss_epoch=1.09e+3]

Epoch 2/1000:   0%|          | 1/1000 [00:14<4:01:34, 14.51s/it, v_num=4yez, train_loss_step=1.07e+3, train_loss_epoch=1.09e+3]

Epoch 2/1000:   0%|          | 2/1000 [00:37<5:27:34, 19.69s/it, v_num=4yez, train_loss_step=1.07e+3, train_loss_epoch=1.09e+3]

Epoch 2/1000:   0%|          | 2/1000 [00:37<5:27:34, 19.69s/it, v_num=4yez, train_loss_step=1.08e+3, train_loss_epoch=1.07e+3]

Epoch 3/1000:   0%|          | 2/1000 [00:37<5:27:34, 19.69s/it, v_num=4yez, train_loss_step=1.08e+3, train_loss_epoch=1.07e+3]

Epoch 3/1000:   0%|          | 3/1000 [00:54<5:04:51, 18.35s/it, v_num=4yez, train_loss_step=1.08e+3, train_loss_epoch=1.07e+3]

Epoch 3/1000:   0%|          | 3/1000 [00:54<5:04:51, 18.35s/it, v_num=4yez, train_loss_step=1.1e+3, train_loss_epoch=1.07e+3] 

Epoch 4/1000:   0%|          | 3/1000 [00:54<5:04:51, 18.35s/it, v_num=4yez, train_loss_step=1.1e+3, train_loss_epoch=1.07e+3]

Epoch 4/1000:   0%|          | 4/1000 [01:15<5:23:22, 19.48s/it, v_num=4yez, train_loss_step=1.1e+3, train_loss_epoch=1.07e+3]

Epoch 4/1000:   0%|          | 4/1000 [01:15<5:23:22, 19.48s/it, v_num=4yez, train_loss_step=1.03e+3, train_loss_epoch=1.06e+3]

Epoch 5/1000:   0%|          | 4/1000 [01:15<5:23:22, 19.48s/it, v_num=4yez, train_loss_step=1.03e+3, train_loss_epoch=1.06e+3]

Epoch 5/1000:   0%|          | 5/1000 [01:33<5:11:26, 18.78s/it, v_num=4yez, train_loss_step=1.03e+3, train_loss_epoch=1.06e+3]

Epoch 5/1000:   0%|          | 5/1000 [01:33<5:11:26, 18.78s/it, v_num=4yez, train_loss_step=1.03e+3, train_loss_epoch=1.06e+3]

Epoch 6/1000:   0%|          | 5/1000 [01:33<5:11:26, 18.78s/it, v_num=4yez, train_loss_step=1.03e+3, train_loss_epoch=1.06e+3]

Epoch 6/1000:   1%|          | 6/1000 [01:49<4:57:20, 17.95s/it, v_num=4yez, train_loss_step=1.03e+3, train_loss_epoch=1.06e+3]

Epoch 6/1000:   1%|          | 6/1000 [01:49<4:57:20, 17.95s/it, v_num=4yez, train_loss_step=1.06e+3, train_loss_epoch=1.06e+3]

Epoch 7/1000:   1%|          | 6/1000 [01:49<4:57:20, 17.95s/it, v_num=4yez, train_loss_step=1.06e+3, train_loss_epoch=1.06e+3]

Epoch 7/1000:   1%|          | 7/1000 [02:10<5:12:57, 18.91s/it, v_num=4yez, train_loss_step=1.06e+3, train_loss_epoch=1.06e+3]

Epoch 7/1000:   1%|          | 7/1000 [02:10<5:12:57, 18.91s/it, v_num=4yez, train_loss_step=1.06e+3, train_loss_epoch=1.06e+3]

Epoch 8/1000:   1%|          | 7/1000 [02:10<5:12:57, 18.91s/it, v_num=4yez, train_loss_step=1.06e+3, train_loss_epoch=1.06e+3]

Epoch 8/1000:   1%|          | 8/1000 [02:29<5:10:47, 18.80s/it, v_num=4yez, train_loss_step=1.06e+3, train_loss_epoch=1.06e+3]

Epoch 8/1000:   1%|          | 8/1000 [02:29<5:10:47, 18.80s/it, v_num=4yez, train_loss_step=1.01e+3, train_loss_epoch=1.06e+3]

Epoch 9/1000:   1%|          | 8/1000 [02:29<5:10:47, 18.80s/it, v_num=4yez, train_loss_step=1.01e+3, train_loss_epoch=1.06e+3]

Epoch 9/1000:   1%|          | 9/1000 [02:43<4:46:40, 17.36s/it, v_num=4yez, train_loss_step=1.01e+3, train_loss_epoch=1.06e+3]

Epoch 9/1000:   1%|          | 9/1000 [02:43<4:46:40, 17.36s/it, v_num=4yez, train_loss_step=1.03e+3, train_loss_epoch=1.06e+3]

Epoch 10/1000:   1%|          | 9/1000 [02:43<4:46:40, 17.36s/it, v_num=4yez, train_loss_step=1.03e+3, train_loss_epoch=1.06e+3]

Epoch 10/1000:   1%|          | 10/1000 [03:05<5:10:41, 18.83s/it, v_num=4yez, train_loss_step=1.03e+3, train_loss_epoch=1.06e+3]

Epoch 10/1000:   1%|          | 10/1000 [03:05<5:10:41, 18.83s/it, v_num=4yez, train_loss_step=1.05e+3, train_loss_epoch=1.06e+3]

Epoch 11/1000:   1%|          | 10/1000 [03:05<5:10:41, 18.83s/it, v_num=4yez, train_loss_step=1.05e+3, train_loss_epoch=1.06e+3]

Epoch 11/1000:   1%|          | 11/1000 [03:23<5:05:52, 18.56s/it, v_num=4yez, train_loss_step=1.05e+3, train_loss_epoch=1.06e+3]

Epoch 11/1000:   1%|          | 11/1000 [03:23<5:05:52, 18.56s/it, v_num=4yez, train_loss_step=1.06e+3, train_loss_epoch=1.06e+3]

Epoch 12/1000:   1%|          | 11/1000 [03:23<5:05:52, 18.56s/it, v_num=4yez, train_loss_step=1.06e+3, train_loss_epoch=1.06e+3]

Epoch 12/1000:   1%|          | 12/1000 [03:43<5:14:27, 19.10s/it, v_num=4yez, train_loss_step=1.06e+3, train_loss_epoch=1.06e+3]

Epoch 12/1000:   1%|          | 12/1000 [03:43<5:14:27, 19.10s/it, v_num=4yez, train_loss_step=1.07e+3, train_loss_epoch=1.06e+3]

Epoch 13/1000:   1%|          | 12/1000 [03:43<5:14:27, 19.10s/it, v_num=4yez, train_loss_step=1.07e+3, train_loss_epoch=1.06e+3]

Epoch 13/1000:   1%|▏         | 13/1000 [04:04<5:23:32, 19.67s/it, v_num=4yez, train_loss_step=1.07e+3, train_loss_epoch=1.06e+3]

Epoch 13/1000:   1%|▏         | 13/1000 [04:04<5:23:32, 19.67s/it, v_num=4yez, train_loss_step=1.03e+3, train_loss_epoch=1.06e+3]

Epoch 14/1000:   1%|▏         | 13/1000 [04:04<5:23:32, 19.67s/it, v_num=4yez, train_loss_step=1.03e+3, train_loss_epoch=1.06e+3]

Epoch 14/1000:   1%|▏         | 14/1000 [04:23<5:21:14, 19.55s/it, v_num=4yez, train_loss_step=1.03e+3, train_loss_epoch=1.06e+3]

Epoch 14/1000:   1%|▏         | 14/1000 [04:23<5:21:14, 19.55s/it, v_num=4yez, train_loss_step=1.07e+3, train_loss_epoch=1.06e+3]

Epoch 15/1000:   1%|▏         | 14/1000 [04:23<5:21:14, 19.55s/it, v_num=4yez, train_loss_step=1.07e+3, train_loss_epoch=1.06e+3]

Epoch 15/1000:   2%|▏         | 15/1000 [04:38<4:54:57, 17.97s/it, v_num=4yez, train_loss_step=1.07e+3, train_loss_epoch=1.06e+3]

Epoch 15/1000:   2%|▏         | 15/1000 [04:38<4:54:57, 17.97s/it, v_num=4yez, train_loss_step=1.04e+3, train_loss_epoch=1.06e+3]

Epoch 16/1000:   2%|▏         | 15/1000 [04:38<4:54:57, 17.97s/it, v_num=4yez, train_loss_step=1.04e+3, train_loss_epoch=1.06e+3]

Epoch 16/1000:   2%|▏         | 16/1000 [04:57<5:03:17, 18.49s/it, v_num=4yez, train_loss_step=1.04e+3, train_loss_epoch=1.06e+3]

Epoch 16/1000:   2%|▏         | 16/1000 [04:57<5:03:17, 18.49s/it, v_num=4yez, train_loss_step=1.06e+3, train_loss_epoch=1.06e+3]

Epoch 17/1000:   2%|▏         | 16/1000 [04:57<5:03:17, 18.49s/it, v_num=4yez, train_loss_step=1.06e+3, train_loss_epoch=1.06e+3]

Epoch 17/1000:   2%|▏         | 17/1000 [05:12<4:41:49, 17.20s/it, v_num=4yez, train_loss_step=1.06e+3, train_loss_epoch=1.06e+3]

Epoch 17/1000:   2%|▏         | 17/1000 [05:12<4:41:49, 17.20s/it, v_num=4yez, train_loss_step=1.01e+3, train_loss_epoch=1.06e+3]

Epoch 18/1000:   2%|▏         | 17/1000 [05:12<4:41:49, 17.20s/it, v_num=4yez, train_loss_step=1.01e+3, train_loss_epoch=1.06e+3]

Epoch 18/1000:   2%|▏         | 18/1000 [05:26<4:28:05, 16.38s/it, v_num=4yez, train_loss_step=1.01e+3, train_loss_epoch=1.06e+3]

Epoch 18/1000:   2%|▏         | 18/1000 [05:26<4:28:05, 16.38s/it, v_num=4yez, train_loss_step=1.02e+3, train_loss_epoch=1.06e+3]

Epoch 19/1000:   2%|▏         | 18/1000 [05:26<4:28:05, 16.38s/it, v_num=4yez, train_loss_step=1.02e+3, train_loss_epoch=1.06e+3]

Epoch 19/1000:   2%|▏         | 19/1000 [05:40<4:17:03, 15.72s/it, v_num=4yez, train_loss_step=1.02e+3, train_loss_epoch=1.06e+3]

Epoch 19/1000:   2%|▏         | 19/1000 [05:40<4:17:03, 15.72s/it, v_num=4yez, train_loss_step=1.07e+3, train_loss_epoch=1.06e+3]

Epoch 20/1000:   2%|▏         | 19/1000 [05:40<4:17:03, 15.72s/it, v_num=4yez, train_loss_step=1.07e+3, train_loss_epoch=1.06e+3]

Epoch 20/1000:   2%|▏         | 20/1000 [05:55<4:09:15, 15.26s/it, v_num=4yez, train_loss_step=1.07e+3, train_loss_epoch=1.06e+3]

Epoch 20/1000:   2%|▏         | 20/1000 [05:55<4:09:15, 15.26s/it, v_num=4yez, train_loss_step=1.04e+3, train_loss_epoch=1.06e+3]

Epoch 21/1000:   2%|▏         | 20/1000 [05:55<4:09:15, 15.26s/it, v_num=4yez, train_loss_step=1.04e+3, train_loss_epoch=1.06e+3]

Epoch 21/1000:   2%|▏         | 21/1000 [06:09<4:03:48, 14.94s/it, v_num=4yez, train_loss_step=1.04e+3, train_loss_epoch=1.06e+3]

Epoch 21/1000:   2%|▏         | 21/1000 [06:09<4:03:48, 14.94s/it, v_num=4yez, train_loss_step=1.07e+3, train_loss_epoch=1.06e+3]

Epoch 21/1000:   2%|▏         | 21/1000 [06:09<4:46:52, 17.58s/it, v_num=4yez, train_loss_step=1.07e+3, train_loss_epoch=1.06e+3]


Monitored metric reconstruction_loss_validation did not improve in the last 10 records. Best score: 1054.821. Signaling Trainer to stop.


In [15]:
wandb.finish()

[34m[1mwandb[0m: - 0.005 MB of 0.005 MB uploaded

[34m[1mwandb[0m: \ 0.019 MB of 0.025 MB uploaded

[34m[1mwandb[0m: | 0.019 MB of 0.025 MB uploaded

[34m[1mwandb[0m: / 0.025 MB of 0.025 MB uploaded

[34m[1mwandb[0m:                                                                                


[34m[1mwandb[0m: 
[34m[1mwandb[0m: Run history:
[34m[1mwandb[0m:                     elbo_train █▆▄▃▃▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁
[34m[1mwandb[0m:                elbo_validation █▅▄▃▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁
[34m[1mwandb[0m:                          epoch ▁▁▁▁▂▂▂▂▂▂▃▃▃▃▃▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇████
[34m[1mwandb[0m:                kl_global_train ▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
[34m[1mwandb[0m:           kl_global_validation ▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
[34m[1mwandb[0m:                 kl_local_train ██▅▄▃▃▃▂▂▂▂▂▂▂▂▁▁▁▁▁▁
[34m[1mwandb[0m:            kl_local_validation █▆▄▃▃▃▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁
[34m[1mwandb[0m:                      kl_weight ▁▁▁▁▂▂▂▂▂▂▃▃▃▃▃▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇████
[34m[1mwandb[0m:      reconstruction_loss_train █▄▃▃▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁
[34m[1mwandb[0m: reconstruction_loss_validation █▅▃▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
[34m[1mwandb[0m:               train_loss_epoch █▄▃▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁
[34m[1mwandb[0m:                train_loss_step ▆▅▇▄▅▃▅▇▃▂▆▅▃▄▅▅█▁▃▆▃▆▅▃▁▁▃▄▅▄▇▃▄▅▄▅▂▆▅▂
[34m[1mwand

[34m[1mwandb[0m: 🚀 View run [33mStep2_T_NonNaive[0m at: [34m[4mhttps://wandb.ai/inflammation/inflammation_atlas_R1/runs/s58o4yez/workspace[0m
[34m[1mwandb[0m: Synced 6 W&B file(s), 0 media file(s), 0 artifact file(s) and 0 other file(s)


[34m[1mwandb[0m: Find logs at: [35m[1m./wandb/run-20241021_094646-s58o4yez/logs[0m


### Extracting embedding space

In [16]:
adata.obsm['X_scVI'] = model.get_latent_representation()

## Save the results

In [17]:
if overwriteData:
    adata.write(here(f"{workDir}/{cellGroup}/results/02_{annotationLevel}_{cellGroup}_HVGsubset_scVI.h5ad"), compression="gzip")
    model.save(here(f"{workDir}/{cellGroup}/results/02_{annotationLevel}_{cellGroup}_HVGsubset_scVI_MODEL/"),
               overwrite = True, 
               save_anndata = False )   

In [18]:
# To load the model do (after loading corresponding adata):
# model = scvi.model.SCVI.load(here('{}/results/01_{}_HVGsubset_scVI_MODEL/'.format(workDir, cellGroup)), 
#                              adata, 
#                              use_gpu=True)