In [None]:
import scvi

import scanpy as sc
import scipy as sp
import pandas as pd
import matplotlib.pyplot as plt
import random
import numpy as np
import os
import torch
import sys
from datetime import datetime

sc.set_figure_params(figsize=(4,4))
sc.set_figure_params(dpi=200)
sc.settings.n_jobs = 1 #nCores/CPUs for scanpy
scvi.settings.progress_bar_style = "tqdm"

# for white background of figures (only for docs rendering)
%config InlineBackend.print_figure_kwargs={'facecolor' : "w"}
%config InlineBackend.figure_format='retina'

#hpc figures
%matplotlib inline

from IPython.core.interactiveshell import InteractiveShell
InteractiveShell.ast_node_interactivity = "all" # print multiple outputs per code cell (not just last)

In [None]:
def set_seed(seed):
    random.seed(seed)
    np.random.seed(seed)
    torch.manual_seed(seed)
    scvi.settings.seed = seed # scvi-tools seed
    os.environ["PYTHONHASHSEED"] = str(seed)

    if torch.cuda.is_available():
        torch.cuda.manual_seed(seed)
        torch.cuda.manual_seed_all(seed)
        torch.backends.cudnn.deterministic = True
        torch.backends.cudnn.benchmark = False

set_seed(123)

In [None]:
!cd /scratch/gent/vo/000/gvo00027/projects/Single_Cell_Neuroblastoma/NBAtlas
os.getcwd()

In [None]:
output_dir = '02_Create_AnndataObj_NBAtlas'
os.makedirs(output_dir, exist_ok=True)

# Original

In [None]:
adata = sc.read_10x_h5("01_Import_Preprocessing_NBAtlas/h5objects/nb_matrix_NBAtlas.h5")

In [None]:
adata

In [None]:
adata.var_names_make_unique()
adata

In [None]:
# metadata
metadata = pd.read_csv('01_Import_Preprocessing_NBAtlas/Tables/nb_matrix_metadata_ext.csv', 
                       index_col=0)
metadata

In [None]:
adata.obs['nCount_RNA'] = metadata['nCount_RNA'].values
adata.obs['nFeature_RNA'] = metadata['nFeature_RNA'].values
adata.obs['percent_mito'] = metadata['percent_mito'].values
adata.obs['Study'] = metadata['Study'].values
adata.obs['Assay'] = metadata['Assay'].values
adata.obs['Platform'] = metadata['Platform'].values
adata.obs['Sample'] = metadata['Sample'].values
adata.obs['Author_Annot'] = metadata['Author_Annot'].values


adata

In [None]:
sc.write(adata=adata, 
        filename = '02_Create_AnndataObj_NBAtlas/nb_adata_NBAtlas.h5ad')

In [None]:
# metadata ext
metadata = pd.read_csv('01_Import_Preprocessing_NBAtlas/Tables/nb_matrix_metadata_ext.csv', 
                       index_col=0)
metadata

In [None]:
adata.obs['Author_annot_unified'] = metadata['Author_annot_unified'].values