In [1]:
import anndata as ad
import scanpy as sc
import sckade
from matplotlib import rcParams

In [2]:
sckade.plot.set_publication_params
rcParams["figure.figsize"] = (4, 4)

In [None]:
rna = ad.read_h5ad("./data/dataset/10x-Multiome-Pbmc10k-RNA.h5ad")
rna

In [None]:
atac = ad.read_h5ad("./data/dataset/10x-Multiome-Pbmc10k-ATAC.h5ad")
atac

In [None]:
rna.X, rna.X.data

In [6]:
rna.layers['counts'] = rna.X.copy()

In [7]:
sc.pp.highly_variable_genes(rna, n_top_genes=2000, flavor="seurat_v3")

In [8]:
sc.pp.normalize_total(rna)
sc.pp.log1p(rna)
sc.pp.scale(rna)
sc.tl.pca(rna, n_comps=100, svd_solver="auto")

In [None]:
sc.pp.neighbors(rna, metric="cosine")
sc.tl.umap(rna)
sc.pl.umap(rna, color="cell_type")

In [None]:
atac.X, atac.X.data

In [11]:
sckade.data.lsi(atac, n_components=100, n_iter=15)

In [None]:
sc.pp.neighbors(atac, use_rep="X_lsi", metric="cosine")
sc.tl.umap(atac)
sc.pl.umap(atac, color="cell_type")

In [None]:
rna, atac

In [14]:
rna.write("./data/preprocess/10x-rna-pp.h5ad", compression="gzip")
atac.write("./data/preprocess/10x-atac-pp.h5ad", compression="gzip")

In [15]:
ad.AnnData(
        X=rna.obsm["X_pca"], obs=rna.obs
    ).write("./data/preprocess/10x_rna_uni.h5ad", compression="gzip")

In [16]:
ad.AnnData(
        X=atac.obsm["X_lsi"], obs=atac.obs
    ).write("./data/preprocess/10x_atac_uni.h5ad", compression="gzip")