This notebook performs the statistical analysis about the readcounts matrix and the RAS(Reaction Activity  Scores) matrix.

In [None]:
import pandas as pd
import scanpy as sc
import matplotlib.pyplot as plt

In [None]:
from utils import plot_correlations
from utils import plot_distributions
from utils import plot_two_reaction_correlation
from utils import table_sparsity,table_sparsity_denoised

## Load datatsets

In [None]:
names_datasets=["datasetGSE110949","datasetE-GEOD-86618","datasetGSE118056"]

Load readcounts and RAS without any denoising

In [None]:
adata1=sc.read_h5ad("outputs/readcounts/datasetGSE110949_nodenoise")
adata2=sc.read_h5ad("outputs/readcounts/datasetE-GEOD-86618_nodenoise")
adata3=sc.read_h5ad("outputs/readcounts/datasetGSE118056_nodenoise")
adatasets_counts=[adata1,adata2,adata3]

In [None]:
adata1=sc.read_h5ad("outputs/ras/datasetGSE110949_nodenoise")
adata2=sc.read_h5ad("outputs/ras/datasetE-GEOD-86618_nodenoise")
adata3=sc.read_h5ad("outputs/ras/datasetGSE118056_nodenoise")
adatasets_ras=[adata1,adata2,adata3]

RAS values with denoising applied on the readcounts matrix

In [None]:
adata1=sc.read_h5ad("outputs/ras/datasetGSE110949_magic_counts")
adata2=sc.read_h5ad("outputs/ras/datasetE-GEOD-86618_magic_counts")
adata3=sc.read_h5ad("outputs/ras/datasetGSE118056_magic_counts")
adatasets_ras_magic_counts=[adata1,adata2,adata3]

In [None]:
adata1=sc.read_h5ad("outputs/ras/datasetGSE110949_enhance_counts")
adata2=sc.read_h5ad("outputs/ras/datasetE-GEOD-86618_enhance_counts")
adata3=sc.read_h5ad("outputs/ras/datasetGSE118056_enhance_counts")
adatasets_ras_enhance_counts=[adata1,adata2,adata3]

In [None]:
adata1=sc.read_h5ad("outputs/ras/datasetGSE110949_saver_counts")
adata2=sc.read_h5ad("outputs/ras/datasetE-GEOD-86618_saver_counts")
adata3=sc.read_h5ad("outputs/ras/datasetGSE118056_saver_counts")
adatasets_ras_saver_counts=[adata1,adata2,adata3]

RAS values with denoising applied on the RAS matrix

In [None]:
adata1=sc.read_h5ad("outputs/ras/datasetGSE110949_magic_ras")
adata2=sc.read_h5ad("outputs/ras/datasetE-GEOD-86618_magic_ras")
adata3=sc.read_h5ad("outputs/ras/datasetGSE118056_magic_ras")
adatasets_ras_magic_ras=[adata1,adata2,adata3]

In [None]:
adata1=sc.read_h5ad("outputs/ras/datasetGSE110949_enhance_ras")
adata2=sc.read_h5ad("outputs/ras/datasetE-GEOD-86618_enhance_ras")
adata3=sc.read_h5ad("outputs/ras/datasetGSE118056_enhance_ras")
adatasets_ras_enhance_ras=[adata1,adata2,adata3]

In [None]:
adata1=sc.read_h5ad("outputs/ras/datasetGSE110949_saver_ras")
adata2=sc.read_h5ad("outputs/ras/datasetE-GEOD-86618_saver_ras")
adata3=sc.read_h5ad("outputs/ras/datasetGSE118056_saver_ras")
adatasets_ras_saver_ras=[adata1,adata2,adata3]

In [None]:
adatasets_ras_saver_counts[0].to_df()

## Level of sparsity of readcounts and RAS matrix

Table that summarizes the level of sparsity on readcounts matrix and ras matrix without any denoising

In [None]:
table_sparsity(adatasets_counts,adatasets_ras,names_datasets)

Table that summarizes the level of sparsity on ras matrix with any denoising applied on the readcount matrix

In [None]:
table_sparsity_denoised(adatasets_ras_magic_counts,
                        adatasets_ras_enhance_counts,
                        adatasets_ras_saver_counts,
                        names_datasets)

Table that summarizes the level of sparsity on ras matrix with any denoising applied on the ras matrix

In [None]:
table_sparsity_denoised(adatasets_ras_magic_ras,
                        adatasets_ras_enhance_ras,
                        adatasets_ras_saver_ras,
                        names_datasets)

In [None]:
adatasets_ras_saver_counts[2].to_df()

## Distribution of zero RAS values

First, analyze the zero RAS values without any denoising

Show percentage of zero RAS values

In [None]:
plot_distributions(adatasets_ras)

Analyze correlation between RAS values, without denoising

In [None]:
plot_correlations(adatasets_ras)

Analyze correlation between a pair of reactions

In [None]:
plot_two_reaction_correlation(adatasets_ras,["LDH_L","DmLact"])

## Analysis on denoised RAS matrix

Analyze correlation between denoised RAS values

In [None]:
plot_correlations(adatasets_ras_magic_counts)

In [None]:
plot_correlations(adatasets_ras_enhance_counts)

In [None]:
plot_correlations(adatasets_ras_saver_counts)

In [None]:
plot_two_reaction_correlation(adatasets_ras_magic_counts,["LDH_L","DmLact"])