In [8]:
import json
import pandas as pd

In [18]:
data = json.load(open("../singscore_new_code/Doxorubicin/Doxorubicin_singscore_results.json"))
df = pd.DataFrame({
    k: [v["scores"]["total_singscore"], v["statistics"]["p_value"]]
    for k, v in data.items()
}).T
df.columns = ["total_singscore", "p_value"]
df.to_csv("../singscore_new_code/Doxorubicin/Doxorubicin_singscore_df.csv")
df

Unnamed: 0,total_singscore,p_value
Mitotic Spindle,0.230768,0.000100
G2-M Checkpoint,0.176974,0.000100
Estrogen Response Late,0.144631,0.000100
Interferon Alpha Response,0.132289,0.000100
Interferon Gamma Response,0.108035,0.000100
...,...,...
Vascular Transport (GO:0010232),0.018016,0.290971
Vitamin Transport (GO:0051180),-0.045955,0.817818
Wound Healing (GO:0042060),0.128020,0.000100
Xenobiotic Transport (GO:0042908),-0.112599,0.956604


In [21]:
# pvalue filter is </= 0.05
pvalue_filtered = df[(df["p_value"] < 0.05) | (df["p_value"] == 0.05)]
pvalue_filtered

Unnamed: 0,total_singscore,p_value
Mitotic Spindle,0.230768,0.0001
G2-M Checkpoint,0.176974,0.0001
Estrogen Response Late,0.144631,0.0001
Interferon Alpha Response,0.132289,0.0001
Interferon Gamma Response,0.108035,0.0001
...,...,...
Telomere Maintenance via Telomerase (GO:0007004),0.188710,0.0013
Telomere Maintenance via Telomere Lengthening (GO:0010833),0.170135,0.0016
Telomere Organization (GO:0032200),0.190736,0.0001
Vascular Endothelial Growth Factor Receptor Signaling Pathway (GO:0048010),0.204348,0.0001


In [24]:
upregualted_pathways = pvalue_filtered.sort_values(by="total_singscore", ascending=False)
upregualted_pathways.to_csv("../singscore_new_code/Doxorubicin/Doxorubicin_upregulated_pathway_all.csv")
upregualted_pathways

Unnamed: 0,total_singscore,p_value
Negative Regulation of Oxidative Stress-Induced Intrinsic Apoptotic Signaling Pathway (GO:1902176),0.334174,0.000100
Constitutive Signaling by Overexpressed ERBB2,0.326175,0.000100
Regulation of Fibroblast Migration (GO:0010762),0.323667,0.000100
SARS-CoV-1-host Interactions,0.316427,0.000100
Negative Regulation of Fibroblast Migration (GO:0010764),0.306521,0.007499
...,...,...
"PI5P, PP2A and IER3 Regulate PI3K AKT Signaling",0.048572,0.049395
Response to Lipopolysaccharide (GO:0032496),0.046805,0.029997
Fatty Acid Metabolism,0.046574,0.019198
Regulation of ERK1 and ERK2 Cascade (GO:0070372),0.043453,0.016098


In [32]:
top30_pathways_up = upregualted_pathways.head(30).index.tolist()
with open("../singscore_new_code/Doxorubicin/Doxorubicin_upregulated_pathway_top30.txt", "w") as f:
    f.write("\n".join(top30_pathways_up))

In [25]:
downregualted_pathways = pvalue_filtered.sort_values(by="total_singscore", ascending=True)
downregualted_pathways.to_csv("../singscore_new_code/Doxorubicin/Doxorubicin_downregulated_pathway_all.csv")
downregualted_pathways

Unnamed: 0,total_singscore,p_value
Lipid Metabolic Process (GO:0006629),0.041754,0.015998
Regulation of ERK1 and ERK2 Cascade (GO:0070372),0.043453,0.016098
Fatty Acid Metabolism,0.046574,0.019198
Response to Lipopolysaccharide (GO:0032496),0.046805,0.029997
"PI5P, PP2A and IER3 Regulate PI3K AKT Signaling",0.048572,0.049395
...,...,...
Negative Regulation of Fibroblast Migration (GO:0010764),0.306521,0.007499
SARS-CoV-1-host Interactions,0.316427,0.000100
Regulation of Fibroblast Migration (GO:0010762),0.323667,0.000100
Constitutive Signaling by Overexpressed ERBB2,0.326175,0.000100


In [34]:
downregualted_pathways.head(30)

Unnamed: 0,total_singscore,p_value
Lipid Metabolic Process (GO:0006629),0.041754,0.015998
Regulation of ERK1 and ERK2 Cascade (GO:0070372),0.043453,0.016098
Fatty Acid Metabolism,0.046574,0.019198
Response to Lipopolysaccharide (GO:0032496),0.046805,0.029997
"PI5P, PP2A and IER3 Regulate PI3K AKT Signaling",0.048572,0.049395
Positive Regulation of Cytokine Production (GO:0001819),0.049068,0.0026
Positive Regulation of Epithelial Cell Proliferation (GO:0050679),0.049251,0.041496
Positive Regulation of Multicellular Organismal Process (GO:0051240),0.049729,0.0005
Nervous System Development (GO:0007399),0.050218,0.0002
Natural killer cell mediated cytotoxicity,0.052181,0.042096


In [33]:
top30_pathways_down = downregualted_pathways.head(30).index.tolist()
with open("../singscore_new_code/Doxorubicin/Doxorubicin_downregulated_pathway_top30.txt", "w") as f:
    f.write("\n".join(top30_pathways_down))

In [35]:
def Isolation_drug_up_down_pathways(drug):
    data = json.load(open(f"../singscore_new_code//{drug}/{drug}_singscore_results.json"))
    df = pd.DataFrame({
        k: [v["scores"]["total_singscore"], v["statistics"]["p_value"]]
        for k, v in data.items()
    }).T
    df.columns = ["total_singscore", "p_value"]
    df.to_csv(f"../singscore_new_code//{drug}/{drug}_singscore_df.csv")

    pvalue_filtered = df[(df["p_value"] < 0.05) | (df["p_value"] == 0.05)]
    upregualted_pathways = pvalue_filtered.sort_values(by="total_singscore", ascending=False)
    upregualted_pathways.to_csv(f"../singscore_new_code//{drug}/{drug}_upregulated_pathway_all.csv")

    top30_pathways_up = upregualted_pathways.head(30).index.tolist()
    with open(f"../singscore_new_code//{drug}/{drug}_upregulated_pathway_top30.txt", "w") as f:
        f.write("\n".join(top30_pathways_up))

    downregualted_pathways = pvalue_filtered.sort_values(by="total_singscore", ascending=True)
    downregualted_pathways.to_csv(f"../singscore_new_code//{drug}/{drug}_downregulated_pathway_all.csv")

    top30_pathways_down = downregualted_pathways.head(30).index.tolist()
    with open(f"../singscore_new_code/{drug}/{drug}_downregulated_pathway_top30.txt", "w") as f:
        f.write("\n".join(top30_pathways_down))

    return print(f"Done for {drug}")