In [1]:
import os
os.chdir("/hdd_14T/data/PXD031322_oxaliplatin_dia_study/ftp.pride.ebi.ac.uk/pride/data/archive/2022/07/PXD031322/2022-09-22_ctrl_vs_ST_vs_LT_study")

In [2]:
import pandas as pd 

In [3]:
apoptosis = pd.read_csv("apoptosis.tsv", sep = "\t", index_col = 0)
cell_cycle = pd.read_csv("cell_cycle.tsv", sep = "\t", index_col = 0)
erbB_signaling_pathway = pd.read_csv("erbB_signaling_pathway.tsv", sep = "\t", index_col = 0)
mismatch_repair = pd.read_csv("mismatch_repair.tsv", sep = "\t", index_col = 0)
nucleotide_excision_repair = pd.read_csv("nucleotide_excision_repair.tsv", sep = "\t", index_col = 0)
p53_signaling_pathway = pd.read_csv("p53_signaling_pathway.tsv", sep = "\t", index_col = 0)

In [4]:
def print_significant_proteins(df, fdr_threshold):
    ctrl_ST_triqler = len(df[df["triqler_FDR_CTRL_ST"] < fdr_threshold])
    ctrl_ST_reported = len(df[df["reported_FDR_CTRL_ST"] < fdr_threshold])

    ctrl_LT_triqler = len(df[df["triqler_FDR_CTRL_LT"] < fdr_threshold])
    ctrl_LT_reported = len(df[df["reported_FDR_CTRL_LT"] < fdr_threshold])

    LT_ST_triqler = len(df[df["triqler_FDR_LT_ST"] < fdr_threshold])
    LT_ST_reported = len(df[df["reported_FDR_LT_ST"] < fdr_threshold])

    #print("Apoptosis pathway")
    print(f"{len(df)} proteins are in pathway.")
    
    print()
    print(f"ctrl_ST_triqler {ctrl_ST_triqler} proteins significantly differentially abundant at fdr: {fdr_threshold}")
    print(f"ctrl_ST_reported {ctrl_ST_reported} proteins significantly differentially abundant at fdr: {fdr_threshold}")
    print()
    print(f"ctrl_LT_triqler {ctrl_LT_triqler} proteins significantly differentially abundant at fdr: {fdr_threshold}")
    print(f"ctrl_LT_reported {ctrl_LT_reported} proteins significantly differentially abundant at fdr: {fdr_threshold}")
    print()
    print(f"LT_ST_triqler {LT_ST_triqler} proteins significantly differentially abundant at fdr: {fdr_threshold}")
    print(f"LT_ST_reported {LT_ST_reported} proteins significantly differentially abundant at fdr: {fdr_threshold}")

In [5]:
def print_identified_proteins(df):

    ctrl_ST_triqler = len(df["triqler_log2FC_CTRL_ST"].dropna())
    ctrl_ST_reported = len(df["reported_log2FC_CTRL_ST"].dropna())

    ctrl_LT_triqler = len(df["triqler_log2FC_CTRL_LT"].dropna())
    ctrl_LT_reported = len(df["reported_log2FC_CTRL_LT"].dropna())

    LT_ST_triqler = len(df["triqler_log2FC_LT_ST"].dropna())
    LT_ST_reported = len(df["reported_log2FC_LT_ST"].dropna())

    print()
    print(f"ctrl_ST_triqler {ctrl_ST_triqler} proteins quantified in both samples")
    print(f"ctrl_ST_reported {ctrl_ST_reported} proteins quantified in both samples")
    print()
    print(f"ctrl_LT_triqler {ctrl_LT_triqler} proteins quantified in both samples")
    print(f"ctrl_LT_reported {ctrl_LT_reported} proteins quantified in both samples")
    print()
    print(f"LT_ST_triqler {LT_ST_triqler} proteins quantified in both samples")
    print(f"LT_ST_reported {LT_ST_reported} proteins quantified in both samples")



# NOTE: Triqler is used with fold_change_eval = 0.1

# Apoptosis

In [6]:
print_significant_proteins(apoptosis, fdr_threshold = 0.05)
print("-------")
print_identified_proteins(apoptosis)

136 proteins are in pathway.

ctrl_ST_triqler 12 proteins significantly differentially abundant at fdr: 0.05
ctrl_ST_reported 8 proteins significantly differentially abundant at fdr: 0.05

ctrl_LT_triqler 21 proteins significantly differentially abundant at fdr: 0.05
ctrl_LT_reported 13 proteins significantly differentially abundant at fdr: 0.05

LT_ST_triqler 14 proteins significantly differentially abundant at fdr: 0.05
LT_ST_reported 9 proteins significantly differentially abundant at fdr: 0.05
-------

ctrl_ST_triqler 57 proteins quantified in both samples
ctrl_ST_reported 40 proteins quantified in both samples

ctrl_LT_triqler 57 proteins quantified in both samples
ctrl_LT_reported 40 proteins quantified in both samples

LT_ST_triqler 57 proteins quantified in both samples
LT_ST_reported 40 proteins quantified in both samples


# Cell cycle

In [7]:
print_significant_proteins(cell_cycle, fdr_threshold = 0.05)
print("-------")
print_identified_proteins(cell_cycle)

125 proteins are in pathway.

ctrl_ST_triqler 9 proteins significantly differentially abundant at fdr: 0.05
ctrl_ST_reported 3 proteins significantly differentially abundant at fdr: 0.05

ctrl_LT_triqler 18 proteins significantly differentially abundant at fdr: 0.05
ctrl_LT_reported 9 proteins significantly differentially abundant at fdr: 0.05

LT_ST_triqler 5 proteins significantly differentially abundant at fdr: 0.05
LT_ST_reported 5 proteins significantly differentially abundant at fdr: 0.05
-------

ctrl_ST_triqler 34 proteins quantified in both samples
ctrl_ST_reported 23 proteins quantified in both samples

ctrl_LT_triqler 34 proteins quantified in both samples
ctrl_LT_reported 23 proteins quantified in both samples

LT_ST_triqler 34 proteins quantified in both samples
LT_ST_reported 23 proteins quantified in both samples


Triqler has more significant proteins in ctrl_ST and ctrl_LT

# erbB Signaling pathway

In [8]:
print_significant_proteins(erbB_signaling_pathway, fdr_threshold = 0.05)
print("-------")
print_identified_proteins(erbB_signaling_pathway)

84 proteins are in pathway.

ctrl_ST_triqler 7 proteins significantly differentially abundant at fdr: 0.05
ctrl_ST_reported 2 proteins significantly differentially abundant at fdr: 0.05

ctrl_LT_triqler 15 proteins significantly differentially abundant at fdr: 0.05
ctrl_LT_reported 6 proteins significantly differentially abundant at fdr: 0.05

LT_ST_triqler 7 proteins significantly differentially abundant at fdr: 0.05
LT_ST_reported 3 proteins significantly differentially abundant at fdr: 0.05
-------

ctrl_ST_triqler 46 proteins quantified in both samples
ctrl_ST_reported 35 proteins quantified in both samples

ctrl_LT_triqler 46 proteins quantified in both samples
ctrl_LT_reported 35 proteins quantified in both samples

LT_ST_triqler 46 proteins quantified in both samples
LT_ST_reported 35 proteins quantified in both samples


Triqler has more significant proteins in every group

# Mismatch Repair

In [9]:
print_significant_proteins(mismatch_repair, fdr_threshold = 0.05)
print("-------")
print_identified_proteins(mismatch_repair)

22 proteins are in pathway.

ctrl_ST_triqler 3 proteins significantly differentially abundant at fdr: 0.05
ctrl_ST_reported 2 proteins significantly differentially abundant at fdr: 0.05

ctrl_LT_triqler 3 proteins significantly differentially abundant at fdr: 0.05
ctrl_LT_reported 2 proteins significantly differentially abundant at fdr: 0.05

LT_ST_triqler 1 proteins significantly differentially abundant at fdr: 0.05
LT_ST_reported 2 proteins significantly differentially abundant at fdr: 0.05
-------

ctrl_ST_triqler 6 proteins quantified in both samples
ctrl_ST_reported 3 proteins quantified in both samples

ctrl_LT_triqler 6 proteins quantified in both samples
ctrl_LT_reported 3 proteins quantified in both samples

LT_ST_triqler 6 proteins quantified in both samples
LT_ST_reported 3 proteins quantified in both samples


Triqler has more significant proteins in every ctrl_ST and ctrl_LT, reported has more in LT_ST

# Nucelotide Excision Repair

In [10]:
print_significant_proteins(nucleotide_excision_repair, fdr_threshold = 0.05)
print("-------")
print_identified_proteins(nucleotide_excision_repair)

43 proteins are in pathway.

ctrl_ST_triqler 4 proteins significantly differentially abundant at fdr: 0.05
ctrl_ST_reported 3 proteins significantly differentially abundant at fdr: 0.05

ctrl_LT_triqler 5 proteins significantly differentially abundant at fdr: 0.05
ctrl_LT_reported 2 proteins significantly differentially abundant at fdr: 0.05

LT_ST_triqler 3 proteins significantly differentially abundant at fdr: 0.05
LT_ST_reported 2 proteins significantly differentially abundant at fdr: 0.05
-------

ctrl_ST_triqler 10 proteins quantified in both samples
ctrl_ST_reported 7 proteins quantified in both samples

ctrl_LT_triqler 10 proteins quantified in both samples
ctrl_LT_reported 7 proteins quantified in both samples

LT_ST_triqler 10 proteins quantified in both samples
LT_ST_reported 7 proteins quantified in both samples


Triqler has more significant proteins in every group

# p53 Signaling Pathway

In [11]:
print_significant_proteins(p53_signaling_pathway, fdr_threshold = 0.05)
print("-------")
print_identified_proteins(p53_signaling_pathway)

72 proteins are in pathway.

ctrl_ST_triqler 3 proteins significantly differentially abundant at fdr: 0.05
ctrl_ST_reported 1 proteins significantly differentially abundant at fdr: 0.05

ctrl_LT_triqler 4 proteins significantly differentially abundant at fdr: 0.05
ctrl_LT_reported 4 proteins significantly differentially abundant at fdr: 0.05

LT_ST_triqler 3 proteins significantly differentially abundant at fdr: 0.05
LT_ST_reported 2 proteins significantly differentially abundant at fdr: 0.05
-------

ctrl_ST_triqler 15 proteins quantified in both samples
ctrl_ST_reported 7 proteins quantified in both samples

ctrl_LT_triqler 15 proteins quantified in both samples
ctrl_LT_reported 7 proteins quantified in both samples

LT_ST_triqler 15 proteins quantified in both samples
LT_ST_reported 7 proteins quantified in both samples


Triqler has more significant proteins in every group