# Number of proteins different between tumor and normal in samples with an event versus samples without it

In [1]:
import altair as alt
import cnvutils
import numpy as np

In [2]:
all_pvals = cnvutils.get_has_vs_not_has_tumor_normal_diff_props(
    chromosomes_events={
            8: {
                "p": ["loss"],
                "q": ["gain"],
            },
        },
    sources=["cptac", "gistic"],
    levels=["gene"],    
)

Running _get_ttest_sig_counts with {'chromosome': 8, 'arm': 'p', 'gain_or_loss': 'loss', 'cis_or_trans': 'cis', 'proteomics_or_transcriptomics': 'proteomics', 'cancer_types': ['brca', 'coad', 'hnscc', 'lscc', 'luad', 'ov'], 'source': 'cptac', 'has_event': True, 'level': None, 'data_dir': '/home/caleb/github/PayneLab/pancancerCNV/00_functions/chr08/../data'}...
Running _get_ttest_sig_counts with {'chromosome': 8, 'arm': 'p', 'gain_or_loss': 'loss', 'cis_or_trans': 'trans', 'proteomics_or_transcriptomics': 'proteomics', 'cancer_types': ['brca', 'coad', 'hnscc', 'lscc', 'luad', 'ov'], 'source': 'cptac', 'has_event': True, 'level': None, 'data_dir': '/home/caleb/github/PayneLab/pancancerCNV/00_functions/chr08/../data'}...
Running _get_ttest_sig_counts with {'chromosome': 8, 'arm': 'p', 'gain_or_loss': 'loss', 'cis_or_trans': 'cis', 'proteomics_or_transcriptomics': 'proteomics', 'cancer_types': ['brca', 'coad', 'hnscc', 'lscc', 'luad', 'ov'], 'source': 'cptac', 'has_event': False, 'level': 


Running _get_ttest_sig_counts with {'chromosome': 8, 'arm': 'p', 'gain_or_loss': 'loss', 'cis_or_trans': 'cis', 'proteomics_or_transcriptomics': 'transcriptomics', 'cancer_types': ['brca', 'coad', 'hnscc', 'lscc', 'luad', 'ov', 'pdac'], 'source': 'gistic', 'has_event': False, 'level': 'gene', 'data_dir': '/home/caleb/github/PayneLab/pancancerCNV/00_functions/chr08/../data'}...
Running _get_ttest_sig_counts with {'chromosome': 8, 'arm': 'q', 'gain_or_loss': 'gain', 'cis_or_trans': 'cis', 'proteomics_or_transcriptomics': 'proteomics', 'cancer_types': ['brca', 'coad', 'hnscc', 'lscc', 'luad', 'ov', 'pdac'], 'source': 'gistic', 'has_event': True, 'level': 'gene', 'data_dir': '/home/caleb/github/PayneLab/pancancerCNV/00_functions/chr08/../data'}...


Running _get_ttest_sig_counts with {'chromosome': 8, 'arm': 'q', 'gain_or_loss': 'gain', 'cis_or_trans': 'trans', 'proteomics_or_transcriptomics': 'proteomics', 'cancer_types': ['brca', 'coad', 'hnscc', 'lscc', 'luad', 'ov', 'pdac'], 'source':

In [3]:
all_pvals = all_pvals.infer_objects()

all_pvals = all_pvals.assign(
    line=-np.log10(0.05),
    neg_log_sig_props=-np.log10(all_pvals["sig_props"]),
    neg_log_not_sig_props=-np.log10(all_pvals["not_sig_props"]),
    neg_log_na_props=-np.log10(all_pvals["na_props"]),
)

all_pvals = all_pvals.drop(columns=["sig_props", "not_sig_props", "na_props"])
all_pvals = all_pvals.melt(
    id_vars=["name", "line"],
    value_vars=["neg_log_sig_props", "neg_log_not_sig_props", "neg_log_na_props"],
    var_name="group",
    value_name="neg_log_p",
)

base = alt.Chart(all_pvals)

dots = base.mark_point().encode(
    x="name",
    y="neg_log_p",
    color="group",
)

line = base.mark_rule(color="crimson").encode(
    y="line"
)

dots + line

Unnamed: 0,name,line,group,neg_log_p
0,p_all,1.30103,neg_log_sig_props,10.471005
1,p_cptac,1.30103,neg_log_sig_props,9.569432
2,p_cptac_proteomics,1.30103,neg_log_sig_props,7.469667
3,p_cptac_proteomics_cis,1.30103,neg_log_sig_props,3.151706
4,p_cptac_proteomics_cis_loss,1.30103,neg_log_sig_props,1.269244
5,p_cptac_proteomics_cis_gain,1.30103,neg_log_sig_props,2.002133
6,p_cptac_proteomics_trans,1.30103,neg_log_sig_props,4.713781
7,p_cptac_proteomics_trans_loss,1.30103,neg_log_sig_props,2.247902
8,p_cptac_proteomics_trans_gain,1.30103,neg_log_sig_props,2.646476
9,p_cptac_transcriptomics,1.30103,neg_log_sig_props,2.728121
