# Number of proteins different between tumor and normal in samples with an event versus samples without it

In [1]:
import altair as alt
import cnvutils
import numpy as np

In [2]:
all_pvals = cnvutils.get_has_vs_not_has_tumor_normal_diff_props(
    chromosomes_events={
            8: {
                "p": ["loss"],
                "q": ["gain"],
            },
        },
    sources=["cptac", "gistic"],
    levels=["gene"],    
)

Running _get_ttest_sig_counts with {'chromosome': 8, 'arm': 'p', 'gain_or_loss': 'loss', 'cis_or_trans': 'cis', 'proteomics_or_transcriptomics': 'proteomics', 'cancer_types': ['brca', 'coad', 'hnscc', 'lscc', 'luad', 'ov'], 'source': 'cptac', 'has_event': True, 'level': None, 'data_dir': '/home/caleb/github/PayneLab/pancancerCNV/00_functions/chr08/../data'}...
Running _get_ttest_sig_counts with {'chromosome': 8, 'arm': 'p', 'gain_or_loss': 'loss', 'cis_or_trans': 'cis', 'proteomics_or_transcriptomics': 'transcriptomics', 'cancer_types': ['brca', 'coad', 'hnscc', 'lscc', 'luad', 'ov'], 'source': 'cptac', 'has_event': True, 'level': None, 'data_dir': '/home/caleb/github/PayneLab/pancancerCNV/00_functions/chr08/../data'}...
Running _get_ttest_sig_counts with {'chromosome': 8, 'arm': 'p', 'gain_or_loss': 'loss', 'cis_or_trans': 'trans', 'proteomics_or_transcriptomics': 'transcriptomics', 'cancer_types': ['brca', 'coad', 'hnscc', 'lscc', 'luad', 'ov'], 'source': 'cptac', 'has_event': True, 




Running _get_ttest_sig_counts with {'chromosome': 8, 'arm': 'p', 'gain_or_loss': 'loss', 'cis_or_trans': 'trans', 'proteomics_or_transcriptomics': 'transcriptomics', 'cancer_types': ['brca', 'coad', 'hnscc', 'lscc', 'luad', 'ov', 'pdac'], 'source': 'gistic', 'has_event': False, 'level': 'gene', 'data_dir': '/home/caleb/github/PayneLab/pancancerCNV/00_functions/chr08/../data'}...

Running _get_ttest_sig_counts with {'chromosome': 8, 'arm': 'q', 'gain_or_loss': 'gain', 'cis_or_trans': 'cis', 'proteomics_or_transcriptomics': 'proteomics', 'cancer_types': ['brca', 'coad', 'hnscc', 'lscc', 'luad', 'ov', 'pdac'], 'source': 'gistic', 'has_event': True, 'level': 'gene', 'data_dir': '/home/caleb/github/PayneLab/pancancerCNV/00_functions/chr08/../data'}...

Running _get_ttest_sig_counts with {'chromosome': 8, 'arm': 'q', 'gain_or_loss': 'gain', 'cis_or_trans': 'trans', 'proteomics_or_transcriptomics': 'proteomics', 'cancer_types': ['brca', 'coad', 'hnscc', 'lscc', 'luad', 'ov', 'pdac'], 'sour

In [3]:
all_pvals

Unnamed: 0,name,sig_props,not_sig_props,na_props
0,p_all,0.0,0.07979,0.013382
1,p_cptac,0.0,0.677334,0.010166
2,p_cptac_proteomics,0.0,0.25101,0.010693
3,p_cptac_proteomics_cis,0.000705,0.384116,0.084441
4,p_cptac_proteomics_cis_loss,0.053797,0.634489,0.261586
5,p_cptac_proteomics_cis_gain,0.009951,0.520527,0.263331
6,p_cptac_proteomics_trans,1.9e-05,0.490871,0.081461
7,p_cptac_proteomics_trans_loss,0.005651,0.580663,0.26475
8,p_cptac_proteomics_trans_gain,0.002257,0.741134,0.257374
9,p_cptac_transcriptomics,0.00187,0.004282,0.008568


In [4]:
all_pvals = all_pvals.infer_objects()

all_pvals = all_pvals.assign(
    line=-np.log10(0.05),
    neg_log_sig_props=-np.log10(all_pvals["sig_props"]),
    neg_log_not_sig_props=-np.log10(all_pvals["not_sig_props"]),
    neg_log_na_props=-np.log10(all_pvals["na_props"]),
)

all_pvals = all_pvals.drop(columns=["sig_props", "not_sig_props", "na_props"])
all_pvals = all_pvals.melt(
    id_vars=["name", "line"],
    value_vars=["neg_log_sig_props", "neg_log_not_sig_props", "neg_log_na_props"],
    var_name="group",
    value_name="neg_log_p",
)

base = alt.Chart(all_pvals)

dots = base.mark_point().encode(
    x="name",
    y="neg_log_p",
    color="group",
)

line = base.mark_rule(color="crimson").encode(
    y="line"
)

dots + line