# Get preliminary results

In [7]:
import subprocess

In [10]:
cancerTypes = ['brca', 'ccrcc', 'endometrial', 'colon', 'ovarian', 'luad']
algorithms = ['cibersort', 'epic', 'xcell', 'mcpcounter']
sigMatrices = ['LM22', 'LM7c', 'LM9', 'PBMC']

In [11]:
for cancer in cancerTypes:
    for algo in algorithms:
        for sig in sigMatrices:
            subprocess.run(['cwltool', 'eval-' + algo + '-with-correlation.cwl', 
                           '--cancerType', cancer, '--signature', '../signature_matrices/' + sig + '.txt'])
            subprocess.run(['mv', 'corr.tsv', cancer + '-' + algo + '-' + sig + '-corr.tsv'])

In [13]:
cancer = 'ovarian'
algo = 'xcell'
for sig in sigMatrices:
    subprocess.run(['cwltool', 'eval-' + algo + '-with-correlation.cwl', 
                           '--cancerType', cancer, '--signature', '../signature_matrices/' + sig + '.txt'])
    subprocess.run(['mv', 'corr.tsv', cancer + '-' + algo + '-' + sig + '-corr.tsv'])

In [82]:
cancer = 'luad'
for algo in algorithms:
    for sig in sigMatrices:
        subprocess.run(['cwltool', 'eval-' + algo + '-with-correlation.cwl', 
                           '--cancerType', cancer, '--signature', '../signature_matrices/' + sig + '.txt'])
        subprocess.run(['mv', 'corr.tsv', cancer + '-' + algo + '-' + sig + '-corr.tsv'])

In [18]:
cancerTypes = ['ccrcc', 'endometrial', 'colon', 'brca']

In [16]:
import pandas as pd

In [80]:
allCorr = []
for cancer in cancerTypes:
    cancerTable = []
    for sig in sigMatrices:
        algoTable = []
        colNames = []
        for algo in algorithms:
            try:
                file = cancer + '-' + algo + '-' + sig + '-corr.tsv'
                corr = pd.read_csv(file, delimiter = '\t', header = None, index_col = 0)
                corr.index = [i.replace('-', '.') for i in list(corr.index)]
                corr.name = algo
                algoTable.append(corr)
                colNames.append(algo)
            except:
                print(algo + " does not work with " + cancer + " using " + sig)
        algoPd = pd.concat(algoTable, axis = 1)
        algoPd.columns = colNames
        
    cancerTable.append(algoPd)
allCorr.append(cancerTable)          

cibersort does not work with brca using LM9


In [21]:
cancer = cancerTypes[0]; sig = sigMatrices[0]; alo = algorithms[0]

In [81]:
algoPd

Unnamed: 0,cibersort,epic,xcell,mcpcounter
X09BR001,0.550563,0.993296,0.017180,0.687763
X05BR016,0.405403,0.986661,0.232551,-0.212848
X15BR003,0.279831,0.998849,-0.158154,-0.397997
X05BR026,-0.245351,0.998782,0.444962,0.518147
X11BR038,0.169694,0.999120,0.378362,0.293081
...,...,...,...,...
X11BR014,0.774114,0.999532,0.464865,0.866520
X20BR001,0.178642,0.688812,0.560944,0.798899
X01BR020,-0.461919,0.982867,-0.509128,-0.867694
X06BR014,0.813179,0.969465,0.449226,0.830412


In [83]:
import cptac

In [84]:
cptac.list_datasets()

Unnamed: 0_level_0,Description,Data reuse status,Publication link
Dataset name,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1
Brca,breast cancer,no restrictions,https://pubmed.ncbi.nlm.nih.gov/33212010/
Ccrcc,clear cell renal cell carcinoma (kidney),no restrictions,https://pubmed.ncbi.nlm.nih.gov/31675502/
Colon,colorectal cancer,no restrictions,https://pubmed.ncbi.nlm.nih.gov/31031003/
Endometrial,endometrial carcinoma (uterine),no restrictions,https://pubmed.ncbi.nlm.nih.gov/32059776/
Gbm,glioblastoma,password access only,unpublished
Hnscc,head and neck,password access only,unpublished
Lscc,lung squamous cell carcinoma,password access only,unpublished
Luad,lung adenocarcinoma,no restrictions,https://pubmed.ncbi.nlm.nih.gov/32649874/
Ovarian,high grade serous ovarian cancer,no restrictions,https://pubmed.ncbi.nlm.nih.gov/27372738/


In [85]:
luad = cptac.Luad()

                                         

In [86]:
df = luad.get_transcriptomics()

In [88]:
luad.get_proteomics()

Name,A1BG,A2M,AAAS,AACS,AADAC,AADAT,AAED1,AAGAB,AAMDC,AAMP,...,ZSCAN31,ZSWIM9,ZW10,ZWILCH,ZWINT,ZXDC,ZYG11B,ZYX,ZZEF1,ZZZ3
Database_ID,NP_570602.2,NP_000005.2|NP_001334353.1|NP_001334354.1|K4JDR8|K4JBA2|K4JB97,NP_056480.1|NP_001166937.1,NP_076417.2|NP_001306769.1|NP_001306768.1,NP_001077.2,NP_001273611.1|NP_001273612.1,NP_714542.1,NP_078942.3|NP_001258814.1,NP_001303889.1|NP_001350493.1|NP_001303886.1|NP_001303887.1,NP_001289474.1|NP_001078.2,...,NP_001128687.1|NP_001230171.1,NP_955373.3,NP_004715.1,NP_060445.3|NP_001274750.1,NP_008988.2|NP_001005413.1,NP_079388.3|NP_001035743.1,NP_078922.1,NP_001010972.1|NP_001349712.1,NP_055928.3,NP_056349.1|NP_001295166.1
Patient_ID,Unnamed: 1_level_2,Unnamed: 2_level_2,Unnamed: 3_level_2,Unnamed: 4_level_2,Unnamed: 5_level_2,Unnamed: 6_level_2,Unnamed: 7_level_2,Unnamed: 8_level_2,Unnamed: 9_level_2,Unnamed: 10_level_2,Unnamed: 11_level_2,Unnamed: 12_level_2,Unnamed: 13_level_2,Unnamed: 14_level_2,Unnamed: 15_level_2,Unnamed: 16_level_2,Unnamed: 17_level_2,Unnamed: 18_level_2,Unnamed: 19_level_2,Unnamed: 20_level_2,Unnamed: 21_level_2
C3L-00001,-2.5347,-3.4057,0.1572,-1.1998,-1.6826,,,-0.8179,-0.8053,-0.1899,...,,,0.2992,-1.3607,,,0.6527,-0.9694,-1.1840,-2.5284
C3L-00009,-0.5627,-1.7945,1.0054,-0.3624,-4.4887,0.0079,0.2157,1.3342,0.0645,0.6427,...,11.6158,-0.5098,-0.1622,0.9828,0.5633,-1.4620,-1.0690,0.7674,0.5066,0.4311
C3L-00080,-1.9422,-2.3782,0.1940,0.1920,-2.2655,,-1.6626,0.2149,-0.7593,0.6113,...,,,-0.2795,0.6613,,0.9659,-0.3442,-1.6480,1.2872,-0.7301
C3L-00083,2.1636,3.1227,-0.3044,-1.7183,-3.2851,-1.8216,3.6147,-0.4863,-1.2387,-0.4946,...,-3.0742,-1.6769,-0.5897,-0.8129,,0.9399,-0.2465,0.3157,0.6547,
C3L-00093,-1.0022,-0.9632,0.8190,0.2556,-11.1252,,-0.1696,0.2911,-0.4459,-0.1518,...,,,0.6950,-0.1625,1.8536,-2.2990,0.4293,-0.5876,-0.4991,-0.3077
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
C3N-02582.N,1.8277,3.6204,0.1783,-1.6842,0.6852,,1.5338,-0.6666,2.3787,-0.0458,...,-0.2001,,-0.0826,-1.6769,-0.0017,-0.1266,0.2995,2.3934,0.7770,0.9497
C3N-02586.N,0.8035,1.6403,0.2300,-1.8837,1.4085,,1.3378,-0.8544,0.1946,-0.0726,...,-0.8229,0.1750,-0.0804,-1.6401,,2.4025,1.2161,1.6443,1.1886,1.1807
C3N-02587.N,1.7637,2.2513,-0.0532,-1.4159,4.8264,0.8151,0.4511,-0.8181,2.6187,-0.3304,...,-0.1301,,-0.0800,-2.4146,-2.8354,,1.2861,2.1244,0.7083,1.1825
C3N-02588.N,1.0875,1.7414,-0.2270,-1.7000,4.5153,0.4875,,-0.2169,0.5044,-0.3012,...,-0.9652,-0.1293,-0.4764,-1.4775,-2.2999,2.1054,0.4943,1.5459,0.6358,1.2729


In [89]:
df

Name,A1BG,A1CF,A2M,A2ML1,A3GALT2,A4GALT,A4GNT,AAAS,AACS,AADAC,...,ZWILCH,ZWINT,ZXDA,ZXDB,ZXDC,ZYG11A,ZYG11B,ZYX,ZZEF1,ZZZ3
Patient_ID,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
C3L-00001,2.2545,-2.7845,8.0488,-3.6051,-1.3305,0.8208,-1.0519,3.4780,2.6953,-3.3578,...,1.5053,2.0838,1.9289,2.1042,3.5256,2.4670,4.6299,3.8840,3.3197,4.1800
C3L-00009,1.4770,-1.9278,8.9855,0.4851,-2.4401,1.7417,-1.5157,4.1043,2.8091,0.0472,...,2.5437,3.2720,1.2569,1.9248,3.0739,0.4493,3.5318,4.5534,3.1330,4.8156
C3L-00080,1.5103,-4.9913,7.4303,-4.3766,-2.1868,-0.3121,-2.3936,4.6577,3.0394,1.2233,...,2.8300,3.9594,1.3346,2.2292,3.9886,-0.7604,3.5882,3.4509,5.3047,4.2428
C3L-00083,3.0398,-3.5440,9.4109,-3.1840,-3.2313,4.3862,-3.0231,3.9942,3.4665,-1.7667,...,0.8903,2.8336,1.7613,1.6259,3.8024,-2.0370,2.8603,5.5446,4.2023,2.9238
C3L-00093,1.7528,-5.2883,9.1136,-2.9449,-1.9313,1.5985,-3.3751,3.8190,3.1688,-2.3956,...,2.1361,3.6211,0.8451,1.4448,3.0815,0.4336,3.6617,4.1700,3.1526,4.3213
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
C3N-02582.N,1.5637,-5.1776,10.4127,-3.4526,-2.3206,2.5782,-2.2193,3.7097,2.3403,2.1092,...,1.2731,1.4223,1.7685,1.7865,3.8293,-2.6821,3.8706,5.1671,3.9047,4.2045
C3N-02586.N,1.9951,-6.2611,10.8147,-1.9942,-2.2342,2.3013,-0.7040,4.0228,3.0234,1.0860,...,1.1465,1.2952,1.4785,1.4900,4.1973,-2.6546,3.7431,5.5086,4.2314,4.2214
C3N-02587.N,1.8867,-5.3774,10.1176,-3.0960,-2.3278,2.2897,-1.9496,3.9663,2.8085,3.3245,...,0.9093,-1.0543,1.7941,1.8703,4.2036,-3.5258,3.6290,5.0396,4.0698,4.0836
C3N-02588.N,1.3870,-4.3241,10.3257,-2.9000,-1.6895,2.4918,-1.9959,3.7245,2.6161,3.5570,...,1.1154,0.6631,1.7917,2.0186,3.9527,-3.3026,3.9594,4.7113,3.9625,4.3164
