In [25]:
import pandas as pd
import numpy as np

In [26]:
IMREP_df = pd.read_csv("../summary_data/original/IMREP/IMREP_TRB_merged_extracted_features.csv")
TRUST4_df = pd.read_csv("../summary_data/original/TRUST4/TRUST4_TRB_merged_extracted_features.csv")
MIXCR_df = pd.read_csv("../summary_data/original/MIXCR/MIXCR_TRB_merged_extracted_features.csv")
TCR_df = pd.read_csv("../summary_data/original/TCR_Seq/TCR_merged_extracted_features.csv")

In [27]:
# Rename TCR SAMPLE names based on 1:1 matchup in python dictionary
Sample_name_matchup_RNA_TCR_dict = {
    "ESO1-sorted-T-cells_S13_L007" : "RearrangementDetails_ESO1_sorted_infusion",
    "INY1-sorted-T-cells_S14_L007" : "RearrangementDetails_INY1_sorted_infusion",
    "INY2-sorted-T-cells_S15_L007" : "RearrangementDetails_INY2_sorted_infusion",
    "TR2-PBMC_S12" : "RearrangementDetails_TR-PBMC",
    "SAR-11-14-12RNA_S1" : "SAR_11-14_PBMC",
    "MP-11-28-12RNA_S2" : "MP_11-28_PBMC",
    "CMT-baseline1C_CAGATC" : "Pt204_Baseline_TCR_seq",
    "HM-baseline1C_CGATGT" : "Pt310_baseline_TCRseq",
    "PT0310_S9" : "Pt310_on-tx_TCR_seq",
    "LEK-baseline_CGATGT" : "Pt294_baseline_TCR_seq",
    "LEK-OT110712A_CCGTCC" : "Pt294_on-tx_TCR_seq",
    "JSSBaseline-RNA_GTGAAA" : "Pt_308_baseline_TCR_seq",
    "RAS-baseline_TGACCA" : "Pt_325_baseline_TCR_seq",
    "PT0112-B_S3" : "Pt_112_baseline_TCR_seq",
    "PT0285-B_S5" : "Pt_285_baseline_TCR_seq"
}

for matchup in Sample_name_matchup_RNA_TCR_dict:
    TCR_df.loc[(TCR_df['Sample'] == Sample_name_matchup_RNA_TCR_dict[matchup]), 'Sample' ] = matchup

In [28]:
# Rename nReads and frequencies columns according to tool for proper merging
IMREP_df = IMREP_df.rename(columns={"nReads": "nReads_IMREP"})
TRUST4_df = TRUST4_df.rename(columns={"nReads": "nReads_TRUST4"})
MIXCR_df = MIXCR_df.rename(columns={"nReads": "nReads_MIXCR"})
TCR_df = TCR_df.rename(columns={"nReads": "nReads_TCR"})

Complete dataframe across all samples and tools

In [29]:
# Merge dataframes based on two key combination: Sample and CDR3. Outer join ensures no data is lost for instances that do not have overlap
merge_IMREP_TRUST4 = pd.merge(IMREP_df, TRUST4_df, how='outer', on=['Sample', 'CDR3']).fillna(0)
merge_IMREP_TRUST4_MIXCR = pd.merge(MIXCR_df, merge_IMREP_TRUST4, how='outer', on=['Sample', 'CDR3']).fillna(0)
merge_complete = pd.merge(TCR_df, merge_IMREP_TRUST4_MIXCR, how='outer', on=['Sample', 'CDR3']).fillna(0)

merge_complete

Unnamed: 0,Sample,CDR3,nReads_TCR,nReads_MIXCR,nReads_IMREP,nReads_TRUST4
0,MP-11-28-12RNA_S2,CSASSLGSYGNTIYF,1.0,0.0,0.0,0.0
1,MP-11-28-12RNA_S2,CASSVNPGGYNEQFF,6.0,0.0,0.0,0.0
2,MP-11-28-12RNA_S2,CASSFSTSAQETQYF,1.0,0.0,0.0,0.0
3,MP-11-28-12RNA_S2,CASNVPPGAGTGELFF,1.0,0.0,0.0,0.0
4,MP-11-28-12RNA_S2,CSARDQGGQGGTF,1.0,0.0,0.0,0.0
...,...,...,...,...,...,...
686750,TR2-PBMC_S12,CASSLTQEPYNEQFF,0.0,0.0,0.0,1.0
686751,TR2-PBMC_S12,CASSKTRVQGIYEPYF,0.0,0.0,0.0,1.0
686752,TR2-PBMC_S12,CATSRGGPEQYF,0.0,0.0,0.0,1.0
686753,TR2-PBMC_S12,CSARFQGDTGELFF,0.0,0.0,0.0,2.0


In [30]:
# Add the tissue type
merge_complete.loc[merge_complete['Sample']=='CMT-baseline1C_CAGATC','tissue'] = 'melanoma'
merge_complete.loc[merge_complete['Sample']=='ESO1-sorted-T-cells_S13_L007','tissue'] = 'PBMC'
merge_complete.loc[merge_complete['Sample']=='HM-baseline1C_CGATGT','tissue'] = 'melanoma'
merge_complete.loc[merge_complete['Sample']=='INY1-sorted-T-cells_S14_L007','tissue'] = 'PBMC'
merge_complete.loc[merge_complete['Sample']=='INY2-sorted-T-cells_S15_L007','tissue'] = 'PBMC'
merge_complete.loc[merge_complete['Sample']=='JSSBaseline-RNA_GTGAAA','tissue'] = 'melanoma'
merge_complete.loc[merge_complete['Sample']=='LEK-OT110712A_CCGTCC','tissue'] = 'melanoma'
merge_complete.loc[merge_complete['Sample']=='LEK-baseline_CGATGT','tissue'] = 'melanoma'
merge_complete.loc[merge_complete['Sample']=='MP-11-28-12RNA_S2','tissue'] = 'PBMC'
merge_complete.loc[merge_complete['Sample']=='PT0112-B_S3','tissue'] = 'melanoma'
merge_complete.loc[merge_complete['Sample']=='PT0285-B_S5','tissue'] = 'melanoma'
merge_complete.loc[merge_complete['Sample']=='PT0310_S9','tissue'] = 'melanoma'
merge_complete.loc[merge_complete['Sample']=='RAS-baseline_TGACCA','tissue'] = 'melanoma'
merge_complete.loc[merge_complete['Sample']=='SAR-11-14-12RNA_S1','tissue'] = 'PBMC'
merge_complete.loc[merge_complete['Sample']=='TR2-PBMC_S12','tissue'] = 'PBMC'
merge_complete.loc[merge_complete['Sample']=='SRR5233639','tissue'] = 'lymph_node'
merge_complete.loc[merge_complete['Sample']=='SRR5233637','tissue'] = 'small_intestine'
merge_complete.loc[merge_complete['Sample']=='TCGA-CZ-4862','tissue'] = 'kidney'
merge_complete.loc[merge_complete['Sample']=='TCGA-CZ-5463','tissue'] = 'kidney'
merge_complete.loc[merge_complete['Sample']=='TCGA-CZ-5985','tissue'] = 'kidney'

In [31]:
# Add T cell rich or poor tissue type
merge_complete.loc[merge_complete['Sample']=='CMT-baseline1C_CAGATC','tissue_type'] = 'T_cell_poor'
merge_complete.loc[merge_complete['Sample']=='ESO1-sorted-T-cells_S13_L007','tissue_type'] = 'T_cell_rich'
merge_complete.loc[merge_complete['Sample']=='HM-baseline1C_CGATGT','tissue_type'] = 'T_cell_poor'
merge_complete.loc[merge_complete['Sample']=='INY1-sorted-T-cells_S14_L007','tissue_type'] = 'T_cell_rich'
merge_complete.loc[merge_complete['Sample']=='INY2-sorted-T-cells_S15_L007','tissue_type'] = 'T_cell_rich'
merge_complete.loc[merge_complete['Sample']=='JSSBaseline-RNA_GTGAAA','tissue_type'] = 'T_cell_poor'
merge_complete.loc[merge_complete['Sample']=='LEK-OT110712A_CCGTCC','tissue_type'] = 'T_cell_poor'
merge_complete.loc[merge_complete['Sample']=='LEK-baseline_CGATGT','tissue_type'] = 'T_cell_poor'
merge_complete.loc[merge_complete['Sample']=='MP-11-28-12RNA_S2','tissue_type'] = 'T_cell_rich'
merge_complete.loc[merge_complete['Sample']=='PT0112-B_S3','tissue_type'] = 'T_cell_poor'
merge_complete.loc[merge_complete['Sample']=='PT0285-B_S5','tissue_type'] = 'T_cell_poor'
merge_complete.loc[merge_complete['Sample']=='PT0310_S9','tissue_type'] = 'T_cell_poor'
merge_complete.loc[merge_complete['Sample']=='RAS-baseline_TGACCA','tissue_type'] = 'T_cell_poor'
merge_complete.loc[merge_complete['Sample']=='SAR-11-14-12RNA_S1','tissue_type'] = 'T_cell_rich'
merge_complete.loc[merge_complete['Sample']=='TR2-PBMC_S12','tissue_type'] = 'T_cell_rich'
merge_complete.loc[merge_complete['Sample']=='SRR5233639','tissue_type'] = 'T_cell_rich'
merge_complete.loc[merge_complete['Sample']=='SRR5233637','tissue_type'] = 'T_cell_poor'
merge_complete.loc[merge_complete['Sample']=='TCGA-CZ-4862','tissue_type'] = 'T_cell_poor'
merge_complete.loc[merge_complete['Sample']=='TCGA-CZ-5463','tissue_type'] = 'T_cell_poor'
merge_complete.loc[merge_complete['Sample']=='TCGA-CZ-5985','tissue_type'] = 'T_cell_poor'

In [33]:
# Add repertoire type 
merge_complete.loc[merge_complete['Sample']=='CMT-baseline1C_CAGATC','class'] = 'T_cell_poor_polyclonal'
merge_complete.loc[merge_complete['Sample']=='ESO1-sorted-T-cells_S13_L007','class'] = 'T_cell_rich_monoclonal'
merge_complete.loc[merge_complete['Sample']=='HM-baseline1C_CGATGT','class'] = 'T_cell_poor_polyclonal'
merge_complete.loc[merge_complete['Sample']=='INY1-sorted-T-cells_S14_L007','class'] = 'T_cell_rich_monoclonal'
merge_complete.loc[merge_complete['Sample']=='INY2-sorted-T-cells_S15_L007','class'] = 'T_cell_rich_monoclonal'
merge_complete.loc[merge_complete['Sample']=='JSSBaseline-RNA_GTGAAA','class'] = 'T_cell_poor_polyclonal'
merge_complete.loc[merge_complete['Sample']=='LEK-OT110712A_CCGTCC','class'] = 'T_cell_poor_polyclonal'
merge_complete.loc[merge_complete['Sample']=='LEK-baseline_CGATGT','class'] = 'T_cell_poor_polyclonal'
merge_complete.loc[merge_complete['Sample']=='MP-11-28-12RNA_S2','class'] = 'T_cell_rich_polyclonal'
merge_complete.loc[merge_complete['Sample']=='PT0112-B_S3','class'] = 'T_cell_poor_polyclonal'
merge_complete.loc[merge_complete['Sample']=='PT0285-B_S5','class'] = 'T_cell_poor_polyclonal'
merge_complete.loc[merge_complete['Sample']=='PT0310_S9','class'] = 'T_cell_poor_polyclonal'
merge_complete.loc[merge_complete['Sample']=='RAS-baseline_TGACCA','class'] = 'T_cell_poor_polyclonal'
merge_complete.loc[merge_complete['Sample']=='SAR-11-14-12RNA_S1','class'] = 'T_cell_rich_polyclonal'
merge_complete.loc[merge_complete['Sample']=='TR2-PBMC_S12','class'] = 'T_cell_rich_polyclonal'
merge_complete.loc[merge_complete['Sample']=='SRR5233639','class'] = 'T_cell_rich_polyclonal'
merge_complete.loc[merge_complete['Sample']=='SRR5233637','class'] = 'T_cell_poor_polyclonal'
merge_complete.loc[merge_complete['Sample']=='TCGA-CZ-4862','class'] = 'T_cell_poor_polyclonal'
merge_complete.loc[merge_complete['Sample']=='TCGA-CZ-5463','class'] = 'T_cell_poor_polyclonal'
merge_complete.loc[merge_complete['Sample']=='TCGA-CZ-5985','class'] = 'T_cell_poor_polyclonal'

In [34]:
# Calculate total number of reads in each sample
total_reads = merge_complete[['Sample','nReads_TCR','nReads_MIXCR','nReads_IMREP','nReads_TRUST4']].groupby('Sample').sum().rename(columns={'nReads_TCR':'total_reads_TCR','nReads_MIXCR':'total_reads_MIXCR','nReads_IMREP':'total_reads_IMREP','nReads_TRUST4':'total_reads_TRUST4'})
total_reads

Unnamed: 0_level_0,total_reads_TCR,total_reads_MIXCR,total_reads_IMREP,total_reads_TRUST4
Sample,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1
CMT-baseline1C_CAGATC,906121.0,232.0,231.0,832.0
ESO1-sorted-T-cells_S13_L007,98553.0,133324.0,219185.0,265867.0
HM-baseline1C_CGATGT,1257571.0,2.0,2.0,20.0
INY1-sorted-T-cells_S14_L007,100499.0,44974.0,57700.0,93182.0
INY2-sorted-T-cells_S15_L007,329969.0,55296.0,64914.0,103137.0
JSSBaseline-RNA_GTGAAA,1408590.0,173.0,259.0,683.0
LEK-OT110712A_CCGTCC,1157845.0,380.0,334.0,1064.0
LEK-baseline_CGATGT,1769522.0,95.0,71.0,346.0
MP-11-28-12RNA_S2,42152.0,79.0,111.0,205.0
PT0112-B_S3,1006220.0,15.0,31.0,68.0


In [35]:
# Merge dataframes 
merge = pd.merge(merge_complete, total_reads, how='outer', on=['Sample']).fillna(0)

# Calculate frequency of CDR3 reads with respect to CDR3s that occur more than once
merge['frequency_TCR'] = merge['nReads_TCR'] / (merge['total_reads_TCR'] * 1.0)
merge['frequency_MIXCR'] = merge['nReads_MIXCR'] / (merge['total_reads_MIXCR'] * 1.0)
merge['frequency_IMREP'] = merge['nReads_IMREP'] / (merge['total_reads_IMREP'] * 1.0)
merge['frequency_TRUST4'] = merge['nReads_TRUST4'] / (merge['total_reads_TRUST4'] * 1.0)  
merge.fillna(0, inplace=True)
merge

Unnamed: 0,Sample,CDR3,nReads_TCR,nReads_MIXCR,nReads_IMREP,nReads_TRUST4,tissue,tissue_type,class,total_reads_TCR,total_reads_MIXCR,total_reads_IMREP,total_reads_TRUST4,frequency_TCR,frequency_MIXCR,frequency_IMREP,frequency_TRUST4
0,MP-11-28-12RNA_S2,CSASSLGSYGNTIYF,1.0,0.0,0.0,0.0,PBMC,T_cell_rich,T_cell_rich_polyclonal,42152.0,79.0,111.0,205.0,0.000024,0.0,0.0,0.000000
1,MP-11-28-12RNA_S2,CASSVNPGGYNEQFF,6.0,0.0,0.0,0.0,PBMC,T_cell_rich,T_cell_rich_polyclonal,42152.0,79.0,111.0,205.0,0.000142,0.0,0.0,0.000000
2,MP-11-28-12RNA_S2,CASSFSTSAQETQYF,1.0,0.0,0.0,0.0,PBMC,T_cell_rich,T_cell_rich_polyclonal,42152.0,79.0,111.0,205.0,0.000024,0.0,0.0,0.000000
3,MP-11-28-12RNA_S2,CASNVPPGAGTGELFF,1.0,0.0,0.0,0.0,PBMC,T_cell_rich,T_cell_rich_polyclonal,42152.0,79.0,111.0,205.0,0.000024,0.0,0.0,0.000000
4,MP-11-28-12RNA_S2,CSARDQGGQGGTF,1.0,0.0,0.0,0.0,PBMC,T_cell_rich,T_cell_rich_polyclonal,42152.0,79.0,111.0,205.0,0.000024,0.0,0.0,0.000000
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
686750,TCGA-CZ-5985,CAISERQGPGELFF,0.0,0.0,0.0,1.0,kidney,T_cell_poor,T_cell_poor_polyclonal,17542.0,0.0,23.0,345.0,0.000000,0.0,0.0,0.002899
686751,TCGA-CZ-5985,CASSLGQGGFNTF,0.0,0.0,0.0,1.0,kidney,T_cell_poor,T_cell_poor_polyclonal,17542.0,0.0,23.0,345.0,0.000000,0.0,0.0,0.002899
686752,TCGA-CZ-5985,CASSLYSASNSPLHF,0.0,0.0,0.0,1.0,kidney,T_cell_poor,T_cell_poor_polyclonal,17542.0,0.0,23.0,345.0,0.000000,0.0,0.0,0.002899
686753,TCGA-CZ-5985,CSAREAGPSPEKLFF,0.0,0.0,0.0,1.0,kidney,T_cell_poor,T_cell_poor_polyclonal,17542.0,0.0,23.0,345.0,0.000000,0.0,0.0,0.002899


In [36]:
RNA_seq_reads = pd.read_csv("../summary_data/original/RNA_seq_reads.csv")
RNA_seq_reads

Unnamed: 0,Sample,total_reads_RNA_seq
0,CMT-baseline1C_CAGATC,82476159
1,ESO1-sorted-T-cells_S13_L007,104984482
2,HM-baseline1C_CGATGT,72397468
3,INY1-sorted-T-cells_S14_L007,73892845
4,INY2-sorted-T-cells_S15_L007,71654976
5,JSSBaseline-RNA_GTGAAA,85492431
6,LEK-OT110712A_CCGTCC,68584414
7,LEK-baseline_CGATGT,63320771
8,MP-11-28-12RNA_S2,40524817
9,PT0112-B_S3,55727841


In [37]:
total_reads = merge[['Sample','tissue','tissue_type','class','total_reads_TCR','total_reads_MIXCR','total_reads_IMREP','total_reads_TRUST4']]
total_reads = total_reads.drop_duplicates(keep='first')
total_reads

# Add the column of RNA-Seq reads
total_reads = pd.merge(total_reads, RNA_seq_reads, how='left', on=['Sample'])
total_reads

# Calculate number of TCR derived reads per one million RNA-Seq reads 
# MIXCR
MIXCR = total_reads[['Sample','tissue','tissue_type','class','total_reads_TCR','total_reads_MIXCR','total_reads_RNA_seq']]
MIXCR.rename(columns={'total_reads_MIXCR':'total_reads_tool'}, inplace=True)
MIXCR.loc[:,'tool'] = 'MIXCR'
MIXCR.loc[:,'TCR_derived_by_RNA_seq_tool'] = MIXCR['total_reads_tool']/MIXCR['total_reads_RNA_seq'] *1000000

# IMREP
IMREP = total_reads[['Sample','tissue','tissue_type','class','total_reads_TCR','total_reads_IMREP','total_reads_RNA_seq']]
IMREP.rename(columns={'total_reads_IMREP':'total_reads_tool'}, inplace=True)
IMREP.loc[:,'tool'] = 'IMREP'
IMREP.loc[:,'TCR_derived_by_RNA_seq_tool'] = IMREP['total_reads_tool']/IMREP['total_reads_RNA_seq']*1000000

# TRUST4
TRUST4 = total_reads[['Sample','tissue','tissue_type','class','total_reads_TCR','total_reads_TRUST4','total_reads_RNA_seq']]
TRUST4.rename(columns={'total_reads_TRUST4':'total_reads_tool'}, inplace=True)
TRUST4.loc[:,'tool'] = 'TRUST4'
TRUST4.loc[:,'TCR_derived_by_RNA_seq_tool'] = TRUST4['total_reads_tool']/TRUST4['total_reads_RNA_seq']*1000000

reads_count = pd.concat([MIXCR,IMREP,TRUST4])

reads_count

Unnamed: 0,Sample,tissue,tissue_type,class,total_reads_TCR,total_reads_tool,total_reads_RNA_seq,tool,TCR_derived_by_RNA_seq_tool
0,MP-11-28-12RNA_S2,PBMC,T_cell_rich,T_cell_rich_polyclonal,42152.0,79.0,40524817,MIXCR,1.949423
1,CMT-baseline1C_CAGATC,melanoma,T_cell_poor,T_cell_poor_polyclonal,906121.0,232.0,82476159,MIXCR,2.812934
2,LEK-baseline_CGATGT,melanoma,T_cell_poor,T_cell_poor_polyclonal,1769522.0,95.0,63320771,MIXCR,1.500298
3,LEK-OT110712A_CCGTCC,melanoma,T_cell_poor,T_cell_poor_polyclonal,1157845.0,380.0,68584414,MIXCR,5.540617
4,HM-baseline1C_CGATGT,melanoma,T_cell_poor,T_cell_poor_polyclonal,1257571.0,2.0,72397468,MIXCR,0.027625
5,PT0310_S9,melanoma,T_cell_poor,T_cell_poor_polyclonal,12954.0,1113.0,80622502,MIXCR,13.805079
6,PT0112-B_S3,melanoma,T_cell_poor,T_cell_poor_polyclonal,1006220.0,15.0,55727841,MIXCR,0.269165
7,PT0285-B_S5,melanoma,T_cell_poor,T_cell_poor_polyclonal,292828.0,11.0,107919183,MIXCR,0.101928
8,JSSBaseline-RNA_GTGAAA,melanoma,T_cell_poor,T_cell_poor_polyclonal,1408590.0,173.0,85492431,MIXCR,2.023571
9,RAS-baseline_TGACCA,melanoma,T_cell_poor,T_cell_poor_polyclonal,749686.0,136.0,55931661,MIXCR,2.431539


In [38]:
mean_repertoire_reads = reads_count.groupby("class")["total_reads_TCR","total_reads_tool","total_reads_RNA_seq","TCR_derived_by_RNA_seq_tool"].agg(["mean", "std"]) 
display(mean_repertoire_reads)
tools = ['MIXCR','IMREP','TRUST4']              
for tool in tools: 
    print(tool)
    df_tool = reads_count.loc[reads_count['tool'] == tool]
    mean_repertoire_reads = df_tool.groupby("class")["total_reads_TCR","total_reads_tool","total_reads_RNA_seq","TCR_derived_by_RNA_seq_tool"].agg(["mean", "std"]) 
    display(mean_repertoire_reads)

Unnamed: 0_level_0,total_reads_TCR,total_reads_TCR,total_reads_tool,total_reads_tool,total_reads_RNA_seq,total_reads_RNA_seq,TCR_derived_by_RNA_seq_tool,TCR_derived_by_RNA_seq_tool
Unnamed: 0_level_1,mean,std,mean,std,mean,std,mean,std
class,Unnamed: 1_level_2,Unnamed: 2_level_2,Unnamed: 3_level_2,Unnamed: 4_level_2,Unnamed: 5_level_2,Unnamed: 6_level_2,Unnamed: 7_level_2,Unnamed: 8_level_2
T_cell_poor_polyclonal,897320.615385,859229.7,337.282051,525.079641,77709050.0,19322210.0,4.496333,6.715241
T_cell_rich_monoclonal,176340.333333,115224.6,115286.555556,78124.305952,83510770.0,16134410.0,1295.298308,646.436725
T_cell_rich_polyclonal,910220.75,1445980.0,4580.083333,5048.500812,57269060.0,16870990.0,65.976852,64.342211


MIXCR


Unnamed: 0_level_0,total_reads_TCR,total_reads_TCR,total_reads_tool,total_reads_tool,total_reads_RNA_seq,total_reads_RNA_seq,TCR_derived_by_RNA_seq_tool,TCR_derived_by_RNA_seq_tool
Unnamed: 0_level_1,mean,std,mean,std,mean,std,mean,std
class,Unnamed: 1_level_2,Unnamed: 2_level_2,Unnamed: 3_level_2,Unnamed: 4_level_2,Unnamed: 5_level_2,Unnamed: 6_level_2,Unnamed: 7_level_2,Unnamed: 8_level_2
T_cell_poor_polyclonal,897320.615385,882774.6,176.384615,303.979039,77709050.0,19851680.0,2.337149,3.808117
T_cell_rich_monoclonal,176340.333333,133049.9,77864.666667,48305.684565,83510770.0,18630410.0,883.425377,344.51754
T_cell_rich_polyclonal,910220.75,1598591.0,2278.0,2556.279327,57269060.0,18651580.0,32.446734,30.810615


IMREP


Unnamed: 0_level_0,total_reads_TCR,total_reads_TCR,total_reads_tool,total_reads_tool,total_reads_RNA_seq,total_reads_RNA_seq,TCR_derived_by_RNA_seq_tool,TCR_derived_by_RNA_seq_tool
Unnamed: 0_level_1,mean,std,mean,std,mean,std,mean,std
class,Unnamed: 1_level_2,Unnamed: 2_level_2,Unnamed: 3_level_2,Unnamed: 4_level_2,Unnamed: 5_level_2,Unnamed: 6_level_2,Unnamed: 7_level_2,Unnamed: 8_level_2
T_cell_poor_polyclonal,897320.615385,882774.6,179.846154,233.733055,77709050.0,19851680.0,2.405759,2.938761
T_cell_rich_monoclonal,176340.333333,133049.9,113933.0,91222.245516,83510770.0,18630410.0,1258.189905,721.166385
T_cell_rich_polyclonal,910220.75,1598591.0,4374.0,4502.855612,57269060.0,18651580.0,62.937652,55.76446


TRUST4


Unnamed: 0_level_0,total_reads_TCR,total_reads_TCR,total_reads_tool,total_reads_tool,total_reads_RNA_seq,total_reads_RNA_seq,TCR_derived_by_RNA_seq_tool,TCR_derived_by_RNA_seq_tool
Unnamed: 0_level_1,mean,std,mean,std,mean,std,mean,std
class,Unnamed: 1_level_2,Unnamed: 2_level_2,Unnamed: 3_level_2,Unnamed: 4_level_2,Unnamed: 5_level_2,Unnamed: 6_level_2,Unnamed: 7_level_2,Unnamed: 8_level_2
T_cell_poor_polyclonal,897320.615385,882774.6,655.615385,749.243122,77709050.0,19851680.0,8.746092,9.503172
T_cell_rich_monoclonal,176340.333333,133049.9,154062.0,96953.82419,83510770.0,18630410.0,1744.27964,688.365888
T_cell_rich_polyclonal,910220.75,1598591.0,7088.25,7150.718256,57269060.0,18651580.0,102.546171,88.466437
