# Download RNA and DNA methylation data from TCGA

Reference of the TCGA portal:

https://docs.gdc.cancer.gov/Data/Bioinformatics_Pipelines/Expression_mRNA_Pipeline/

```
Introduction 
The GDC mRNA quantification analysis pipeline measures gene level expression with   STAR as raw read counts. Subsequently the counts are augmented with several transformations including Fragments per Kilobase of transcript per Million mapped reads (FPKM), upper quartile normalized FPKM (FPKM-UQ), and Transcripts per Million (TPM). These values are additionally annotated with the gene symbol and gene bio-type. These data are generated through this pipeline by first aligning reads to the GRCh38   reference genome and then by quantifying the mapped reads. To facilitate harmonization across samples, all RNA-Seq reads are treated as unstranded during analyses.
```


In [2]:
# Read in the clinical files
import os

# Now we need to download the data from TCGA for the RNAseq
from scidat.api import API, APIException
from sciutil import SciUtil
import pandas as pd

u = SciUtil()
save_fig = False

annotation_file = f'hsapiens_gene_ensembl-GRCh38.p13.csv'

gene_name = 'external_gene_name'
gdc_client = f'./gdc-client'
sample_file = f'gdc_sample_sheet.2023-07-17.tsv'
manifest_file = f'gdc_manifest_20230717_100907.txt'
clinical_file = f'clinical.tsv' # Copied out from the clinical file

api = API(manifest_file, gdc_client, clinical_file, sample_file, 'downloads/', 'downloads/', annotation_file,
                            max_cnt=500, clin_cols=['primary_diagnosis', 'age_at_diagnosis', 'gender', 'race', 'vital_status',
                         'ajcc_pathologic_stage', 'days_to_death'],
          requires_lst=['counts', 'methylation_array'])

"""
If you haven't downloaded the data already you'll need to do this step!
""" 

download_rnaseq = True
if download_rnaseq:
    api.download_data_from_manifest()

  self.annotation_df = pd.read_csv(self.annotation_file)


100% [############################################] Time:  0:00:12   1.8 MiB/s 
100% [############################################] Time:  0:00:12 329.2 KiB/s 
100% [############################################] Time:  0:00:12 320.6 KiB/s 
100% [############################################] Time:  0:00:12   1.7 MiB/s 
100% [############################################] Time:  0:00:12   1.7 MiB/s 
100% [############################################] Time:  0:00:13 317.2 KiB/s 
100% [############################################] Time:  0:00:12 323.4 KiB/s 
100% [############################################] Time:  0:00:12 326.2 KiB/s 
100% [############################################] Time:  0:00:05 689.3 KiB/s 
100% [############################################] Time:  0:00:06   3.3 MiB/s 
100% [############################################] Time:  0:00:05 740.3 KiB/s 
100% [############################################] Time:  0:00:06 673.7 KiB/s 
100% [##################################

100% [############################################] Time:  0:00:04   5.1 MiB/s 
100% [############################################] Time:  0:00:04   1.0 MiB/s 
100% [############################################] Time:  0:00:03   5.5 MiB/s 
100% [###########################################] Time:  0:00:04 1006.3 KiB/s 
100% [############################################] Time:  0:00:03   1.1 MiB/s 
100% [############################################] Time:  0:00:04 969.0 KiB/s 
100% [###########################################] Time:  0:00:04 1019.0 KiB/s 
100% [############################################] Time:  0:00:03   3.7 MiB/s 
100% [############################################] Time:  0:00:06   3.3 MiB/s 
100% [############################################] Time:  0:00:07   3.0 MiB/s 
100% [############################################] Time:  0:00:07   3.0 MiB/s 
100% [############################################] Time:  0:00:07   2.9 MiB/s 
100% [##################################

100% [############################################] Time:  0:00:05   3.2 MiB/s 
100% [############################################] Time:  0:00:06 653.2 KiB/s 
100% [############################################] Time:  0:00:06 627.3 KiB/s 
100% [############################################] Time:  0:00:05   2.5 MiB/s 
100% [############################################] Time:  0:00:08   2.7 MiB/s 
100% [############################################] Time:  0:00:09 422.9 KiB/s 
100% [############################################] Time:  0:00:09   2.3 MiB/s 
100% [############################################] Time:  0:00:07   3.0 MiB/s 
100% [############################################] Time:  0:00:14   1.5 MiB/s 
100% [############################################] Time:  0:00:05 697.4 KiB/s 
100% [############################################] Time:  0:00:05 750.0 KiB/s 
100% [############################################] Time:  0:00:11 376.0 KiB/s 
100% [##################################

100% [############################################] Time:  0:00:06   3.3 MiB/s 
100% [############################################] Time:  0:00:06   3.3 MiB/s 
100% [############################################] Time:  0:00:05 720.1 KiB/s 
100% [############################################] Time:  0:00:05 716.8 KiB/s 
100% [############################################] Time:  0:00:04   1.0 MiB/s 
100% [############################################] Time:  0:00:04 980.1 KiB/s 
100% [############################################] Time:  0:00:04   5.4 MiB/s 
100% [############################################] Time:  0:00:04   5.0 MiB/s 
100% [############################################] Time:  0:00:05   4.0 MiB/s 
100% [############################################] Time:  0:00:05   4.0 MiB/s 
100% [############################################] Time:  0:00:06   3.5 MiB/s 
100% [############################################] Time:  0:00:04 882.7 KiB/s 
100% [##################################

100% [############################################] Time:  0:00:04 899.6 KiB/s 
100% [############################################] Time:  0:00:04   4.7 MiB/s 
100% [############################################] Time:  0:00:04 940.5 KiB/s 
100% [############################################] Time:  0:00:15   1.4 MiB/s 
100% [############################################] Time:  0:00:15   1.4 MiB/s 
100% [############################################] Time:  0:00:18   1.1 MiB/s 
100% [############################################] Time:  0:00:15 267.4 KiB/s 
100% [############################################] Time:  0:00:15   1.4 MiB/s 
100% [############################################] Time:  0:00:14 911.3 KiB/s 
100% [############################################] Time:  0:00:15   1.5 MiB/s 
100% [############################################] Time:  0:00:14 281.2 KiB/s 
100% [############################################] Time:  0:00:05 812.9 KiB/s 
100% [##################################

100% [############################################] Time:  0:00:04   5.3 MiB/s 
100% [############################################] Time:  0:00:05 825.9 KiB/s 
100% [############################################] Time:  0:00:05 757.0 KiB/s 
100% [############################################] Time:  0:00:05 786.5 KiB/s 
100% [############################################] Time:  0:00:05   4.0 MiB/s 
100% [############################################] Time:  0:00:05 756.4 KiB/s 
100% [############################################] Time:  0:00:05 723.0 KiB/s 
100% [############################################] Time:  0:00:06   3.5 MiB/s 
100% [############################################] Time:  0:00:03   1.2 MiB/s 
100% [############################################] Time:  0:00:03   1.2 MiB/s 
100% [############################################] Time:  0:00:03   1.2 MiB/s 
100% [############################################] Time:  0:00:03   6.7 MiB/s 
100% [##################################

100% [############################################] Time:  0:00:05 729.1 KiB/s 
100% [############################################] Time:  0:00:05 725.0 KiB/s 
100% [############################################] Time:  0:00:05   4.0 MiB/s 
100% [############################################] Time:  0:00:05 780.7 KiB/s 
100% [############################################] Time:  0:00:06 686.4 KiB/s 
100% [############################################] Time:  0:00:05   4.1 MiB/s 
100% [############################################] Time:  0:00:05   4.4 MiB/s 
100% [############################################] Time:  0:00:05   4.2 MiB/s 
100% [############################################] Time:  0:00:05 807.3 KiB/s 
100% [############################################] Time:  0:00:05 788.4 KiB/s 
100% [############################################] Time:  0:00:05   4.0 MiB/s 
100% [############################################] Time:  0:00:04   3.9 MiB/s 
100% [##################################

100% [############################################] Time:  0:00:05 753.1 KiB/s 
100% [############################################] Time:  0:00:06 629.5 KiB/s 
100% [############################################] Time:  0:00:04 898.7 KiB/s 
100% [############################################] Time:  0:00:04 981.1 KiB/s 
100% [############################################] Time:  0:00:04   5.4 MiB/s 
100% [############################################] Time:  0:00:04   5.0 MiB/s 
100% [############################################] Time:  0:00:04   4.6 MiB/s 
100% [############################################] Time:  0:00:04   4.8 MiB/s 
100% [############################################] Time:  0:00:03   1.0 MiB/s 
100% [############################################] Time:  0:00:04 839.7 KiB/s 
100% [############################################] Time:  0:00:06   3.5 MiB/s 
100% [############################################] Time:  0:00:06 635.1 KiB/s 
100% [##################################

100% [############################################] Time:  0:00:05   4.3 MiB/s 
100% [############################################] Time:  0:00:04   4.6 MiB/s 
100% [############################################] Time:  0:00:04   4.9 MiB/s 
100% [############################################] Time:  0:00:04 908.7 KiB/s 
100% [############################################] Time:  0:00:04   4.8 MiB/s 
100% [############################################] Time:  0:00:04 975.9 KiB/s 
100% [###########################################] Time:  0:00:04 1018.5 KiB/s 
100% [############################################] Time:  0:00:03   5.6 MiB/s 
100% [############################################] Time:  0:00:04 855.5 KiB/s 
100% [############################################] Time:  0:00:03   5.9 MiB/s 
100% [############################################] Time:  0:00:04   5.4 MiB/s 
100% [############################################] Time:  0:00:04 873.7 KiB/s 
100% [##################################

100% [############################################] Time:  0:00:05 774.4 KiB/s 
100% [############################################] Time:  0:00:03   1.0 MiB/s 
100% [############################################] Time:  0:00:04 993.1 KiB/s 
100% [############################################] Time:  0:00:04   5.0 MiB/s 
100% [############################################] Time:  0:00:04 872.3 KiB/s 
100% [############################################] Time:  0:00:05   4.0 MiB/s 
100% [############################################] Time:  0:00:05 793.9 KiB/s 
100% [############################################] Time:  0:00:05 810.4 KiB/s 
100% [############################################] Time:  0:00:05   4.0 MiB/s 
100% [############################################] Time:  0:00:04 885.5 KiB/s 
100% [############################################] Time:  0:00:05 776.1 KiB/s 
100% [############################################] Time:  0:00:04 853.8 KiB/s 
100% [##################################

100% [############################################] Time:  0:00:05 741.5 KiB/s 
100% [############################################] Time:  0:00:08   2.7 MiB/s 
100% [############################################] Time:  0:00:03   1.0 MiB/s 
100% [############################################] Time:  0:00:03   5.8 MiB/s 
100% [############################################] Time:  0:00:03   1.0 MiB/s 
100% [############################################] Time:  0:00:03   1.0 MiB/s 
100% [############################################] Time:  0:00:04   5.3 MiB/s 
100% [############################################] Time:  0:00:04   5.1 MiB/s 
100% [############################################] Time:  0:00:04 849.5 KiB/s 
100% [############################################] Time:  0:00:04 860.0 KiB/s 
100% [############################################] Time:  0:00:03   5.8 MiB/s 
100% [############################################] Time:  0:00:04 983.9 KiB/s 
100% [##################################

100% [############################################] Time:  0:00:03   1.1 MiB/s 
100% [############################################] Time:  0:00:04 967.9 KiB/s 
100% [############################################] Time:  0:00:06   3.4 MiB/s 
100% [############################################] Time:  0:00:06   3.5 MiB/s 
100% [############################################] Time:  0:00:06   2.1 MiB/s 
100% [############################################] Time:  0:00:06 638.1 KiB/s 
100% [############################################] Time:  0:00:06 598.4 KiB/s 
100% [############################################] Time:  0:00:07   3.0 MiB/s 
100% [############################################] Time:  0:00:05   3.7 MiB/s 
100% [############################################] Time:  0:00:04 958.4 KiB/s 
100% [############################################] Time:  0:00:05   3.4 MiB/s 
100% [############################################] Time:  0:00:06   3.5 MiB/s 
100% [##################################

100% [############################################] Time:  0:00:04   5.4 MiB/s 
100% [############################################] Time:  0:00:03   5.6 MiB/s 
100% [############################################] Time:  0:00:04   5.5 MiB/s 
100% [############################################] Time:  0:00:04 970.9 KiB/s 
100% [############################################] Time:  0:00:05 739.2 KiB/s 
100% [############################################] Time:  0:00:05 738.6 KiB/s 
100% [############################################] Time:  0:00:05 730.5 KiB/s 
100% [############################################] Time:  0:00:05 811.3 KiB/s 
100% [############################################] Time:  0:00:05   4.3 MiB/s 
100% [############################################] Time:  0:00:04   4.8 MiB/s 
100% [###########################################] Time:  0:00:04 1010.0 KiB/s 
100% [############################################] Time:  0:00:04 950.9 KiB/s 
100% [##################################

100% [############################################] Time:  0:00:04 855.6 KiB/s 
100% [############################################] Time:  0:00:05 805.6 KiB/s 
100% [############################################] Time:  0:00:03   5.9 MiB/s 
100% [############################################] Time:  0:00:04 831.4 KiB/s 
100% [############################################] Time:  0:00:05   4.0 MiB/s 
100% [############################################] Time:  0:00:04 935.4 KiB/s 
100% [############################################] Time:  0:00:05 781.1 KiB/s 
100% [############################################] Time:  0:00:04   5.1 MiB/s 
100% [############################################] Time:  0:00:03   5.6 MiB/s 
100% [############################################] Time:  0:00:03   1.1 MiB/s 
100% [############################################] Time:  0:00:03   1.1 MiB/s 
100% [############################################] Time:  0:00:03   5.7 MiB/s 
100% [##################################

100% [############################################] Time:  0:00:04   3.0 MiB/s 
100% [############################################] Time:  0:00:05 717.6 KiB/s 
100% [############################################] Time:  0:00:05 713.3 KiB/s 
100% [############################################] Time:  0:00:05 808.0 KiB/s 
100% [############################################] Time:  0:00:03   1.1 MiB/s 
100% [############################################] Time:  0:00:03   1.1 MiB/s 
100% [############################################] Time:  0:00:04   5.2 MiB/s 
100% [############################################] Time:  0:00:04   5.0 MiB/s 
100% [############################################] Time:  0:00:04   4.9 MiB/s 
100% [############################################] Time:  0:00:04   4.5 MiB/s 
100% [############################################] Time:  0:00:04 871.4 KiB/s 
100% [############################################] Time:  0:00:04   5.1 MiB/s 
100% [##################################

100% [############################################] Time:  0:00:04   4.5 MiB/s 
100% [############################################] Time:  0:00:04   5.1 MiB/s 
100% [############################################] Time:  0:00:04   5.2 MiB/s 
100% [############################################] Time:  0:00:04   5.4 MiB/s 
100% [############################################] Time:  0:00:04 872.9 KiB/s 
100% [############################################] Time:  0:00:03   1.0 MiB/s 
100% [############################################] Time:  0:00:04   5.3 MiB/s 
100% [############################################] Time:  0:00:04 895.3 KiB/s 
100% [############################################] Time:  0:00:04   4.7 MiB/s 
100% [############################################] Time:  0:00:05 793.7 KiB/s 
100% [############################################] Time:  0:00:04 984.6 KiB/s 
100% [############################################] Time:  0:00:04   4.6 MiB/s 
100% [##################################

100% [############################################] Time:  0:00:03   5.9 MiB/s 
100% [############################################] Time:  0:00:03   1.2 MiB/s 
100% [############################################] Time:  0:00:03   1.1 MiB/s 
100% [############################################] Time:  0:00:03   6.4 MiB/s 
100% [###########################################] Time:  0:00:04 1001.1 KiB/s 
100% [############################################] Time:  0:00:04   5.3 MiB/s 
100% [############################################] Time:  0:00:04 989.4 KiB/s 
100% [############################################] Time:  0:00:04   4.7 MiB/s 
100% [############################################] Time:  0:00:05 819.1 KiB/s 
100% [############################################] Time:  0:00:04 876.5 KiB/s 
100% [############################################] Time:  0:00:03   5.1 MiB/s 
100% [############################################] Time:  0:00:06 629.9 KiB/s 
100% [##################################

100% [############################################] Time:  0:00:04 918.8 KiB/s 
100% [############################################] Time:  0:00:04   5.1 MiB/s 
100% [############################################] Time:  0:00:04 946.0 KiB/s 
100% [############################################] Time:  0:00:03   1.1 MiB/s 
100% [############################################] Time:  0:00:04   4.5 MiB/s 
100% [############################################] Time:  0:00:04 851.2 KiB/s 
100% [############################################] Time:  0:00:03   1.1 MiB/s 
100% [############################################] Time:  0:00:04 939.6 KiB/s 
100% [###########################################] Time:  0:00:04 1021.6 KiB/s 
100% [############################################] Time:  0:00:04   5.2 MiB/s 
100% [############################################] Time:  0:00:04   4.7 MiB/s 
100% [############################################] Time:  0:00:05   3.9 MiB/s 
100% [##################################

100% [############################################] Time:  0:00:04 990.7 KiB/s 
100% [############################################] Time:  0:00:04 948.2 KiB/s 
100% [############################################] Time:  0:00:04   5.4 MiB/s 
100% [############################################] Time:  0:00:04   4.9 MiB/s 
100% [############################################] Time:  0:00:04   1.0 MiB/s 
100% [############################################] Time:  0:00:04   5.2 MiB/s 
100% [############################################] Time:  0:00:03   1.0 MiB/s 
100% [############################################] Time:  0:00:05 740.9 KiB/s 
100% [############################################] Time:  0:00:05   4.1 MiB/s 
100% [############################################] Time:  0:00:04 834.5 KiB/s 
100% [############################################] Time:  0:00:04   4.3 MiB/s 
100% [###########################################] Time:  0:00:04 1012.5 KiB/s 
100% [##################################

100% [############################################] Time:  0:00:03   1.2 MiB/s 
100% [############################################] Time:  0:00:04   5.4 MiB/s 
100% [############################################] Time:  0:00:03   5.6 MiB/s 
100% [############################################] Time:  0:00:03   1.1 MiB/s 
100% [############################################] Time:  0:00:04 927.9 KiB/s 
100% [############################################] Time:  0:00:04   5.3 MiB/s 
100% [############################################] Time:  0:00:04   5.2 MiB/s 
100% [###########################################] Time:  0:00:04 1018.1 KiB/s 
100% [############################################] Time:  0:00:04 895.2 KiB/s 
100% [############################################] Time:  0:00:05   3.7 MiB/s 
100% [############################################] Time:  0:00:04   4.1 MiB/s 
100% [############################################] Time:  0:00:04 861.8 KiB/s 
100% [##################################

100% [############################################] Time:  0:00:03   1.1 MiB/s 
100% [############################################] Time:  0:00:03   5.3 MiB/s 
100% [############################################] Time:  0:00:03   3.5 MiB/s 
100% [############################################] Time:  0:00:04 969.9 KiB/s 
100% [############################################] Time:  0:00:04 893.8 KiB/s 
100% [############################################] Time:  0:00:05 711.2 KiB/s 
100% [############################################] Time:  0:00:05   4.0 MiB/s 
100% [############################################] Time:  0:00:05 732.8 KiB/s 
100% [############################################] Time:  0:00:05   4.2 MiB/s 
100% [############################################] Time:  0:00:05 772.8 KiB/s 
100% [############################################] Time:  0:00:05 767.5 KiB/s 
100% [############################################] Time:  0:00:05 801.5 KiB/s 
100% [##################################

100% [############################################] Time:  0:00:55  74.6 KiB/s 
100% [############################################] Time:  0:00:04   5.1 MiB/s 
100% [############################################] Time:  0:00:03   3.4 MiB/s 
100% [############################################] Time:  0:00:03   1.1 MiB/s 
100% [############################################] Time:  0:00:04   5.4 MiB/s 
100% [############################################] Time:  0:00:04   5.3 MiB/s 
100% [############################################] Time:  0:00:03   5.7 MiB/s 
100% [############################################] Time:  0:00:03   1.0 MiB/s 
100% [############################################] Time:  0:00:04 848.9 KiB/s 
100% [############################################] Time:  0:00:04   4.4 MiB/s 
100% [############################################] Time:  0:00:05   4.2 MiB/s 
100% [############################################] Time:  0:00:05   4.2 MiB/s 
100% [##################################

100% [############################################] Time:  0:00:05   4.1 MiB/s 
100% [############################################] Time:  0:00:05 699.0 KiB/s 
100% [############################################] Time:  0:00:05   3.6 MiB/s 
100% [############################################] Time:  0:00:06 688.3 KiB/s 
100% [############################################] Time:  0:00:06 639.8 KiB/s 
100% [############################################] Time:  0:00:05   4.1 MiB/s 
100% [############################################] Time:  0:00:04 976.3 KiB/s 
100% [############################################] Time:  0:00:04   4.7 MiB/s 
100% [############################################] Time:  0:00:05 791.6 KiB/s 
100% [############################################] Time:  0:00:05 786.7 KiB/s 
100% [############################################] Time:  0:00:05 791.1 KiB/s 
100% [############################################] Time:  0:00:05   4.2 MiB/s 
100% [##################################

100% [############################################] Time:  0:00:05 804.8 KiB/s 
100% [############################################] Time:  0:00:04   5.3 MiB/s 
100% [############################################] Time:  0:00:04 837.5 KiB/s 
100% [############################################] Time:  0:00:05 727.5 KiB/s 
100% [############################################] Time:  0:00:05 815.3 KiB/s 
100% [############################################] Time:  0:00:05 787.6 KiB/s 
100% [############################################] Time:  0:00:05   4.3 MiB/s 
100% [############################################] Time:  0:00:04 856.4 KiB/s 
100% [############################################] Time:  0:00:05   4.0 MiB/s 
100% [############################################] Time:  0:00:05   3.8 MiB/s 
100% [############################################] Time:  0:00:05   3.7 MiB/s 
100% [############################################] Time:  0:00:06 648.3 KiB/s 
100% [##################################

100% [############################################] Time:  0:00:04   5.0 MiB/s 
100% [############################################] Time:  0:00:03   1.1 MiB/s 
100% [############################################] Time:  0:00:05   3.8 MiB/s 
100% [############################################] Time:  0:00:04 934.9 KiB/s 
100% [############################################] Time:  0:00:06   3.6 MiB/s 
100% [############################################] Time:  0:00:03   1.0 MiB/s 
[32mSuccessfully downloaded[0m: 500
100% [############################################] Time:  0:00:04 924.3 KiB/s 
[32mSuccessfully downloaded[0m: 500
100% [############################################] Time:  0:00:04   5.3 MiB/s 
100% [############################################] Time:  0:00:05   4.2 MiB/s 
100% [############################################] Time:  0:00:04   5.2 MiB/s 
100% [############################################] Time:  0:00:04   4.6 MiB/s 
100% [######################################

# Build datasets

In [3]:
api.build_annotation()

[93m--------------------------------------------------------------------------------[0m
 Run: annotate.set_case_submitter_id() to setup. 
Continuing with automatic selection.	[0m
[93m--------------------------------------------------------------------------------[0m
[94m--------------------------------------------------------------------------------[0m
[94m                    Submitter ID set as: 	case_submitter_id	                    [0m
[94m--------------------------------------------------------------------------------[0m
[94m--------------------------------------------------------------------------------[0m
[94m                              Clinical dataframe	                               [0m
[94m--------------------------------------------------------------------------------[0m
[94m--------------------------------------------------------------------------------[0m
[94m  case_submitter_id project_id age_at_index  gender   race vital_status  \
0         C3N-0117

In [4]:
data_dir = 'downloads/'
rna_df = api.build_star_rna_df(data_dir)
meth_df = api.build_sesame_meth_df(data_dir)
api.rna_df.to_csv(f'RNA_all.csv', index=False)
api.meth_df.to_csv(f'Methylation_all.csv', index=False)

In [8]:
rna_df = api.rna_df

In [9]:
rna_df.shape

(60664, 2137)

In [10]:
meth_df.shape

(865918, 1767)

# Now we want to save out each of the cancers based on our clinical info for the different patients

In [22]:
clin_tcga_df = pd.read_csv(clinical_file, sep='\t')
clin_tcga_df

Unnamed: 0,case_id,case_submitter_id,project_id,age_at_index,age_is_obfuscated,cause_of_death,cause_of_death_source,country_of_residence_at_enrollment,days_to_birth,days_to_death,...,treatment_arm,treatment_dose,treatment_dose_units,treatment_effect,treatment_effect_indicator,treatment_frequency,treatment_intent_type,treatment_or_therapy,treatment_outcome,treatment_type
0,000ead0d-abf5-4606-be04-1ea31b999840,C3N-01179,CPTAC-3,'--,'--,'--,'--,'--,-26483,'--,...,'--,'--,'--,'--,'--,'--,'--,'--,'--,'--
1,003f4f85-3244-4132-8c9d-c29f09382269,C3N-02672,CPTAC-3,'--,'--,'--,'--,'--,-22056,'--,...,'--,'--,'--,'--,'--,'--,'--,'--,'--,'--
2,005d0639-c923-470f-a179-02a4dbb5cdf2,C3L-01929,CPTAC-3,'--,'--,'--,'--,'--,-19698,'--,...,'--,'--,'--,'--,'--,'--,'--,'--,'--,'--
3,006931bb-f5b1-4aa4-b0a8-af517a912db0,C3L-01838,CPTAC-3,'--,'--,'--,'--,'--,-25663,'--,...,'--,'--,'--,'--,'--,'--,'--,'--,'--,'--
4,0103db96-3e58-485c-bb9f-37b8a1f966e1,C3L-01146,CPTAC-3,'--,'--,Cancer Related,'--,'--,-21566,509,...,'--,'--,'--,'--,'--,'--,'--,'--,'--,'--
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
1145,fdd6c700-c04d-4857-a522-8f83f67f5f95,C3N-00297,CPTAC-3,'--,'--,'--,'--,'--,-25254,'--,...,'--,'--,'--,'--,'--,'--,'--,'--,'--,'--
1146,fed33fff-0310-42ad-a7dc-d563792f18cc,C3N-03853,CPTAC-3,'--,'--,Unknown,'--,'--,-17976,393,...,'--,'--,'--,'--,'--,'--,'--,'--,'--,'--
1147,fed70927-708c-479e-942c-139414370672,C3L-02856,CPTAC-3,'--,'--,'--,'--,'--,-32731,'--,...,'--,'--,'--,'--,'--,'--,'--,'--,'--,'--
1148,ff527151-6797-414e-8760-edcb73306a28,C3L-03984,CPTAC-3,'--,'--,'--,'--,'--,-21834,'--,...,'--,'--,'--,'--,'--,'--,'--,'--,'--,'--


In [23]:
clin_tcga_df['primary_diagnosis'].value_counts()

primary_diagnosis
Endometrioid adenocarcinoma, NOS    239
Adenocarcinoma, NOS                 223
Renal cell carcinoma, NOS           218
Squamous cell carcinoma, NOS        215
Infiltrating duct carcinoma, NOS    156
Glioblastoma                         99
Name: count, dtype: int64

In [19]:
# This basically means that alot of the datasets need more annoations so we'll have to use those from CPTAC files
import os
# Step through the files getting out all the clinical info
clin_df = pd.DataFrame()
bio_df = pd.DataFrame()
clin_dir = 'CPTAC_clinical'
clin_files = os.listdir(clin_dir)
for f in clin_files:
    if 'clinical' in f:
        clin_df = pd.concat([clin_df, pd.read_csv(os.path.join(clin_dir, f), sep='\t')])
    elif 'biospeci' in f:
        bio_df = pd.concat([bio_df, pd.read_csv(os.path.join(clin_dir, f), sep='\t')])
bio_df

Unnamed: 0,Aliquot ID,Aliquot Submitter ID,Sample ID,Sample Submitter ID,Case ID,Case Submitter ID,Project Name,Sample Type,Primary Site,Disease Type,...,Sample Ordinal,Shortest Dimension,Time Between Clamping And Freezing,Time Between Excision and Freezing,Tissue Collection Type,Tissue Type,Tumor Code,Tumor Code ID,Tumor Descriptor,Program Name
0,db299c0d-8891-4392-a4c9-85b1f51972b6,NCI7-1.0_pro,0d5e281f-4f2e-4567-9c66-b866f6b89a0a,NCI7-1.0_pro,54559a36-d9bc-4373-86f5-98d50a203d76,NCI-7,CPTAC3-Other,Cell Lines,Not Reported,Other,...,,,,,,,,,,Clinical Proteomic Tumor Analysis Consortium
1,20f536b7-a3be-4ae9-ac2f-706702208c19,NCI7-0.1_pro,c3176869-7ee5-484f-b816-7af6d8b98e3d,NCI7-0.1_pro,54559a36-d9bc-4373-86f5-98d50a203d76,NCI-7,CPTAC3-Other,Cell Lines,Not Reported,Other,...,,,,,,,,,,Clinical Proteomic Tumor Analysis Consortium
2,209334d7-a63d-4dba-9d2a-0ed158594c08,NCI7-1.0_pep,e798c551-1164-4690-b646-837b05b97029,NCI7-1.0_pep,54559a36-d9bc-4373-86f5-98d50a203d76,NCI-7,CPTAC3-Other,Cell Lines,Not Reported,Other,...,,,,,,,,,,Clinical Proteomic Tumor Analysis Consortium
3,a42d5403-25f1-4868-b56e-a4a5d8dc2c76,NCI7-0.5_pep,4aed607e-110d-448b-8527-6ed2816c438b,NCI7-0.5_pep,54559a36-d9bc-4373-86f5-98d50a203d76,NCI-7,CPTAC3-Other,Cell Lines,Not Reported,Other,...,,,,,,,,,,Clinical Proteomic Tumor Analysis Consortium
4,3f04b11c-ff67-476f-9ba8-1fe7b1df010f,NCI7-0.2_pro,c55a87d2-05c6-44a6-8078-4bffa1497a43,NCI7-0.2_pro,54559a36-d9bc-4373-86f5-98d50a203d76,NCI-7,CPTAC3-Other,Cell Lines,Not Reported,Other,...,,,,,,,,,,Clinical Proteomic Tumor Analysis Consortium
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
245,1cfd38e5-0295-4ca4-9bd4-e1e96edeffde,CPT0236360004,778f5ab4-651a-4f9b-83a7-96f9243b236b,C3N-03069-03,d21fa2fa-9a2d-4baa-b7d8-601b906a16c7,C3N-03069,CPTAC3 Discovery and Confirmatory,Solid Tissue Normal,Pancreas,Pancreatic Ductal Adenocarcinoma,...,,,19.0,14.0,,Normal,,,,Clinical Proteomic Tumor Analysis Consortium
246,7328da7b-0f55-49c3-8e74-5114fcb4fc18,CPT0218220004,d962522e-e61d-446a-9393-784867a459b5,C3L-01124-04,5a3fd9f7-cd11-4ed9-b122-3096ba0e93a5,C3L-01124,CPTAC3 Discovery and Confirmatory,Solid Tissue Normal,Pancreas,Pancreatic Ductal Adenocarcinoma,...,,,,19.0,,Normal,,,,Clinical Proteomic Tumor Analysis Consortium
247,c59055c9-e724-49cb-bfc3-9f0d072eea48,CPT0094940004,dc68bdaf-21b9-43e7-9dc0-31fbaddd164c,"C3L-01703-02, C3L-01703-03",344f4536-d2cf-4162-99d8-dcc40972c80b,C3L-01703,CPTAC3 Discovery and Confirmatory,Primary Tumor,Pancreas,Pancreatic Ductal Adenocarcinoma,...,,,,,,Tumor,,,,Clinical Proteomic Tumor Analysis Consortium
248,b0efe015-7be2-4faf-a3f6-a5962316dc83,CPT0078000003,a2913672-6c34-44df-ad13-f3cf5144b481,C3N-00518-01,0f06151e-53a2-4573-84c3-76e1b5c0ce34,C3N-00518,CPTAC3 Discovery and Confirmatory,Primary Tumor,Pancreas,Pancreatic Ductal Adenocarcinoma,...,,,,6.0,,Tumor,,,,Clinical Proteomic Tumor Analysis Consortium


In [21]:
clin_df['Cases Submitter ID'].values

array(['15-00464', '13-00166', '14-00034', 'Cell based ref', '13-00515',
       '14-00537', 'Standard ref', '14-00083', '13-00034', '14-00045',
       '14-00240', '13-00602', '12-00211', '14-00359', '14-00488',
       '14-00495', '15-00051', '14-00127', '15-00701', '15-00276',
       'Universal Ref', '16-00886', '16-01225', 'WHIM74', 'WHIM30',
       'HCI027', 'WHIM75', 'WHIM12', 'Core CR', 'WHIM14', 'WHIM68',
       'HCI030', 'PDX  CR', 'HCI009', 'C3N-01946', 'C3N-01754',
       'C3L-01138', 'C3N-03888', 'C3N-04280', 'C3N-01945', 'C3N-03011',
       'C3L-04791', 'C3N-00822', 'C3L-00994', 'C3N-03008', 'C3N-00299',
       'C3N-01756', 'C3N-00297', 'C3N-01947', 'C3N-03612', 'C3N-02693',
       'C3N-01948', 'C3N-01340', 'C3N-03013', 'C3N-03620', 'C3N-03781',
       'C3N-03928', 'C3N-04276', 'C3N-01858', 'C3N-02714', 'C3N-03028',
       'C3N-01943', 'C3N-02695', 'C3N-04152', 'QC1', 'QC3', 'C3L-00999',
       'C3N-03664', 'C3L-01237', 'QC2', 'C3N-04277', 'QC5', 'QC4', 'QC7',
       'QC6', '

# Combine the two on case_submitter_id and 'Cases Submitter ID' so that we can actually find out what each patient has!


In [26]:
df = pd.merge(clin_df, clin_tcga_df, left_on='Cases Submitter ID', right_on='case_submitter_id', how='outer')

In [34]:
df['Disease Type'].value_counts()

Disease Type
Pancreatic Ductal Adenocarcinoma         140
Lung Adenocarcinoma                      111
Head and Neck Squamous Cell Carcinoma    110
Lung Squamous Cell Carcinoma             110
Uterine Corpus Endometrial Carcinoma     104
Clear Cell Renal Cell Carcinoma          103
Other                                     91
Breast Invasive Carcinoma                 65
Acute Myeloid Leukemia                    39
Non-Clear Cell Renal Cell Carcinoma        7
Name: count, dtype: int64

In [35]:
df['Race'].value_counts()

Race
White                               488
Other                               129
Asian                               126
Not Reported                         95
Black or African American            25
Unknown                              16
American Indian or Alaska Native      1
Name: count, dtype: int64

In [36]:
df['Gender'].value_counts()

Gender
Male            441
Female          354
Not Reported     85
Name: count, dtype: int64

In [37]:
df['AJCC Pathologic Stage'].value_counts()

AJCC Pathologic Stage
Stage I         140
                134
Stage III       128
Stage IIB        92
Stage IB         72
Not Reported     58
Stage IIA        51
Stage II         48
Stage IA         41
Stage IIIA       38
Stage IVA        37
Stage IV         27
Stage IVB         6
Unknown           3
Stage IIIB        2
Stage IA3         1
Name: count, dtype: int64

# For each of the Disease Types for each case in that disease type see if it exists in the RNA file and if so add that case

1. Basically go through and filter out each of the files for the cases that exist in the RNA and methylation datasets to create a dataset for each cancer.

In [38]:
rna_df

Unnamed: 0,gene_id,gene_name,CPTAC-3_SolidTissueNormal_male_other_None_RNA_None_None_CPTAC-3_C3N-02727_9a32b693-bea7-470f-9aaf-1cb738e3981f,CPTAC-3_SolidTissueNormal_male_white_None_RNA_None_None_CPTAC-3_C3L-00907_ff35024d-0cfa-4cd0-b835-eb2bd7430390,CPTAC-3_PrimaryTumor_male_other_None_RNA_None_None_CPTAC-3_C3N-01524_8edd2ab4-377e-4d07-879b-b6bac439a29d,CPTAC-3_PrimaryTumor_male_white_None_RNA_None_None_CPTAC-3_C3L-00603_e1494839-503b-4601-97c2-9dff2c6b7632,CPTAC-3_SolidTissueNormal_male_white_None_RNA_None_None_CPTAC-3_C3L-00080_e94ee4c0-43bb-4fee-aced-1fe6e9b1408f,CPTAC-3_SolidTissueNormal_male_asian_None_RNA_None_None_CPTAC-3_C3N-02424_7ab3854b-f05e-4741-81c4-7a5df8dcc6c5,CPTAC-3_PrimaryTumor_female_white_None_RNA_None_None_CPTAC-3_C3L-01729_dc562117-37a9-47b3-9209-b97d75234197,CPTAC-3_SolidTissueNormal_male_white_None_RNA_68_None_CPTAC-3_C3L-02809_e3d16a9e-974c-4fca-a4a2-6837493e33e9,...,CPTAC-3_SolidTissueNormal_male_white_None_RNA_766_None_CPTAC-3_C3L-02964_fab994d4-ade4-40e4-87b4-321e3cc5fada,CPTAC-3_SolidTissueNormal_male_asian_None_RNA_None_None_CPTAC-3_C3N-02375_1ce96b1b-e8cc-4cbb-a1eb-bd84b10b143f,CPTAC-3_PrimaryTumor_male_white_None_RNA_632_None_CPTAC-3_C3N-02695_534d5eaf-5bfd-48cc-b5e2-abd2f8bb285e,CPTAC-3_PrimaryTumor_female_notreported_None_RNA_None_None_CPTAC-3_C3N-02244_58ca7c12-6bfc-4ea4-a2b9-68c46e9b49f8,CPTAC-3_PrimaryTumor_male_white_None_RNA_None_None_CPTAC-3_C3N-02015_f5efcbb2-a1fd-4318-9677-1cc7da4a46de,CPTAC-3_PrimaryTumor_female_white_None_RNA_None_None_CPTAC-3_C3L-01304_7e6f35d3-4d48-43fb-8e15-4609d62e925d,CPTAC-3_PrimaryTumor_male_other_None_RNA_None_None_CPTAC-3_C3N-01842_dbee7893-9842-4819-b49b-8204b459a238,CPTAC-3_PrimaryTumor_male_white_None_RNA_None_None_CPTAC-3_C3N-00154_872bad3a-5f4a-48fb-9310-ffbc7927972a,CPTAC-3_PrimaryTumor_female_white_None_RNA_1209_None_CPTAC-3_C3N-01192_e0a69a83-c3ee-430c-9769-816d68d8b746,CPTAC-3_PrimaryTumor_male_white_None_RNA_91_None_CPTAC-3_C3L-00369_11bb1416-a269-4efe-bb46-65e6c6335260
0,N_unmapped,,1046140,762581,1788602,631410,755932,1142923,1544830,772869,...,1464300,942688,19088312,54895528,878787,19880486,1523470,913130,1410345,1367303
1,N_multimapping,,9693205,7052602,7367473,7239181,8682025,9713766,9720755,7083415,...,12344709,9964967,25985699,23130942,9350571,11862174,7219746,7391750,11527468,11067273
2,N_noFeature,,19904658,45170611,40319206,36695592,38455289,36274738,42972589,34329138,...,36469550,38867154,6121913,72483072,37521292,83489512,39549768,40625974,39587327,35320321
3,N_ambiguous,,6472994,7313691,6524768,7130867,5799858,5875767,8230528,5697312,...,8170534,6908082,523409,4168500,8849467,2912724,4103201,5982045,8683939,9739153
4,ENSG00000000003.15,TSPAN6,4182,3166,1748,2083,1055,676,3632,1228,...,652,966,55,3053,1222,1354,3066,1591,2856,1943
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
60659,ENSG00000288669.1,AC008763.4,0,0,0,0,0,0,0,1,...,1,0,0,0,0,0,0,0,0,0
60660,ENSG00000288670.1,AL592295.6,129,534,434,205,177,162,215,184,...,164,266,15,229,502,279,189,246,214,361
60661,ENSG00000288671.1,AC006486.3,0,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,0
60662,ENSG00000288674.1,AL391628.1,4,14,4,12,25,16,6,10,...,22,14,0,0,9,19,9,19,16,14


In [46]:
set(df['Disease Type'].values)

{'Acute Myeloid Leukemia',
 'Breast Invasive Carcinoma',
 'Clear Cell Renal Cell Carcinoma',
 'Head and Neck Squamous Cell Carcinoma',
 'Lung Adenocarcinoma',
 'Lung Squamous Cell Carcinoma',
 'Non-Clear Cell Renal Cell Carcinoma',
 'Other',
 'Pancreatic Ductal Adenocarcinoma',
 'Uterine Corpus Endometrial Carcinoma',
 nan}

In [50]:
output_dir = '../../output_data/'
diseases = ['Acute Myeloid Leukemia',
 'Breast Invasive Carcinoma',
 'Clear Cell Renal Cell Carcinoma',
 'Head and Neck Squamous Cell Carcinoma',
 'Lung Adenocarcinoma',
 'Lung Squamous Cell Carcinoma',
 'Pancreatic Ductal Adenocarcinoma',
 'Uterine Corpus Endometrial Carcinoma']

case_to_column = []
for disease in diseases:
    cases = list(df[df['Disease Type'] == disease]['case_submitter_id'].values)
    d_rna_df = rna_df[['gene_id', 'gene_name']]
    d_meth_df = meth_df[['id']]
    # Now go through the RNA file
    for col in rna_df.columns:
        c = col.split('_')
        if len(c) > 3:
            if c[-2] in cases:
                case_id = c[-2].replace('-', '.') # Make safe for R
                sample_type = 'Tumor' if 'SolidTissueNormal' not in c else 'Normal' 
                label = f'{case_id}_{sample_type}_RNA_{c[-1].replace("-", ".")}'
                d_rna_df[label] = rna_df[col].values
                case_to_column.append([col, label])
    for col in meth_df.columns:
        c = col.split('_')
        if len(c) > 3:
            if c[-2] in cases:
                sample_type = 'Tumor' if 'SolidTissueNormal' not in c else 'Normal' 
                label = f'{case_id}_{sample_type}_CpG_{c[-1].replace("-", ".")}'
                d_meth_df[label] = meth_df[col].values
                case_to_column.append([col, label])
    # Save both to files
    disease = disease.replace(' ', '')
    d_meth_df.to_csv(f'{output_dir}{disease}/{disease}_DNAMethylation.csv', index=False)
    d_rna_df.to_csv(f'{output_dir}{disease}/{disease}_RNA.csv', index=False)
    print("DONE", disease)

DONE AcuteMyeloidLeukemia
DONE BreastInvasiveCarcinoma


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,

A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_in

A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_in

A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_in

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

DONE ClearCellRenalCellCarcinoma


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,

  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label] = rna_df[col].values
  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label] = rna_df[col].values
  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label

A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_in

A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_in

A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_in

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values


DONE HeadandNeckSquamousCellCarcinoma


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,

  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label] = rna_df[col].values
  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label] = rna_df[col].values
  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label

A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_in

A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_in

A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_in

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

DONE LungAdenocarcinoma


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,

A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_in

A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_in

A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_in

A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_in

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

DONE LungSquamousCellCarcinoma


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,

A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_in

A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_in

A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_in

A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_in

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

DONE PancreaticDuctalAdenocarcinoma


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,

  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label] = rna_df[col].values
  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label] = rna_df[col].values
  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label

A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_in

A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_in

A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_in

A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_in

DONE UterineCorpusEndometrialCarcinoma


In [94]:
output_dir = '../../output_data/'
diseases = ['Acute Myeloid Leukemia',
 'Breast Invasive Carcinoma',
 'Clear Cell Renal Cell Carcinoma',
 'Head and Neck Squamous Cell Carcinoma',
 'Lung Adenocarcinoma',
 'Lung Squamous Cell Carcinoma',
 'Pancreatic Ductal Adenocarcinoma',
 'Uterine Corpus Endometrial Carcinoma']

case_to_column = []
d_rna_df = rna_df[['gene_id', 'gene_name']]
d_meth_df = meth_df[['id']]
for disease in diseases:
    cases = list(df[df['Disease Type'] == disease]['case_submitter_id'].values)
    # Save both to files
    disease = disease.replace(' ', '')
    # Now go through the RNA file
    for col in rna_df.columns:
        c = col.split('_')
        if len(c) > 3:
            if c[-2] in cases:
                case_id = c[-2].replace('-', '.') # Make safe for R
                sample_type = 'Tumor' if 'SolidTissueNormal' not in c else 'Normal' 
                label = f'{case_id}_{sample_type}_RNA_{disease}_{c[-1].replace("-", ".")}'
                d_rna_df[label] = rna_df[col].values
                case_to_column.append([col, label])
    for col in meth_df.columns:
        c = col.split('_')
        if len(c) > 3:
            if c[-2] in cases:
                case_id = c[-2].replace('-', '.') # Make safe for R
                sample_type = 'Tumor' if 'SolidTissueNormal' not in c else 'Normal' 
                label = f'{case_id}_{sample_type}_CpG_{disease}_{c[-1].replace("-", ".")}'
                d_meth_df[label] = meth_df[col].values
                case_to_column.append([col, label])

    print("DONE", disease)
    
d_meth_df.to_csv(f'{output_dir}DNAMethylation.csv', index=False)
d_rna_df.to_csv(f'{output_dir}RNA.csv', index=False)

DONE AcuteMyeloidLeukemia
DONE BreastInvasiveCarcinoma


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,

A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,

A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,

A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,

  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label] = rna_df[col].values
  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label] = rna_df[col].values
  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label

A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_in

A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_in

A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_in

A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_in

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

DONE ClearCellRenalCellCarcinoma


  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label] = rna_df[col].values
  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label] = rna_df[col].values
  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label

  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label] = rna_df[col].values
  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label] = rna_df[col].values
  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

DONE HeadandNeckSquamousCellCarcinoma


  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label] = rna_df[col].values
  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label] = rna_df[col].values
  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label

  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label] = rna_df[col].values
  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label] = rna_df[col].values
  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label

  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label] = rna_df[col].values
  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label] = rna_df[col].values
  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_

DONE LungAdenocarcinoma


  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label] = rna_df[col].values
  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label] = rna_df[col].values
  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

DONE LungSquamousCellCarcinoma


  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label] = rna_df[col].values
  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label] = rna_df[col].values
  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

DONE PancreaticDuctalAdenocarcinoma


  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label] = rna_df[col].values
  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label] = rna_df[col].values
  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label

  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label] = rna_df[col].values
  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label] = rna_df[col].values
  d_rna_df[label] = rna_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_rna_df[label

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_meth_df[label] = meth_df[col].values
  d_meth_df[label] = meth_df[col].values
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  d_me

DONE UterineCorpusEndometrialCarcinoma


# Make a clean patient sample dataset for each of the cancers 

In [95]:
# Get all the cases that were included
cases = [c[1].split('_')[0].replace('.', '-') for c in case_to_column]
case_df = df[df['case_submitter_id'].isin(cases)]
case_df

Unnamed: 0,Case ID,Cases Submitter ID,Related Entities,Annotation,Genomic and Imaging Data Resource,Ethnicity,Gender,Race,Morphology,Primary Diagnosis,...,treatment_arm,treatment_dose,treatment_dose_units,treatment_effect,treatment_effect_indicator,treatment_frequency,treatment_intent_type,treatment_or_therapy,treatment_outcome,treatment_type
36,df4ed85e-8f98-11ea-b1fd-0aad30af8a83,C3N-01946,,,GDC: https://portal.gdc.cancer.gov/cases/14b0b...,Not Reported,Male,White,8070/3,"Squamous cell carcinoma, NOS",...,'--,'--,'--,'--,'--,'--,'--,'--,'--,'--
37,df4ecd30-8f98-11ea-b1fd-0aad30af8a83,C3N-01754,,,GDC: https://portal.gdc.cancer.gov/cases/a18e0...,Not Reported,Male,White,8070/3,"Squamous cell carcinoma, NOS",...,'--,'--,'--,'--,'--,'--,'--,'--,'--,'--
38,df4e9d3d-8f98-11ea-b1fd-0aad30af8a83,C3L-01138,,,GDC: https://portal.gdc.cancer.gov/cases/93160...,Not Reported,Male,Other,8070/3,"Squamous cell carcinoma, NOS",...,'--,'--,'--,'--,'--,'--,'--,'--,'--,'--
39,df4f1689-8f98-11ea-b1fd-0aad30af8a83,C3N-03888,,,GDC: https://portal.gdc.cancer.gov/cases/0a1de...,Not Reported,Male,Other,8070/3,"Squamous cell carcinoma, NOS",...,'--,'--,'--,'--,'--,'--,'--,'--,'--,'--
40,df4f238b-8f98-11ea-b1fd-0aad30af8a83,C3N-04280,,,GDC: https://portal.gdc.cancer.gov/cases/1f370...,Not Reported,Male,White,8070/3,"Squamous cell carcinoma, NOS",...,'--,'--,'--,'--,'--,'--,'--,'--,'--,'--
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
870,f1ee4435-cf1e-11e9-9a07-0a80fada099c,C3N-02582,,,GDC: https://portal.gdc.cancer.gov/cases/dd186...,Not Reported,Male,Asian,8140/3,"Adenocarcinoma, NOS",...,'--,'--,'--,'--,'--,'--,'--,'--,'--,'--
871,f1ee455a-cf1e-11e9-9a07-0a80fada099c,C3N-02586,,,GDC: https://portal.gdc.cancer.gov/cases/89190...,Not Reported,Male,Asian,8140/3,"Adenocarcinoma, NOS",...,'--,'--,'--,'--,'--,'--,'--,'--,'--,'--
872,f1ee4684-cf1e-11e9-9a07-0a80fada099c,C3N-02587,,,GDC: https://portal.gdc.cancer.gov/cases/cd6ed...,Not Reported,Female,Asian,8140/3,"Adenocarcinoma, NOS",...,'--,'--,'--,'--,'--,'--,'--,'--,'--,'--
873,f1ee47a8-cf1e-11e9-9a07-0a80fada099c,C3N-02588,,,GDC: https://portal.gdc.cancer.gov/cases/86058...,Not Reported,Male,Asian,8140/3,"Adenocarcinoma, NOS",...,'--,'--,'--,'--,'--,'--,'--,'--,'--,'--


In [96]:
print('\n'.join(list(case_df.columns)))

Case ID
Cases Submitter ID
Related Entities
Annotation
Genomic and Imaging Data Resource
Ethnicity
Gender
Race
Morphology
Primary Diagnosis
Site of Resection or Biopsy
Tissue or Organ of Origin
Tumor Grade
Tumor Stage
Age at Diagnosis
Classification of Tumor
Days to Recurrence
Disease Type
Primary Site
Program Name
Project Name
Status
Cause of Death
Days to Birth
Days to Death
Vital Status
Year of Birth
Year of Death
Days to Last Follow Up
Days to Last Known Disease Status
Last Known Disease Status
Progression or Recurrence
Prior Malignancy
AJCC Clinical M
AJCC Clinical N
AJCC Clinical Stage
AJCC Clinical T
AJCC Pathologic M
AJCC Pathologic N
AJCC Pathologic Stage
AJCC Pathologic T
AJCC Staging System Edition
Ann Arbor B Symptoms
Ann Arbor Clinical Stage
Ann Arbor Extranodal Involvement
Ann Arbor Pathologic Stage
Best Overall Response
Burkitt Lymphoma Clinical Variant
Circumferential Resection Margin
Colon Polups History
Days to Best Overall
Days to Diagnosis
Days to HIV Diagnosis
Days

## Let's add some demographics we want to keep 

1. Case ID: `Cases Submitter ID` i.e. patient ID
2. Gender: `Gender`
3. Race: `Race`
4. Ethnicity: `Ethnicity`
5. Dead/alive: `Days to Death`
6. Tumour stage: `Tumor Stage`
7. Disease type: `Disease Type`
8. Primary Site: `Primary Site`
9. Age: `Days to Birth` --> convert to years

In [97]:
features = ['Cases Submitter ID', 'Gender', 'Race', 'Ethnicity', 'Primary Site', 'Disease Type', 
            'AJCC Pathologic Stage', 'Days to Death', 'Days to Birth']
for f in features:
    u.dp([f])
    print(case_df[f].value_counts())

[94m--------------------------------------------------------------------------------[0m
[94m                              Cases Submitter ID	                               [0m
[94m--------------------------------------------------------------------------------[0m
Cases Submitter ID
C3N-01946    1
C3L-01637    1
C3L-00928    1
C3N-03069    1
C3N-01719    1
            ..
C3N-03877    1
C3N-03424    1
C3L-00904    1
C3L-00993    1
C3N-02729    1
Name: count, Length: 605, dtype: int64
[94m--------------------------------------------------------------------------------[0m
[94m                                    Gender	                                     [0m
[94m--------------------------------------------------------------------------------[0m
Gender
Male      371
Female    234
Name: count, dtype: int64
[94m--------------------------------------------------------------------------------[0m
[94m                                     Race	                                      

In [98]:
# Convert stage (i.e. AJCC Pathologic Stage to Stage I, Stage II, Stage III, Stage IV) and also early & late
# Convert age to years
stage_simple = []
stage_early_late = []
age_born_yrs = []
ages = case_df['Days to Birth'].values
stages = case_df['AJCC Pathologic Stage'].values
for i, stage in enumerate(stages):
    if stage == 'Stage I' or stage == 'Stage IA3' or stage == 'Stage IA' or stage == 'Stage IB':
        stage_simple.append('Stage I')
        stage_early_late.append('Early')
    elif stage == 'Stage IIB' or stage == 'Stage II' or stage == 'Stage IIA':
        stage_simple.append('Stage II')
        stage_early_late.append('Early')
    elif stage == 'Stage III' or stage == 'Stage IIIA' or stage == 'Stage IIIB':
        stage_simple.append('Stage III')
        stage_early_late.append('Late')
    elif stage == 'Stage IV' or stage == 'Stage IVA' or stage == 'Stage IVB':
        stage_simple.append('Stage IV')
        stage_early_late.append('Late')
    else:
        print(stage)
        stage_early_late.append(None)
        stage_simple.append(None)
    try:
        age_born_yrs.append(int(int(ages[i])/365))
    except:
        age_born_yrs.append(None)

Unknown
Unknown
Not Reported
Not Reported
Not Reported
Not Reported
Not Reported


In [99]:
case_df['TumorStage'] = stage_simple
case_df['Stage'] = stage_early_late
case_df['AgeYears'] = age_born_yrs

A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  case_df['TumorStage'] = stage_simple
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  case_df['Stage'] = stage_early_late
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  case_df['AgeYears'] = age_born_yrs


In [100]:
features = ['Cases Submitter ID', 'Gender', 'Race', 'Ethnicity', 'Primary Site', 'Disease Type', 
            'AgeYears', 'Stage', 'TumorStage',
            'AJCC Pathologic Stage', 'Days to Death', 'Days to Birth']
for f in features:
    u.dp([f])
    print(case_df[f].value_counts())

[94m--------------------------------------------------------------------------------[0m
[94m                              Cases Submitter ID	                               [0m
[94m--------------------------------------------------------------------------------[0m
Cases Submitter ID
C3N-01946    1
C3L-01637    1
C3L-00928    1
C3N-03069    1
C3N-01719    1
            ..
C3N-03877    1
C3N-03424    1
C3L-00904    1
C3L-00993    1
C3N-02729    1
Name: count, Length: 605, dtype: int64
[94m--------------------------------------------------------------------------------[0m
[94m                                    Gender	                                     [0m
[94m--------------------------------------------------------------------------------[0m
Gender
Male      371
Female    234
Name: count, dtype: int64
[94m--------------------------------------------------------------------------------[0m
[94m                                     Race	                                      

In [157]:
len(case_df)

605

In [101]:
# Fix the ordering to make it easier and save to CSV and also add in the files that were associated with each case
case_to_files = {}
for case_value in case_to_column:
    case = case_value[1].split('_')[0]
    if case_to_files.get(case):
        case_to_files[case].append(case_value[1])
    else:
        case_to_files[case] = []
        case_to_files[case].append(case_value[1])

In [102]:
case_to_files

{'C3L.00907': ['C3L.00907_Normal_RNA_ClearCellRenalCellCarcinoma_ff35024d.0cfa.4cd0.b835.eb2bd7430390',
  'C3L.00907_Tumor_RNA_ClearCellRenalCellCarcinoma_4e894ea9.875e.46fe.80b1.1a605636a848',
  'C3L.00907_Tumor_RNA_ClearCellRenalCellCarcinoma_ffa253ae.7402.4c50.9f5f.d8cb39e46057',
  'C3L.00907_Tumor_RNA_ClearCellRenalCellCarcinoma_154017fa.8ca7.43b6.b417.86b9890083f0',
  'C3L.00907_Tumor_CpG_ClearCellRenalCellCarcinoma_2aedf2e4.ad19.4d0e.b1d6.a0cf38f08ea0',
  'C3L.00907_Tumor_CpG_ClearCellRenalCellCarcinoma_1bef3c9a.d931.4f88.a5e9.ff18bc1b594c',
  'C3L.00907_Tumor_CpG_ClearCellRenalCellCarcinoma_774dafb6.ad12.401e.afd0.ed53ff1179fa',
  'C3L.00907_Normal_CpG_ClearCellRenalCellCarcinoma_dddd3ed8.2b12.4c04.b730.3e6b542eed9d'],
 'C3N.01524': ['C3N.01524_Tumor_RNA_ClearCellRenalCellCarcinoma_8edd2ab4.377e.4d07.879b.b6bac439a29d',
  'C3N.01524_Normal_RNA_ClearCellRenalCellCarcinoma_b27245c6.412c.45c3.b4e5.f7464580097b',
  'C3N.01524_Tumor_RNA_ClearCellRenalCellCarcinoma_aa366c5f.98b2.4a47.

In [103]:
case_files = []
case_file_count = []
safe_cases = []
for case in case_df['Cases Submitter ID'].values:
    try:
        case = case.replace('-', '.')
        safe_cases.append(case)
        if not case_to_files.get(case):
            case_file_count.append(None)
            case_files.append(None)
            print(case)
        else:
            case_file_count.append(len(case_to_files.get(case)))
            case_files.append('|'.join(case_to_files.get(case)))
    except:
        print(case)

In [104]:
case_df['SafeCases'] = safe_cases
case_df['CaseFiles'] = case_files
case_df['CaseFileCounts'] = case_file_count
case_df

A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  case_df['SafeCases'] = safe_cases
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  case_df['CaseFiles'] = case_files
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  case_df['CaseFileCounts'] = case_file_count


Unnamed: 0,Case ID,Cases Submitter ID,Related Entities,Annotation,Genomic and Imaging Data Resource,Ethnicity,Gender,Race,Morphology,Primary Diagnosis,...,treatment_intent_type,treatment_or_therapy,treatment_outcome,treatment_type,TumorStage,Stage,AgeYears,SafeCases,CaseFiles,CaseFileCounts
36,df4ed85e-8f98-11ea-b1fd-0aad30af8a83,C3N-01946,,,GDC: https://portal.gdc.cancer.gov/cases/14b0b...,Not Reported,Male,White,8070/3,"Squamous cell carcinoma, NOS",...,'--,'--,'--,'--,Stage II,Early,-64.0,C3N.01946,C3N.01946_Normal_RNA_HeadandNeckSquamousCellCa...,3
37,df4ecd30-8f98-11ea-b1fd-0aad30af8a83,C3N-01754,,,GDC: https://portal.gdc.cancer.gov/cases/a18e0...,Not Reported,Male,White,8070/3,"Squamous cell carcinoma, NOS",...,'--,'--,'--,'--,Stage III,Late,-64.0,C3N.01754,C3N.01754_Normal_RNA_HeadandNeckSquamousCellCa...,3
38,df4e9d3d-8f98-11ea-b1fd-0aad30af8a83,C3L-01138,,,GDC: https://portal.gdc.cancer.gov/cases/93160...,Not Reported,Male,Other,8070/3,"Squamous cell carcinoma, NOS",...,'--,'--,'--,'--,Stage IV,Late,-62.0,C3L.01138,C3L.01138_Tumor_RNA_HeadandNeckSquamousCellCar...,5
39,df4f1689-8f98-11ea-b1fd-0aad30af8a83,C3N-03888,,,GDC: https://portal.gdc.cancer.gov/cases/0a1de...,Not Reported,Male,Other,8070/3,"Squamous cell carcinoma, NOS",...,'--,'--,'--,'--,Stage III,Late,-58.0,C3N.03888,C3N.03888_Tumor_RNA_HeadandNeckSquamousCellCar...,5
40,df4f238b-8f98-11ea-b1fd-0aad30af8a83,C3N-04280,,,GDC: https://portal.gdc.cancer.gov/cases/1f370...,Not Reported,Male,White,8070/3,"Squamous cell carcinoma, NOS",...,'--,'--,'--,'--,Stage II,Early,-66.0,C3N.04280,C3N.04280_Tumor_RNA_HeadandNeckSquamousCellCar...,3
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
870,f1ee4435-cf1e-11e9-9a07-0a80fada099c,C3N-02582,,,GDC: https://portal.gdc.cancer.gov/cases/dd186...,Not Reported,Male,Asian,8140/3,"Adenocarcinoma, NOS",...,'--,'--,'--,'--,Stage II,Early,-77.0,C3N.02582,C3N.02582_Normal_RNA_LungAdenocarcinoma_affd75...,2
871,f1ee455a-cf1e-11e9-9a07-0a80fada099c,C3N-02586,,,GDC: https://portal.gdc.cancer.gov/cases/89190...,Not Reported,Male,Asian,8140/3,"Adenocarcinoma, NOS",...,'--,'--,'--,'--,Stage II,Early,-74.0,C3N.02586,C3N.02586_Normal_RNA_LungAdenocarcinoma_eeea13...,2
872,f1ee4684-cf1e-11e9-9a07-0a80fada099c,C3N-02587,,,GDC: https://portal.gdc.cancer.gov/cases/cd6ed...,Not Reported,Female,Asian,8140/3,"Adenocarcinoma, NOS",...,'--,'--,'--,'--,Stage I,Early,-59.0,C3N.02587,C3N.02587_Normal_RNA_LungAdenocarcinoma_8b59c6...,2
873,f1ee47a8-cf1e-11e9-9a07-0a80fada099c,C3N-02588,,,GDC: https://portal.gdc.cancer.gov/cases/86058...,Not Reported,Male,Asian,8140/3,"Adenocarcinoma, NOS",...,'--,'--,'--,'--,Stage II,Early,-69.0,C3N.02588,C3N.02588_Normal_RNA_LungAdenocarcinoma_b835c7...,2


In [111]:
case_df['CaseFileCounts'].value_counts()

CaseFileCounts
4     197
2     184
3     122
1      31
5      29
8      22
10      9
6       5
7       3
9       2
12      1
Name: count, dtype: int64

In [112]:
case_df[case_df['CaseFileCounts'] > 8]

Unnamed: 0,Case ID,Cases Submitter ID,Related Entities,Annotation,Genomic and Imaging Data Resource,Ethnicity,Gender,Race,Morphology,Primary Diagnosis,...,treatment_intent_type,treatment_or_therapy,treatment_outcome,treatment_type,TumorStage,Stage,AgeYears,SafeCases,CaseFiles,CaseFileCounts
519,6386852c-1fb9-11e9-b7f8-0a80fada099c,C3N-00150,,,GDC: https://portal.gdc.cancer.gov/cases/6ff70...,Not Reported,Female,White,8312/3,"Renal cell carcinoma, NOS",...,'--,'--,'--,'--,Stage IV,Late,-55.0,C3N.00150,C3N.00150_Tumor_RNA_ClearCellRenalCellCarcinom...,10
536,675d0c38-1fb9-11e9-b7f8-0a80fada099c,C3N-00168,,,GDC: https://portal.gdc.cancer.gov/cases/2d1ff...,Not Reported,Male,Asian,8312/3,"Renal cell carcinoma, NOS",...,'--,'--,'--,'--,Stage I,Early,-47.0,C3N.00168,C3N.00168_Normal_RNA_ClearCellRenalCellCarcino...,10
545,8cbd7a01-1fb9-11e9-b7f8-0a80fada099c,C3N-00573,,,GDC: https://portal.gdc.cancer.gov/cases/a0d5a...,Not Reported,Male,Asian,8312/3,"Renal cell carcinoma, NOS",...,'--,'--,'--,'--,Stage II,Early,-61.0,C3N.00573,C3N.00573_Normal_RNA_ClearCellRenalCellCarcino...,10
553,8e59b323-1fb9-11e9-b7f8-0a80fada099c,C3N-00577,,,GDC: https://portal.gdc.cancer.gov/cases/262b9...,Not Reported,Male,Asian,8312/3,"Renal cell carcinoma, NOS",...,'--,'--,'--,'--,Stage IV,Late,-72.0,C3N.00577,C3N.00577_Normal_RNA_ClearCellRenalCellCarcino...,10
555,901a5db5-1fb9-11e9-b7f8-0a80fada099c,C3N-00646,,,GDC: https://portal.gdc.cancer.gov/cases/68daa...,Not Reported,Female,White,8312/3,"Renal cell carcinoma, NOS",...,'--,'--,'--,'--,Stage I,Early,-57.0,C3N.00646,C3N.00646_Tumor_RNA_ClearCellRenalCellCarcinom...,10
560,78a71616-1fb9-11e9-b7f8-0a80fada099c,C3N-00314,,,GDC: https://portal.gdc.cancer.gov/cases/3fe41...,Not Reported,Male,White,8312/3,"Renal cell carcinoma, NOS",...,'--,'--,'--,'--,Stage I,Early,-79.0,C3N.00314,C3N.00314_Normal_RNA_ClearCellRenalCellCarcino...,10
561,73b649eb-1fb9-11e9-b7f8-0a80fada099c,C3N-00310,,,GDC: https://portal.gdc.cancer.gov/cases/2f344...,Not Reported,Male,White,8312/3,"Renal cell carcinoma, NOS",...,'--,'--,'--,'--,Stage III,Late,-84.0,C3N.00310,C3N.00310_Tumor_RNA_ClearCellRenalCellCarcinom...,10
571,6039aa8e-1fb9-11e9-b7f8-0a80fada099c,C3N-00148,,,GDC: https://portal.gdc.cancer.gov/cases/0625c...,Not Reported,Male,White,8312/3,"Renal cell carcinoma, NOS",...,'--,'--,'--,'--,Stage I,Early,-52.0,C3N.00148,C3N.00148_Tumor_RNA_ClearCellRenalCellCarcinom...,10
576,810c2c81-1fb9-11e9-b7f8-0a80fada099c,C3N-00390,,,GDC: https://portal.gdc.cancer.gov/cases/a7b5e...,Not Reported,Male,Other,8312/3,"Renal cell carcinoma, NOS",...,'--,'--,'--,'--,Stage IV,Late,-58.0,C3N.00390,C3N.00390_Tumor_RNA_ClearCellRenalCellCarcinom...,10
593,7d95243f-1fb9-11e9-b7f8-0a80fada099c,C3N-00320,,,GDC: https://portal.gdc.cancer.gov/cases/ceae0...,Not Reported,Male,White,8312/3,"Renal cell carcinoma, NOS",...,'--,'--,'--,'--,Stage III,Late,-67.0,C3N.00320,C3N.00320_Tumor_RNA_ClearCellRenalCellCarcinom...,9


In [115]:
col_order = ['SafeCases', 'TumorStage', 'Stage', 'AgeYears', 'CaseFiles', 'CaseFileCounts']
case_df = case_df[col_order + [c for c in case_df.columns if c not in col_order]]

In [117]:
case_df.to_csv('PatientInfo.csv', index=False)

# Filter the cases and make sure for each cancer we don't have patient outliers!

Given in my previous experience there are often outliers in the patients let's remove those from both datasets.

It's also important to check teh biospecimen data - make sure patients don't have multiple submissions (since it seems like there are sometimes multiple RNAseq files for the same patient. i.e. if there are multiple submissions let's try and picl the one which is Solid Tissue not Peripheral Blood Componenets.

In [123]:
bio_df = pd.read_csv('biospecimen.cart.2023-07-17/sample.tsv', sep='\t')
bio_df['composition'].value_counts()

composition
Solid Tissue                       3219
Peripheral Blood Components NOS    1687
Buffy Coat                          102
'--                                 100
Name: count, dtype: int64

# Build a RNA and a CpG sample DF

In [158]:
len(set(cpg_sample_df['SafeCases']))

582

In [162]:
len(set(bio_df['sample_id'].values))
bio_sample_map = dict(zip(bio_df['sample_submitter_id'], bio_df['composition']))
sample_df = pd.read_csv(sample_file, sep='\t')
sample_map = dict(zip(sample_df['File ID'], sample_df['Sample ID']))

rna_sample_df = pd.DataFrame()
cpg_sample_df = pd.DataFrame()

rna_tumour_count = []
rna_normal_count = []
cpg_tumour_count = []
cpg_normal_count = []

rna_case_ids = []
rna_samples = []

cpg_case_ids = []
cpg_samples = []

for i, case_id in enumerate(case_df['SafeCases'].values):
    files = case_to_files.get(case_id)
    rna_files = [c for c in files if 'RNA' in c]
    cpg_files = [c for c in files if 'CpG' in c]
    rna_tumour_count.append(len([c for c in rna_files if 'Tumor' in c]))
    rna_normal_count.append(len([c for c in rna_files if 'Normal' in c]))
    cpg_tumour_count.append(len([c for c in cpg_files if 'Tumor' in c]))
    cpg_normal_count.append(len([c for c in cpg_files if 'Normal' in c]))
    # For each of these let's have a add the case to the case Ids
    for r in rna_files:
        s = sample_map.get(r.split('_')[-1].replace('.', '-'))
        if bio_sample_map.get(s) == 'Solid Tissue':
            rna_case_ids.append(case_id)
            rna_samples.append(r)
    for r in cpg_files:
        s = sample_map.get(r.split('_')[-1].replace('.', '-'))
        if bio_sample_map.get(s) == 'Solid Tissue':
            cpg_case_ids.append(case_id)
            cpg_samples.append(r)
rna_sample_df['SafeCases'] = rna_case_ids
rna_sample_df['Sample'] = rna_samples
cpg_sample_df['SafeCases'] = cpg_case_ids
cpg_sample_df['Sample'] = cpg_samples
cpg_sample_df

Unnamed: 0,SafeCases,Sample
0,C3N.01946,C3N.01946_Tumor_CpG_HeadandNeckSquamousCellCar...
1,C3N.01754,C3N.01754_Normal_CpG_HeadandNeckSquamousCellCa...
2,C3L.01138,C3L.01138_Tumor_CpG_HeadandNeckSquamousCellCar...
3,C3L.01138,C3L.01138_Normal_CpG_HeadandNeckSquamousCellCa...
4,C3N.03888,C3N.03888_Tumor_CpG_HeadandNeckSquamousCellCar...
...,...,...
942,C3N.02582,C3N.02582_Normal_CpG_LungAdenocarcinoma_02b912...
943,C3N.02586,C3N.02586_Normal_CpG_LungAdenocarcinoma_d4ed07...
944,C3N.02587,C3N.02587_Normal_CpG_LungAdenocarcinoma_36dec5...
945,C3N.02588,C3N.02588_Normal_CpG_LungAdenocarcinoma_496143...


In [170]:
# Now we also want to get the different sample things like sample type, disease, stage & age
cpg_sample_df = pd.merge(cpg_sample_df, case_df, how='left', on='SafeCases')
cpg_sample_df['CondID'] = [1 if 'Tumor' in c else 0 for c in cpg_sample_df['Sample'].values]
cpg_sample_df['Disease'] = [c.split('_')[3] for c in cpg_sample_df['Sample'].values]


rna_sample_df = pd.merge(rna_sample_df, case_df, how='left', on='SafeCases')
rna_sample_df['CondID'] = [1 if 'Tumor' in c else 0 for c in rna_sample_df['Sample'].values]
rna_sample_df['Disease'] = [c.split('_')[3] for c in rna_sample_df['Sample'].values]

rna_sample_df.to_csv('rna_sample_df.csv', index=False)
cpg_sample_df.to_csv('cpg_sample_df.csv', index=False)


In [171]:
cpg_sample_df['Disease'].value_counts()

Disease
ClearCellRenalCellCarcinoma          257
LungSquamousCellCarcinoma            173
LungAdenocarcinoma                   171
PancreaticDuctalAdenocarcinoma       135
HeadandNeckSquamousCellCarcinoma     120
UterineCorpusEndometrialCarcinoma     91
Name: count, dtype: int64

In [175]:
cpg_sample_df

Unnamed: 0,SafeCases,Sample,TumorStage_x,Stage_x,AgeYears_x,CaseFiles_x,CaseFileCounts_x,Case ID_x,Cases Submitter ID_x,Related Entities_x,...,treatment_dose_y,treatment_dose_units_y,treatment_effect_y,treatment_effect_indicator_y,treatment_frequency_y,treatment_intent_type_y,treatment_or_therapy_y,treatment_outcome_y,treatment_type_y,Disease
0,C3N.01946,C3N.01946_Tumor_CpG_HeadandNeckSquamousCellCar...,Stage II,Early,-64.0,C3N.01946_Normal_RNA_HeadandNeckSquamousCellCa...,3,df4ed85e-8f98-11ea-b1fd-0aad30af8a83,C3N-01946,,...,'--,'--,'--,'--,'--,'--,'--,'--,'--,HeadandNeckSquamousCellCarcinoma
1,C3N.01754,C3N.01754_Normal_CpG_HeadandNeckSquamousCellCa...,Stage III,Late,-64.0,C3N.01754_Normal_RNA_HeadandNeckSquamousCellCa...,3,df4ecd30-8f98-11ea-b1fd-0aad30af8a83,C3N-01754,,...,'--,'--,'--,'--,'--,'--,'--,'--,'--,HeadandNeckSquamousCellCarcinoma
2,C3L.01138,C3L.01138_Tumor_CpG_HeadandNeckSquamousCellCar...,Stage IV,Late,-62.0,C3L.01138_Tumor_RNA_HeadandNeckSquamousCellCar...,5,df4e9d3d-8f98-11ea-b1fd-0aad30af8a83,C3L-01138,,...,'--,'--,'--,'--,'--,'--,'--,'--,'--,HeadandNeckSquamousCellCarcinoma
3,C3L.01138,C3L.01138_Normal_CpG_HeadandNeckSquamousCellCa...,Stage IV,Late,-62.0,C3L.01138_Tumor_RNA_HeadandNeckSquamousCellCar...,5,df4e9d3d-8f98-11ea-b1fd-0aad30af8a83,C3L-01138,,...,'--,'--,'--,'--,'--,'--,'--,'--,'--,HeadandNeckSquamousCellCarcinoma
4,C3N.03888,C3N.03888_Tumor_CpG_HeadandNeckSquamousCellCar...,Stage III,Late,-58.0,C3N.03888_Tumor_RNA_HeadandNeckSquamousCellCar...,5,df4f1689-8f98-11ea-b1fd-0aad30af8a83,C3N-03888,,...,'--,'--,'--,'--,'--,'--,'--,'--,'--,HeadandNeckSquamousCellCarcinoma
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
942,C3N.02582,C3N.02582_Normal_CpG_LungAdenocarcinoma_02b912...,Stage II,Early,-77.0,C3N.02582_Normal_RNA_LungAdenocarcinoma_affd75...,2,f1ee4435-cf1e-11e9-9a07-0a80fada099c,C3N-02582,,...,'--,'--,'--,'--,'--,'--,'--,'--,'--,LungAdenocarcinoma
943,C3N.02586,C3N.02586_Normal_CpG_LungAdenocarcinoma_d4ed07...,Stage II,Early,-74.0,C3N.02586_Normal_RNA_LungAdenocarcinoma_eeea13...,2,f1ee455a-cf1e-11e9-9a07-0a80fada099c,C3N-02586,,...,'--,'--,'--,'--,'--,'--,'--,'--,'--,LungAdenocarcinoma
944,C3N.02587,C3N.02587_Normal_CpG_LungAdenocarcinoma_36dec5...,Stage I,Early,-59.0,C3N.02587_Normal_RNA_LungAdenocarcinoma_8b59c6...,2,f1ee4684-cf1e-11e9-9a07-0a80fada099c,C3N-02587,,...,'--,'--,'--,'--,'--,'--,'--,'--,'--,LungAdenocarcinoma
945,C3N.02588,C3N.02588_Normal_CpG_LungAdenocarcinoma_496143...,Stage II,Early,-69.0,C3N.02588_Normal_RNA_LungAdenocarcinoma_b835c7...,2,f1ee47a8-cf1e-11e9-9a07-0a80fada099c,C3N-02588,,...,'--,'--,'--,'--,'--,'--,'--,'--,'--,LungAdenocarcinoma
