# Flair Transcript Quantification Results Counts to TPM Conversion

This notebook tests the conversion algorithm from raw transcript counts to TPM. The dataset used in this notebook is from the GTEx V9 database.

## Part 1: Import Data and Configure Python Libraries

In [1]:
import os
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
import matplotlib.gridspec
%matplotlib inline
import seaborn as sns
import re
from IPython.display import display
from matplotlib.pyplot import gcf
from sklearn.decomposition import PCA 
from sklearn.preprocessing import StandardScaler
from PIL import ImageColor
from matplotlib.patches import Patch #for custom legend making
import scipy.spatial as sp, scipy.cluster.hierarchy as hc #for faster computing of hierarchial clusters

In [2]:
import warnings
warnings.filterwarnings('ignore')

### Import Data

In [3]:
os.getcwd()

'C:\\Users\\15082\\OneDrive\\Desktop\\thesis_research\\gtex_v9_data_analysis\\FLAIR\\work_in_progress'

In [4]:
data_dir = 'gtex_v9_data\\data_for_analysis\\gtex_database_data'

In [5]:
flair_raw_quant_results_file_path = os.path.join(data_dir, 'gtexdb_flair_filter_transcript_raw_counts.txt')

#### Flair Transcript Quantification Data (in raw counts)

In [6]:
# change working directory
os.chdir('C:\\Users\\15082\\OneDrive\\Desktop\\thesis_research')

In [7]:
flair_quant_data = pd.read_csv(flair_raw_quant_results_file_path,sep='\t')

In [8]:
flair_quant_data.head(5)

Unnamed: 0,transcript,GTEX-1192X-0011-R10a-SM-4RXXZ,GTEX-11H98-0011-R11b-SM-4SFLZ,GTEX-11TTK-0011-R7b-SM-4TVFS,GTEX-1211K-0826-SM-7LDFQ,GTEX-1313W-0011-R7b-SM-4ZL3U,GTEX-13QBU-0426-SM-5A4VT,GTEX-13QJ3-0726-SM-7LDHS,GTEX-13QJ3-0726-SM-7LDHS_rep,GTEX-13RTJ-0011-R7b-SM-5CTCB,...,GTEX-QV44-0008-SM-3QNG7_ctrl2,GTEX-QV44-0008-SM-3QNG7_exp,GTEX-S4Z8-0008-SM-2Y983_ctrl,GTEX-S4Z8-0008-SM-2Y983_exp1,GTEX-S4Z8-0008-SM-2Y983_exp2,GTEX-S95S-0008-SM-3RQ8B_ctrl,GTEX-S95S-0008-SM-3RQ8B_exp1,GTEX-S95S-0008-SM-3RQ8B_exp2,GTEX-WY7C-0008-SM-3NZB5_ctrl,GTEX-WY7C-0008-SM-3NZB5_exp
0,000187c4-a488-40f0-a69c-0a89582f3241_ENSG00000...,0,0,0,0,0,0,0,0,0,...,1,1,1,2,0,0,0,1,0,1
1,00026598-3078-4e2f-8ac9-dd8f523396b9_ENSG00000...,0,0,0,0,0,0,0,0,0,...,0,1,0,0,1,1,0,1,0,1
2,0002a5e2-f01a-4690-a7db-7af726712a5e_ENSG00000...,1,18,2,9,1,11,11,5,1,...,26,34,17,26,36,48,32,53,8,29
3,000339f1-1769-4608-b369-59aa222cd7b7_ENSG00000...,0,1,0,2,0,0,0,0,3,...,2,1,1,2,4,1,2,2,2,3
4,0003706a-94a7-4419-a61d-6310d7a9c10c_ENSG00000...,39,62,18,8,6,20,27,24,17,...,17,20,15,22,23,25,16,35,42,18


In [9]:
flair_quant_data.shape

(93630, 93)

#### Transcript Length Table

In [10]:
transcript_length_file_path = os.path.join(data_dir, 'transcript_length_df.csv')

In [11]:
transcript_length_df = pd.read_csv(transcript_length_file_path)

In [12]:
transcript_length_df.head(3)

Unnamed: 0.1,Unnamed: 0,isoform,gene,length,composite_id
0,0,dfe30c5c-ddd7-4ee8-a9ba-74556bd9dd87_chr10:628000,chr10:628000,2618,dfe30c5c-ddd7-4ee8-a9ba-74556bd9dd87_chr10:628...
1,1,01252fde-2aa4-4b0d-99f6-c95a4efcc758_chr10:650000,chr10:649000,2709,01252fde-2aa4-4b0d-99f6-c95a4efcc758_chr10:650...
2,2,5d705740-efaf-4cd9-9b68-71d6b775a3be_chr10:306...,chr10:3069000,1026,5d705740-efaf-4cd9-9b68-71d6b775a3be_chr10:306...


In [13]:
transcript_length_df.shape

(93709, 5)

In [14]:
transcript_length_df.composite_id

0        dfe30c5c-ddd7-4ee8-a9ba-74556bd9dd87_chr10:628...
1        01252fde-2aa4-4b0d-99f6-c95a4efcc758_chr10:650...
2        5d705740-efaf-4cd9-9b68-71d6b775a3be_chr10:306...
3        115765b8-4233-49bb-a2bf-93683ac4e094_chr10:313...
4        6d54e9f3-0815-4ea6-a878-1ef2947c1cd0_chr10:482...
                               ...                        
93704    4a6b98d8-7f76-425f-a663-a7d3e4826c05_ENSG00000...
93705                ENST00000250784.12_ENSG00000129824.15
93706    bea576a7-6c87-43f3-8a92-1bbf2af9df4f_ENSG00000...
93707    82867362-1175-4171-9e9d-620fb01ad65d_ENSG00000...
93708    141285fb-d028-4740-a9d9-f04a28fbaef1_ENSG00000...
Name: composite_id, Length: 93709, dtype: object

In [15]:
transcript_length_clean_df = transcript_length_df[['composite_id','length']]

In [16]:
transcript_length_clean_df.head(3)

Unnamed: 0,composite_id,length
0,dfe30c5c-ddd7-4ee8-a9ba-74556bd9dd87_chr10:628...,2618
1,01252fde-2aa4-4b0d-99f6-c95a4efcc758_chr10:650...,2709
2,5d705740-efaf-4cd9-9b68-71d6b775a3be_chr10:306...,1026


## Part 2: Data Cleaning and Manipulation

### Merge transcript quantification raw counts dataframe with the transcript length table

In [17]:
transcript_counts_with_length_df = flair_quant_data.merge(transcript_length_clean_df,how='inner',
                                                                         left_on='transcript',right_on='composite_id')

In [18]:
transcript_counts_with_length_df.head(5)

Unnamed: 0,transcript,GTEX-1192X-0011-R10a-SM-4RXXZ,GTEX-11H98-0011-R11b-SM-4SFLZ,GTEX-11TTK-0011-R7b-SM-4TVFS,GTEX-1211K-0826-SM-7LDFQ,GTEX-1313W-0011-R7b-SM-4ZL3U,GTEX-13QBU-0426-SM-5A4VT,GTEX-13QJ3-0726-SM-7LDHS,GTEX-13QJ3-0726-SM-7LDHS_rep,GTEX-13RTJ-0011-R7b-SM-5CTCB,...,GTEX-S4Z8-0008-SM-2Y983_ctrl,GTEX-S4Z8-0008-SM-2Y983_exp1,GTEX-S4Z8-0008-SM-2Y983_exp2,GTEX-S95S-0008-SM-3RQ8B_ctrl,GTEX-S95S-0008-SM-3RQ8B_exp1,GTEX-S95S-0008-SM-3RQ8B_exp2,GTEX-WY7C-0008-SM-3NZB5_ctrl,GTEX-WY7C-0008-SM-3NZB5_exp,composite_id,length
0,000187c4-a488-40f0-a69c-0a89582f3241_ENSG00000...,0,0,0,0,0,0,0,0,0,...,1,2,0,0,0,1,0,1,000187c4-a488-40f0-a69c-0a89582f3241_ENSG00000...,3811
1,00026598-3078-4e2f-8ac9-dd8f523396b9_ENSG00000...,0,0,0,0,0,0,0,0,0,...,0,0,1,1,0,1,0,1,00026598-3078-4e2f-8ac9-dd8f523396b9_ENSG00000...,1706
2,0002a5e2-f01a-4690-a7db-7af726712a5e_ENSG00000...,1,18,2,9,1,11,11,5,1,...,17,26,36,48,32,53,8,29,0002a5e2-f01a-4690-a7db-7af726712a5e_ENSG00000...,1917
3,000339f1-1769-4608-b369-59aa222cd7b7_ENSG00000...,0,1,0,2,0,0,0,0,3,...,1,2,4,1,2,2,2,3,000339f1-1769-4608-b369-59aa222cd7b7_ENSG00000...,3413
4,0003706a-94a7-4419-a61d-6310d7a9c10c_ENSG00000...,39,62,18,8,6,20,27,24,17,...,15,22,23,25,16,35,42,18,0003706a-94a7-4419-a61d-6310d7a9c10c_ENSG00000...,1095


In [19]:
transcript_counts_with_length_df.shape

(93621, 95)

In [20]:
if transcript_counts_with_length_df.isna().values.any():
    print("There are NaN values in the DataFrame.")
else:
    print("There are no NaN values in the DataFrame.")

There are no NaN values in the DataFrame.


In [21]:
# shift column 'length' to second position
length_column = transcript_counts_with_length_df.pop('length')
transcript_counts_with_length_df.insert(1, 'transcript_length', length_column)

In [22]:
transcript_counts_with_length_df.head(3)

Unnamed: 0,transcript,transcript_length,GTEX-1192X-0011-R10a-SM-4RXXZ,GTEX-11H98-0011-R11b-SM-4SFLZ,GTEX-11TTK-0011-R7b-SM-4TVFS,GTEX-1211K-0826-SM-7LDFQ,GTEX-1313W-0011-R7b-SM-4ZL3U,GTEX-13QBU-0426-SM-5A4VT,GTEX-13QJ3-0726-SM-7LDHS,GTEX-13QJ3-0726-SM-7LDHS_rep,...,GTEX-QV44-0008-SM-3QNG7_exp,GTEX-S4Z8-0008-SM-2Y983_ctrl,GTEX-S4Z8-0008-SM-2Y983_exp1,GTEX-S4Z8-0008-SM-2Y983_exp2,GTEX-S95S-0008-SM-3RQ8B_ctrl,GTEX-S95S-0008-SM-3RQ8B_exp1,GTEX-S95S-0008-SM-3RQ8B_exp2,GTEX-WY7C-0008-SM-3NZB5_ctrl,GTEX-WY7C-0008-SM-3NZB5_exp,composite_id
0,000187c4-a488-40f0-a69c-0a89582f3241_ENSG00000...,3811,0,0,0,0,0,0,0,0,...,1,1,2,0,0,0,1,0,1,000187c4-a488-40f0-a69c-0a89582f3241_ENSG00000...
1,00026598-3078-4e2f-8ac9-dd8f523396b9_ENSG00000...,1706,0,0,0,0,0,0,0,0,...,1,0,0,1,1,0,1,0,1,00026598-3078-4e2f-8ac9-dd8f523396b9_ENSG00000...
2,0002a5e2-f01a-4690-a7db-7af726712a5e_ENSG00000...,1917,1,18,2,9,1,11,11,5,...,34,17,26,36,48,32,53,8,29,0002a5e2-f01a-4690-a7db-7af726712a5e_ENSG00000...


In [23]:
# Delete the last column
transcript_counts_with_length_df = transcript_counts_with_length_df.drop(transcript_counts_with_length_df.columns[-1], axis=1)

In [24]:
transcript_counts_with_length_df.head(3)

Unnamed: 0,transcript,transcript_length,GTEX-1192X-0011-R10a-SM-4RXXZ,GTEX-11H98-0011-R11b-SM-4SFLZ,GTEX-11TTK-0011-R7b-SM-4TVFS,GTEX-1211K-0826-SM-7LDFQ,GTEX-1313W-0011-R7b-SM-4ZL3U,GTEX-13QBU-0426-SM-5A4VT,GTEX-13QJ3-0726-SM-7LDHS,GTEX-13QJ3-0726-SM-7LDHS_rep,...,GTEX-QV44-0008-SM-3QNG7_ctrl2,GTEX-QV44-0008-SM-3QNG7_exp,GTEX-S4Z8-0008-SM-2Y983_ctrl,GTEX-S4Z8-0008-SM-2Y983_exp1,GTEX-S4Z8-0008-SM-2Y983_exp2,GTEX-S95S-0008-SM-3RQ8B_ctrl,GTEX-S95S-0008-SM-3RQ8B_exp1,GTEX-S95S-0008-SM-3RQ8B_exp2,GTEX-WY7C-0008-SM-3NZB5_ctrl,GTEX-WY7C-0008-SM-3NZB5_exp
0,000187c4-a488-40f0-a69c-0a89582f3241_ENSG00000...,3811,0,0,0,0,0,0,0,0,...,1,1,1,2,0,0,0,1,0,1
1,00026598-3078-4e2f-8ac9-dd8f523396b9_ENSG00000...,1706,0,0,0,0,0,0,0,0,...,0,1,0,0,1,1,0,1,0,1
2,0002a5e2-f01a-4690-a7db-7af726712a5e_ENSG00000...,1917,1,18,2,9,1,11,11,5,...,26,34,17,26,36,48,32,53,8,29


In [25]:
transcript_counts_with_length_df.shape

(93621, 94)

## Part 3: Counts to TPM Conversion

In [26]:
# Define the function to calculate TPM
def calculate_tpm(counts, length):
    return (counts / length) / ((counts.sum()/length)/1000000)

# Apply the function to each cell of the dataframe
transcript_TPM_df = transcript_counts_with_length_df[transcript_counts_with_length_df.\
                    columns[2:]].apply(lambda x: calculate_tpm(x, transcript_counts_with_length_df['transcript_length']))

In [27]:
transcript_TPM_df.head(5)

Unnamed: 0,GTEX-1192X-0011-R10a-SM-4RXXZ,GTEX-11H98-0011-R11b-SM-4SFLZ,GTEX-11TTK-0011-R7b-SM-4TVFS,GTEX-1211K-0826-SM-7LDFQ,GTEX-1313W-0011-R7b-SM-4ZL3U,GTEX-13QBU-0426-SM-5A4VT,GTEX-13QJ3-0726-SM-7LDHS,GTEX-13QJ3-0726-SM-7LDHS_rep,GTEX-13RTJ-0011-R7b-SM-5CTCB,GTEX-13VXU-0011-R11b-SM-5BFQZ,...,GTEX-QV44-0008-SM-3QNG7_ctrl2,GTEX-QV44-0008-SM-3QNG7_exp,GTEX-S4Z8-0008-SM-2Y983_ctrl,GTEX-S4Z8-0008-SM-2Y983_exp1,GTEX-S4Z8-0008-SM-2Y983_exp2,GTEX-S95S-0008-SM-3RQ8B_ctrl,GTEX-S95S-0008-SM-3RQ8B_exp1,GTEX-S95S-0008-SM-3RQ8B_exp2,GTEX-WY7C-0008-SM-3NZB5_ctrl,GTEX-WY7C-0008-SM-3NZB5_exp
0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.275591,...,0.335124,0.359675,0.421937,0.974555,0.0,0.0,0.0,0.263975,0.0,0.39919
1,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,...,0.0,0.359675,0.0,0.0,0.278891,0.295382,0.0,0.263975,0.0,0.39919
2,0.385601,5.439593,2.056247,4.607019,1.904958,7.441563,6.472077,2.423809,0.678189,1.377953,...,8.713227,12.228962,7.172935,12.669219,10.040063,14.178322,13.925607,13.990673,1.732832,11.576504
3,0.0,0.3022,0.0,1.023782,0.0,0.0,0.0,0.0,2.034566,0.551181,...,0.670248,0.359675,0.421937,0.974555,1.115563,0.295382,0.87035,0.52795,0.433208,1.197569
4,15.038446,18.736376,18.506219,4.095128,11.429747,13.530115,15.886007,11.634282,11.529207,20.944879,...,5.69711,7.193507,6.329061,10.720109,6.414484,7.384543,6.962803,9.239124,9.097366,7.185416


In [28]:
transcript_TPM_with_ID_df = pd.concat([transcript_TPM_df, transcript_counts_with_length_df['transcript']], axis=1)

In [29]:
transcript_TPM_with_ID_df.head(5)

Unnamed: 0,GTEX-1192X-0011-R10a-SM-4RXXZ,GTEX-11H98-0011-R11b-SM-4SFLZ,GTEX-11TTK-0011-R7b-SM-4TVFS,GTEX-1211K-0826-SM-7LDFQ,GTEX-1313W-0011-R7b-SM-4ZL3U,GTEX-13QBU-0426-SM-5A4VT,GTEX-13QJ3-0726-SM-7LDHS,GTEX-13QJ3-0726-SM-7LDHS_rep,GTEX-13RTJ-0011-R7b-SM-5CTCB,GTEX-13VXU-0011-R11b-SM-5BFQZ,...,GTEX-QV44-0008-SM-3QNG7_exp,GTEX-S4Z8-0008-SM-2Y983_ctrl,GTEX-S4Z8-0008-SM-2Y983_exp1,GTEX-S4Z8-0008-SM-2Y983_exp2,GTEX-S95S-0008-SM-3RQ8B_ctrl,GTEX-S95S-0008-SM-3RQ8B_exp1,GTEX-S95S-0008-SM-3RQ8B_exp2,GTEX-WY7C-0008-SM-3NZB5_ctrl,GTEX-WY7C-0008-SM-3NZB5_exp,transcript
0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.275591,...,0.359675,0.421937,0.974555,0.0,0.0,0.0,0.263975,0.0,0.39919,000187c4-a488-40f0-a69c-0a89582f3241_ENSG00000...
1,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,...,0.359675,0.0,0.0,0.278891,0.295382,0.0,0.263975,0.0,0.39919,00026598-3078-4e2f-8ac9-dd8f523396b9_ENSG00000...
2,0.385601,5.439593,2.056247,4.607019,1.904958,7.441563,6.472077,2.423809,0.678189,1.377953,...,12.228962,7.172935,12.669219,10.040063,14.178322,13.925607,13.990673,1.732832,11.576504,0002a5e2-f01a-4690-a7db-7af726712a5e_ENSG00000...
3,0.0,0.3022,0.0,1.023782,0.0,0.0,0.0,0.0,2.034566,0.551181,...,0.359675,0.421937,0.974555,1.115563,0.295382,0.87035,0.52795,0.433208,1.197569,000339f1-1769-4608-b369-59aa222cd7b7_ENSG00000...
4,15.038446,18.736376,18.506219,4.095128,11.429747,13.530115,15.886007,11.634282,11.529207,20.944879,...,7.193507,6.329061,10.720109,6.414484,7.384543,6.962803,9.239124,9.097366,7.185416,0003706a-94a7-4419-a61d-6310d7a9c10c_ENSG00000...


In [30]:
# shift column 'transcript' to first position
transcript_id_column = transcript_TPM_with_ID_df.pop('transcript')
transcript_TPM_with_ID_df.insert(0, 'transcript', transcript_id_column)

In [31]:
transcript_TPM_with_ID_df.head(3)

Unnamed: 0,transcript,GTEX-1192X-0011-R10a-SM-4RXXZ,GTEX-11H98-0011-R11b-SM-4SFLZ,GTEX-11TTK-0011-R7b-SM-4TVFS,GTEX-1211K-0826-SM-7LDFQ,GTEX-1313W-0011-R7b-SM-4ZL3U,GTEX-13QBU-0426-SM-5A4VT,GTEX-13QJ3-0726-SM-7LDHS,GTEX-13QJ3-0726-SM-7LDHS_rep,GTEX-13RTJ-0011-R7b-SM-5CTCB,...,GTEX-QV44-0008-SM-3QNG7_ctrl2,GTEX-QV44-0008-SM-3QNG7_exp,GTEX-S4Z8-0008-SM-2Y983_ctrl,GTEX-S4Z8-0008-SM-2Y983_exp1,GTEX-S4Z8-0008-SM-2Y983_exp2,GTEX-S95S-0008-SM-3RQ8B_ctrl,GTEX-S95S-0008-SM-3RQ8B_exp1,GTEX-S95S-0008-SM-3RQ8B_exp2,GTEX-WY7C-0008-SM-3NZB5_ctrl,GTEX-WY7C-0008-SM-3NZB5_exp
0,000187c4-a488-40f0-a69c-0a89582f3241_ENSG00000...,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,...,0.335124,0.359675,0.421937,0.974555,0.0,0.0,0.0,0.263975,0.0,0.39919
1,00026598-3078-4e2f-8ac9-dd8f523396b9_ENSG00000...,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,...,0.0,0.359675,0.0,0.0,0.278891,0.295382,0.0,0.263975,0.0,0.39919
2,0002a5e2-f01a-4690-a7db-7af726712a5e_ENSG00000...,0.385601,5.439593,2.056247,4.607019,1.904958,7.441563,6.472077,2.423809,0.678189,...,8.713227,12.228962,7.172935,12.669219,10.040063,14.178322,13.925607,13.990673,1.732832,11.576504


## Part 4: Results Check

#### For each column (sample), the TPM values should add up to 1,000,000

In [32]:
pd.options.display.max_columns = None
pd.options.display.max_rows = None
pd.options.display.max_colwidth = 100

In [51]:
tpm_sum =transcript_TPM_with_ID_df[transcript_TPM_with_ID_df.columns[1:]].apply(lambda x: x.sum()).tolist()

In [53]:
check_tpm_sum_by_column_result = sum(abs(value-1000000)<0.01 for value in tpm_sum_by_column)

In [54]:
check_tpm_sum_by_column_result

92

#### Check with GTEx V9 database TPM quant results

In [37]:
flair_tpm_quant_results_file_path = os.path.join(data_dir, 'glinos_flair_quant_tpm_results.csv')

In [38]:
flair_tpm_quant_data = pd.read_csv(flair_tpm_quant_results_file_path)

In [39]:
flair_tpm_quant_data.head(3)

Unnamed: 0,transcript,GTEX-1192X-0011-R10a-SM-4RXXZ,GTEX-11H98-0011-R11b-SM-4SFLZ,GTEX-11TTK-0011-R7b-SM-4TVFS,GTEX-1211K-0826-SM-7LDFQ,GTEX-1313W-0011-R7b-SM-4ZL3U,GTEX-13QBU-0426-SM-5A4VT,GTEX-13QJ3-0726-SM-7LDHS,GTEX-13QJ3-0726-SM-7LDHS_rep,GTEX-13RTJ-0011-R7b-SM-5CTCB,GTEX-13VXU-0011-R11b-SM-5BFQZ,GTEX-13X6J-0011-R10b-SM-5CEKT,GTEX-145MH-0011-R3b-SM-5CTCM,GTEX-14BIL-0011-R10a-SM-5EQV4,GTEX-14BMU-0526-SM-5CA2F,GTEX-14BMU-0526-SM-5CA2F_rep,GTEX-14BMU-0526-SM-5CA2F_rep2,GTEX-14C5O-0011-R7b-SM-5GUPO,GTEX-14XAO-0926-SM-5YQWC,GTEX-15DCD-0011-R10b-SM-5S51M,GTEX-15ER7-0011-R5b-SM-5S51V,GTEX-15ER7-0011-R7a-SM-5QYP2,GTEX-15RIE-1726-SM-5V7WB,GTEX-17F97-0011-R11b-SM-63KY2,GTEX-17MFQ-1926-SM-6659L,GTEX-1C64N-0326-SM-6ZHT1,GTEX-1GN1W-0226-SM-7AGLJ,GTEX-1GN1W-0226-SM-7AGLJ_rep,GTEX-1H11D-1226-SM-9P6XJ,GTEX-1H3NZ-0011-R11b-SM-AUNOV,GTEX-1HBPH-0226-SM-7LLUW,GTEX-1I6K7-0626-SM-AAEQW,GTEX-1I6K7-1226-SM-AAEQX,GTEX-1IDJD-1226-SM-AXRWG,GTEX-1IDJD-0226-SM-AML89,GTEX-1IDJF-0826-SM-ABADH,GTEX-1IDJU-0726-SM-BXZK2,GTEX-1KXAM-0426-SM-CYKMP,GTEX-1KXAM-2426-SM-CYKMT,GTEX-1LVA9-0326-SM-CYRXA,GTEX-OHPL-0326-SM-DPSB8,GTEX-OIZI-0008-SM-2FR3P,GTEX-OXRL-0008-SM-2FR3T,GTEX-PSDG-0008-SM-3NZBI,GTEX-Q2AG-0011-R11A-SM-2EBL2,GTEX-Q2AG-0011-R11A-SM-2EBL2_rep,GTEX-Q2AG-0011-R11A-SM-2EBL2_rep2,GTEX-QDT8-0011-R10A-SM-2FKJB,GTEX-R53T-0326-SM-2K8S4,GTEX-S4P3-1326-SM-2QRBQ,GTEX-R55E-0008-SM-3QNG3,GTEX-RWS6-0008-SM-3QHWG_direct,GTEX-RWS6-0008-SM-3QHWG,GTEX-R55E-0008-SM-3QNG3_direct,GTEX-RWS6-0008-SM-3QHWG_rep,GTEX-T5JC-0011-R11A-SM-2TT24,GTEX-T5JC-0011-R10A-SM-2TT23,GTEX-T5JC-0011-R7A-SM-2TT1Z,GTEX-UTHO-2426-SM-38ZXF,GTEX-WFG7-0008-SM-3ML7A,GTEX-WY7C-1126-SM-3GS2X,GTEX-WY7C-1126-SM-3GS2X_rep,GTEX-WY7C-1126-SM-3GS2X_rep2,GTEX-WY7C-0726-SM-3GLGQ,GTEX-WYJK-2426-SM-3H5V1,GTEX-WYVS-0526-SM-3H5V7,GTEX-Y5LM-0426-SM-3YX99,GTEX-Y5LM-0426-SM-3YX99_rep,GTEX-Y5LM-0426-SM-3YX99_rep2,GTEX-ZF29-2026-SM-4TVXH,GTEX-ZPU1-0826-SM-4UJSC,GTEX-ZT9X-0326-SM-4U9QG,GTEX-ZT9X-1826-SM-4V2KV,GTEX-ZT9X-1826-SM-4V2KV_rep,GTEX-ZT9X-1826-SM-4V2KV_rep2,GTEX-ZVZP-0226-SM-4VEIO,K562_ampure,K562_ampure_70ng,K562_extrawash,K562_extrawashwarm,GTEX-QEG5-0008-SM-3QHW2_ctrl,GTEX-QEG5-0008-SM-3QHW2_exp,GTEX-QV44-0008-SM-3QNG7_ctrl1,GTEX-QV44-0008-SM-3QNG7_ctrl2,GTEX-QV44-0008-SM-3QNG7_exp,GTEX-S4Z8-0008-SM-2Y983_ctrl,GTEX-S4Z8-0008-SM-2Y983_exp1,GTEX-S4Z8-0008-SM-2Y983_exp2,GTEX-S95S-0008-SM-3RQ8B_ctrl,GTEX-S95S-0008-SM-3RQ8B_exp1,GTEX-S95S-0008-SM-3RQ8B_exp2,GTEX-WY7C-0008-SM-3NZB5_ctrl,GTEX-WY7C-0008-SM-3NZB5_exp
0,000187c4-a488-40f0-a69c-0a89582f3241_ENSG00000173848.18,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.271232,0.0,0.0,0.0,0.0,0.0,0.0,0.401559,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.855814,0.0,0.0,0.0,0.34776,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.247011,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.172998,0.0,0.0,0.0,3.568258,4.2275,4.134056,0.0,0.0,0.0,0.334328,0.358385,0.420881,0.97198,0.0,0.0,0.0,0.262969,0.0,0.397173
1,00026598-3078-4e2f-8ac9-dd8f523396b9_ENSG00000102893.15_ENSG00000102893.15,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.357341,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.345291,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.292644,0.452385,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.140389,0.0,0.0,0.322937,0.0,0.0,0.0,0.0,0.0,0.0,0.282519,0.0,0.342038,0.0,0.0,0.0,0.0,0.920954,0.0,0.0,0.826811,0.0,0.377575,0.0,0.0,0.358385,0.0,0.0,0.278141,0.294667,0.0,0.262969,0.0,0.397173
2,0002a5e2-f01a-4690-a7db-7af726712a5e_ENSG00000071575.11_ENSG00000071575.11,0.380702,5.359084,1.961873,4.590649,1.793796,7.308494,6.346269,2.378808,0.653233,1.356161,0.0,1.711933,2.473291,2.706481,3.394736,3.11726,2.007797,2.406889,1.40879,0.0,0.921998,3.176194,1.621951,2.031087,2.182747,3.019761,4.142551,1.864178,1.716797,11.361996,11.657984,0.345291,5.990699,2.730105,2.955553,7.782465,0.69552,0.491895,0.459837,1.684399,3.227072,5.267594,1.809538,1.499532,1.387856,1.208018,1.271994,0.22215,2.927223,3.098819,4.965564,2.286598,2.068881,1.898499,2.055162,0.0,0.0,8.116883,4.773238,1.741776,1.450395,1.614686,0.26049,1.235055,1.721758,1.079359,0.446525,0.32937,0.282519,0.343607,3.762416,1.506611,0.518995,1.606998,3.876758,4.604768,7.850167,2.5365,4.960867,16.087012,23.409654,4.534268,8.692515,12.185087,7.154979,12.635743,10.013078,14.144038,13.873059,13.937337,1.727199,11.518015


In [40]:
flair_tpm_quant_data.transcript[0]

'000187c4-a488-40f0-a69c-0a89582f3241_ENSG00000173848.18'

In [41]:
flair_tpm_quant_data[flair_tpm_quant_data.transcript=='000187c4-a488-40f0-a69c-0a89582f3241_ENSG00000173848.18']

Unnamed: 0,transcript,GTEX-1192X-0011-R10a-SM-4RXXZ,GTEX-11H98-0011-R11b-SM-4SFLZ,GTEX-11TTK-0011-R7b-SM-4TVFS,GTEX-1211K-0826-SM-7LDFQ,GTEX-1313W-0011-R7b-SM-4ZL3U,GTEX-13QBU-0426-SM-5A4VT,GTEX-13QJ3-0726-SM-7LDHS,GTEX-13QJ3-0726-SM-7LDHS_rep,GTEX-13RTJ-0011-R7b-SM-5CTCB,GTEX-13VXU-0011-R11b-SM-5BFQZ,GTEX-13X6J-0011-R10b-SM-5CEKT,GTEX-145MH-0011-R3b-SM-5CTCM,GTEX-14BIL-0011-R10a-SM-5EQV4,GTEX-14BMU-0526-SM-5CA2F,GTEX-14BMU-0526-SM-5CA2F_rep,GTEX-14BMU-0526-SM-5CA2F_rep2,GTEX-14C5O-0011-R7b-SM-5GUPO,GTEX-14XAO-0926-SM-5YQWC,GTEX-15DCD-0011-R10b-SM-5S51M,GTEX-15ER7-0011-R5b-SM-5S51V,GTEX-15ER7-0011-R7a-SM-5QYP2,GTEX-15RIE-1726-SM-5V7WB,GTEX-17F97-0011-R11b-SM-63KY2,GTEX-17MFQ-1926-SM-6659L,GTEX-1C64N-0326-SM-6ZHT1,GTEX-1GN1W-0226-SM-7AGLJ,GTEX-1GN1W-0226-SM-7AGLJ_rep,GTEX-1H11D-1226-SM-9P6XJ,GTEX-1H3NZ-0011-R11b-SM-AUNOV,GTEX-1HBPH-0226-SM-7LLUW,GTEX-1I6K7-0626-SM-AAEQW,GTEX-1I6K7-1226-SM-AAEQX,GTEX-1IDJD-1226-SM-AXRWG,GTEX-1IDJD-0226-SM-AML89,GTEX-1IDJF-0826-SM-ABADH,GTEX-1IDJU-0726-SM-BXZK2,GTEX-1KXAM-0426-SM-CYKMP,GTEX-1KXAM-2426-SM-CYKMT,GTEX-1LVA9-0326-SM-CYRXA,GTEX-OHPL-0326-SM-DPSB8,GTEX-OIZI-0008-SM-2FR3P,GTEX-OXRL-0008-SM-2FR3T,GTEX-PSDG-0008-SM-3NZBI,GTEX-Q2AG-0011-R11A-SM-2EBL2,GTEX-Q2AG-0011-R11A-SM-2EBL2_rep,GTEX-Q2AG-0011-R11A-SM-2EBL2_rep2,GTEX-QDT8-0011-R10A-SM-2FKJB,GTEX-R53T-0326-SM-2K8S4,GTEX-S4P3-1326-SM-2QRBQ,GTEX-R55E-0008-SM-3QNG3,GTEX-RWS6-0008-SM-3QHWG_direct,GTEX-RWS6-0008-SM-3QHWG,GTEX-R55E-0008-SM-3QNG3_direct,GTEX-RWS6-0008-SM-3QHWG_rep,GTEX-T5JC-0011-R11A-SM-2TT24,GTEX-T5JC-0011-R10A-SM-2TT23,GTEX-T5JC-0011-R7A-SM-2TT1Z,GTEX-UTHO-2426-SM-38ZXF,GTEX-WFG7-0008-SM-3ML7A,GTEX-WY7C-1126-SM-3GS2X,GTEX-WY7C-1126-SM-3GS2X_rep,GTEX-WY7C-1126-SM-3GS2X_rep2,GTEX-WY7C-0726-SM-3GLGQ,GTEX-WYJK-2426-SM-3H5V1,GTEX-WYVS-0526-SM-3H5V7,GTEX-Y5LM-0426-SM-3YX99,GTEX-Y5LM-0426-SM-3YX99_rep,GTEX-Y5LM-0426-SM-3YX99_rep2,GTEX-ZF29-2026-SM-4TVXH,GTEX-ZPU1-0826-SM-4UJSC,GTEX-ZT9X-0326-SM-4U9QG,GTEX-ZT9X-1826-SM-4V2KV,GTEX-ZT9X-1826-SM-4V2KV_rep,GTEX-ZT9X-1826-SM-4V2KV_rep2,GTEX-ZVZP-0226-SM-4VEIO,K562_ampure,K562_ampure_70ng,K562_extrawash,K562_extrawashwarm,GTEX-QEG5-0008-SM-3QHW2_ctrl,GTEX-QEG5-0008-SM-3QHW2_exp,GTEX-QV44-0008-SM-3QNG7_ctrl1,GTEX-QV44-0008-SM-3QNG7_ctrl2,GTEX-QV44-0008-SM-3QNG7_exp,GTEX-S4Z8-0008-SM-2Y983_ctrl,GTEX-S4Z8-0008-SM-2Y983_exp1,GTEX-S4Z8-0008-SM-2Y983_exp2,GTEX-S95S-0008-SM-3RQ8B_ctrl,GTEX-S95S-0008-SM-3RQ8B_exp1,GTEX-S95S-0008-SM-3RQ8B_exp2,GTEX-WY7C-0008-SM-3NZB5_ctrl,GTEX-WY7C-0008-SM-3NZB5_exp
0,000187c4-a488-40f0-a69c-0a89582f3241_ENSG00000173848.18,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.271232,0.0,0.0,0.0,0.0,0.0,0.0,0.401559,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.855814,0.0,0.0,0.0,0.34776,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.247011,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.172998,0.0,0.0,0.0,3.568258,4.2275,4.134056,0.0,0.0,0.0,0.334328,0.358385,0.420881,0.97198,0.0,0.0,0.0,0.262969,0.0,0.397173


In [42]:
transcript_TPM_with_ID_df[transcript_TPM_with_ID_df.transcript=='000187c4-a488-40f0-a69c-0a89582f3241_ENSG00000173848.18']

Unnamed: 0,transcript,GTEX-1192X-0011-R10a-SM-4RXXZ,GTEX-11H98-0011-R11b-SM-4SFLZ,GTEX-11TTK-0011-R7b-SM-4TVFS,GTEX-1211K-0826-SM-7LDFQ,GTEX-1313W-0011-R7b-SM-4ZL3U,GTEX-13QBU-0426-SM-5A4VT,GTEX-13QJ3-0726-SM-7LDHS,GTEX-13QJ3-0726-SM-7LDHS_rep,GTEX-13RTJ-0011-R7b-SM-5CTCB,GTEX-13VXU-0011-R11b-SM-5BFQZ,GTEX-13X6J-0011-R10b-SM-5CEKT,GTEX-145MH-0011-R3b-SM-5CTCM,GTEX-14BIL-0011-R10a-SM-5EQV4,GTEX-14BMU-0526-SM-5CA2F,GTEX-14BMU-0526-SM-5CA2F_rep,GTEX-14BMU-0526-SM-5CA2F_rep2,GTEX-14C5O-0011-R7b-SM-5GUPO,GTEX-14XAO-0926-SM-5YQWC,GTEX-15DCD-0011-R10b-SM-5S51M,GTEX-15ER7-0011-R5b-SM-5S51V,GTEX-15ER7-0011-R7a-SM-5QYP2,GTEX-15RIE-1726-SM-5V7WB,GTEX-17F97-0011-R11b-SM-63KY2,GTEX-17MFQ-1926-SM-6659L,GTEX-1C64N-0326-SM-6ZHT1,GTEX-1GN1W-0226-SM-7AGLJ,GTEX-1GN1W-0226-SM-7AGLJ_rep,GTEX-1H11D-1226-SM-9P6XJ,GTEX-1H3NZ-0011-R11b-SM-AUNOV,GTEX-1HBPH-0226-SM-7LLUW,GTEX-1I6K7-0626-SM-AAEQW,GTEX-1I6K7-1226-SM-AAEQX,GTEX-1IDJD-1226-SM-AXRWG,GTEX-1IDJD-0226-SM-AML89,GTEX-1IDJF-0826-SM-ABADH,GTEX-1IDJU-0726-SM-BXZK2,GTEX-1KXAM-0426-SM-CYKMP,GTEX-1KXAM-2426-SM-CYKMT,GTEX-1LVA9-0326-SM-CYRXA,GTEX-OHPL-0326-SM-DPSB8,GTEX-OIZI-0008-SM-2FR3P,GTEX-OXRL-0008-SM-2FR3T,GTEX-PSDG-0008-SM-3NZBI,GTEX-Q2AG-0011-R11A-SM-2EBL2,GTEX-Q2AG-0011-R11A-SM-2EBL2_rep,GTEX-Q2AG-0011-R11A-SM-2EBL2_rep2,GTEX-QDT8-0011-R10A-SM-2FKJB,GTEX-R53T-0326-SM-2K8S4,GTEX-S4P3-1326-SM-2QRBQ,GTEX-R55E-0008-SM-3QNG3,GTEX-RWS6-0008-SM-3QHWG_direct,GTEX-RWS6-0008-SM-3QHWG,GTEX-R55E-0008-SM-3QNG3_direct,GTEX-RWS6-0008-SM-3QHWG_rep,GTEX-T5JC-0011-R11A-SM-2TT24,GTEX-T5JC-0011-R10A-SM-2TT23,GTEX-T5JC-0011-R7A-SM-2TT1Z,GTEX-UTHO-2426-SM-38ZXF,GTEX-WFG7-0008-SM-3ML7A,GTEX-WY7C-1126-SM-3GS2X,GTEX-WY7C-1126-SM-3GS2X_rep,GTEX-WY7C-1126-SM-3GS2X_rep2,GTEX-WY7C-0726-SM-3GLGQ,GTEX-WYJK-2426-SM-3H5V1,GTEX-WYVS-0526-SM-3H5V7,GTEX-Y5LM-0426-SM-3YX99,GTEX-Y5LM-0426-SM-3YX99_rep,GTEX-Y5LM-0426-SM-3YX99_rep2,GTEX-ZF29-2026-SM-4TVXH,GTEX-ZPU1-0826-SM-4UJSC,GTEX-ZT9X-0326-SM-4U9QG,GTEX-ZT9X-1826-SM-4V2KV,GTEX-ZT9X-1826-SM-4V2KV_rep,GTEX-ZT9X-1826-SM-4V2KV_rep2,GTEX-ZVZP-0226-SM-4VEIO,K562_ampure,K562_ampure_70ng,K562_extrawash,K562_extrawashwarm,GTEX-QEG5-0008-SM-3QHW2_ctrl,GTEX-QEG5-0008-SM-3QHW2_exp,GTEX-QV44-0008-SM-3QNG7_ctrl1,GTEX-QV44-0008-SM-3QNG7_ctrl2,GTEX-QV44-0008-SM-3QNG7_exp,GTEX-S4Z8-0008-SM-2Y983_ctrl,GTEX-S4Z8-0008-SM-2Y983_exp1,GTEX-S4Z8-0008-SM-2Y983_exp2,GTEX-S95S-0008-SM-3RQ8B_ctrl,GTEX-S95S-0008-SM-3RQ8B_exp1,GTEX-S95S-0008-SM-3RQ8B_exp2,GTEX-WY7C-0008-SM-3NZB5_ctrl,GTEX-WY7C-0008-SM-3NZB5_exp
0,000187c4-a488-40f0-a69c-0a89582f3241_ENSG00000173848.18,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.275591,0.0,0.0,0.0,0.0,0.0,0.0,0.409973,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.858561,0.0,0.0,0.0,0.348678,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.247905,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.174879,0.0,0.0,0.0,3.569575,4.230351,4.136672,0.0,0.0,0.0,0.335124,0.359675,0.421937,0.974555,0.0,0.0,0.0,0.263975,0.0,0.39919
