# load packages

In [None]:
import pandas as pd

In [None]:
from sklearn.preprocessing import StandardScaler, MinMaxScaler

In [None]:
import seaborn as sns

In [None]:
import matplotlib.pyplot as plt

In [None]:
import numpy as np

# read in input files

In [None]:
gene_score_adsp = pd.read_csv('common_var_gene_score/igap_adsp_gene_score/merged_outputs/AOU_ALL.UKBB.metasoft.ADSP.all.VEP_v113.gene_by_position.r2_0.1_clump_variants_excluded.RE_pval_threshold_0.05.gene_symbol.average_gene_score.merged.common_id.transpose.txt.gz',
                              sep = '\t')
print(gene_score_adsp.shape)
print(gene_score_adsp[~gene_score_adsp['GENE'].isin(['ALZ_STATUS', 'AGE', 'SEX', 'PC1', 'PC2', 'PC3', 'PC4', 'PC5', 'PC6', 'PC7', 'PC8'])].drop(columns = ['GENE']).astype(float).min().min())
print(gene_score_adsp[~gene_score_adsp['GENE'].isin(['ALZ_STATUS', 'AGE', 'SEX', 'PC1', 'PC2', 'PC3', 'PC4', 'PC5', 'PC6', 'PC7', 'PC8'])].drop(columns = ['GENE']).astype(float).max().max())

In [None]:
rnaseq_rosmap = pd.read_csv('pathway_score/gene_mapping/ROSMAP.RNAseq.TPM5_log2norm.individualids.codinggenes.VEP_v113_genes.gene_symbol.common_id.duplicate_ids_removed.transpose.txt.gz',
                            sep = '\t')
print(rnaseq_rosmap.drop(columns = ['GENE']).min().min())
print(rnaseq_rosmap.drop(columns = ['GENE']).max().max())
print(rnaseq_rosmap.shape)

In [None]:
rnaseq_10_msbb = pd.read_csv('pathway_score/msbb/MSBB.RNAseq.BA_10.19batch.gene_symbol.individualID.mvalue_norm.tpm.log2.coding_genes_only.covar_corrected.common_id.transpose.txt',
                             sep = '\t')
print(rnaseq_10_msbb.shape)
print(rnaseq_10_msbb.drop(columns = ['GENE']).min().min())
print(rnaseq_10_msbb.drop(columns = ['GENE']).max().max())

In [None]:
rnaseq_22_msbb = pd.read_csv('pathway_score/msbb/MSBB.RNAseq.BA_22.19batch.gene_symbol.individualID.mvalue_norm.tpm.log2.coding_genes_only.covar_corrected.common_id.transpose.txt',
                             sep = '\t')
print(rnaseq_22_msbb.shape)
print(rnaseq_22_msbb.drop(columns = ['GENE']).min().min())
print(rnaseq_22_msbb.drop(columns = ['GENE']).max().max())

In [None]:
rnaseq_36_msbb = pd.read_csv('pathway_score/msbb/MSBB.RNAseq.BA_36.19batch.gene_symbol.individualID.mvalue_norm.tpm.log2.coding_genes_only.covar_corrected.common_id.transpose.txt',
                             sep = '\t')
print(rnaseq_36_msbb.shape)
print(rnaseq_36_msbb.drop(columns = ['GENE']).min().min())
print(rnaseq_36_msbb.drop(columns = ['GENE']).max().max())

In [None]:
rnaseq_44_msbb = pd.read_csv('pathway_score/msbb/MSBB.RNAseq.BA_44.19batch.gene_symbol.individualID.mvalue_norm.tpm.log2.coding_genes_only.covar_corrected.common_id.transpose.txt',
                             sep = '\t')
print(rnaseq_44_msbb.shape)
print(rnaseq_44_msbb.drop(columns = ['GENE']).min().min())
print(rnaseq_44_msbb.drop(columns = ['GENE']).max().max())

In [None]:
methyl_rosmap = pd.read_csv('pathway_score/rosmap/ROSMAP_arrayMethylation_imputed.gene_symbol.individualID.mvalue_norm.weighted_gene_average.common_id.transpose.txt',
                            sep = '\t')
print(methyl_rosmap.shape)
print(methyl_rosmap.drop(columns = ['GENE']).min().min())
print(methyl_rosmap.drop(columns = ['GENE']).max().max())

In [None]:
methyl_msbb = pd.read_csv('pathway_score/msbb/MSBB.methylation_array.19batch.gene_symbol.individualID.mvalue_norm.weighted_gene_average.common_id.transpose.txt',
                          sep = '\t')
print(methyl_msbb.shape)
print(methyl_msbb.drop(columns = ['GENE']).min().min())
print(methyl_msbb.drop(columns = ['GENE']).max().max())

In [None]:
somoscan_rosmap = pd.read_csv('pathway_score/rosmap/ROSMAP.proteomics.somoscan.individualID.entrez_gene_symbol.common_id.transpose.txt.gz',
                              sep = '\t')
print(somoscan_rosmap.shape)
print(somoscan_rosmap.drop(columns = ['GENE']).min().min())
print(somoscan_rosmap.drop(columns = ['GENE']).max().max())

In [None]:
tmt_msbb = pd.read_csv('pathway_score/msbb/MSBB.TMT_proteomics.19batch.normalized.gene_symbol.individualID.log2_transformed.common_id.transpose.txt',
                       sep = '\t')
print(tmt_msbb.shape)
print(tmt_msbb.drop(columns = ['GENE']).min().min())
print(tmt_msbb.drop(columns = ['GENE']).max().max())

# clean up dfs

## gene scores

In [None]:
gene_score_adsp_clean = gene_score_adsp[~gene_score_adsp['GENE'].isin(['ALZ_STATUS', 'AGE', 'SEX', 'PC1', 'PC2', 'PC3', 'PC4', 'PC5', 'PC6', 'PC7', 'PC8'])]
gene_score_adsp_clean.head()

## replace inf with missing in methlation

In [None]:
methyl_rosmap_clean = methyl_rosmap.replace([np.inf, -np.inf], np.nan)

In [None]:
methyl_msbb_clean = methyl_msbb.replace([np.inf, -np.inf], np.nan)

# scale

## gene score

In [None]:
input_df = gene_score_adsp_clean.copy()

scaler = StandardScaler()
predictors = [col for col in input_df.columns if col != 'GENE']
gene = input_df[['GENE']]
output_df = scaler.fit_transform(input_df[predictors])
output_df = pd.DataFrame(output_df)
output_df = pd.concat([gene, output_df], axis = 1)
output_df.columns = input_df.columns

print(input_df[predictors].mean().mean())
print(input_df[predictors].std().mean())

print(output_df[predictors].mean().mean())
print(output_df[predictors].std().mean())

gene_score_adsp_scaled_df = output_df.copy()
gene_score_adsp_scaled_df.head()

In [None]:
input_df = gene_score_adsp_clean.copy()

scaler = MinMaxScaler(feature_range = (-14.472073470708509, 28.78601705422015))
predictors = [col for col in input_df.columns if col != 'GENE']
gene = input_df[['GENE']]
output_df = scaler.fit_transform(input_df[predictors])
output_df = pd.DataFrame(output_df)
output_df = pd.concat([gene, output_df], axis = 1)
output_df.columns = input_df.columns

print(input_df[predictors].min().min())
print(input_df[predictors].max().max())

print(output_df[predictors].min().min())
print(output_df[predictors].max().max())

gene_score_adsp_minmax_scaled_df = output_df.copy()
gene_score_adsp_minmax_scaled_df.head()

## rosmap rnaseq

In [None]:
input_df = rnaseq_rosmap.copy()

scaler = StandardScaler()
predictors = [col for col in input_df.columns if col != 'GENE']
gene = input_df[['GENE']]
output_df = scaler.fit_transform(input_df[predictors])
output_df = pd.DataFrame(output_df)
output_df = pd.concat([gene, output_df], axis = 1)
output_df.columns = input_df.columns

print(input_df[predictors].mean().mean())
print(input_df[predictors].std().mean())

print(output_df[predictors].mean().mean())
print(output_df[predictors].std().mean())

rnaseq_rosmap_scaled_df = output_df.copy()
rnaseq_rosmap_scaled_df.head()

In [None]:
input_df = rnaseq_rosmap.copy()

scaler = MinMaxScaler(feature_range = (-14.472073470708509, 28.78601705422015))
predictors = [col for col in input_df.columns if col != 'GENE']
gene = input_df[['GENE']]
output_df = scaler.fit_transform(input_df[predictors])
output_df = pd.DataFrame(output_df)
output_df = pd.concat([gene, output_df], axis = 1)
output_df.columns = input_df.columns

print(input_df[predictors].min().min())
print(input_df[predictors].max().max())

print(output_df[predictors].min().min())
print(output_df[predictors].max().max())

rnaseq_rosmap_minmax_scaled_df = output_df.copy()
rnaseq_rosmap_minmax_scaled_df.head()

## msbb rnaseq 10

In [None]:
input_df = rnaseq_10_msbb.copy()

scaler = StandardScaler()
predictors = [col for col in input_df.columns if col != 'GENE']
gene = input_df[['GENE']]
output_df = scaler.fit_transform(input_df[predictors])
output_df = pd.DataFrame(output_df)
output_df = pd.concat([gene, output_df], axis = 1)
output_df.columns = input_df.columns

print(input_df[predictors].mean().mean())
print(input_df[predictors].std().mean())

print(output_df[predictors].mean().mean())
print(output_df[predictors].std().mean())

rnaseq_10_msbb_scaled_df = output_df.copy()
rnaseq_10_msbb_scaled_df.head()

In [None]:
input_df = rnaseq_10_msbb.copy()

scaler = MinMaxScaler(feature_range = (-14.472073470708509, 28.78601705422015))
predictors = [col for col in input_df.columns if col != 'GENE']
gene = input_df[['GENE']]
output_df = scaler.fit_transform(input_df[predictors])
output_df = pd.DataFrame(output_df)
output_df = pd.concat([gene, output_df], axis = 1)
output_df.columns = input_df.columns

print(input_df[predictors].min().min())
print(input_df[predictors].max().max())

print(output_df[predictors].min().min())
print(output_df[predictors].max().max())

rnaseq_10_msbb_minmax_scaled_df = output_df.copy()
rnaseq_10_msbb_minmax_scaled_df.head()

## msbb rnaseq 22

In [None]:
input_df = rnaseq_22_msbb.copy()

scaler = StandardScaler()
predictors = [col for col in input_df.columns if col != 'GENE']
gene = input_df[['GENE']]
output_df = scaler.fit_transform(input_df[predictors])
output_df = pd.DataFrame(output_df)
output_df = pd.concat([gene, output_df], axis = 1)
output_df.columns = input_df.columns

print(input_df[predictors].mean().mean())
print(input_df[predictors].std().mean())

print(output_df[predictors].mean().mean())
print(output_df[predictors].std().mean())

rnaseq_22_msbb_scaled_df = output_df.copy()
rnaseq_22_msbb_scaled_df.head()

In [None]:
input_df = rnaseq_22_msbb.copy()

scaler = MinMaxScaler(feature_range = (-14.472073470708509, 28.78601705422015))
predictors = [col for col in input_df.columns if col != 'GENE']
gene = input_df[['GENE']]
output_df = scaler.fit_transform(input_df[predictors])
output_df = pd.DataFrame(output_df)
output_df = pd.concat([gene, output_df], axis = 1)
output_df.columns = input_df.columns

print(input_df[predictors].min().min())
print(input_df[predictors].max().max())

print(output_df[predictors].min().min())
print(output_df[predictors].max().max())

rnaseq_22_msbb_minmax_scaled_df = output_df.copy()
rnaseq_22_msbb_minmax_scaled_df.head()

## msbb rnaseq 36

In [None]:
input_df = rnaseq_36_msbb.copy()

scaler = StandardScaler()
predictors = [col for col in input_df.columns if col != 'GENE']
gene = input_df[['GENE']]
output_df = scaler.fit_transform(input_df[predictors])
output_df = pd.DataFrame(output_df)
output_df = pd.concat([gene, output_df], axis = 1)
output_df.columns = input_df.columns

print(input_df[predictors].mean().mean())
print(input_df[predictors].std().mean())

print(output_df[predictors].mean().mean())
print(output_df[predictors].std().mean())

rnaseq_36_msbb_scaled_df = output_df.copy()
rnaseq_36_msbb_scaled_df.head()

In [None]:
input_df = rnaseq_36_msbb.copy()

scaler = MinMaxScaler(feature_range = (-14.472073470708509, 28.78601705422015))
predictors = [col for col in input_df.columns if col != 'GENE']
gene = input_df[['GENE']]
output_df = scaler.fit_transform(input_df[predictors])
output_df = pd.DataFrame(output_df)
output_df = pd.concat([gene, output_df], axis = 1)
output_df.columns = input_df.columns

print(input_df[predictors].min().min())
print(input_df[predictors].max().max())

print(output_df[predictors].min().min())
print(output_df[predictors].max().max())

rnaseq_36_msbb_minmax_scaled_df = output_df.copy()
rnaseq_36_msbb_minmax_scaled_df.head()

## msbb rnaseq 44

In [None]:
input_df = rnaseq_44_msbb.copy()

scaler = StandardScaler()
predictors = [col for col in input_df.columns if col != 'GENE']
gene = input_df[['GENE']]
output_df = scaler.fit_transform(input_df[predictors])
output_df = pd.DataFrame(output_df)
output_df = pd.concat([gene, output_df], axis = 1)
output_df.columns = input_df.columns

print(input_df[predictors].mean().mean())
print(input_df[predictors].std().mean())

print(output_df[predictors].mean().mean())
print(output_df[predictors].std().mean())

rnaseq_44_msbb_scaled_df = output_df.copy()
rnaseq_44_msbb_scaled_df.head()

In [None]:
input_df = rnaseq_44_msbb.copy()

scaler = MinMaxScaler(feature_range = (-14.472073470708509, 28.78601705422015))
predictors = [col for col in input_df.columns if col != 'GENE']
gene = input_df[['GENE']]
output_df = scaler.fit_transform(input_df[predictors])
output_df = pd.DataFrame(output_df)
output_df = pd.concat([gene, output_df], axis = 1)
output_df.columns = input_df.columns

print(input_df[predictors].min().min())
print(input_df[predictors].max().max())

print(output_df[predictors].min().min())
print(output_df[predictors].max().max())

rnaseq_44_msbb_minmax_scaled_df = output_df.copy()
rnaseq_44_msbb_minmax_scaled_df.head()

## methyl rosmap

In [None]:
input_df = methyl_rosmap_clean.copy()

scaler = StandardScaler()
predictors = [col for col in input_df.columns if col != 'GENE']
gene = input_df[['GENE']]
output_df = scaler.fit_transform(input_df[predictors])
output_df = pd.DataFrame(output_df)
output_df = pd.concat([gene, output_df], axis = 1)
output_df.columns = input_df.columns

print(input_df[predictors].mean().mean())
print(input_df[predictors].std().mean())

print(output_df[predictors].mean().mean())
print(output_df[predictors].std().mean())

methyl_rosmap_scaled_df = output_df.copy()
print(methyl_rosmap_scaled_df.shape)

In [None]:
input_df = methyl_rosmap_clean.copy()

scaler = MinMaxScaler(feature_range = (-14.472073470708509, 28.78601705422015))
predictors = [col for col in input_df.columns if col != 'GENE']
gene = input_df[['GENE']]
output_df = scaler.fit_transform(input_df[predictors])
output_df = pd.DataFrame(output_df)
output_df = pd.concat([gene, output_df], axis = 1)
output_df.columns = input_df.columns

print(input_df[predictors].min().min())
print(input_df[predictors].max().max())

print(output_df[predictors].min().min())
print(output_df[predictors].max().max())

methyl_rosmap_minmax_scaled_df = output_df.copy()
methyl_rosmap_minmax_scaled_df.head()

## methyl msbb

In [None]:
input_df = methyl_msbb_clean.copy()

scaler = StandardScaler()
predictors = [col for col in input_df.columns if col != 'GENE']
gene = input_df[['GENE']]
output_df = scaler.fit_transform(input_df[predictors])
output_df = pd.DataFrame(output_df)
output_df = pd.concat([gene, output_df], axis = 1)
output_df.columns = input_df.columns

print(input_df[predictors].mean().mean())
print(input_df[predictors].std().mean())

print(output_df[predictors].mean().mean())
print(output_df[predictors].std().mean())

methyl_msbb_scaled_df = output_df.copy()
print(methyl_msbb_scaled_df.shape)

In [None]:
input_df = methyl_msbb_clean.copy()

scaler = MinMaxScaler(feature_range = (-14.472073470708509, 28.78601705422015))
predictors = [col for col in input_df.columns if col != 'GENE']
gene = input_df[['GENE']]
output_df = scaler.fit_transform(input_df[predictors])
output_df = pd.DataFrame(output_df)
output_df = pd.concat([gene, output_df], axis = 1)
output_df.columns = input_df.columns

print(input_df[predictors].min().min())
print(input_df[predictors].max().max())

print(output_df[predictors].min().min())
print(output_df[predictors].max().max())

methyl_msbb_minmax_scaled_df = output_df.copy()
methyl_msbb_minmax_scaled_df.head()

## rosmap somoscan

In [None]:
input_df = somoscan_rosmap.copy()

scaler = StandardScaler()
predictors = [col for col in input_df.columns if col != 'GENE']
gene = input_df[['GENE']]
output_df = scaler.fit_transform(input_df[predictors])
output_df = pd.DataFrame(output_df)
output_df = pd.concat([gene, output_df], axis = 1)
output_df.columns = input_df.columns

print(input_df[predictors].mean().mean())
print(input_df[predictors].std().mean())

print(output_df[predictors].mean().mean())
print(output_df[predictors].std().mean())

somoscan_rosmap_scaled_df = output_df.copy()
somoscan_rosmap_scaled_df.head()

In [None]:
input_df = somoscan_rosmap.copy()

scaler = MinMaxScaler(feature_range = (-14.472073470708509, 28.78601705422015))
predictors = [col for col in input_df.columns if col != 'GENE']
gene = input_df[['GENE']]
output_df = scaler.fit_transform(input_df[predictors])
output_df = pd.DataFrame(output_df)
output_df = pd.concat([gene, output_df], axis = 1)
output_df.columns = input_df.columns

print(input_df[predictors].min().min())
print(input_df[predictors].max().max())

print(output_df[predictors].min().min())
print(output_df[predictors].max().max())

somoscan_rosmap_minmax_scaled_df = output_df.copy()
somoscan_rosmap_minmax_scaled_df.head()

## tmt msbb

In [None]:
input_df = tmt_msbb.copy()

scaler = StandardScaler()
predictors = [col for col in input_df.columns if col != 'GENE']
gene = input_df[['GENE']]
output_df = scaler.fit_transform(input_df[predictors])
output_df = pd.DataFrame(output_df)
output_df = pd.concat([gene, output_df], axis = 1)
output_df.columns = input_df.columns

print(input_df[predictors].mean().mean())
print(input_df[predictors].std().mean())

print(output_df[predictors].mean().mean())
print(output_df[predictors].std().mean())

tmt_msbb_scaled_df = output_df.copy()
tmt_msbb_scaled_df.head()

In [None]:
input_df = tmt_msbb.copy()

scaler = MinMaxScaler(feature_range = (-14.472073470708509, 28.78601705422015))
predictors = [col for col in input_df.columns if col != 'GENE']
gene = input_df[['GENE']]
output_df = scaler.fit_transform(input_df[predictors])
output_df = pd.DataFrame(output_df)
output_df = pd.concat([gene, output_df], axis = 1)
output_df.columns = input_df.columns

print(input_df[predictors].min().min())
print(input_df[predictors].max().max())

print(output_df[predictors].min().min())
print(output_df[predictors].max().max())

tmt_msbb_minmax_scaled_df = output_df.copy()
tmt_msbb_minmax_scaled_df.head()

# export

## gene score

In [None]:
gene_score_adsp_scaled_df.to_csv('common_var_gene_score/igap_adsp_gene_score/merged_outputs/AOU_ALL.UKBB.metasoft.ADSP.all.VEP_v113.gene_by_position.r2_0.1_clump_variants_excluded.RE_pval_threshold_0.05.gene_symbol.average_gene_score.merged.common_id.transpose.scaled.txt',
                                 sep = '\t', index = None)

In [None]:
gene_score_adsp_minmax_scaled_df.to_csv('common_var_gene_score/igap_adsp_gene_score/merged_outputs/AOU_ALL.UKBB.metasoft.ADSP.all.VEP_v113.gene_by_position.r2_0.1_clump_variants_excluded.RE_pval_threshold_0.05.gene_symbol.average_gene_score.merged.common_id.transpose.minmax.scaled.txt',
                                        sep = '\t', index = None)

## rosmap rnaseq

In [None]:
rnaseq_rosmap_scaled_df.to_csv('pathway_score/gene_mapping/ROSMAP.RNAseq.TPM5_log2norm.individualids.codinggenes.VEP_v113_genes.gene_symbol.common_id.duplicate_ids_removed.transpose.scaled.txt',
                               sep = '\t', index = None)

In [None]:
rnaseq_rosmap_minmax_scaled_df.to_csv('pathway_score/gene_mapping/ROSMAP.RNAseq.TPM5_log2norm.individualids.codinggenes.VEP_v113_genes.gene_symbol.common_id.duplicate_ids_removed.transpose.minmax.scaled.txt',
                                      sep = '\t', index = None)

## msbb 10 rnaseq

In [None]:
rnaseq_10_msbb_scaled_df.to_csv('pathway_score/msbb/MSBB.RNAseq.BA_10.19batch.gene_symbol.individualID.mvalue_norm.tpm.log2.coding_genes_only.covar_corrected.common_id.transpose.scaled.txt',
                                sep = '\t', index = None)

In [None]:
rnaseq_10_msbb_minmax_scaled_df.to_csv('pathway_score/msbb/MSBB.RNAseq.BA_10.19batch.gene_symbol.individualID.mvalue_norm.tpm.log2.coding_genes_only.covar_corrected.common_id.transpose.minmax.scaled.txt',
                                       sep = '\t', index = None)

## msbb 22 rnaseq

In [None]:
rnaseq_22_msbb_scaled_df.to_csv('pathway_score/msbb/MSBB.RNAseq.BA_22.19batch.gene_symbol.individualID.mvalue_norm.tpm.log2.coding_genes_only.covar_corrected.common_id.transpose.scaled.txt',
                                sep = '\t', index = None)

In [None]:
rnaseq_22_msbb_minmax_scaled_df.to_csv('pathway_score/msbb/MSBB.RNAseq.BA_22.19batch.gene_symbol.individualID.mvalue_norm.tpm.log2.coding_genes_only.covar_corrected.common_id.transpose.minmax.scaled.txt',
                                       sep = '\t', index = None)

## msbb 36 rnaseq

In [None]:
rnaseq_36_msbb_scaled_df.to_csv('pathway_score/msbb/MSBB.RNAseq.BA_36.19batch.gene_symbol.individualID.mvalue_norm.tpm.log2.coding_genes_only.covar_corrected.common_id.transpose.scaled.txt',
                                sep = '\t', index = None)

In [None]:
rnaseq_36_msbb_minmax_scaled_df.to_csv('pathway_score/msbb/MSBB.RNAseq.BA_36.19batch.gene_symbol.individualID.mvalue_norm.tpm.log2.coding_genes_only.covar_corrected.common_id.transpose.minmax.scaled.txt',
                                       sep = '\t', index = None)

## msbb 44 rnaseq

In [None]:
rnaseq_44_msbb_scaled_df.to_csv('pathway_score/msbb/MSBB.RNAseq.BA_44.19batch.gene_symbol.individualID.mvalue_norm.tpm.log2.coding_genes_only.covar_corrected.common_id.transpose.scaled.txt',
                                sep = '\t', index = None)

In [None]:
rnaseq_44_msbb_minmax_scaled_df.to_csv('pathway_score/msbb/MSBB.RNAseq.BA_44.19batch.gene_symbol.individualID.mvalue_norm.tpm.log2.coding_genes_only.covar_corrected.common_id.transpose.minmax.scaled.txt',
                                       sep = '\t', index = None)

## methyl rosmap

In [None]:
methyl_rosmap_scaled_df.to_csv('pathway_score/rosmap/ROSMAP_arrayMethylation_imputed.gene_symbol.individualID.mvalue_norm.weighted_gene_average.common_id.transpose.scaled.txt',
                               sep = '\t', index = None)

In [None]:
methyl_rosmap_minmax_scaled_df.to_csv('pathway_score/rosmap/ROSMAP_arrayMethylation_imputed.gene_symbol.individualID.mvalue_norm.weighted_gene_average.common_id.transpose.minmax.scaled.txt',
                                      sep = '\t', index = None)

## methyl msbb

In [None]:
methyl_msbb_scaled_df.to_csv('pathway_score/msbb/MSBB.methylation_array.19batch.gene_symbol.individualID.mvalue_norm.weighted_gene_average.common_id.transpose.scaled.txt',
                             sep = '\t', index = None)

In [None]:
methyl_msbb_minmax_scaled_df.to_csv('pathway_score/msbb/MSBB.methylation_array.19batch.gene_symbol.individualID.mvalue_norm.weighted_gene_average.common_id.transpose.minmax.scaled.txt',
                                    sep = '\t', index = None)

## somoscan rosmap

In [None]:
somoscan_rosmap_scaled_df.to_csv('pathway_score/rosmap/ROSMAP.proteomics.somoscan.individualID.entrez_gene_symbol.common_id.transpose.scaled.txt',
                                 sep = '\t', index = None)

In [None]:
somoscan_rosmap_minmax_scaled_df.to_csv('pathway_score/rosmap/ROSMAP.proteomics.somoscan.individualID.entrez_gene_symbol.common_id.transpose.minmax.scaled.txt',
                                        sep = '\t', index = None)

## tmt msbb

In [None]:
tmt_msbb_scaled_df.to_csv('pathway_score/msbb/MSBB.TMT_proteomics.19batch.normalized.gene_symbol.individualID.log2_transformed.common_id.transpose.scaled.txt',
                          sep = '\t', index = None)

In [None]:
tmt_msbb_minmax_scaled_df.to_csv('pathway_score/msbb/MSBB.TMT_proteomics.19batch.normalized.gene_symbol.individualID.log2_transformed.common_id.transpose.minmax.scaled.txt',
                                 sep = '\t', index = None)