In [1]:
import pandas as pd

files = {
    "Week_0_Normal": "GSE162653_Week_0_Normal_weight_EDITED.txt",
    "Week_0_Obese": "GSE162653_Week_0_Obese_EDITED.txt",
    "Week_12_Normal": "GSE162653_Week_12_Normal_weight_EDITED.txt",
    "Week_12_Obese": "GSE162653_Week_12_Obese_EDITED.txt",
}

#making the normal at week 0 data frame
df_0_normal = pd.read_csv("GSE162653_Week_0_Normal_weight_EDITED.txt", sep="\t", skipinitialspace=True)

#making the first column title set to "gene"
df_0_normal = df_0_normal.rename({'Unnamed: 0':'Gene'})

df_0_normal.columns = ['Gene', '001_V2', '010_V2', '015_V2', '017_V2', '024_V2',
       '028_V2', '034_V2', '040_V2', '042_V2', '043_V2']

#making the obese at week 0 data frame
df_0_obese = pd.read_csv("GSE162653_Week_0_Obese_EDITED.txt", sep="\t", skipinitialspace=True)

#making the first column title set to "gene", so we can make this the index/key to merge on
df_0_obese.columns = ['Gene', '052_V2', '054_V2', '063_V2', '070_V2', '072_V2',
       '078_V2', '085_V2', '092_V2', '099_V2', '100_V2']

#making the indexing by gene for both dataframes
df_0_normal.set_index('Gene')
df_0_obese.set_index('Gene')

#combining the week 0 data
df_0 = pd.merge(df_0_normal, df_0_obese, how='outer', on='Gene',suffixes=('_normal','_obese'))
df_0.to_csv("Monday_df_0_combined.txt", sep="\t")


In [3]:
#loading in the week 12 data
df_12_normal = pd.read_csv("GSE162653_Week_12_Normal_weight_EDITED.txt", sep="\t", skipinitialspace=True)
df_12_obese = pd.read_csv("GSE162653_Week_12_Obese_EDITED.txt", sep="\t", skipinitialspace=True)


#renaming the column titles so that the first column can be used as the index gene

df_12_normal.columns = ['Gene', '001_V4', '010_V4', '015_V4', '017_V4', '024_V4',
       '028_V4', '034_V4', '040_V4', '042_V4', '043_V4']

df_12_obese.columns = ['Gene', '052_V4', '054_V4', '063_V4', '070_V4', '072_V4',
       '078_V4', '085_V4', '092_V4', '099_V4', '100_V4']

#setting the index here to gene as well
df_12_normal.set_index('Gene')
df_12_obese.set_index('Gene')

#combinig the week 12 data
df_12 = pd.merge(df_12_normal, df_12_obese, how='outer', on='Gene',suffixes=('_normal','_obese'))
df_12.to_csv("Monday_df_12_combined.txt", sep="\t")


In [5]:
#combining the week 0 data and week 12 data into one big ol' dataframe
df_main = pd.merge(df_0, df_12, how='outer',on='Gene',suffixes=('_0','_12'))

df_main.shape

df_main.to_csv("Monday_ALL_combined.txt", sep="\t")
df_main.to_csv("Monday_ALL_combined.csv")

In [7]:
#also gonna save as an excel file in case it's easier to casually view the data this way

import openpyxl

df_main.to_excel('Monday_ALL_combined.xlsx')