In [None]:
#Bowel Movement Frequency
#Metabolomics Analysis
#James Johnson
#Credit to Christian Diener, PhD as noted
#v 12-22-22

# Use this Arivale snapshot path
#frozen_ss_path='/shared-data/snapshots/arivale_snapshot_ISB_2020-03-16_2156'

# Load libraries
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
import statsmodels.api as sm
import statsmodels.formula.api as smf
import seaborn as sns

# Get the library
from arivale_data_interface import *
import arivale_data_interface as adi

# Set display options
pd.set_option('display.max_rows', 200)
pd.set_option('display.max_columns', 200)
pd.set_option('display.width', 1000)
from IPython.display import display

# Apply these settings so the library knows where the data is
adi.apply_isb_config()

# If you want plots to show up in the notebook you need to run this
%matplotlib inline
plt.rcParams["figure.figsize"] = [10, 10]

In [None]:
#Obtain Bowel Movement Frequency (BMF) data:
bowel = adi.get_snapshot('assessments')
bowel = bowel.sort_values('days_in_program',ascending=True) # Sort df by days first
bowel = bowel.drop(columns = ['vendor','days_in_program','days_since_first_call','days_since_first_draw']) # Drop days and vendor, unneeded from this point
bowel = bowel.drop_duplicates(subset='public_client_id') # Keep only the first timepoint for each public_client_id
bowel = bowel.fillna(0) # Fill in empty BMF data with zero
bowel = bowel.set_index('public_client_id') # Arrange df by index of PCI
bowel = bowel[['assessment:digestion:bowel-movements:enum']]
bowel = bowel.rename(columns={"assessment:digestion:bowel-movements:enum":"bowel"}) # rename column to "bowel"
bowel = bowel[bowel['bowel'] != 0] #remove participants with no bowel data, reduce from 5764 -> 3955 individuals
bowel_list = ['(1) 2 or fewer times per week', '(2) 3-6 times per week', '(3) 1-3 times daily', '(4) 4+ times daily']
bowel_r = [1,2,3,4] #convert bowel responses to bowel movement frequency per week (minimum of each range, 1x, 3x, 7x, 28x)
bowel.bowel = bowel.bowel.replace(to_replace = bowel_list, value = bowel_r)
bowel = bowel.reset_index() # 3955 individuals
bowel

  t = pandas.to_datetime(x.str.replace("^arivale_snapshot.*(\\d{4}-\\d{2}-\\d{2}_\\d{4})$", "\\1"), format="%Y-%m-%d_%H%M")
  colnames = hdr.loc[~hdr.str.contains("^#")].head(1).str.replace("\n$","")
  hdr = hdr.loc[hdr.str.contains("^#")].str.replace("\n$","")
  fields = hdr.str.replace("^# [^:]+: *(.*)$",r"\1")
  fields.index = hdr.str.replace("^# ([^:]+):.*$",r"\1")
  return "\n".join(list(hdr.loc[hdr.index >= i].str.replace("^# ","")))


Unnamed: 0,public_client_id,bowel
0,01092042,3
1,01568974,3
2,01684342,2
3,01601230,3
4,01124029,3
...,...,...
3950,01395286,3
3951,01232614,3
3952,01181682,3
3953,01380110,3


In [None]:
#Obtain "eGFR" calculated GFR data (credit: Alexandra Ralevski) code chunk below:
################################################################################################
chems = adi.get_snapshot('chemistries', clean=True)
cl = adi.get_snapshot('clients', clean=True)
chems_dems = join_clients(cl, chems)
#these are the relevant column names
[col for col in chems.columns if 'CREAT' in col]
[col for col in chems.columns if 'GFR' in col]
def f(sex, age, creatinine): 
    if sex == 'F':
        if (creatinine/0.7) <=1:
            return 142*(((creatinine/0.7)**-0.241) * (0.9938**age) * 1.012)
        else:
            return 142*(((creatinine/0.7)**-1.200) * (0.9938**age) * 1.012)
    if sex == 'M':
        if (creatinine/0.9) <=1:
            return 142*(((creatinine/0.9)**-0.302) * (0.9938**age))
        else:
            return 142*(((creatinine/0.7)**-1.200) * (0.9938**age))

creat_calc = chems_dems[['public_client_id','sex', 'age', 'CREATININE_ENZ__SER']]

creat_calc['eGFR'] = creat_calc.apply(lambda x: f(x.sex, x.age, x.CREATININE_ENZ__SER), axis=1)
creat_calc.to_csv('eGFR.csv',index = False)
################################################################################################

#prepare eGFR dataframe:
eGFR = creat_calc
#eGFR = eGFR.set_index('public_client_id')
eGFR = eGFR[['public_client_id','eGFR']] #select relevant columns
#drop duplicate entries to reduce 12316 entries across all individuals
#to 6133 individuals
eGFR = eGFR.dropna()
eGFR = eGFR.drop_duplicates('public_client_id')
eGFR

  t = pandas.to_datetime(x.str.replace("^arivale_snapshot.*(\\d{4}-\\d{2}-\\d{2}_\\d{4})$", "\\1"), format="%Y-%m-%d_%H%M")
  colnames = hdr.loc[~hdr.str.contains("^#")].head(1).str.replace("\n$","")
  hdr = hdr.loc[hdr.str.contains("^#")].str.replace("\n$","")
  fields = hdr.str.replace("^# [^:]+: *(.*)$",r"\1")
  fields.index = hdr.str.replace("^# ([^:]+):.*$",r"\1")
  return "\n".join(list(hdr.loc[hdr.index >= i].str.replace("^# ","")))
  x.columns = x.columns.str.replace("[^a-zA-Z0-9]","_").str.replace("^([0-9])","_\\1")
  x.columns = x.columns.str.replace("[^a-zA-Z0-9]","_").str.replace("^([0-9])","_\\1")
  t = pandas.to_datetime(x.str.replace("^arivale_snapshot.*(\\d{4}-\\d{2}-\\d{2}_\\d{4})$", "\\1"), format="%Y-%m-%d_%H%M")
  colnames = hdr.loc[~hdr.str.contains("^#")].head(1).str.replace("\n$","")
  hdr = hdr.loc[hdr.str.contains("^#")].str.replace("\n$","")
  fields = hdr.str.replace("^# [^:]+: *(.*)$",r"\1")
  fields.index = hdr.str.replace("^# ([^:]+):.*$",r"\1")
  return "

Unnamed: 0,public_client_id,eGFR
3,01001298,99.024207
4,01001467,100.959522
6,01001548,105.411124
7,01001621,69.439409
9,01001661,120.947576
...,...,...
12307,QIRL,111.687296
12311,ZU273983,118.179626
12312,ZU612255,70.256126
12313,ZU621944,120.472213


In [5]:
# Blood plasma serum metabolites snapshot:
# Get the metabolomics data:
rawmet=adi.get_snapshot('metabolomics_corrected')
rawmet = rawmet.sort_values('days_in_program',ascending=True) # Sort by days
rawmet = rawmet.sort_values('public_client_id',ascending=True) # Sort by PCI
rawmet=rawmet.drop(columns={"sample_id","days_in_program","days_since_first_call","days_since_first_draw","month","weekday","season"}) # Drop unneeded columns
rawmet = rawmet.drop_duplicates('public_client_id') # This line drops duplicates from this snapshot from 3305 participants -> 2043
met_zerocounts=(rawmet == 0).sum() # sum up times any columns have zero values
met_nonnancounts=(~rawmet.isna()).sum() # sum up times any columns have non-NA values
rawmet = rawmet.loc[:, met_nonnancounts/rawmet.shape[0] >= 0.70] #this sum of zero values/num of total rows should less than 30% to proceed with the cohort
rawmet = rawmet.dropna(axis = 0, how = 'all') # Drop patients with all NaN values
rawmet = rawmet.dropna(axis = 1, how = 'all') # Drop patients with all NaN values
rawmet = rawmet.fillna(rawmet.median()) # Fill df NaNs with very small values instead of 0
#rawmet = rawmet.set_index('public_client_id') # arrange index by PCI
rawmet
#2043 individuals

  t = pandas.to_datetime(x.str.replace("^arivale_snapshot.*(\\d{4}-\\d{2}-\\d{2}_\\d{4})$", "\\1"), format="%Y-%m-%d_%H%M")
  colnames = hdr.loc[~hdr.str.contains("^#")].head(1).str.replace("\n$","")
  hdr = hdr.loc[hdr.str.contains("^#")].str.replace("\n$","")
  fields = hdr.str.replace("^# [^:]+: *(.*)$",r"\1")
  fields.index = hdr.str.replace("^# ([^:]+):.*$",r"\1")
  return "\n".join(list(hdr.loc[hdr.index >= i].str.replace("^# ","")))
  rawmet = rawmet.fillna(rawmet.median()) # Fill df NaNs with very small values instead of 0


Unnamed: 0,public_client_id,35,50,55,62,93,98,111,112,132,136,158,171,179,180,181,182,189,192,194,197,209,212,229,231,234,235,240,241,244,250,252,254,266,267,273,275,278,279,297,302,310,313,330,331,338,339,340,342,344,355,356,358,361,363,376,391,397,407,409,415,424,432,439,444,445,452,460,461,480,482,491,498,501,503,504,512,519,533,535,537,561,563,564,565,566,572,796,798,799,800,803,806,811,815,821,823,825,827,849,...,999946616,999946620,999946623,999946624,999946627,999946632,999946633,999946636,999946639,999946645,999946646,999946657,999946666,999946673,999946674,999946681,999946685,999946690,999946695,999946700,999946701,999946705,999946707,999946710,999946902,999946905,999946911,999946966,999946970,999946972,999946973,999946977,999946986,999946997,999946998,999947006,999947011,999947417,999947437,999947478,999947493,999947642,999947650,999947654,999947670,999947671,999947687,999947708,999947788,999947790,999947802,999947804,999947818,999947820,999947905,999947929,999947955,999947959,999947971,999947977,999947988,999947993,999948001,999948009,999948047,999948076,999948081,999948094,999949463,999949512,999949515,999949517,999949521,999949555,999949557,999949592,999949637,999949679,999949681,999949883,999952025,999952286,999952483,999952501,999952502,999952504,999952524,999952533,999952640,999952661,999952843,999952865,999952867,999952870,999952877,999952909,999953114,999953157,999953267,999954840
0,01000261,0.972222,2.568898,1.155771,0.824435,0.947589,0.772955,0.716831,1.193115,5.372793,24.532961,1.289964,1.135706,0.815813,0.710183,0.986860,0.603223,1.421159,1.128161,1.186826,1.186918,2.183882,1.129249,0.920111,1.374374,1.891255,0.819227,1.204927,1.203517,1.017136,0.921926,1.530622,0.389302,1.364602,1.437235,1.702655,0.954904,2.320103,0.708487,4.268696,2.899063,0.816147,3.386740,1.101887,0.785114,0.943850,0.875629,1.076899,1.014633,1.051367,1.239469,2.139945,1.987275,3.027573,1.165933,1.031538,1.053787,1.165150,1.364448,1.219670,1.115540,0.832081,1.370398,0.920689,1.555217,1.408812,0.800073,1.035181,0.934017,1.245427,1.512853,0.951191,1.512646,4.848959,1.096566,2.289297,1.570808,1.039696,0.889427,0.980195,1.237122,0.948468,1.329892,1.461135,1.029702,1.077272,0.924483,0.496321,1.188124,0.933092,1.196293,0.796418,0.744728,1.375578,0.748462,0.972041,1.600477,1.164032,0.553433,1.373963,...,2.695183,0.819572,0.606842,1.380649,5.777018,1.152754,1.220782,0.167234,0.506707,1.376055,0.585078,0.733665,15.507542,7.548603,0.989995,1.449365,0.960719,1.252370,0.953545,1.799173,2.910742,0.965338,0.651738,0.378580,0.571384,1.854875,2.604398,1.030214,1.039960,1.128947,0.927640,0.924388,1.142827,0.730759,4.020639,1.009418,2.206431,0.885257,1.115327,2.592638,1.835164,0.588192,0.298005,3.765115,1.168743,0.467600,0.918908,2.920539,1.087581,1.021349,0.739217,0.754325,0.462004,0.689655,1.012121,1.000043,0.891436,1.069549,0.671550,0.446172,0.809453,1.266994,4.729395,1.144651,0.790954,1.018050,1.053664,0.997330,0.546438,1.206396,1.436551,1.013768,1.585908,0.483140,0.494334,0.689787,1.214707,1.310367,0.523531,0.570142,0.878512,1.266454,0.934197,1.365642,1.165906,0.659998,0.999463,1.371351,1.089485,1.493849,0.856545,1.678183,1.144330,1.292103,0.715138,1.114859,1.045152,0.592175,0.923405,0.980653
1,01001621,1.819302,0.704097,0.619724,1.014908,1.334809,1.341022,0.971382,0.977802,0.437747,0.597480,0.981717,0.373895,2.085763,0.567837,0.650733,0.983778,1.036290,0.888782,1.192718,0.666124,1.047442,1.219334,0.663285,1.661423,0.694435,2.090090,1.321783,0.546186,0.927013,0.484962,1.264994,0.683409,0.999556,1.063370,0.955280,1.053888,0.834389,0.813427,0.566890,1.378451,1.030161,0.557247,1.359100,1.121047,1.189167,2.339233,1.287490,0.819302,1.526069,0.914017,0.778223,1.437623,0.681799,0.851270,0.929102,1.152256,0.817847,0.871570,1.169466,0.909120,0.644457,1.023283,1.009925,1.015428,0.987975,0.379701,0.962439,1.500350,1.197596,0.760786,0.951191,0.820892,0.538089,0.999284,0.765463,1.128796,0.533141,1.162388,0.894506,1.426137,0.529222,1.009188,1.318555,0.915440,0.804123,0.996878,0.693355,1.003074,0.849613,1.615323,0.603969,0.592127,1.113037,0.968207,1.119836,0.838256,0.836145,1.734544,3.448607,...,2.841334,0.614300,0.992375,0.687927,0.997586,1.173688,1.005829,1.607427,1.486123,1.030870,1.722813,1.324431,1.017005,17.098502,0.989995,0.990457,1.085562,0.665675,2.055824,1.180362,1.080516,0.667261,0.769920,1.957673,2.227080,1.389496,0.970008,0.781084,2.302494,0.591117,1.199069,1.224311,1.254009,0.982351,0.247112,1.001132,1.001347,0.734604,3.553576,1.063844,0.984213,2.135471,2.320744,0.961425,0.814772,1.462328,0.894339,0.996005,1.288771,1.021349,0.753729,0.661740,2.258629,1.251819,1.479819,2.515144,1.096075,0.997352,1.830214,0.686897,2.077862,0.990652,0.526165,0.992708,0.980669,1.078174,1.028737,1.011223,1.013171,1.454377,0.872246,1.013768,10.215746,1.694952,0.627407,0.558186,0.808554,0.991109,1.203914,1.281067,0.988128,0.718099,0.516304,1.284870,1.022681,0.679225,0.713206,0.994872,2.363626,0.940232,0.820114,0.961806,1.015091,1.016476,1.742466,0.525021,0.983414,0.737648,0.844609,0.980653
3,01002183,0.528804,2.260729,0.425073,2.299795,0.850577,1.737810,0.984920,2.335956,3.769524,3.896395,1.051881,1.459102,1.823657,2.978882,2.421741,1.466470,1.207379,1.758998,1.133902,1.520067,1.886599,1.093981,1.201631,0.740414,1.339688,0.990273,0.979290,0.319515,1.098019,1.325594,1.753197,32.210346,1.100406,1.230342,0.895924,1.038174,1.514974,2.536602,2.710388,0.470894,3.014329,2.526205,1.322621,0.462182,0.870719,1.617798,0.998268,1.873371,0.925059,0.775723,1.065127,2.299804,3.634989,1.590725,0.803890,1.125505,0.784719,0.929209,1.258474,0.828234,2.270925,1.441238,2.466381,1.180070,1.721624,5.867892,0.814355,1.072046,0.979631,1.208090,1.548912,1.124846,1.943683,0.936875,0.464060,1.677937,3.414667,1.381473,1.047617,1.146355,0.802923,0.934881,0.955544,0.658789,0.866354,0.930874,2.272248,1.548701,0.911506,0.969242,0.906317,1.556853,0.874275,0.961637,1.151840,1.251795,1.459896,0.701073,0.023024,...,1.692679,0.261399,8.741517,0.753129,9.556887,0.965060,1.335196,5.975684,1.035380,0.486720,0.501176,0.958028,0.059995,1.006791,1.296573,0.999665,1.336956,1.329022,1.203016,0.831101,1.538813,5.268829,0.569734,0.177557,0.460412,9.419514,0.505720,2.618249,0.668784,1.426144,0.985807,0.841155,0.585205,1.642595,1.355057,9.323010,0.282722,1.442073,0.940509,2.624852,1.876157,0.861270,4.439497,0.166112,0.563895,0.966311,1.028446,1.386704,1.019769,2.251398,1.921009,1.806371,0.951667,1.312641,1.706791,2.319721,1.096288,2.016603,1.219276,0.711310,1.514662,1.223954,1.927196,0.977777,9.023102,1.842714,1.037084,4.320820,1.076432,0.608346,1.000454,0.830907,0.319562,1.448167,0.551810,1.201820,1.319489,0.991109,1.765913,0.786596,0.640124,1.012736,0.743734,0.758288,1.507977,0.602664,1.372594,0.752198,0.632819,1.231781,0.979239,0.666351,0.505361,0.315999,0.643624,1.456737,0.772146,3.109291,0.896029,0.932469
4,01002412,0.863152,0.535317,1.008430,1.300685,0.877139,0.772371,1.052063,1.128991,1.276539,0.338884,0.912151,1.371908,0.993805,1.363787,1.691931,1.149111,1.695642,1.353985,0.946088,0.739603,0.837236,1.219042,1.627303,0.896095,1.232910,0.635565,0.824078,1.354499,0.696302,0.850491,0.116368,1.331680,1.330306,1.336548,1.707707,0.970455,2.454634,1.285158,2.004822,0.874492,0.463814,1.506055,1.478072,0.644207,1.102536,0.699082,0.762516,0.667225,0.665948,1.119785,1.968280,0.740929,2.525954,0.973392,0.893094,0.902797,0.961872,1.004920,1.253473,0.809371,1.442111,0.966668,1.253539,0.962945,0.987827,2.745546,0.932228,1.008731,0.748856,2.432967,0.331273,1.425743,2.298414,0.827643,0.052189,0.981442,1.920976,1.034740,1.116247,1.259668,0.695022,0.832403,0.809243,0.921793,0.870250,1.016423,1.322008,1.365583,0.647609,1.114263,0.833467,1.375467,0.959994,0.939378,0.888631,2.022399,1.381412,0.542122,0.370307,...,0.993954,0.990161,0.375014,0.247210,0.997586,1.657402,0.988605,1.231948,5.352143,0.432327,2.105681,1.460228,2.133159,0.988333,1.756289,0.922048,1.400946,1.269941,0.830175,1.021127,1.136340,0.754905,1.012129,0.403511,1.536304,0.990189,0.952409,0.986874,0.314467,1.095291,1.854689,1.010113,1.586589,0.388884,0.261917,0.677321,0.299104,1.249010,0.354919,1.629255,0.916581,0.700685,1.823693,0.110104,1.154961,1.927119,0.953554,0.362096,0.684793,1.718999,1.165320,1.042208,1.512897,1.099416,1.071476,0.898256,1.077274,0.767719,0.961963,0.661606,1.105208,0.541328,0.556993,0.905297,1.010583,1.353932,2.052933,1.910046,2.137562,0.931497,0.998001,1.013768,1.217739,1.048890,1.108697,0.884804,1.009820,0.291430,1.409572,1.325102,1.166231,1.353643,2.557282,0.884912,0.988793,1.549910,0.601601,1.370806,0.564907,0.767939,0.934401,0.744207,0.922136,0.981230,1.143238,1.350473,0.725215,1.702258,1.010258,0.639387
6,01002471,2.064995,0.986490,1.308322,0.773852,0.760033,1.120927,0.864391,0.303651,1.272669,0.315599,0.995144,0.656958,0.964420,1.697865,1.024676,1.289724,2.051666,0.824469,1.151999,0.931829,0.660730,0.860587,2.224214,0.912627,0.781160,1.258297,0.815119,1.081719,1.136016,0.705771,0.804477,0.336264,1.139861,0.902644,1.039865,1.020039,0.995660,0.826441,0.589480,0.802184,1.277612,0.563587,0.582758,1.560815,1.026992,0.474899,1.603208,0.374648,0.676397,0.890703,1.300481,0.956750,0.730311,0.553297,1.064050,0.950831,1.008005,1.070929,0.615761,0.863889,1.417916,0.788280,1.720298,0.977289,0.693026,2.019326,0.955565,0.907692,1.073787,0.690338,1.025866,0.885360,0.435372,0.995659,0.744475,0.839650,1.611892,1.025128,1.195571,0.874040,0.950650,0.972500,0.968054,1.039965,1.030774,0.951808,0.988564,0.829006,0.823075,1.336834,0.830718,0.699213,0.944482,0.796977,1.052902,0.767993,0.945428,1.220494,1.124982,...,0.424669,1.074053,1.061026,1.623698,0.103251,1.183251,1.300748,0.157823,6.638761,2.703289,0.963890,0.581882,1.826102,1.006791,1.773629,1.582059,0.920416,0.544685,0.818892,0.588983,0.792668,0.997951,1.256255,0.182453,0.785908,0.787675,0.357447,0.202418,1.269296,0.809168,0.641894,1.065702,0.637479,1.114242,0.833660,0.693932,4.641100,0.923287,1.067618,1.300248,1.383848,0.427153,0.844063,0.355064,0.994877,1.219488,1.235941,0.680863,1.231617,1.021349,0.525346,0.574549,0.493011,0.850680,1.326200,0.880279,0.988154,0.997352,0.651892,1.537800,1.074156,1.010185,1.106668,1.404952,0.651197,0.871550,0.821550,0.553413,1.327705,2.160051,1.800796,0.934822,2.194548,0.723246,0.925423,1.113210,0.756221,1.279691,0.834587,0.835386,0.248901,0.816067,0.354885,1.293357,0.894301,1.332717,0.584096,0.622946,0.673490,1.647810,2.823129,0.822285,0.449556,1.873760,0.846569,1.708918,0.983414,0.865380,1.153715,0.980653
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
3300,HX409129,0.293945,1.169026,2.116840,0.888013,0.994897,0.685195,2.681062,0.842799,1.212464,0.191386,0.924692,1.498795,0.775644,1.463832,1.410570,0.741907,0.754003,0.985389,1.000957,0.853879,0.985995,0.884191,1.363257,0.794610,1.049076,0.334771,0.791397,1.012681,0.907027,0.733194,0.999376,1.039812,1.016732,0.950115,1.174212,0.771902,1.272168,0.336448,1.932395,0.515055,0.291243,1.957355,1.209582,0.930509,0.768473,0.325320,0.870067,0.171186,0.802546,1.026871,0.860504,1.638939,1.161628,1.054982,0.936356,0.699198,1.134129,1.056094,1.200610,0.917835,1.772614,1.240209,1.359660,0.985741,1.196599,2.376415,0.984309,0.914006,0.882419,1.376412,1.137091,0.755141,0.787131,1.155326,1.046611,1.054763,1.783531,0.770417,0.891620,0.571094,1.042764,0.916201,0.973237,0.748718,1.109750,0.878201,1.667638,1.222129,1.008472,0.781168,1.337876,0.878307,0.978517,1.005622,0.677396,1.100451,1.059340,0.952044,0.834551,...,0.410554,0.994271,0.490613,3.310144,0.997586,0.595945,1.046722,0.285591,0.676871,0.770590,0.216563,0.873380,1.017005,0.582037,0.791514,0.359549,0.671983,1.052018,0.646661,1.002885,0.287626,2.428708,0.334983,0.657411,0.956441,1.382889,5.221789,0.986874,0.982858,1.182890,1.000685,0.726752,0.992763,0.423556,0.297706,0.956572,1.001347,0.361518,0.927303,1.016359,0.984213,1.339607,0.328432,0.961425,1.160430,1.270745,0.702943,0.996005,0.716331,0.143873,1.645232,1.858631,0.467638,1.642978,0.845299,0.635652,0.978217,0.753862,1.013957,0.931314,0.949513,2.396748,0.213364,0.992708,1.245224,0.707155,1.026085,1.115858,1.013171,0.782362,0.787242,0.498829,0.052159,1.725756,0.610755,0.860259,0.750734,0.509069,1.418470,1.594174,0.942591,0.343925,0.907863,1.123352,1.052340,0.993945,1.132403,0.994872,0.958700,1.208956,0.795302,1.132065,2.370099,0.665257,1.230591,1.374512,0.271015,1.016984,1.010258,0.943314
3301,HX460562,0.967099,1.137992,1.731506,0.676390,0.804149,1.313167,1.003930,0.842896,1.034660,4.892710,1.349325,0.590254,0.773872,0.660153,0.810674,2.134438,1.411470,0.812872,1.117198,1.053634,0.901961,1.180933,0.808491,1.213340,1.191766,0.476361,1.417045,1.003818,1.226775,0.916593,1.060786,0.516050,0.989456,0.908439,0.746589,0.851187,0.934748,0.951570,1.020632,1.925098,1.664708,1.167862,0.777275,1.137106,0.874898,0.750916,0.988063,4.855933,0.852488,0.978802,0.648442,0.942340,0.989756,0.907819,1.058649,0.820754,1.094881,1.328300,0.854746,1.141695,0.873659,1.340750,0.840141,1.075907,1.168893,1.007298,1.162655,0.858106,1.023615,0.722871,0.951191,0.698737,0.675141,1.071068,2.123250,1.123728,0.843348,0.835169,1.028974,1.364395,1.044989,1.059805,1.549351,1.096307,1.214988,1.188926,1.696757,1.419263,0.856461,1.325343,1.686169,0.814738,1.152513,1.313716,1.300659,0.938338,0.949432,1.926365,1.886206,...,0.748818,1.311752,0.812088,0.899447,2.316296,1.372724,0.896752,0.787117,1.049491,0.373941,1.209983,0.967430,1.017005,1.006791,0.989995,0.879710,1.311278,0.697377,0.423724,0.657753,1.019636,0.997951,0.710309,4.851325,0.813197,0.569748,0.970008,0.986874,0.982858,0.830176,1.123124,1.242655,0.295063,0.595950,1.066278,1.009418,1.001347,0.670436,0.311704,0.431748,0.564371,1.172605,0.884355,1.493247,0.837906,0.669872,1.194474,0.674922,0.683711,0.998965,0.556303,0.992172,4.747186,1.100764,1.183830,1.000043,0.978217,0.997352,0.364934,0.490303,1.178855,0.990652,0.833629,0.931017,0.736767,1.297460,1.026085,0.696111,1.109097,1.488904,0.848086,0.388493,0.361643,1.002261,0.628152,0.650280,0.735295,1.149918,1.052895,1.036297,0.871674,0.818190,0.675211,1.529002,1.111636,1.514023,0.592653,0.771967,0.344492,1.457742,1.196898,0.637983,1.280635,1.552814,0.681650,1.256991,1.027760,0.947308,1.123345,0.854447
3302,HX794171,0.847237,0.739835,0.660610,0.742720,0.994897,1.022540,0.984920,0.892882,0.556806,1.020689,1.271883,0.908899,0.562607,1.606326,1.081211,0.566162,0.842122,0.921913,1.014110,0.813691,0.263425,0.852257,0.999842,0.644714,0.737477,1.012418,1.666856,1.175950,1.213544,1.147164,0.697014,3.227658,1.022125,0.764084,1.008475,1.134923,1.501059,0.681087,0.421655,0.494839,0.825173,0.357887,1.202161,1.440885,0.495096,1.136502,0.927470,0.952889,0.881206,0.866427,0.656156,0.956750,0.989756,0.777884,1.104414,1.006929,0.977068,0.860101,1.037788,0.959999,1.228826,0.608739,1.139937,1.052226,1.527722,1.686543,0.870300,1.009112,1.407180,1.103513,1.003782,0.738829,0.993264,0.999600,0.085900,0.660701,1.199279,0.745457,0.896482,2.946901,0.677493,0.883825,1.034886,0.872393,1.049007,0.895331,1.978742,1.037701,0.900396,1.387039,1.029819,0.998073,0.902280,0.813330,1.004686,1.071418,0.465846,0.771074,0.145891,...,0.674068,1.132728,0.916876,1.392433,0.997586,1.411063,1.303827,0.297318,0.903516,0.141576,2.294990,2.063530,0.330872,0.862191,0.989995,3.297034,1.525793,1.052018,0.690899,1.389069,1.153200,0.835391,1.930300,12.494666,1.246260,1.229625,0.970008,0.743217,0.648438,1.656908,1.629688,0.885974,0.727675,0.870340,0.365335,1.432755,0.658996,0.908713,0.442705,0.741779,0.806280,2.874496,1.281355,0.914997,1.361995,1.826027,0.831349,0.996005,0.808922,0.241492,1.878353,1.674086,1.619529,2.006647,0.887967,1.747914,1.013042,1.235154,1.497222,0.931314,0.833656,0.574115,0.486881,0.992708,0.941280,1.394025,1.026085,1.301059,1.294317,1.412740,0.541051,0.586660,1.251593,1.924372,1.005923,0.864534,1.174404,1.832098,1.392178,1.514256,0.633108,1.216083,1.037989,1.563296,1.632232,0.675297,0.988642,1.097448,0.833378,0.940232,1.126640,1.023881,1.296063,0.553423,0.969611,1.285084,1.733623,0.935738,1.010258,1.124675
3303,INEW,0.958132,2.187877,1.635473,0.793053,0.826271,2.112935,1.446977,1.236833,2.500101,4.786991,0.888386,2.051927,0.436781,0.904626,1.013039,1.232329,3.505438,0.811308,0.900621,1.412596,1.981013,0.720299,1.135925,0.876337,1.276568,2.785307,1.378173,1.118191,1.891294,0.526987,1.658525,0.561925,1.233850,1.435658,1.123733,1.145211,0.714259,1.354412,3.973211,0.817582,1.382921,4.777693,1.118794,0.786007,0.885228,0.919234,0.843833,2.441447,0.984592,0.993432,1.569950,0.808409,1.858431,1.474923,1.203146,0.937171,1.174463,0.993878,1.331893,1.048720,0.986489,1.975936,0.801913,1.034652,1.108172,1.169664,1.130142,0.920667,1.152048,1.423575,1.335704,1.281314,0.302595,0.736015,1.973289,1.157142,1.022229,1.375249,1.013729,0.506573,1.171922,0.883873,1.013466,1.122071,1.359226,0.964647,0.564049,1.016824,0.824540,1.043635,0.821326,0.588487,1.105307,0.955032,0.972875,1.143334,1.271508,0.561454,4.925820,...,2.038145,1.546206,0.907311,1.458233,0.085822,1.009130,1.118734,2.487615,0.376692,3.337197,1.067689,0.517654,2.432184,0.751093,0.917748,0.582558,0.741585,0.545501,1.630514,0.694774,1.104264,0.258609,0.665797,0.241260,0.983612,1.566991,0.174873,0.153320,0.816234,0.971794,1.259316,2.006549,0.775108,1.270336,1.008525,1.332353,1.483697,0.738098,1.596064,0.257389,0.620371,0.836804,0.476419,3.334104,0.757069,1.102936,1.397552,0.806825,0.682566,0.403907,0.797098,0.984870,0.678347,1.140204,0.915967,1.355472,0.972091,1.547769,0.677287,0.958792,1.087288,0.964500,1.401698,1.404048,1.248806,0.769752,0.997274,1.339972,2.100294,0.999283,0.893002,2.616666,0.064125,0.936390,1.492462,0.885103,0.989237,0.991109,0.548039,0.909615,0.567963,1.305335,1.063255,0.798746,0.531192,1.083452,1.911078,1.535510,1.963208,0.874430,0.459620,0.639348,0.670493,3.087680,0.970384,1.066472,0.983414,1.161242,0.629977,0.629693


In [5]:
#Get BMI data
bmi = adi.get_snapshot('weight_monthly')
bmi = bmi[['public_client_id','days_in_program','BMI_CALC']] # Keep relevant columns
bmi = bmi.sort_values('days_in_program',ascending=True) # Sort by days in program
bmi = bmi.sort_values('public_client_id',ascending=True) # Sort by PCI
bmi = bmi.drop('days_in_program', axis=1) # Drop days column (unneeded at this point)
bmi = bmi.drop_duplicates('public_client_id') # Drop duplicate PCI
#bmi = bmi.set_index('public_client_id') # Arrange index by PCI
bmi = bmi.dropna() # Drop PCI with no BMI data
bmi #5567 individuals

  t = pandas.to_datetime(x.str.replace("^arivale_snapshot.*(\\d{4}-\\d{2}-\\d{2}_\\d{4})$", "\\1"), format="%Y-%m-%d_%H%M")
  colnames = hdr.loc[~hdr.str.contains("^#")].head(1).str.replace("\n$","")
  hdr = hdr.loc[hdr.str.contains("^#")].str.replace("\n$","")
  fields = hdr.str.replace("^# [^:]+: *(.*)$",r"\1")
  fields.index = hdr.str.replace("^# ([^:]+):.*$",r"\1")
  return "\n".join(list(hdr.loc[hdr.index >= i].str.replace("^# ","")))


Unnamed: 0,public_client_id,BMI_CALC
0,01000261,22.594123
3,01000552,31.619378
5,01001181,39.047808
8,01001298,25.948604
14,01001548,36.119222
...,...,...
46475,QIRL,31.942410
46562,ZU273983,32.042139
46566,ZU612255,36.045023
46569,ZU621944,51.577264


In [6]:
#Now, get the Assessments data
bio=adi.get_snapshot('clients')
a = bio['sex']
b = bio['age']
c = bio['public_client_id']
biodf = pd.DataFrame({'sex':a, 'age':b, 'public_client_id':c}) # Get df with desired columns
biodf = biodf[['sex','age','public_client_id']]
#biodf = biodf.set_index('public_client_id') # Arrange index by PCI
biodf = biodf.dropna()
biodf = biodf.replace(to_replace = 'F', value = 'W') # Replace F with W so R Studio doesn't interpret women as a boolean
biodf #6133 individuals

  t = pandas.to_datetime(x.str.replace("^arivale_snapshot.*(\\d{4}-\\d{2}-\\d{2}_\\d{4})$", "\\1"), format="%Y-%m-%d_%H%M")
  colnames = hdr.loc[~hdr.str.contains("^#")].head(1).str.replace("\n$","")
  hdr = hdr.loc[hdr.str.contains("^#")].str.replace("\n$","")
  fields = hdr.str.replace("^# [^:]+: *(.*)$",r"\1")
  fields.index = hdr.str.replace("^# ([^:]+):.*$",r"\1")
  return "\n".join(list(hdr.loc[hdr.index >= i].str.replace("^# ","")))


Unnamed: 0,sex,age,public_client_id
0,M,54.0,01000552
1,W,52.0,01000978
2,W,48.0,01001181
3,W,61.0,01001298
4,W,31.0,01001467
...,...,...,...
6128,W,44.0,QIRL
6129,W,32.0,ZU273983
6130,W,35.0,ZU612255
6131,W,37.0,ZU621944


In [7]:
# Merge dfs
output_df = pd.merge(biodf,bmi)
output_df = pd.merge(output_df,eGFR)
output_df = pd.merge(output_df,bowel)
output_df = pd.merge(output_df,rawmet)
metab = output_df

metab = metab.set_index('public_client_id')

#Metadata for R Studio - LIMMA:
metab.iloc[:,:5].to_csv('metab_meta.csv')

#Metabolite count data for R Studio - LIMMA
metab.iloc[:,5:].transpose().to_csv('metab_counts.csv')

#Full dataframe:
metab.to_csv('metab_full.csv')

#Rearrange df for metabolite heatmap
metab_hm = metab
metab_hm = metab_hm.reset_index() # Remove PCI from the index
metab_hm = metab_hm.drop(columns = ['public_client_id','sex','age','BMI_CALC']) # Drop columns that aren't metabolite or bowel
metab_hm = metab_hm.set_index('bowel') # Arrange index by bowel (BMF)
metab_hm.to_csv('metab_hm.csv')

metab

Unnamed: 0_level_0,sex,age,BMI_CALC,eGFR,bowel,35,50,55,62,93,98,111,112,132,136,158,171,179,180,181,182,189,192,194,197,209,212,229,231,234,235,240,241,244,250,252,254,266,267,273,275,278,279,297,302,310,313,330,331,338,339,340,342,344,355,356,358,361,363,376,391,397,407,409,415,424,432,439,444,445,452,460,461,480,482,491,498,501,503,504,512,519,533,535,537,561,563,564,565,566,572,796,798,799,800,803,806,811,815,821,...,999946616,999946620,999946623,999946624,999946627,999946632,999946633,999946636,999946639,999946645,999946646,999946657,999946666,999946673,999946674,999946681,999946685,999946690,999946695,999946700,999946701,999946705,999946707,999946710,999946902,999946905,999946911,999946966,999946970,999946972,999946973,999946977,999946986,999946997,999946998,999947006,999947011,999947417,999947437,999947478,999947493,999947642,999947650,999947654,999947670,999947671,999947687,999947708,999947788,999947790,999947802,999947804,999947818,999947820,999947905,999947929,999947955,999947959,999947971,999947977,999947988,999947993,999948001,999948009,999948047,999948076,999948081,999948094,999949463,999949512,999949515,999949517,999949521,999949555,999949557,999949592,999949637,999949679,999949681,999949883,999952025,999952286,999952483,999952501,999952502,999952504,999952524,999952533,999952640,999952661,999952843,999952865,999952867,999952870,999952877,999952909,999953114,999953157,999953267,999954840
public_client_id,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1,Unnamed: 22_level_1,Unnamed: 23_level_1,Unnamed: 24_level_1,Unnamed: 25_level_1,Unnamed: 26_level_1,Unnamed: 27_level_1,Unnamed: 28_level_1,Unnamed: 29_level_1,Unnamed: 30_level_1,Unnamed: 31_level_1,Unnamed: 32_level_1,Unnamed: 33_level_1,Unnamed: 34_level_1,Unnamed: 35_level_1,Unnamed: 36_level_1,Unnamed: 37_level_1,Unnamed: 38_level_1,Unnamed: 39_level_1,Unnamed: 40_level_1,Unnamed: 41_level_1,Unnamed: 42_level_1,Unnamed: 43_level_1,Unnamed: 44_level_1,Unnamed: 45_level_1,Unnamed: 46_level_1,Unnamed: 47_level_1,Unnamed: 48_level_1,Unnamed: 49_level_1,Unnamed: 50_level_1,Unnamed: 51_level_1,Unnamed: 52_level_1,Unnamed: 53_level_1,Unnamed: 54_level_1,Unnamed: 55_level_1,Unnamed: 56_level_1,Unnamed: 57_level_1,Unnamed: 58_level_1,Unnamed: 59_level_1,Unnamed: 60_level_1,Unnamed: 61_level_1,Unnamed: 62_level_1,Unnamed: 63_level_1,Unnamed: 64_level_1,Unnamed: 65_level_1,Unnamed: 66_level_1,Unnamed: 67_level_1,Unnamed: 68_level_1,Unnamed: 69_level_1,Unnamed: 70_level_1,Unnamed: 71_level_1,Unnamed: 72_level_1,Unnamed: 73_level_1,Unnamed: 74_level_1,Unnamed: 75_level_1,Unnamed: 76_level_1,Unnamed: 77_level_1,Unnamed: 78_level_1,Unnamed: 79_level_1,Unnamed: 80_level_1,Unnamed: 81_level_1,Unnamed: 82_level_1,Unnamed: 83_level_1,Unnamed: 84_level_1,Unnamed: 85_level_1,Unnamed: 86_level_1,Unnamed: 87_level_1,Unnamed: 88_level_1,Unnamed: 89_level_1,Unnamed: 90_level_1,Unnamed: 91_level_1,Unnamed: 92_level_1,Unnamed: 93_level_1,Unnamed: 94_level_1,Unnamed: 95_level_1,Unnamed: 96_level_1,Unnamed: 97_level_1,Unnamed: 98_level_1,Unnamed: 99_level_1,Unnamed: 100_level_1,Unnamed: 101_level_1,Unnamed: 102_level_1,Unnamed: 103_level_1,Unnamed: 104_level_1,Unnamed: 105_level_1,Unnamed: 106_level_1,Unnamed: 107_level_1,Unnamed: 108_level_1,Unnamed: 109_level_1,Unnamed: 110_level_1,Unnamed: 111_level_1,Unnamed: 112_level_1,Unnamed: 113_level_1,Unnamed: 114_level_1,Unnamed: 115_level_1,Unnamed: 116_level_1,Unnamed: 117_level_1,Unnamed: 118_level_1,Unnamed: 119_level_1,Unnamed: 120_level_1,Unnamed: 121_level_1,Unnamed: 122_level_1,Unnamed: 123_level_1,Unnamed: 124_level_1,Unnamed: 125_level_1,Unnamed: 126_level_1,Unnamed: 127_level_1,Unnamed: 128_level_1,Unnamed: 129_level_1,Unnamed: 130_level_1,Unnamed: 131_level_1,Unnamed: 132_level_1,Unnamed: 133_level_1,Unnamed: 134_level_1,Unnamed: 135_level_1,Unnamed: 136_level_1,Unnamed: 137_level_1,Unnamed: 138_level_1,Unnamed: 139_level_1,Unnamed: 140_level_1,Unnamed: 141_level_1,Unnamed: 142_level_1,Unnamed: 143_level_1,Unnamed: 144_level_1,Unnamed: 145_level_1,Unnamed: 146_level_1,Unnamed: 147_level_1,Unnamed: 148_level_1,Unnamed: 149_level_1,Unnamed: 150_level_1,Unnamed: 151_level_1,Unnamed: 152_level_1,Unnamed: 153_level_1,Unnamed: 154_level_1,Unnamed: 155_level_1,Unnamed: 156_level_1,Unnamed: 157_level_1,Unnamed: 158_level_1,Unnamed: 159_level_1,Unnamed: 160_level_1,Unnamed: 161_level_1,Unnamed: 162_level_1,Unnamed: 163_level_1,Unnamed: 164_level_1,Unnamed: 165_level_1,Unnamed: 166_level_1,Unnamed: 167_level_1,Unnamed: 168_level_1,Unnamed: 169_level_1,Unnamed: 170_level_1,Unnamed: 171_level_1,Unnamed: 172_level_1,Unnamed: 173_level_1,Unnamed: 174_level_1,Unnamed: 175_level_1,Unnamed: 176_level_1,Unnamed: 177_level_1,Unnamed: 178_level_1,Unnamed: 179_level_1,Unnamed: 180_level_1,Unnamed: 181_level_1,Unnamed: 182_level_1,Unnamed: 183_level_1,Unnamed: 184_level_1,Unnamed: 185_level_1,Unnamed: 186_level_1,Unnamed: 187_level_1,Unnamed: 188_level_1,Unnamed: 189_level_1,Unnamed: 190_level_1,Unnamed: 191_level_1,Unnamed: 192_level_1,Unnamed: 193_level_1,Unnamed: 194_level_1,Unnamed: 195_level_1,Unnamed: 196_level_1,Unnamed: 197_level_1,Unnamed: 198_level_1,Unnamed: 199_level_1,Unnamed: 200_level_1,Unnamed: 201_level_1
01001621,W,54.0,23.627456,69.439409,2,1.819302,0.704097,0.619724,1.014908,1.334809,1.341022,0.971382,0.977802,0.437747,0.597480,0.981717,0.373895,2.085763,0.567837,0.650733,0.983778,1.036290,0.888782,1.192718,0.666124,1.047442,1.219334,0.663285,1.661423,0.694435,2.090090,1.321783,0.546186,0.927013,0.484962,1.264994,0.683409,0.999556,1.063370,0.955280,1.053888,0.834389,0.813427,0.566890,1.378451,1.030161,0.557247,1.359100,1.121047,1.189167,2.339233,1.287490,0.819302,1.526069,0.914017,0.778223,1.437623,0.681799,0.851270,0.929102,1.152256,0.817847,0.871570,1.169466,0.909120,0.644457,1.023283,1.009925,1.015428,0.987975,0.379701,0.962439,1.500350,1.197596,0.760786,0.951191,0.820892,0.538089,0.999284,0.765463,1.128796,0.533141,1.162388,0.894506,1.426137,0.529222,1.009188,1.318555,0.915440,0.804123,0.996878,0.693355,1.003074,0.849613,1.615323,0.603969,0.592127,1.113037,0.968207,1.119836,...,2.841334,0.614300,0.992375,0.687927,0.997586,1.173688,1.005829,1.607427,1.486123,1.030870,1.722813,1.324431,1.017005,17.098502,0.989995,0.990457,1.085562,0.665675,2.055824,1.180362,1.080516,0.667261,0.769920,1.957673,2.227080,1.389496,0.970008,0.781084,2.302494,0.591117,1.199069,1.224311,1.254009,0.982351,0.247112,1.001132,1.001347,0.734604,3.553576,1.063844,0.984213,2.135471,2.320744,0.961425,0.814772,1.462328,0.894339,0.996005,1.288771,1.021349,0.753729,0.661740,2.258629,1.251819,1.479819,2.515144,1.096075,0.997352,1.830214,0.686897,2.077862,0.990652,0.526165,0.992708,0.980669,1.078174,1.028737,1.011223,1.013171,1.454377,0.872246,1.013768,10.215746,1.694952,0.627407,0.558186,0.808554,0.991109,1.203914,1.281067,0.988128,0.718099,0.516304,1.284870,1.022681,0.679225,0.713206,0.994872,2.363626,0.940232,0.820114,0.961806,1.015091,1.016476,1.742466,0.525021,0.983414,0.737648,0.844609,0.980653
01002471,W,56.0,30.509302,82.686835,3,2.064995,0.986490,1.308322,0.773852,0.760033,1.120927,0.864391,0.303651,1.272669,0.315599,0.995144,0.656958,0.964420,1.697865,1.024676,1.289724,2.051666,0.824469,1.151999,0.931829,0.660730,0.860587,2.224214,0.912627,0.781160,1.258297,0.815119,1.081719,1.136016,0.705771,0.804477,0.336264,1.139861,0.902644,1.039865,1.020039,0.995660,0.826441,0.589480,0.802184,1.277612,0.563587,0.582758,1.560815,1.026992,0.474899,1.603208,0.374648,0.676397,0.890703,1.300481,0.956750,0.730311,0.553297,1.064050,0.950831,1.008005,1.070929,0.615761,0.863889,1.417916,0.788280,1.720298,0.977289,0.693026,2.019326,0.955565,0.907692,1.073787,0.690338,1.025866,0.885360,0.435372,0.995659,0.744475,0.839650,1.611892,1.025128,1.195571,0.874040,0.950650,0.972500,0.968054,1.039965,1.030774,0.951808,0.988564,0.829006,0.823075,1.336834,0.830718,0.699213,0.944482,0.796977,1.052902,...,0.424669,1.074053,1.061026,1.623698,0.103251,1.183251,1.300748,0.157823,6.638761,2.703289,0.963890,0.581882,1.826102,1.006791,1.773629,1.582059,0.920416,0.544685,0.818892,0.588983,0.792668,0.997951,1.256255,0.182453,0.785908,0.787675,0.357447,0.202418,1.269296,0.809168,0.641894,1.065702,0.637479,1.114242,0.833660,0.693932,4.641100,0.923287,1.067618,1.300248,1.383848,0.427153,0.844063,0.355064,0.994877,1.219488,1.235941,0.680863,1.231617,1.021349,0.525346,0.574549,0.493011,0.850680,1.326200,0.880279,0.988154,0.997352,0.651892,1.537800,1.074156,1.010185,1.106668,1.404952,0.651197,0.871550,0.821550,0.553413,1.327705,2.160051,1.800796,0.934822,2.194548,0.723246,0.925423,1.113210,0.756221,1.279691,0.834587,0.835386,0.248901,0.816067,0.354885,1.293357,0.894301,1.332717,0.584096,0.622946,0.673490,1.647810,2.823129,0.822285,0.449556,1.873760,0.846569,1.708918,0.983414,0.865380,1.153715,0.980653
01003555,M,47.0,28.478009,63.708606,2,0.713570,0.897179,0.976676,0.820367,1.964455,1.415588,0.843104,1.389681,1.421328,0.537021,1.359196,1.014580,0.918333,1.054004,0.759117,1.049928,1.375178,0.845334,0.981321,1.252526,1.476926,1.238355,1.361816,1.348515,1.394327,1.818558,1.177932,1.726719,1.113264,0.812268,1.508218,0.512731,1.428186,0.951118,0.816564,1.101993,1.339927,0.977231,2.119731,0.589790,0.905860,1.874549,1.365351,1.694305,1.294768,1.354593,0.983640,0.131881,1.475468,0.981385,0.788895,1.286581,1.091763,1.010909,0.973068,1.410487,0.902712,0.975781,1.201931,0.969104,0.970873,1.338672,1.058174,1.071675,1.862286,0.523392,0.985914,0.668120,0.982488,1.071656,0.944810,1.247801,0.729379,0.847234,0.107208,1.416709,0.899301,0.978225,1.137825,1.320800,1.387588,0.996499,0.942360,0.984776,0.805358,1.292644,0.802839,0.977959,0.949317,0.718971,1.118957,1.182887,1.044560,1.241617,1.102927,...,0.991387,0.845887,1.419193,0.971489,3.899467,1.243230,1.045731,0.145278,0.389913,1.030870,0.923509,0.967430,0.146579,0.699347,1.065783,1.733403,1.095966,0.329736,1.623750,0.989430,1.579610,0.476885,1.236641,1.322971,0.976375,0.965286,1.641501,0.821471,1.917424,0.814441,1.663249,1.173894,0.274558,0.799619,1.203418,0.987991,0.640598,0.789030,2.509215,0.528743,0.984213,0.761631,1.491240,0.961425,1.476512,1.630495,0.983273,0.915848,0.809503,1.001555,0.849102,1.136716,0.951667,1.262799,1.302637,1.000043,1.676921,0.997352,1.430802,4.679011,0.665931,0.990652,1.201188,0.992708,1.554672,1.095746,1.026085,1.181587,1.971323,1.292997,3.009653,2.107568,9.145998,0.901270,1.324128,0.508566,1.259130,1.139569,0.576665,0.482035,0.997160,1.115130,1.000361,0.785112,0.534536,1.050690,1.646978,1.107560,0.972626,0.940232,2.205788,1.282597,0.753864,0.818380,1.411935,1.283322,1.126584,1.009515,1.041174,1.781095
01003758,W,33.0,25.821855,115.064998,3,1.067010,2.168985,1.537199,1.013175,0.756108,0.562948,0.428667,1.224927,0.366127,0.462658,1.295006,0.150034,0.775881,0.867852,0.855136,0.674270,0.748127,1.569472,0.677684,1.044402,1.152995,0.589538,1.210516,0.930204,0.940145,0.621822,0.640778,0.772121,0.488692,3.129046,0.749586,1.692857,0.896615,1.119981,0.925403,0.733014,0.849183,0.649744,1.142193,0.734443,0.413235,1.293695,0.901920,0.545643,1.160859,0.802013,1.502427,0.356585,0.996642,0.620162,0.655730,1.102649,0.588964,1.146353,0.803743,0.862584,0.779088,0.732137,1.010273,0.913282,0.772737,1.186139,0.783715,0.742832,0.852776,0.984365,0.901400,0.754456,0.782378,0.710058,2.477820,0.883111,0.928833,1.049833,1.683627,1.290540,0.825076,0.754360,0.994064,0.802964,0.675195,1.056781,0.992867,0.841595,0.780347,0.944063,0.820807,0.368460,1.125684,1.147881,1.082632,0.848912,0.992055,0.720489,0.877495,...,0.796038,1.027894,0.379700,0.553727,0.997586,0.922785,0.972484,0.627501,1.164141,0.851734,0.390711,1.234045,0.287741,1.449629,1.468004,1.054282,0.910643,0.206883,1.282742,0.583285,1.224186,0.997951,1.292729,0.814920,0.647673,0.666988,3.348634,0.986874,0.982858,0.633363,1.008151,0.322529,0.526762,0.628932,0.634019,0.638055,1.380316,0.913146,0.865701,1.016359,0.984213,2.249568,0.800398,1.777224,1.122156,3.276764,0.770233,0.853634,0.813877,1.021349,1.285427,1.073307,0.434133,1.391757,0.490760,0.965698,0.547810,1.005952,0.464385,0.931314,1.389376,0.610523,0.288600,1.195711,0.694499,0.907431,1.026085,1.417172,4.233176,0.492691,1.128916,0.575542,3.527939,1.327478,1.160205,0.992546,1.052884,2.944504,2.547333,1.119906,0.602167,0.917149,1.064515,0.506051,0.501626,1.389399,0.640876,0.330888,0.958700,1.502846,1.088446,0.602580,0.444576,1.571371,1.610660,0.463138,0.983414,0.698853,1.042826,0.356784
01004551,W,35.0,31.952683,108.136716,1,0.924290,0.783514,0.819616,0.865116,0.996610,0.659450,0.486425,0.791334,0.461329,0.743150,1.374979,1.435289,1.048871,0.536022,0.984939,0.973936,0.878626,1.187911,0.948794,0.588183,0.514478,1.082091,0.459974,1.227662,0.579511,1.168911,0.720258,0.947287,0.991814,0.347021,1.145647,0.408127,1.154793,0.562955,0.483398,0.996915,0.508651,1.414554,1.233232,0.643116,0.928997,0.953524,1.061203,0.501286,1.094705,2.212527,1.476387,1.311195,0.803089,0.935156,0.453224,2.016072,1.211724,0.960567,0.940896,1.048062,0.896067,1.120463,1.000725,1.087456,0.568373,0.467972,0.545831,1.079642,1.028315,1.111456,0.887262,1.000402,1.086979,1.163601,0.951191,0.836500,0.378969,1.266804,0.327363,0.738912,0.823866,0.931847,0.887833,1.610089,0.438380,1.038204,1.429244,0.938744,0.854963,0.896906,0.507715,0.314437,1.041597,0.844394,1.358281,0.690816,1.109174,0.953029,1.014453,...,1.341862,0.672256,0.535020,0.880689,0.997586,0.595036,0.573543,0.253140,1.049491,0.827686,0.669609,0.737971,1.404561,0.806951,0.528285,0.955262,0.515337,0.873213,0.697856,0.505139,0.583253,2.489396,1.065657,0.159338,1.502045,1.054228,0.137080,1.510755,0.927190,0.800731,1.319549,1.267136,0.327576,0.982351,0.851250,0.864204,0.962607,1.155048,0.541076,1.016359,0.984213,1.944418,0.594811,0.961425,0.445658,0.826722,1.131721,1.162101,0.781572,1.021349,0.481466,0.439164,0.951667,0.530844,1.601412,1.000043,1.002634,0.734719,4.310923,0.931314,0.969495,0.912360,0.322138,0.691514,0.778879,0.527209,0.529235,0.406135,3.042761,1.253389,0.802074,0.847684,0.549907,0.462941,0.578404,0.617351,0.678313,1.663775,0.969487,0.999338,1.272280,1.872679,0.370907,1.240225,1.063716,1.200804,1.696334,1.418185,2.263225,0.940232,0.986138,1.023881,0.564303,1.173441,0.969611,0.269416,0.983414,0.654025,0.338930,0.876061
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
01998999,M,57.0,18.783706,100.993545,3,2.508696,1.795655,1.650015,1.347469,0.966869,1.069195,0.863598,1.075435,0.196224,0.395478,0.881317,0.604372,0.964420,0.712967,0.889432,1.249995,1.126224,1.320210,1.211493,0.830784,0.536195,1.589204,0.909554,0.984077,0.531973,1.438702,0.927149,1.806263,0.654396,1.949552,1.038978,0.638326,1.296966,1.156078,0.935015,1.081554,0.579501,0.741122,0.579581,1.004136,0.782254,0.611950,1.376768,0.941985,1.444692,0.772254,1.019604,0.316845,1.465209,1.057891,1.087244,0.956750,0.558618,1.270739,0.831071,1.073354,0.952736,0.993423,1.208977,0.993319,0.815774,1.180858,0.760556,0.921711,1.449046,1.139077,1.265083,0.842730,0.793005,0.814779,1.850678,1.319570,0.445153,0.829684,1.615393,0.987449,1.062912,1.075204,0.858863,0.671010,0.494076,1.073192,0.911766,1.155252,0.904768,0.995699,0.745505,1.039798,1.411075,0.977694,0.710814,1.463846,1.073576,0.766515,1.269176,...,1.539688,1.002253,20.053540,0.367076,0.997586,0.806152,0.678568,0.756975,1.334511,1.861676,2.030724,0.933575,3.728086,1.006791,0.989995,0.400730,1.020503,12.257630,0.811382,1.073906,2.096620,2.942871,1.398205,0.890606,0.976375,1.208060,0.227507,0.986874,0.899228,1.346519,1.008151,0.966306,0.452115,0.733195,2.533991,1.288400,0.887183,1.292428,1.399023,0.458055,0.984213,1.534976,2.012718,10.873986,0.568048,0.774962,1.383787,2.452739,1.486011,0.459433,1.317110,1.473895,0.587802,1.356544,1.662648,1.165203,0.959254,0.875942,0.707158,0.789669,1.251459,1.537558,1.677781,0.928571,1.291811,0.985679,0.930923,0.945103,0.195948,1.248705,1.885807,1.807789,1.987864,1.566631,1.032821,0.857585,1.528057,1.059655,0.995406,1.125263,1.276904,1.507432,1.334403,2.060474,1.556957,0.993945,3.918230,0.830448,2.351900,0.940232,1.055523,1.333549,0.690017,1.016476,1.369746,1.260805,0.983414,2.033027,1.010258,0.996457
HX344502,W,44.0,26.927286,114.368652,3,0.958132,0.328335,1.378031,1.085398,1.017652,1.026411,2.659871,0.716476,0.526556,0.193007,1.064625,1.726289,0.784984,1.674860,1.699388,0.454474,0.616601,0.812281,0.834688,0.513354,0.588382,0.470242,0.911506,0.823500,0.683931,0.250738,1.046513,0.724800,0.893319,0.729063,0.910272,8.925657,1.058197,0.503429,0.863477,0.822236,1.131487,0.469579,0.836323,0.699158,0.315727,0.825738,1.189764,0.706820,0.602780,0.867663,1.032199,0.942461,1.153447,0.841459,0.806228,0.956750,1.500843,0.790383,0.913130,1.150227,0.974718,0.928717,0.820447,0.838576,1.524940,0.523966,1.267656,1.139770,0.879645,2.231031,0.851949,0.958683,0.847188,1.605974,0.930248,0.596140,1.486393,1.226515,0.173168,0.648306,1.713089,0.938782,0.767580,2.265104,0.578348,0.972979,1.269775,0.666839,1.109542,0.904396,1.842826,0.804778,1.094852,0.795559,1.006802,0.998073,0.815495,0.653424,0.637053,...,0.463037,0.996104,0.992375,0.902055,1.236390,0.959643,1.005829,0.550839,1.049491,0.141374,1.534063,0.698622,0.546947,0.850108,0.826627,1.248228,0.746160,1.052018,0.526074,1.021127,1.019636,0.523639,0.582503,0.996968,0.790610,2.165350,4.091047,0.812006,0.982858,1.110274,0.442719,0.604789,0.992763,0.395443,1.022473,1.009418,0.345277,0.755476,0.418543,1.016359,0.984213,1.515164,1.101401,0.961425,0.387223,0.916668,0.630210,0.996005,0.247199,1.364434,2.167576,2.443513,0.951667,1.677750,0.724815,1.000043,0.978217,0.997352,2.607406,1.179918,0.367036,1.395897,1.011033,0.534604,1.337429,0.769548,1.026085,1.434100,1.261288,0.616300,0.919501,0.299344,0.998299,1.765674,0.266097,1.037445,0.609443,1.239690,1.380517,1.312319,0.738349,0.344999,0.805630,0.968207,1.507689,0.993945,0.482679,0.994872,0.392112,1.123720,0.875749,0.693498,0.584476,0.876747,0.377163,0.540882,0.595506,0.863708,0.718484,0.660657
HX409129,W,47.0,29.635969,110.039613,3,0.293945,1.169026,2.116840,0.888013,0.994897,0.685195,2.681062,0.842799,1.212464,0.191386,0.924692,1.498795,0.775644,1.463832,1.410570,0.741907,0.754003,0.985389,1.000957,0.853879,0.985995,0.884191,1.363257,0.794610,1.049076,0.334771,0.791397,1.012681,0.907027,0.733194,0.999376,1.039812,1.016732,0.950115,1.174212,0.771902,1.272168,0.336448,1.932395,0.515055,0.291243,1.957355,1.209582,0.930509,0.768473,0.325320,0.870067,0.171186,0.802546,1.026871,0.860504,1.638939,1.161628,1.054982,0.936356,0.699198,1.134129,1.056094,1.200610,0.917835,1.772614,1.240209,1.359660,0.985741,1.196599,2.376415,0.984309,0.914006,0.882419,1.376412,1.137091,0.755141,0.787131,1.155326,1.046611,1.054763,1.783531,0.770417,0.891620,0.571094,1.042764,0.916201,0.973237,0.748718,1.109750,0.878201,1.667638,1.222129,1.008472,0.781168,1.337876,0.878307,0.978517,1.005622,0.677396,...,0.410554,0.994271,0.490613,3.310144,0.997586,0.595945,1.046722,0.285591,0.676871,0.770590,0.216563,0.873380,1.017005,0.582037,0.791514,0.359549,0.671983,1.052018,0.646661,1.002885,0.287626,2.428708,0.334983,0.657411,0.956441,1.382889,5.221789,0.986874,0.982858,1.182890,1.000685,0.726752,0.992763,0.423556,0.297706,0.956572,1.001347,0.361518,0.927303,1.016359,0.984213,1.339607,0.328432,0.961425,1.160430,1.270745,0.702943,0.996005,0.716331,0.143873,1.645232,1.858631,0.467638,1.642978,0.845299,0.635652,0.978217,0.753862,1.013957,0.931314,0.949513,2.396748,0.213364,0.992708,1.245224,0.707155,1.026085,1.115858,1.013171,0.782362,0.787242,0.498829,0.052159,1.725756,0.610755,0.860259,0.750734,0.509069,1.418470,1.594174,0.942591,0.343925,0.907863,1.123352,1.052340,0.993945,1.132403,0.994872,0.958700,1.208956,0.795302,1.132065,2.370099,0.665257,1.230591,1.374512,0.271015,1.016984,1.010258,0.943314
HX460562,W,48.0,45.708683,108.943104,3,0.967099,1.137992,1.731506,0.676390,0.804149,1.313167,1.003930,0.842896,1.034660,4.892710,1.349325,0.590254,0.773872,0.660153,0.810674,2.134438,1.411470,0.812872,1.117198,1.053634,0.901961,1.180933,0.808491,1.213340,1.191766,0.476361,1.417045,1.003818,1.226775,0.916593,1.060786,0.516050,0.989456,0.908439,0.746589,0.851187,0.934748,0.951570,1.020632,1.925098,1.664708,1.167862,0.777275,1.137106,0.874898,0.750916,0.988063,4.855933,0.852488,0.978802,0.648442,0.942340,0.989756,0.907819,1.058649,0.820754,1.094881,1.328300,0.854746,1.141695,0.873659,1.340750,0.840141,1.075907,1.168893,1.007298,1.162655,0.858106,1.023615,0.722871,0.951191,0.698737,0.675141,1.071068,2.123250,1.123728,0.843348,0.835169,1.028974,1.364395,1.044989,1.059805,1.549351,1.096307,1.214988,1.188926,1.696757,1.419263,0.856461,1.325343,1.686169,0.814738,1.152513,1.313716,1.300659,...,0.748818,1.311752,0.812088,0.899447,2.316296,1.372724,0.896752,0.787117,1.049491,0.373941,1.209983,0.967430,1.017005,1.006791,0.989995,0.879710,1.311278,0.697377,0.423724,0.657753,1.019636,0.997951,0.710309,4.851325,0.813197,0.569748,0.970008,0.986874,0.982858,0.830176,1.123124,1.242655,0.295063,0.595950,1.066278,1.009418,1.001347,0.670436,0.311704,0.431748,0.564371,1.172605,0.884355,1.493247,0.837906,0.669872,1.194474,0.674922,0.683711,0.998965,0.556303,0.992172,4.747186,1.100764,1.183830,1.000043,0.978217,0.997352,0.364934,0.490303,1.178855,0.990652,0.833629,0.931017,0.736767,1.297460,1.026085,0.696111,1.109097,1.488904,0.848086,0.388493,0.361643,1.002261,0.628152,0.650280,0.735295,1.149918,1.052895,1.036297,0.871674,0.818190,0.675211,1.529002,1.111636,1.514023,0.592653,0.771967,0.344492,1.457742,1.196898,0.637983,1.280635,1.552814,0.681650,1.256991,1.027760,0.947308,1.123345,0.854447


In [8]:
#Output the metabolomics metatadata df from Arivale
meta = adi.get_snapshot('metabolomics_metadata')
meta.to_csv('metabolomics_fullmetadata.csv')

  t = pandas.to_datetime(x.str.replace("^arivale_snapshot.*(\\d{4}-\\d{2}-\\d{2}_\\d{4})$", "\\1"), format="%Y-%m-%d_%H%M")
  colnames = hdr.loc[~hdr.str.contains("^#")].head(1).str.replace("\n$","")
  hdr = hdr.loc[hdr.str.contains("^#")].str.replace("\n$","")
  fields = hdr.str.replace("^# [^:]+: *(.*)$",r"\1")
  fields.index = hdr.str.replace("^# ([^:]+):.*$",r"\1")
  return "\n".join(list(hdr.loc[hdr.index >= i].str.replace("^# ","")))
