In [2]:
import sys
import os
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
from tqdm import trange,tqdm
import argparse
import xlrd
from datetime import datetime,timedelta
import dateparser
import re

In [3]:
pd.set_option('display.max_columns',None)

In [4]:
def getloclist(wd,end,filter_out):
    loc_list = []
    EIRA_found = False
    for root, dirs, files in os.walk(wd):
        for file in files:
            if file.endswith(end) and not file.endswith(filter_out):
                loc = os.path.join(root, file)
                loc_list.append(loc) #get bim file location
#     if EIRA_found == True:""
#         print("EIRA detected!")
#     else:
#         print("Warning! No EIRA bim detected! Use first scanned cohort as ref!")
    return loc_list

In [5]:
def openfile(file,n=0,sep=','):
    if file.endswith((".csv",".CSV")):
        clinical = pd.read_csv(file,sep=sep,skiprows=n)
    elif file.endswith((".xlsx",".xls")):
        clinical = pd.read_excel(file,skiprows=n)
    elif file.endswith(".dta"):
        clinical = pd.read_stata(file)
    else:
#         raise ValueError("no clinical file detected!")
        clinical = pd.DataFrame()
    return clinical
def search(columns,patterns=["sjc","crp","sdai","cdai","mtx","Methotrexate"]):
    list_found = []
    for i in trange(len(columns)):
        for j in patterns:
            if j.lower() in columns[i].lower():
                print("Found pattern",j ,"in column num",i,columns[i])
                list_found.append(columns[i])
    return list_found
def search_folder(loc):
    list_found = []
    for root, dirs, files in os.walk(loc):
        for file in files:
            path = os.path.join(root, file)
            opened = openfile(path)
            print("openning file ",file)
            list_found.append(search(opened.columns))
    return list_found

In [6]:
def todatetime(a):
    b = dateparser.parse(a)
#     b = datetime.strptime(b,"%d-%b-%y")
    return b

In [7]:
def countRemission(fam):
    count_case = len(fam[fam[5]==2])
    count_control = len(fam[fam[5]==1])
    count_miss = len(fam[fam[5]==-9])+len(fam[fam[5]==0])
    plt.bar(["case",'control','missing'],[count_case,count_control,count_miss])
    return count_case,count_control,count_miss

In [8]:
# The primary outcome measure to model response trajectories was the disease activity score based on the 2-component DAS28, computed as 
# sqrt (SJC) + (0.6*ln[CRP+1]).
def TwocompDAS(sjc,crp):
    DAS = np.sqrt(sjc)+(0.6*np.log(crp+1))
    return DAS

In [9]:
def cDAI_S(cdai):
# sDAI <=3.3 case, >3.3 control
# cDAI <=2.8 case, >2.8 control
# ('1' = control, '2' = case)
    if cdai == -9:
        state = 0
    elif cdai <= 2.8:
        state = 2
    elif cdai > 2.8:
        state = 1
    return state

In [10]:
def sDAI_S(cdai):
# sDAI <=3.3 case, >3.3 control
# cDAI <=2.8 case, >2.8 control
# ('1' = control, '2' = case)
    if cdai == -9:
        state = 0
    elif cdai > 3.3:
        state = 1
    elif cdai <= 3.3:
        state = 2
    return state

## RAMS


In [16]:
RAMS_fam = pd.read_csv('./Pipelinerun_withPC/RAMS/mergedChr/RAMS_merged.fam',sep='\s',header=None)
RAMS_fam

  return func(*args, **kwargs)


Unnamed: 0,0,1,2,3,4,5
0,RAMS_1_RAMS_1,RAMS_1_RAMS_1,0,0,0,1
1,RAMS_10_RAMS_10,RAMS_10_RAMS_10,0,0,0,1
2,RAMS_100_RAMS_100,RAMS_100_RAMS_100,0,0,0,1
3,RAMS_102_RAMS_102,RAMS_102_RAMS_102,0,0,0,1
4,RAMS_103_RAMS_103,RAMS_103_RAMS_103,0,0,0,1
...,...,...,...,...,...,...
240,RAMS_89_RAMS_89,RAMS_89_RAMS_89,0,0,0,1
241,RAMS_91_RAMS_91,RAMS_91_RAMS_91,0,0,0,1
242,RAMS_93_RAMS_93,RAMS_93_RAMS_93,0,0,0,2
243,RAMS_95_RAMS_95,RAMS_95_RAMS_95,0,0,0,1


In [17]:
RAMS_pheno = openfile("/exports/reum/knevel_lab/RAMS/clinical/pheno.csv")
RAMS_pheno

Unnamed: 0,fid_anon,iid_anon,fupno,start_dose_mtx,steroids,vaspat,tjc28_value,sjc28_value,DAS28_CRP,sex,age_baseline,disease_duration_at_baseline_mths,logCRP,smoke_baseline
0,RAMS_1,RAMS_1,6 Mo,,No,78.0,27.0,16.0,7.087547,,,,2.793616,
1,RAMS_1,RAMS_1,Baseline,15.0,No,77.0,24.0,11.0,6.549305,F,56.92845,17.311480,2.331172,current
2,RAMS_3,RAMS_3,Baseline,15.0,No,50.0,5.0,7.0,4.952939,M,43.01267,14.032790,3.610918,current
3,RAMS_3,RAMS_3,3 Mo,,,30.0,3.0,2.0,3.695989,,,,2.639057,
4,RAMS_3,RAMS_3,6 Mo,,No,90.0,0.0,0.0,3.378795,,,,3.218876,
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
912,RAMS_526,RAMS_526,Baseline,7.5,Yes,26.0,2.0,0.0,3.047825,F,48.36700,4.524590,2.588516,never
913,RAMS_527,RAMS_527,3 Mo,,,24.0,5.0,0.0,3.193232,,,,1.791759,
914,RAMS_527,RAMS_527,Baseline,10.0,No,50.0,16.0,10.0,5.430471,M,77.39542,7.606557,1.791759,never
915,RAMS_527,RAMS_527,12 Mo,,No,28.0,0.0,0.0,1.997033,,,,1.791759,


In [18]:
RAMS_pheno['CRP']=RAMS_pheno['logCRP'].map(np.exp)

In [20]:
RAMS_pheno['2COMPDAS']=TwocompDAS(RAMS_pheno['sjc28_value'],RAMS_pheno['CRP'])

In [23]:
RAMS_pheno['id'] = RAMS_pheno['fid_anon']+"_"+RAMS_pheno['iid_anon']

In [24]:
RAMS_pheno

Unnamed: 0,fid_anon,iid_anon,fupno,start_dose_mtx,steroids,vaspat,tjc28_value,sjc28_value,DAS28_CRP,sex,age_baseline,disease_duration_at_baseline_mths,logCRP,smoke_baseline,CRP,2COMPDAS,id
0,RAMS_1,RAMS_1,6 Mo,,No,78.0,27.0,16.0,7.087547,,,,2.793616,,16.339999,5.711810,RAMS_1_RAMS_1
1,RAMS_1,RAMS_1,Baseline,15.0,No,77.0,24.0,11.0,6.549305,F,56.92845,17.311480,2.331172,current,10.289994,4.770975,RAMS_1_RAMS_1
2,RAMS_3,RAMS_3,Baseline,15.0,No,50.0,5.0,7.0,4.952939,M,43.01267,14.032790,3.610918,current,37.000003,4.828303,RAMS_3_RAMS_3
3,RAMS_3,RAMS_3,3 Mo,,,30.0,3.0,2.0,3.695989,,,,2.639057,,13.999995,3.039043,RAMS_3_RAMS_3
4,RAMS_3,RAMS_3,6 Mo,,No,90.0,0.0,0.0,3.378795,,,,3.218876,,25.000004,1.954858,RAMS_3_RAMS_3
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
912,RAMS_526,RAMS_526,Baseline,7.5,Yes,26.0,2.0,0.0,3.047825,F,48.36700,4.524590,2.588516,never,13.310005,1.596575,RAMS_526_RAMS_526
913,RAMS_527,RAMS_527,3 Mo,,,24.0,5.0,0.0,3.193232,,,,1.791759,,5.999997,1.167546,RAMS_527_RAMS_527
914,RAMS_527,RAMS_527,Baseline,10.0,No,50.0,16.0,10.0,5.430471,M,77.39542,7.606557,1.791759,never,5.999997,4.329824,RAMS_527_RAMS_527
915,RAMS_527,RAMS_527,12 Mo,,No,28.0,0.0,0.0,1.997033,,,,1.791759,,5.999997,1.167546,RAMS_527_RAMS_527


In [27]:
merge_RAMS = pd.merge(RAMS_fam,RAMS_pheno[RAMS_pheno['fupno']=='6 Mo'],how='inner',left_on=0,right_on='id')
merge_RAMS

Unnamed: 0,0,1,2,3,4,5,fid_anon,iid_anon,fupno,start_dose_mtx,steroids,vaspat,tjc28_value,sjc28_value,DAS28_CRP,sex,age_baseline,disease_duration_at_baseline_mths,logCRP,smoke_baseline,CRP,2COMPDAS,id
0,RAMS_1_RAMS_1,RAMS_1_RAMS_1,0,0,0,1,RAMS_1,RAMS_1,6 Mo,,No,78.0,27.0,16.0,7.087547,,,,2.793616,,16.339999,5.711810,RAMS_1_RAMS_1
1,RAMS_10_RAMS_10,RAMS_10_RAMS_10,0,0,0,1,RAMS_10,RAMS_10,6 Mo,,No,100.0,21.0,13.0,6.731171,,,,2.209373,,9.110003,4.993666,RAMS_10_RAMS_10
2,RAMS_100_RAMS_100,RAMS_100_RAMS_100,0,0,0,1,RAMS_100,RAMS_100,6 Mo,,,60.0,4.0,4.0,4.164221,,,,1.900614,,6.690001,3.223953,RAMS_100_RAMS_100
3,RAMS_102_RAMS_102,RAMS_102_RAMS_102,0,0,0,1,RAMS_102,RAMS_102,6 Mo,,No,50.0,4.0,2.0,3.571480,,,,1.098612,,2.999999,2.245990,RAMS_102_RAMS_102
4,RAMS_103_RAMS_103,RAMS_103_RAMS_103,0,0,0,1,RAMS_103,RAMS_103,6 Mo,,No,75.0,0.0,1.0,2.639480,,,,0.970779,,2.640000,1.775190,RAMS_103_RAMS_103
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
240,RAMS_89_RAMS_89,RAMS_89_RAMS_89,0,0,0,1,RAMS_89,RAMS_89,6 Mo,,Yes,37.0,2.0,0.0,3.135811,,,,2.405142,,11.080004,1.494931,RAMS_89_RAMS_89
241,RAMS_91_RAMS_91,RAMS_91_RAMS_91,0,0,0,1,RAMS_91,RAMS_91,6 Mo,,Yes,71.0,26.0,2.0,6.567739,,,,3.784190,,44.000016,3.698211,RAMS_91_RAMS_91
242,RAMS_93_RAMS_93,RAMS_93_RAMS_93,0,0,0,2,RAMS_93,RAMS_93,6 Mo,,No,4.0,0.0,0.0,1.284808,,,,0.746688,,2.110000,0.680774,RAMS_93_RAMS_93
243,RAMS_95_RAMS_95,RAMS_95_RAMS_95,0,0,0,1,RAMS_95,RAMS_95,6 Mo,,No,87.0,4.0,1.0,4.278013,,,,1.944481,,6.990003,2.246915,RAMS_95_RAMS_95


In [28]:
# 245 samples
merge_RAMS.loc[:,[0,1,2,3,4,'2COMPDAS']].to_csv("/exports/reum/CKe/Pipelinerun_withPC/TwoCompDAS/RAMS_merged_2cDAS.fam",sep='\t',index=False,header=False)

### Vienna

In [26]:
vienna_fam = pd.read_csv('./Pipelinerun_withPC/Vienna/mergedChr/vienna_merged.fam',sep='\s',header=None)
vienna_fam

  return func(*args, **kwargs)


Unnamed: 0,0,1,2,3,4,5
0,10_1130820744,10_1130820744,0,0,0,2
1,1012_1041715812,1012_1041715812,0,0,0,2
2,1014_1131619222,1014_1131619222,0,0,0,2
3,1015_1150204122,1015_1150204122,0,0,0,1
4,1017_1041664226,1017_1041664226,0,0,0,1
...,...,...,...,...,...,...
401,967_1153937793,967_1153937793,0,0,0,-9
402,988_1153942083,988_1153942083,0,0,0,1
403,989_1085427379,989_1085427379,0,0,0,2
404,990_1150146097,990_1150146097,0,0,0,2


In [27]:
Vienna = openfile("/exports/reum/knevel_lab/Vienna/clinical/Rachel_data_ready_to deliver.csv",sep=';')
Vienna

Unnamed: 0,desc,patient,followup,visit_nr,Eintrt_datum,sex,age,Beschwerdebeginn,Beschwerdedauer,Erstdiagnose,Krankenheitsdauer,Nikotin,Nikotin_text,Analgetika,Kortison,Kortison_merkmal,KortisonStoss,KortisonDosis,NSAIDs,CRP,ESR,PGA,EGA,PAIN,HAQ,SJC28,TJC28,TJC32,SJC32,RF,CCP,DAS_esr,DAS_ESR_S,DAS_crp,SDAI,SDAI_S,CDAI,CDAI_S,rf_pos,ccp_pos,DMARD_Start,MTX_DOSIS,Arava_DOSIS,Salazopyrin_DOSIS,trtment,tr_visit,tr_dur,tr_b,tr_e,trt_course,DMARD__cat,care_dur,RRECEPT_B,locality,PTPN_22,STAT_4,CTLA_4,TRAF1_C5,TNFAIP3,AFF3,IRF5,PADI4,hla1,hla2,shared_epitope,@___merge,filter__,discrib,SampleID_last,@_merge
0,clin,2,4/11/2007,1,4/11/2007,F,495,4/1/2007,0,4/11/2007,0,0,nein,False,1,ja,False,50,True,",3",16,36,34,41,",25",4,7,7,4,12,11,448643283976402,MDA,400468670419933,183,MDA,18,MDA,0,0,8/2/2007,20,,,Mtx,1,8,4/11/2007,12/6/2007,1,MTX,0,,W,GG,GG,AG,AA,GG,TT,TT,CT,DRB1*01:01:01,DRB1*15:01:01:01Â,1,3,1,BOTH,1085421526,3
1,both,2,4/26/2007,2,4/11/2007,F,496,4/1/2007,",1",4/11/2007,0,0,nein,False,1,ja,False,5,True,",32",17,32,31,46,",625",4,9,10,4,12,14,467124934083935,MDA,416463042910416,1962,MDA,193,MDA,0,0,8/2/2007,20,,,Mtx,2,8,4/11/2007,12/6/2007,1,MTX,0,,W,GG,GG,AG,AA,GG,TT,TT,CT,DRB1*01:01:01,DRB1*15:01:01:01Â,1,3,0,BOTH,1085421526,3
2,clin,2,8/2/2007,3,4/11/2007,F,498,4/1/2007,",3",4/11/2007,",3",0,nein,False,1,ja,False,5,True,",34",16,24,6,31,",5",0,3,3,0,,17,324676055780642,MDA,279932608697129,634,LDA,6,LDA,0,0,8/2/2007,15,,,Mtx,3,8,4/11/2007,12/6/2007,1,MTX,3,,W,GG,GG,AG,AA,GG,TT,TT,CT,DRB1*01:01:01,DRB1*15:01:01:01Â,1,3,0,BOTH,1085421526,3
3,both,2,12/6/2007,4,4/11/2007,F,502,4/1/2007,",7",4/11/2007,",7",0,nein,False,1,ja,False,5,True,",42",22,31,3,33,",625",0,4,4,0,12,1,371772971735082,MDA,310751710521146,782,LDA,74,LDA,0,0,8/2/2007,,,,,1,9,12/6/2007,9/1/2008,2,,7,,W,GG,GG,AG,AA,GG,TT,TT,CT,DRB1*01:01:01,DRB1*15:01:01:01Â,1,3,0,BOTH,1085421526,3
4,both,4,3/14/2007,1,3/14/2007,W,513,,,,,2,,False,1,ja,False,75,False,",68",54,74,8,72,",625",0,6,6,0,12,13,520000308855357,HDA,410719880008898,1488,MDA,142,MDA,0,0,3/14/2007,10,,,Mtx,1,351,3/14/2007,1/29/2010,1,MTX,0,1,W,GG,GG,AA,AG,GG,AT,CT,TT,DRB1*07:01:01:01,DRB1*12:01:01Â,0,3,1,BOTH,1031467068,3
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
2208,clin,4239,5/21/2014,2,2/14/2014,W,454,2/1/2012,23,2/14/2014,",3",1,ja,False,1,ja,False,625,False,109,28,56,9,24,1375,1,1,2,1,77,,395654315712264,MDA,347555382404229,959,LDA,85,LDA,1,1,2/14/2014,25,,,Mtx,2,151,2/14/2014,5/13/2015,1,MTX,3,,,,,,,,,,,,,,1,0,BOTH,1095887411,3
2209,clin,4239,6/25/2014,3,2/14/2014,W,455,2/1/2012,24,2/14/2014,",4",1,ja,False,0,nein,False,,False,",53",19,0,0,0,0,0,0,0,0,38,,206110728541651,REM,16225978680231,",53",REM,0,REM,1,1,2/14/2014,25,,,Mtx,3,151,2/14/2014,5/13/2015,1,MTX,4,,,,,,,,,,,,,,1,0,BOTH,1095887411,3
2210,clin,4239,9/17/2014,4,2/14/2014,W,457,2/1/2012,26,2/14/2014,",6",1,ja,False,0,nein,False,,False,",67",21,34,0,36,",625",0,2,2,0,88,,339912530133533,MDA,29627989133184,607,LDA,54,LDA,1,1,2/14/2014,25,,,Mtx,4,151,2/14/2014,5/13/2015,1,MTX,7,,,,,,,,,,,,,,1,0,BOTH,1095887411,3
2211,clin,4239,1/14/2015,5,2/14/2014,W,461,2/1/2012,3,2/14/2014,",9",1,ja,False,0,nein,False,,False,",25",21,52,0,1,",125",0,0,0,0,,,28591657064064,LDA,213899466865833,545,LDA,52,LDA,1,1,2/14/2014,25,,,Mtx,5,151,2/14/2014,5/13/2015,1,MTX,11,,,,,,,,,,,,,,1,0,BOTH,1095887411,3


In [11]:
search(Vienna.columns)

100%|████████████████████████████████████████| 70/70 [00:00<00:00, 44552.55it/s]

Found pattern crp in column num 19 CRP
Found pattern sjc in column num 25 SJC28
Found pattern sjc in column num 28 SJC32
Found pattern crp in column num 33 DAS_crp
Found pattern sdai in column num 34 SDAI
Found pattern sdai in column num 35 SDAI_S
Found pattern cdai in column num 36 CDAI
Found pattern cdai in column num 37 CDAI_S
Found pattern mtx in column num 41 MTX_DOSIS





['CRP',
 'SJC28',
 'SJC32',
 'DAS_crp',
 'SDAI',
 'SDAI_S',
 'CDAI',
 'CDAI_S',
 'MTX_DOSIS']

In [28]:
Vienna['CRP'] = Vienna['CRP'].str.replace(',','.').replace(' ',0).astype(np.float)
Vienna['followup'] = Vienna['followup'].map(todatetime)
Vienna['Eintrt_datum'] = Vienna['Eintrt_datum'].map(todatetime)

Deprecated in NumPy 1.20; for more details and guidance: https://numpy.org/devdocs/release/1.20.0-notes.html#deprecations
  Vienna['CRP'] = Vienna['CRP'].str.replace(',','.').replace(' ',0).astype(np.float)
  date_obj = stz.localize(date_obj)


In [29]:
Vienna['SJC28'] = Vienna['SJC28'].str.replace(',','.').replace(' ',0).astype(np.float)

Deprecated in NumPy 1.20; for more details and guidance: https://numpy.org/devdocs/release/1.20.0-notes.html#deprecations
  Vienna['SJC28'] = Vienna['SJC28'].str.replace(',','.').replace(' ',0).astype(np.float)


In [30]:
Vienna

Unnamed: 0,desc,patient,followup,visit_nr,Eintrt_datum,sex,age,Beschwerdebeginn,Beschwerdedauer,Erstdiagnose,Krankenheitsdauer,Nikotin,Nikotin_text,Analgetika,Kortison,Kortison_merkmal,KortisonStoss,KortisonDosis,NSAIDs,CRP,ESR,PGA,EGA,PAIN,HAQ,SJC28,TJC28,TJC32,SJC32,RF,CCP,DAS_esr,DAS_ESR_S,DAS_crp,SDAI,SDAI_S,CDAI,CDAI_S,rf_pos,ccp_pos,DMARD_Start,MTX_DOSIS,Arava_DOSIS,Salazopyrin_DOSIS,trtment,tr_visit,tr_dur,tr_b,tr_e,trt_course,DMARD__cat,care_dur,RRECEPT_B,locality,PTPN_22,STAT_4,CTLA_4,TRAF1_C5,TNFAIP3,AFF3,IRF5,PADI4,hla1,hla2,shared_epitope,@___merge,filter__,discrib,SampleID_last,@_merge
0,clin,2,2007-04-11,1,2007-04-11,F,495,4/1/2007,0,4/11/2007,0,0,nein,False,1,ja,False,50,True,0.30,16,36,34,41,",25",4.0,7,7,4,12,11,448643283976402,MDA,400468670419933,183,MDA,18,MDA,0,0,8/2/2007,20,,,Mtx,1,8,4/11/2007,12/6/2007,1,MTX,0,,W,GG,GG,AG,AA,GG,TT,TT,CT,DRB1*01:01:01,DRB1*15:01:01:01Â,1,3,1,BOTH,1085421526,3
1,both,2,2007-04-26,2,2007-04-11,F,496,4/1/2007,",1",4/11/2007,0,0,nein,False,1,ja,False,5,True,0.32,17,32,31,46,",625",4.0,9,10,4,12,14,467124934083935,MDA,416463042910416,1962,MDA,193,MDA,0,0,8/2/2007,20,,,Mtx,2,8,4/11/2007,12/6/2007,1,MTX,0,,W,GG,GG,AG,AA,GG,TT,TT,CT,DRB1*01:01:01,DRB1*15:01:01:01Â,1,3,0,BOTH,1085421526,3
2,clin,2,2007-08-02,3,2007-04-11,F,498,4/1/2007,",3",4/11/2007,",3",0,nein,False,1,ja,False,5,True,0.34,16,24,6,31,",5",0.0,3,3,0,,17,324676055780642,MDA,279932608697129,634,LDA,6,LDA,0,0,8/2/2007,15,,,Mtx,3,8,4/11/2007,12/6/2007,1,MTX,3,,W,GG,GG,AG,AA,GG,TT,TT,CT,DRB1*01:01:01,DRB1*15:01:01:01Â,1,3,0,BOTH,1085421526,3
3,both,2,2007-12-06,4,2007-04-11,F,502,4/1/2007,",7",4/11/2007,",7",0,nein,False,1,ja,False,5,True,0.42,22,31,3,33,",625",0.0,4,4,0,12,1,371772971735082,MDA,310751710521146,782,LDA,74,LDA,0,0,8/2/2007,,,,,1,9,12/6/2007,9/1/2008,2,,7,,W,GG,GG,AG,AA,GG,TT,TT,CT,DRB1*01:01:01,DRB1*15:01:01:01Â,1,3,0,BOTH,1085421526,3
4,both,4,2007-03-14,1,2007-03-14,W,513,,,,,2,,False,1,ja,False,75,False,0.68,54,74,8,72,",625",0.0,6,6,0,12,13,520000308855357,HDA,410719880008898,1488,MDA,142,MDA,0,0,3/14/2007,10,,,Mtx,1,351,3/14/2007,1/29/2010,1,MTX,0,1,W,GG,GG,AA,AG,GG,AT,CT,TT,DRB1*07:01:01:01,DRB1*12:01:01Â,0,3,1,BOTH,1031467068,3
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
2208,clin,4239,2014-05-21,2,2014-02-14,W,454,2/1/2012,23,2/14/2014,",3",1,ja,False,1,ja,False,625,False,1.09,28,56,9,24,1375,1.0,1,2,1,77,,395654315712264,MDA,347555382404229,959,LDA,85,LDA,1,1,2/14/2014,25,,,Mtx,2,151,2/14/2014,5/13/2015,1,MTX,3,,,,,,,,,,,,,,1,0,BOTH,1095887411,3
2209,clin,4239,2014-06-25,3,2014-02-14,W,455,2/1/2012,24,2/14/2014,",4",1,ja,False,0,nein,False,,False,0.53,19,0,0,0,0,0.0,0,0,0,38,,206110728541651,REM,16225978680231,",53",REM,0,REM,1,1,2/14/2014,25,,,Mtx,3,151,2/14/2014,5/13/2015,1,MTX,4,,,,,,,,,,,,,,1,0,BOTH,1095887411,3
2210,clin,4239,2014-09-17,4,2014-02-14,W,457,2/1/2012,26,2/14/2014,",6",1,ja,False,0,nein,False,,False,0.67,21,34,0,36,",625",0.0,2,2,0,88,,339912530133533,MDA,29627989133184,607,LDA,54,LDA,1,1,2/14/2014,25,,,Mtx,4,151,2/14/2014,5/13/2015,1,MTX,7,,,,,,,,,,,,,,1,0,BOTH,1095887411,3
2211,clin,4239,2015-01-14,5,2014-02-14,W,461,2/1/2012,3,2/14/2014,",9",1,ja,False,0,nein,False,,False,0.25,21,52,0,1,",125",0.0,0,0,0,,,28591657064064,LDA,213899466865833,545,LDA,52,LDA,1,1,2/14/2014,25,,,Mtx,5,151,2/14/2014,5/13/2015,1,MTX,11,,,,,,,,,,,,,,1,0,BOTH,1095887411,3


In [31]:
Vienna['2COMPDAS']=TwocompDAS(Vienna['SJC28'],Vienna['CRP'])

In [32]:
Vienna_select = Vienna[(Vienna['followup']-Vienna['Eintrt_datum']<=timedelta(180))]
Vienna_select

Unnamed: 0,desc,patient,followup,visit_nr,Eintrt_datum,sex,age,Beschwerdebeginn,Beschwerdedauer,Erstdiagnose,Krankenheitsdauer,Nikotin,Nikotin_text,Analgetika,Kortison,Kortison_merkmal,KortisonStoss,KortisonDosis,NSAIDs,CRP,ESR,PGA,EGA,PAIN,HAQ,SJC28,TJC28,TJC32,SJC32,RF,CCP,DAS_esr,DAS_ESR_S,DAS_crp,SDAI,SDAI_S,CDAI,CDAI_S,rf_pos,ccp_pos,DMARD_Start,MTX_DOSIS,Arava_DOSIS,Salazopyrin_DOSIS,trtment,tr_visit,tr_dur,tr_b,tr_e,trt_course,DMARD__cat,care_dur,RRECEPT_B,locality,PTPN_22,STAT_4,CTLA_4,TRAF1_C5,TNFAIP3,AFF3,IRF5,PADI4,hla1,hla2,shared_epitope,@___merge,filter__,discrib,SampleID_last,@_merge,2COMPDAS
0,clin,2,2007-04-11,1,2007-04-11,F,495,4/1/2007,0,4/11/2007,0,0,nein,False,1,ja,False,50,True,0.30,16,36,34,41,",25",4.0,7,7,4,12,11,448643283976402,MDA,400468670419933,183,MDA,18,MDA,0,0,8/2/2007,20,,,Mtx,1,8,4/11/2007,12/6/2007,1,MTX,0,,W,GG,GG,AG,AA,GG,TT,TT,CT,DRB1*01:01:01,DRB1*15:01:01:01Â,1,3,1,BOTH,1085421526,3,2.157419
1,both,2,2007-04-26,2,2007-04-11,F,496,4/1/2007,",1",4/11/2007,0,0,nein,False,1,ja,False,5,True,0.32,17,32,31,46,",625",4.0,9,10,4,12,14,467124934083935,MDA,416463042910416,1962,MDA,193,MDA,0,0,8/2/2007,20,,,Mtx,2,8,4/11/2007,12/6/2007,1,MTX,0,,W,GG,GG,AG,AA,GG,TT,TT,CT,DRB1*01:01:01,DRB1*15:01:01:01Â,1,3,0,BOTH,1085421526,3,2.166579
2,clin,2,2007-08-02,3,2007-04-11,F,498,4/1/2007,",3",4/11/2007,",3",0,nein,False,1,ja,False,5,True,0.34,16,24,6,31,",5",0.0,3,3,0,,17,324676055780642,MDA,279932608697129,634,LDA,6,LDA,0,0,8/2/2007,15,,,Mtx,3,8,4/11/2007,12/6/2007,1,MTX,3,,W,GG,GG,AG,AA,GG,TT,TT,CT,DRB1*01:01:01,DRB1*15:01:01:01Â,1,3,0,BOTH,1085421526,3,0.175602
4,both,4,2007-03-14,1,2007-03-14,W,513,,,,,2,,False,1,ja,False,75,False,0.68,54,74,8,72,",625",0.0,6,6,0,12,13,520000308855357,HDA,410719880008898,1488,MDA,142,MDA,0,0,3/14/2007,10,,,Mtx,1,351,3/14/2007,1/29/2010,1,MTX,0,1,W,GG,GG,AA,AG,GG,AT,CT,TT,DRB1*07:01:01:01,DRB1*12:01:01Â,0,3,1,BOTH,1031467068,3,0.311276
5,both,4,2007-07-18,2,2007-03-14,W,516,,,,,2,,False,0,nein,False,,False,0.28,27,87,1,55,125,0.0,0,0,0,12,1,352508580620303,MDA,265860038402364,908,LDA,88,LDA,0,0,3/14/2007,20,,,Mtx,2,351,3/14/2007,1/29/2010,1,MTX,4,1,W,GG,GG,AA,AG,GG,AT,CT,TT,DRB1*07:01:01:01,DRB1*12:01:01Â,0,3,0,BOTH,1031467068,3,0.148116
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
2203,clin,4236,2005-05-19,2,2005-03-17,F,678,3/1/2003,22,3/17/2005,",2",0,nein,False,1,ja,False,5,True,1.21,49,0,0,0,0,0.0,0,0,0,,,272427420867744,LDA,188614040287456,121,REM,0,REM,0,0,3/17/2005,,,,Resochin,2,46,3/17/2005,8/2/2005,1,csDMARD,2,,W,GG,GG,,AA,GG,TT,TT,CT,DRB1*04:01:01,DRB1*15:01:01:01Â,1,3,0,BOTH,1031466324,3,0.475796
2204,clin,4236,2005-08-02,3,2005-03-17,F,68,3/1/2003,24,3/17/2005,",4",0,nein,True,1,ja,False,5,True,1.38,18,0,0,28,0,0.0,0,0,0,12,,202326023052732,REM,193006578507722,138,REM,0,REM,0,0,3/17/2005,10,,,Mtx,1,698,8/2/2005,4/26/2011,2,MTX,4,,W,GG,GG,,AA,GG,TT,TT,CT,DRB1*04:01:01,DRB1*15:01:01:01Â,1,3,0,BOTH,1031466324,3,0.520260
2207,both,4239,2014-02-14,1,2014-02-14,W,452,2/1/2012,2,2/14/2014,0,1,ja,False,2,,False,,False,0.33,24,17,9,5,",5",2.0,1,1,2,123,,341861747870803,MDA,267908120563629,593,LDA,56,LDA,1,1,2/14/2014,20,,,Mtx,1,151,2/14/2014,5/13/2015,1,MTX,0,,,,,,,,,,,,,,1,1,BOTH,1095887411,3,1.585321
2208,clin,4239,2014-05-21,2,2014-02-14,W,454,2/1/2012,23,2/14/2014,",3",1,ja,False,1,ja,False,625,False,1.09,28,56,9,24,1375,1.0,1,2,1,77,,395654315712264,MDA,347555382404229,959,LDA,85,LDA,1,1,2/14/2014,25,,,Mtx,2,151,2/14/2014,5/13/2015,1,MTX,3,,,,,,,,,,,,,,1,0,BOTH,1095887411,3,1.442298


In [33]:
Vienna_select['CDAI_S'] = Vienna_select['CDAI_S'].map({"MDA":1,"LDA":1,"HDA":1,"REM":2," ":0})
Vienna_select['SDAI_S'] = Vienna_select['SDAI_S'].map({"MDA":1,"LDA":1,"HDA":1,"REM":2," ":0})

A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  Vienna_select['CDAI_S'] = Vienna_select['CDAI_S'].map({"MDA":1,"LDA":1,"HDA":1,"REM":2," ":0})
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  Vienna_select['SDAI_S'] = Vienna_select['SDAI_S'].map({"MDA":1,"LDA":1,"HDA":1,"REM":2," ":0})


In [34]:
Vienna_select

Unnamed: 0,desc,patient,followup,visit_nr,Eintrt_datum,sex,age,Beschwerdebeginn,Beschwerdedauer,Erstdiagnose,Krankenheitsdauer,Nikotin,Nikotin_text,Analgetika,Kortison,Kortison_merkmal,KortisonStoss,KortisonDosis,NSAIDs,CRP,ESR,PGA,EGA,PAIN,HAQ,SJC28,TJC28,TJC32,SJC32,RF,CCP,DAS_esr,DAS_ESR_S,DAS_crp,SDAI,SDAI_S,CDAI,CDAI_S,rf_pos,ccp_pos,DMARD_Start,MTX_DOSIS,Arava_DOSIS,Salazopyrin_DOSIS,trtment,tr_visit,tr_dur,tr_b,tr_e,trt_course,DMARD__cat,care_dur,RRECEPT_B,locality,PTPN_22,STAT_4,CTLA_4,TRAF1_C5,TNFAIP3,AFF3,IRF5,PADI4,hla1,hla2,shared_epitope,@___merge,filter__,discrib,SampleID_last,@_merge,2COMPDAS
0,clin,2,2007-04-11,1,2007-04-11,F,495,4/1/2007,0,4/11/2007,0,0,nein,False,1,ja,False,50,True,0.30,16,36,34,41,",25",4.0,7,7,4,12,11,448643283976402,MDA,400468670419933,183,1,18,1,0,0,8/2/2007,20,,,Mtx,1,8,4/11/2007,12/6/2007,1,MTX,0,,W,GG,GG,AG,AA,GG,TT,TT,CT,DRB1*01:01:01,DRB1*15:01:01:01Â,1,3,1,BOTH,1085421526,3,2.157419
1,both,2,2007-04-26,2,2007-04-11,F,496,4/1/2007,",1",4/11/2007,0,0,nein,False,1,ja,False,5,True,0.32,17,32,31,46,",625",4.0,9,10,4,12,14,467124934083935,MDA,416463042910416,1962,1,193,1,0,0,8/2/2007,20,,,Mtx,2,8,4/11/2007,12/6/2007,1,MTX,0,,W,GG,GG,AG,AA,GG,TT,TT,CT,DRB1*01:01:01,DRB1*15:01:01:01Â,1,3,0,BOTH,1085421526,3,2.166579
2,clin,2,2007-08-02,3,2007-04-11,F,498,4/1/2007,",3",4/11/2007,",3",0,nein,False,1,ja,False,5,True,0.34,16,24,6,31,",5",0.0,3,3,0,,17,324676055780642,MDA,279932608697129,634,1,6,1,0,0,8/2/2007,15,,,Mtx,3,8,4/11/2007,12/6/2007,1,MTX,3,,W,GG,GG,AG,AA,GG,TT,TT,CT,DRB1*01:01:01,DRB1*15:01:01:01Â,1,3,0,BOTH,1085421526,3,0.175602
4,both,4,2007-03-14,1,2007-03-14,W,513,,,,,2,,False,1,ja,False,75,False,0.68,54,74,8,72,",625",0.0,6,6,0,12,13,520000308855357,HDA,410719880008898,1488,1,142,1,0,0,3/14/2007,10,,,Mtx,1,351,3/14/2007,1/29/2010,1,MTX,0,1,W,GG,GG,AA,AG,GG,AT,CT,TT,DRB1*07:01:01:01,DRB1*12:01:01Â,0,3,1,BOTH,1031467068,3,0.311276
5,both,4,2007-07-18,2,2007-03-14,W,516,,,,,2,,False,0,nein,False,,False,0.28,27,87,1,55,125,0.0,0,0,0,12,1,352508580620303,MDA,265860038402364,908,1,88,1,0,0,3/14/2007,20,,,Mtx,2,351,3/14/2007,1/29/2010,1,MTX,4,1,W,GG,GG,AA,AG,GG,AT,CT,TT,DRB1*07:01:01:01,DRB1*12:01:01Â,0,3,0,BOTH,1031467068,3,0.148116
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
2203,clin,4236,2005-05-19,2,2005-03-17,F,678,3/1/2003,22,3/17/2005,",2",0,nein,False,1,ja,False,5,True,1.21,49,0,0,0,0,0.0,0,0,0,,,272427420867744,LDA,188614040287456,121,2,0,2,0,0,3/17/2005,,,,Resochin,2,46,3/17/2005,8/2/2005,1,csDMARD,2,,W,GG,GG,,AA,GG,TT,TT,CT,DRB1*04:01:01,DRB1*15:01:01:01Â,1,3,0,BOTH,1031466324,3,0.475796
2204,clin,4236,2005-08-02,3,2005-03-17,F,68,3/1/2003,24,3/17/2005,",4",0,nein,True,1,ja,False,5,True,1.38,18,0,0,28,0,0.0,0,0,0,12,,202326023052732,REM,193006578507722,138,2,0,2,0,0,3/17/2005,10,,,Mtx,1,698,8/2/2005,4/26/2011,2,MTX,4,,W,GG,GG,,AA,GG,TT,TT,CT,DRB1*04:01:01,DRB1*15:01:01:01Â,1,3,0,BOTH,1031466324,3,0.520260
2207,both,4239,2014-02-14,1,2014-02-14,W,452,2/1/2012,2,2/14/2014,0,1,ja,False,2,,False,,False,0.33,24,17,9,5,",5",2.0,1,1,2,123,,341861747870803,MDA,267908120563629,593,1,56,1,1,1,2/14/2014,20,,,Mtx,1,151,2/14/2014,5/13/2015,1,MTX,0,,,,,,,,,,,,,,1,1,BOTH,1095887411,3,1.585321
2208,clin,4239,2014-05-21,2,2014-02-14,W,454,2/1/2012,23,2/14/2014,",3",1,ja,False,1,ja,False,625,False,1.09,28,56,9,24,1375,1.0,1,2,1,77,,395654315712264,MDA,347555382404229,959,1,85,1,1,1,2/14/2014,25,,,Mtx,2,151,2/14/2014,5/13/2015,1,MTX,3,,,,,,,,,,,,,,1,0,BOTH,1095887411,3,1.442298


In [35]:
vienna_fam['id'] = vienna_fam[0].str.split("_",expand=True)[1]
vienna_fam

Unnamed: 0,0,1,2,3,4,5,id
0,10_1130820744,10_1130820744,0,0,0,2,1130820744
1,1012_1041715812,1012_1041715812,0,0,0,2,1041715812
2,1014_1131619222,1014_1131619222,0,0,0,2,1131619222
3,1015_1150204122,1015_1150204122,0,0,0,1,1150204122
4,1017_1041664226,1017_1041664226,0,0,0,1,1041664226
...,...,...,...,...,...,...,...
401,967_1153937793,967_1153937793,0,0,0,-9,1153937793
402,988_1153942083,988_1153942083,0,0,0,1,1153942083
403,989_1085427379,989_1085427379,0,0,0,2,1085427379
404,990_1150146097,990_1150146097,0,0,0,2,1150146097


In [36]:
vienna_merge = pd.merge(vienna_fam, Vienna_select, left_on="id",right_on="SampleID_last",how='left')
vienna_merge

Unnamed: 0,0,1,2,3,4,5,id,desc,patient,followup,visit_nr,Eintrt_datum,sex,age,Beschwerdebeginn,Beschwerdedauer,Erstdiagnose,Krankenheitsdauer,Nikotin,Nikotin_text,Analgetika,Kortison,Kortison_merkmal,KortisonStoss,KortisonDosis,NSAIDs,CRP,ESR,PGA,EGA,PAIN,HAQ,SJC28,TJC28,TJC32,SJC32,RF,CCP,DAS_esr,DAS_ESR_S,DAS_crp,SDAI,SDAI_S,CDAI,CDAI_S,rf_pos,ccp_pos,DMARD_Start,MTX_DOSIS,Arava_DOSIS,Salazopyrin_DOSIS,trtment,tr_visit,tr_dur,tr_b,tr_e,trt_course,DMARD__cat,care_dur,RRECEPT_B,locality,PTPN_22,STAT_4,CTLA_4,TRAF1_C5,TNFAIP3,AFF3,IRF5,PADI4,hla1,hla2,shared_epitope,@___merge,filter__,discrib,SampleID_last,@_merge,2COMPDAS
0,10_1130820744,10_1130820744,0,0,0,2,1130820744,both,3147.0,2011-09-27,1.0,2011-09-27,W,416,5/1/2011,",4",12/15/2011,"-,2",0.0,nein,False,2,,False,,True,1.60,24,17,14,6,,3.0,3,3,4,59,157,391756035960142,MDA,367287948221809,107,1.0,91,1.0,1.0,1,12/15/2011,,,,,,26,9/27/2011,12/15/2011,,,0.0,1,W,GG,GG,GG,AA,GG,AA,TT,CT,DRB1*01:01:01,DRB1*13:02:01Â,1,3.0,1.0,BOTH,1130820744,3.0,2.305358
1,10_1130820744,10_1130820744,0,0,0,2,1130820744,clin,3147.0,2011-12-15,2.0,2011-09-27,W,419,5/1/2011,",6",12/15/2011,0,0.0,nein,False,1,ja,True,625,True,0.63,20,37,8,29,,2.0,5,6,4,128,163,426319045635214,MDA,384181263019991,1213,1.0,115,1.0,1.0,1,12/15/2011,10,,,Mtx,1,86,12/15/2011,8/28/2012,1,MTX,2.0,1,W,GG,GG,GG,AA,GG,AA,TT,CT,DRB1*01:01:01,DRB1*13:02:01Â,1,3.0,0.0,BOTH,1130820744,3.0,1.707362
2,10_1130820744,10_1130820744,0,0,0,2,1130820744,both,3147.0,2012-03-20,3.0,2011-09-27,W,421,5/1/2011,",9",12/15/2011,",3",0.0,nein,False,0,nein,False,,True,0.48,21,0,0,0,0,0.0,0,0,0,38,78,21311657064064,REM,159282885031885,",48",2.0,0,2.0,1.0,1,12/15/2011,20,,,Mtx,2,86,12/15/2011,8/28/2012,1,MTX,5.0,1,W,GG,GG,GG,AA,GG,AA,TT,CT,DRB1*01:01:01,DRB1*13:02:01Â,1,3.0,0.0,BOTH,1130820744,3.0,0.235225
3,1012_1041715812,1012_1041715812,0,0,0,2,1041715812,clin,1614.0,2002-08-22,1.0,2002-08-22,F,563,10/1/2001,",9",6/1/2002,",2",1.0,ja,False,0,nein,False,,True,0.50,8,45,37,45,1875,5.0,5,5,5,883,,396390618027571,MDA,411333051002192,187,1.0,182,1.0,1.0,1,8/22/2002,,,2000,Salazopyrin,1,17,8/22/2002,1/13/2004,1,csDMARD,0.0,,,,,,,,,,,,,,1.0,1.0,BOTH,1041715812,3.0,2.479347
4,1012_1041715812,1012_1041715812,0,0,0,2,1041715812,clin,1614.0,2003-02-07,2.0,2002-08-22,F,568,10/1/2001,14,6/1/2002,",7",1.0,ja,False,0,nein,False,,False,0.50,7,33,23,35,",25",2.0,3,3,2,291,,319006535404176,LDA,343296165862514,111,1.0,106,1.0,1.0,1,8/22/2002,,,3000,Salazopyrin,2,17,8/22/2002,1/13/2004,1,csDMARD,5.0,,,,,,,,,,,,,,1.0,0.0,BOTH,1041715812,3.0,1.657493
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
1021,990_1150146097,990_1150146097,0,0,0,2,1150146097,clin,3357.0,1998-01-21,1.0,1998-01-21,F,252,4/30/1997,",7",9/1/1997,",4",2.0,,False,1,ja,False,5,True,0.50,13,12,9,3,0,0.0,1,1,0,12,,252346455022308,REM,23330334089221,36,1.0,31,1.0,0.0,0,3/1/1997,,,3000,Salazopyrin,1,285,1/21/1998,5/26/2000,1,csDMARD,0.0,,W,AG,GG,GG,GG,GG,AT,CT,CT,DRB1*04:04:01,DRB1*08:01:01Â,1,3.0,1.0,BOTH,1150146097,3.0,0.243279
1022,990_1150146097,990_1150146097,0,0,0,2,1150146097,clin,3357.0,1998-03-13,2.0,1998-01-21,F,254,4/30/1997,",9",9/1/1997,",5",2.0,,False,1,ja,False,25,False,0.50,6,10,4,0,",375",0.0,0,0,0,,,139423162845964,REM,17450334089221,19,2.0,14,2.0,0.0,0,3/1/1997,,,2500,Salazopyrin,2,285,1/21/1998,5/26/2000,1,csDMARD,1.0,,W,AG,GG,GG,GG,GG,AT,CT,CT,DRB1*04:04:01,DRB1*08:01:01Â,1,3.0,0.0,BOTH,1150146097,3.0,0.243279
1023,991_1131615031,991_1131615031,0,0,0,1,1131615031,both,2100.0,2012-07-24,1.0,2012-07-24,W,422,5/24/2012,",2",8/20/2012,"-,1",1.0,ja,False,1,ja,True,625,False,1.05,21,58,45,56,",25",4.0,5,5,4,12,23,475536377380628,MDA,44634430001328,2035,1.0,193,1.0,0.0,0,10/9/2012,,,,,,26,7/24/2012,10/9/2012,,,0.0,,,,,,,,,,,,,,1.0,1.0,BOTH,1131615031,3.0,2.430704
1024,991_1131615031,991_1131615031,0,0,0,1,1131615031,both,2100.0,2012-08-20,2.0,2012-07-24,W,423,5/24/2012,",2",8/20/2012,0,1.0,ja,False,1,ja,False,5,False,0.62,20,44,19,50,,3.0,6,,,12,2,456970107356566,MDA,414335765144579,1592,1.0,153,1.0,0.0,0,10/9/2012,,,,,,26,7/24/2012,10/9/2012,,,0.0,,,,,,,,,,,,,,1.0,0.0,BOTH,1131615031,3.0,2.021506


In [37]:
vienna_merge = vienna_merge.drop_duplicates('id',keep='last')
vienna_merge

Unnamed: 0,0,1,2,3,4,5,id,desc,patient,followup,visit_nr,Eintrt_datum,sex,age,Beschwerdebeginn,Beschwerdedauer,Erstdiagnose,Krankenheitsdauer,Nikotin,Nikotin_text,Analgetika,Kortison,Kortison_merkmal,KortisonStoss,KortisonDosis,NSAIDs,CRP,ESR,PGA,EGA,PAIN,HAQ,SJC28,TJC28,TJC32,SJC32,RF,CCP,DAS_esr,DAS_ESR_S,DAS_crp,SDAI,SDAI_S,CDAI,CDAI_S,rf_pos,ccp_pos,DMARD_Start,MTX_DOSIS,Arava_DOSIS,Salazopyrin_DOSIS,trtment,tr_visit,tr_dur,tr_b,tr_e,trt_course,DMARD__cat,care_dur,RRECEPT_B,locality,PTPN_22,STAT_4,CTLA_4,TRAF1_C5,TNFAIP3,AFF3,IRF5,PADI4,hla1,hla2,shared_epitope,@___merge,filter__,discrib,SampleID_last,@_merge,2COMPDAS
2,10_1130820744,10_1130820744,0,0,0,2,1130820744,both,3147.0,2012-03-20,3.0,2011-09-27,W,421,5/1/2011,",9",12/15/2011,",3",0.0,nein,False,0,nein,False,,True,0.48,21,0,0,0,0,0.0,0,0,0,38,78,21311657064064,REM,159282885031885,",48",2.0,0,2.0,1.0,1,12/15/2011,20,,,Mtx,2,86,12/15/2011,8/28/2012,1,MTX,5.0,1,W,GG,GG,GG,AA,GG,AA,TT,CT,DRB1*01:01:01,DRB1*13:02:01Â,1,3.0,0.0,BOTH,1130820744,3.0,0.235225
4,1012_1041715812,1012_1041715812,0,0,0,2,1041715812,clin,1614.0,2003-02-07,2.0,2002-08-22,F,568,10/1/2001,14,6/1/2002,",7",1.0,ja,False,0,nein,False,,False,0.50,7,33,23,35,",25",2.0,3,3,2,291,,319006535404176,LDA,343296165862514,111,1.0,106,1.0,1.0,1,8/22/2002,,,3000,Salazopyrin,2,17,8/22/2002,1/13/2004,1,csDMARD,5.0,,,,,,,,,,,,,,1.0,0.0,BOTH,1041715812,3.0,1.657493
8,1014_1131619222,1014_1131619222,0,0,0,2,1131619222,both,326.0,2006-12-27,4.0,2006-08-23,W,614,7/15/2006,",5",7/1/2006,",5",0.0,nein,False,1,ja,False,9375,True,0.11,8,34,9,40,",125",0.0,1,1,0,12,13,249160907917588,REM,226309744410258,541,1.0,53,1.0,0.0,0,8/23/2006,20,,,Mtx,3,34,10/19/2006,8/4/2009,1,MTX,4.0,1,W,GG,GG,AG,GG,GG,TT,CT,CT,DRB1*04:04:01,DRB1*13:01:01Â,1,3.0,0.0,BOTH,1131619222,3.0,0.062616
11,1015_1150204122,1015_1150204122,0,0,0,1,1150204122,clin,2018.0,2005-08-19,3.0,2005-04-08,M,449,12/14/2004,",7",4/8/2005,",4",1.0,ja,False,1,ja,False,125,False,4.00,69,68,24,39,0,0.0,4,4,0,208,,503587455321808,MDA,436888594401355,172,1.0,132,1.0,1.0,0,4/8/2005,25,,,Mtx,3,10,4/8/2005,2/3/2006,1,MTX,4.0,,,,,,,,,,,,,,1.0,0.0,BOTH,1150204122,3.0,0.965663
15,1017_1041664226,1017_1041664226,0,0,0,1,1041664226,clin,2829.0,2008-07-16,4.0,2008-04-10,W,769,1/15/2007,15,5/1/2007,12,0.0,nein,False,1,ja,False,625,False,1.53,22,37,16,29,0,8.0,0,0,8,12,340,347368931227975,MDA,327477903374151,1483,1.0,133,1.0,1.0,1,4/10/2008,,20,,Arava,1,62,7/16/2008,1/19/2009,2,csDMARD,3.0,5,W,GG,GG,AG,GG,GG,AT,CT,TT,DRB1*01:01:01,DRB1*04:01:01Â,2,3.0,0.0,BOTH,1041664226,3.0,3.385359
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
1015,967_1153937793,967_1153937793,0,0,0,-9,1153937793,,,NaT,,NaT,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
1017,988_1153942083,988_1153942083,0,0,0,1,1153942083,clin,2763.0,2014-06-06,2.0,2014-01-08,F,505,6/1/2013,1,1/8/2014,",4",0.0,nein,False,0,nein,True,,False,0.94,,22,10,31,",625",2.0,4,4,2,12,",5",,,36270298876775,1014,1.0,92,1.0,0.0,0,6/6/2014,10,,,Mtx,1,136,6/6/2014,7/20/2015,1,MTX,4.0,,,,,,,,,,,,,,1.0,0.0,BOTH,1153942083,3.0,1.811826
1020,989_1085427379,989_1085427379,0,0,0,2,1085427379,clin,2894.0,2009-01-29,3.0,2008-09-25,W,42,12/1/2007,12,9/25/2008,",3",0.0,nein,False,1,ja,False,5,False,0.00,,7,14,9,",125",2.0,3,3,2,,,,,,,0.0,71,1.0,1.0,1,9/5/2008,25,,,Mtx,3,1257,9/25/2008,1/23/2019,1,MTX,4.0,2,W,GG,GT,AG,AA,GG,AA,CT,CC,DRB1*01:01:01,DRB1*16:01:01Â,1,3.0,0.0,BOTH,1085427379,3.0,1.414214
1022,990_1150146097,990_1150146097,0,0,0,2,1150146097,clin,3357.0,1998-03-13,2.0,1998-01-21,F,254,4/30/1997,",9",9/1/1997,",5",2.0,,False,1,ja,False,25,False,0.50,6,10,4,0,",375",0.0,0,0,0,,,139423162845964,REM,17450334089221,19,2.0,14,2.0,0.0,0,3/1/1997,,,2500,Salazopyrin,2,285,1/21/1998,5/26/2000,1,csDMARD,1.0,,W,AG,GG,GG,GG,GG,AT,CT,CT,DRB1*04:04:01,DRB1*08:01:01Â,1,3.0,0.0,BOTH,1150146097,3.0,0.243279


In [38]:
vienna_merge['2COMPDAS'] = vienna_merge['2COMPDAS'].fillna(-9)
vienna_merge['SDAI_S'] = vienna_merge['SDAI_S'].fillna(-9)
vienna_merge['CDAI_S'] = vienna_merge['CDAI_S'].fillna(-9)

A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  vienna_merge['2COMPDAS'] = vienna_merge['2COMPDAS'].fillna(-9)
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  vienna_merge['SDAI_S'] = vienna_merge['SDAI_S'].fillna(-9)
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  vienna_merge['CDAI_S'] = vienna_merge['CDAI_S'].fillna(-9)


In [39]:
vienna_fam_2cDAS = vienna_merge.loc[:,[0,1,2,3,4,'2COMPDAS']]
vienna_fam_sDAI = vienna_merge.loc[:,[0,1,2,3,4,'SDAI_S']]
vienna_fam_cDAI = vienna_merge.loc[:,[0,1,2,3,4,'CDAI_S']]

In [47]:
vienna_fam_sDAI['SDAI_S'] = vienna_fam_sDAI['SDAI_S'].astype(int)
vienna_fam_cDAI['CDAI_S'] = vienna_fam_cDAI['CDAI_S'].astype(int)

In [48]:
#398 samples 
vienna_fam_2cDAS.to_csv("/exports/reum/CKe/Pipelinerun_withPC/TwoCompDAS/Vienna_merged_2cDAS.fam",sep='\t',index=False,header=False)
vienna_fam_sDAI.to_csv("/exports/reum/CKe/Pipelinerun_withPC/TwoCompDAS/Vienna_merged_sDAI.fam",sep='\t',index=False,header=False)
vienna_fam_cDAI.to_csv("/exports/reum/CKe/Pipelinerun_withPC/TwoCompDAS/Vienna_merged_cDAI.fam",sep='\t',index=False,header=False)

### Madrid

In [17]:
Madrid = openfile("/exports/reum/knevel_lab/Madrid/clinical/Clinical_data_GWAS_patients_HUP.dta")
Madrid_additional = openfile("/exports/reum/knevel_lab/Scripts_Samantha/GWAS_runscripts/GWAS_scripts/input_files_used/madrid/Additional clincal data pacients GWAS HUP.xls")

In [66]:
Madrid

Unnamed: 0,codigo2,tabaco,fr,fechaini,sexo,cort_v1,dosis_mtx_v1,dosis_leflu_v1,dosis_antipal_v1,dosis_szp_v1,dosis_oro_v1,dosis_csa_v1,a_tnf_v1,aba_v1,toci_v1,ritu_v1,cort_v2,dosis_mtx_v2,dosis_leflu_v2,dosis_antipal_v2,dosis_szp_v2,dosis_oro_v2,dosis_csa_v2,a_tnf_v2,aba_v2,toci_v2,ritu_v2,vgepac_v3,vgemed_v3,nad_v3,nat_v3,vsg_v3,pcr_v3,cort_v3,dosis_mtx_v3,dosis_leflu_v3,dosis_antipal_v3,dosis_szp_v3,dosis_oro_v3,dosis_csa_v3,a_tnf_v3,aba_v3,toci_v3,ritu_v3,das28_v3,das28pcr_v3,das28cat_v3,das28pcrcat_v3,sdai_v3,cdai_v3,cort_v4,edadinienf,tevol_v1,tevol_v3,ccpsn,hupi_v3,hupicat_v3,cortic_1yr
0,536,1.0,1,2012-08-15,Mujer,0.0,0.0,0,0,0,0,0,0,0,0,0,,,,,,,,,,,,12.0,14.0,0.0,0.0,29.0,0.30,0.0,17.5,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,2.525107,1.627066,Remision,Remision,2.900000,2.600000,0.0,65.180824,2.266667,14.400000,1.0,1.0,Remision,0.000
1,539,0.0,0,2012-08-20,Mujer,0.0,0.0,0,0,0,0,0,0,0,0,0,0.0,17.5,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,52.0,45.0,6.0,1.0,21.0,0.10,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,4.510880,3.589247,Act. moderada,Act. baja,16.799999,16.700001,0.0,48.515068,3.133333,15.866667,1.0,7.0,Act. moderada,100.000
2,541,2.0,1,2012-03-15,Mujer,0.0,0.0,0,0,0,0,0,0,0,0,0,2.0,20.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,16.0,25.0,0.0,3.0,13.0,0.60,0.0,20.0,8.7,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,2.504439,2.369502,Remision,Act. baja,7.700000,7.100000,0.0,60.082191,8.666667,22.366667,1.0,3.5,Act. leve,1528.125
3,542,1.0,0,2012-06-21,Mujer,0.0,0.0,0,0,0,0,0,0,0,0,0,5.0,15.0,20.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,6.0,0.0,0.0,0.0,13.0,0.10,2.0,15.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.879465,1.293533,Remision,Remision,0.700000,0.600000,0.0,62.964382,6.533333,19.500000,0.0,0.0,Remision,1642.500
4,545,0.0,1,2012-03-01,Mujer,0.0,0.0,0,0,0,0,0,0,0,0,0,0.0,20.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,3.0,18.0,0.0,2.0,56.0,0.20,5.0,20.0,10.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,3.255726,1.793480,Act. moderada,Remision,4.300000,4.100000,0.0,69.490410,10.866667,23.733334,1.0,2.5,Act. leve,75.000
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
118,836,1.0,1,2019-05-15,Mujer,0.0,0.0,0,0,0,0,0,0,0,0,0,0.0,15.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,45.0,5.0,3.0,0.0,25.0,0.23,0.0,15.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,3.853162,2.989761,Act. moderada,Act. baja,8.230000,8.000000,,63.967125,0.400000,13.233334,1.0,5.0,Act. leve,0.000
119,839,2.0,1,2018-06-15,Hombre,0.0,0.0,0,0,0,0,0,0,0,0,0,2.5,20.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,60.0,75.0,12.0,7.0,79.0,1.26,0.0,20.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,6.590000,,Act. alta,,33.259998,,,62.526028,12.066667,,1.0,11.5,Act. alta,
120,842,1.0,1,2019-05-15,Mujer,0.0,0.0,0,0,0,0,0,0,0,0,0,0.0,15.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,3.0,0.0,0.0,2.0,0.06,0.0,0.0,0.0,0.0,1250.0,0.0,0.0,0.0,0.0,0.0,0.0,0.485203,1.129201,Remision,Remision,0.360000,0.300000,,31.545206,1.233333,13.233334,1.0,0.0,Remision,0.000
121,843,0.0,1,2019-05-15,Mujer,0.0,15.0,0,0,0,0,0,0,0,0,0,0.0,20.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,,,,,,,,,,,,,,,,,,38.980824,1.566667,,1.0,,,0.000


In [72]:
Madrid_additional

Unnamed: 0,codigo2,fechaini,vgepac_v1,vgemed_v1,nad_v1,nat_v1,vsg_v1,pcr_v1,das28_v1,das28pcr_v1,das28cat_v1,das28pcrcat_v1,sdai_v1,cdai_v1,vgepac_v2,vgemed_v2,nad_v2,nat_v2,vsg_v2,pcr_v2,das28_v2,das28pcr_v2,das28cat_v2,das28pcrcat_v2,sdai_v2,cdai_v2,vgepac_v3,vgemed_v3,nad_v3,nat_v3,vsg_v3,pcr_v3,das28_v3,das28pcr_v3,das28cat_v3,das28pcrcat_v3,sdai_v3,cdai_v3,peso,talla,bmi,edadinienf,tevol_v1,tevol_v2,tevol_v3,fecha1fme,hupi_v1,hupicat_v1,hupi_v2,hupicat_v2,hupi_v3,hupicat_v3,CDAI_S,SDAI_S
0,536,2012-08-15,47,25,1,2,46.0,0.60,4.294029,3.274508,Act. moderada,Act. baja,10.800000,10.200000,,,,,,,,,,,-9.00,-9.0,12.0,14.0,0.0,0.0,29.0,0.30,2.525107,1.627066,Remision,Remision,2.900000,2.600000,92.5,1.610,35.685352,65.180824,2.266667,,14.400000,2012-10-23,6.0,Act. moderada,,,1.0,Remision,2,2
1,539,2012-08-20,27,22,2,2,19.0,0.10,3.627047,2.775472,Act. moderada,Act. baja,9.000000,8.900000,81.0,54.0,9.0,4.0,15.0,0.10,5.269635,4.583533,Act. alta,Act. moderada,26.60,26.5,52.0,45.0,6.0,1.0,21.0,0.10,4.510880,3.589247,Act. moderada,Act. baja,16.799999,16.700001,60.0,1.720,20.281233,48.515068,3.133333,9.433333,15.866667,2012-11-24,3.5,Act. leve,8.0,Act. moderada,7.0,Act. moderada,1,1
2,541,2012-03-15,45,58,2,9,50.0,4.00,5.000376,4.558846,Act. moderada,Act. moderada,25.299999,21.299999,29.0,35.0,0.0,3.0,20.0,0.30,2.987987,2.350040,Act. baja,Act. baja,9.70,9.4,16.0,25.0,0.0,3.0,13.0,0.60,2.504439,2.369502,Remision,Act. baja,7.700000,7.100000,55.0,1.470,25.452358,60.082191,8.666667,13.900000,22.366667,2012-12-05,9.0,Act. moderada,3.5,Act. leve,3.5,Act. leve,1,1
3,542,2012-06-21,55,75,10,10,17.0,0.20,5.409563,4.781814,Act. alta,Act. moderada,33.200001,33.000000,12.0,14.0,0.0,1.0,14.0,0.00,2.295340,1.408000,Remision,Remision,3.60,3.6,6.0,0.0,0.0,0.0,13.0,0.10,1.879465,1.293533,Remision,Remision,0.700000,0.600000,57.0,1.640,21.192743,62.964382,6.533333,14.233334,19.500000,2013-01-08,9.5,Act. alta,1.0,Remision,0.0,Remision,1,1
4,545,2012-03-01,65,49,7,9,40.0,1.30,5.813837,5.141681,Act. alta,Act. alta,28.700001,27.400000,8.0,10.0,0.0,1.0,37.0,0.10,2.919642,1.601533,Act. baja,Remision,2.90,2.8,3.0,18.0,0.0,2.0,56.0,0.20,3.255726,1.793480,Act. moderada,Remision,4.300000,4.100000,55.5,1.480,25.337837,69.490410,10.866667,16.933332,23.733334,2013-01-22,11.5,Act. alta,2.5,Act. leve,2.5,Act. leve,2,2
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
118,836,2019-05-15,66,25,10,1,31.0,0.50,5.378666,4.579909,Act. alta,Act. moderada,20.600000,20.100000,44.0,13.0,4.0,0.0,46.0,0.27,4.416049,3.167000,Act. moderada,Act. baja,9.97,9.7,45.0,5.0,3.0,0.0,25.0,0.23,3.853162,2.989761,Act. moderada,Act. baja,8.230000,8.000000,63.0,1.510,27.630367,63.967125,0.400000,6.233333,13.233334,2019-05-28,8.5,Act. moderada,5.5,Act. moderada,5.0,Act. leve,1,1
119,839,2018-06-15,55,37,9,4,58.0,0.37,5.852310,4.527122,Act. alta,Act. moderada,22.570000,22.200001,,,,,,,,,,,-9.00,-9.0,,,,,,,,,,,,,66.0,1.665,23.807590,62.526028,12.066667,,,2019-06-14,9.5,Act. alta,,,,,2,2
120,842,2019-05-15,91,65,14,9,16.0,0.76,6.150140,5.943963,Act. alta,Act. alta,39.360001,38.599998,2.0,0.0,0.0,0.0,6.0,0.06,1.282232,1.157201,Remision,Remision,0.26,0.2,0.0,3.0,0.0,0.0,2.0,0.06,0.485203,1.129201,Remision,Remision,0.360000,0.300000,58.0,1.560,23.833004,31.545206,1.233333,6.700000,13.233334,2019-06-24,10.0,Act. alta,0.0,Remision,0.0,Remision,2,2
121,843,2019-05-15,90,65,0,10,35.0,0.71,4.634181,3.858509,Act. moderada,Act. moderada,26.209999,25.500000,10.0,5.0,0.0,1.0,10.0,0.56,2.031810,2.059345,Remision,Remision,3.06,2.5,,,,,,,,,,,,,63.5,1.560,26.093031,38.980824,1.566667,8.566667,,2019-07-02,8.0,Act. moderada,1.5,Remision,,,2,2


In [18]:
Madrid_fam = pd.read_csv('./Pipelinerun_withPC/Madrid/mergedChr/madrid_merged.fam',sep='\s',header=None)
Madrid_fam

  return func(*args, **kwargs)


Unnamed: 0,0,1,2,3,4,5
0,1018_ARC796,1018_ARC796,0,0,0,-9
1,1020_ARC552,1020_ARC552,0,0,0,1
2,1042_HCSC06,1042_HCSC06,0,0,0,-9
3,1044_ARC602,1044_ARC602,0,0,0,1
4,1068_ARC646,1068_ARC646,0,0,0,2
...,...,...,...,...,...,...
136,922_ARC560,922_ARC560,0,0,0,1
137,944_HCSC12,944_HCSC12,0,0,0,-9
138,946_ARC611,946_ARC611,0,0,0,1
139,970_ARC666,970_ARC666,0,0,0,2


In [19]:
#V2 6month
Madrid_additional['sdai_v2'] = Madrid_additional['sdai_v2'].fillna(-9)
Madrid_additional['cdai_v2'] = Madrid_additional['cdai_v2'].fillna(-9)

In [20]:
Madrid_additional['CDAI_S'] = Madrid_additional['cdai_v2'].map(cDAI_S)
Madrid_additional['SDAI_S'] = Madrid_additional['sdai_v2'].map(sDAI_S)

In [22]:
Madrid_fam['id'] = Madrid_fam[0].str.replace('^.*_',"").str.replace("^.*C","").str.lstrip("0").astype(int)
Madrid_select = pd.merge(Madrid_additional,Madrid_fam,how='right',left_on='codigo2',right_on='id')
Madrid_select['CDAI_S'] = Madrid_select['CDAI_S'].fillna(-9)
Madrid_select['SDAI_S'] = Madrid_select['SDAI_S'].fillna(-9)
Madrid_select

  Madrid_fam['id'] = Madrid_fam[0].str.replace('^.*_',"").str.replace("^.*C","").str.lstrip("0").astype(int)


Unnamed: 0,codigo2,fechaini,vgepac_v1,vgemed_v1,nad_v1,nat_v1,vsg_v1,pcr_v1,das28_v1,das28pcr_v1,das28cat_v1,das28pcrcat_v1,sdai_v1,cdai_v1,vgepac_v2,vgemed_v2,nad_v2,nat_v2,vsg_v2,pcr_v2,das28_v2,das28pcr_v2,das28cat_v2,das28pcrcat_v2,sdai_v2,cdai_v2,vgepac_v3,vgemed_v3,nad_v3,nat_v3,vsg_v3,pcr_v3,das28_v3,das28pcr_v3,das28cat_v3,das28pcrcat_v3,sdai_v3,cdai_v3,peso,talla,bmi,edadinienf,tevol_v1,tevol_v2,tevol_v3,fecha1fme,hupi_v1,hupicat_v1,hupi_v2,hupicat_v2,hupi_v3,hupicat_v3,CDAI_S,SDAI_S,0,1,2,3,4,5,id
0,796.0,2018-07-01,78.0,55.0,5.0,6.0,50.0,2.9,5.768471,5.214486,Act. alta,Act. alta,27.200001,24.299999,0.0,15.0,2.0,1.0,3.0,0.15,1.840988,2.361824,Remision,Act. baja,4.650000,4.500000,,,,,,,,,,,,,64.0,1.55,26.638918,78.717812,0.733333,6.566667,,NaT,11.0,Act. alta,2.0,Remision,,,1.0,1.0,1018_ARC796,1018_ARC796,0,0,0,-9,796
1,552.0,2012-02-01,76.0,52.0,6.0,8.0,82.0,4.3,6.312377,5.549982,Act. alta,Act. alta,31.100000,26.799999,48.0,15.0,6.0,1.0,25.0,0.30,4.576927,3.782780,Act. moderada,Act. baja,13.600000,13.300000,56.0,25.0,1.0,1.0,37.0,0.30,4.151642,3.083066,Act. moderada,Act. baja,10.400000,10.100000,60.0,1.52,25.969528,77.271233,12.866667,18.366667,24.900000,2013-02-22,11.0,Act. alta,6.0,Act. moderada,6.5,Act. moderada,1.0,1.0,1020_ARC552,1020_ARC552,0,0,0,1,552
2,,NaT,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,NaT,,,,,,,-9.0,-9.0,1042_HCSC06,1042_HCSC06,0,0,0,-9,6
3,602.0,2014-02-01,85.0,49.0,9.0,6.0,54.0,0.6,6.348146,5.216385,Act. alta,Act. alta,29.000000,28.400000,50.0,14.0,0.0,0.0,23.0,0.20,2.894846,2.055501,Act. baja,Remision,6.600000,6.400000,55.0,10.0,0.0,1.0,6.0,0.20,2.304232,2.405500,Remision,Act. baja,7.700000,7.500000,66.0,1.52,28.566483,73.539726,2.866667,8.233334,15.000000,2014-04-29,11.0,Act. alta,3.0,Act. leve,4.0,Act. leve,1.0,1.0,1044_ARC602,1044_ARC602,0,0,0,1,602
4,646.0,2015-01-15,0.0,25.0,0.0,1.0,14.0,0.1,2.127340,1.489533,Remision,Remision,3.600000,3.500000,3.0,2.0,0.0,0.0,11.0,0.10,1.720527,1.251533,Remision,Remision,0.600000,0.500000,0.0,0.0,0.0,0.0,22.0,0.30,2.163730,1.459066,Remision,Remision,0.300000,0.000000,57.5,1.60,22.460938,63.191780,6.433333,12.500000,18.100000,2015-07-29,1.0,Remision,0.0,Remision,1.0,Remision,2.0,2.0,1068_ARC646,1068_ARC646,0,0,0,2,646
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
136,560.0,2013-03-15,39.0,25.0,6.0,5.0,7.0,2.9,3.905950,4.728244,Act. moderada,Act. moderada,20.299999,17.400000,20.0,9.0,4.0,0.0,13.0,1.00,3.195465,3.223242,Act. baja,Act. baja,7.900000,6.900000,32.0,15.0,2.0,0.0,12.0,1.50,2.979394,3.198092,Act. baja,Act. baja,8.200000,6.700000,70.0,1.72,23.661438,73.008217,4.066667,8.733334,15.266666,2014-03-15,9.5,Act. alta,5.0,Act. leve,5.5,Act. moderada,1.0,1.0,922_ARC560,922_ARC560,0,0,0,1,560
137,,NaT,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,NaT,,,,,,,-9.0,-9.0,944_HCSC12,944_HCSC12,0,0,0,-9,12
138,611.0,2014-07-01,75.0,49.0,12.0,8.0,,3.0,,5.978092,,Act. alta,35.400002,32.400002,50.0,12.0,3.0,0.0,13.0,0.50,3.465413,3.274982,Act. moderada,Act. baja,9.700000,9.200000,25.0,3.0,0.0,0.0,4.0,0.10,1.320406,1.559533,Remision,Remision,2.900000,2.800000,72.0,1.52,31.163435,80.093147,1.733333,6.733333,14.566667,2014-08-23,12.0,Act. alta,4.0,Act. leve,1.0,Remision,1.0,1.0,946_ARC611,946_ARC611,0,0,0,1,611
139,666.0,2015-08-15,15.0,30.0,1.0,4.0,20.0,0.2,3.427013,2.685500,Act. moderada,Act. baja,9.700000,9.500000,19.0,5.0,0.0,0.0,28.0,0.10,2.598543,1.475533,Remision,Remision,2.500000,2.400000,30.0,15.0,0.0,1.0,33.0,0.14,3.147555,1.975169,Act. baja,Remision,5.640000,5.500000,69.5,1.64,25.840273,67.884933,6.133333,11.033334,18.266666,2016-02-16,3.5,Act. leve,2.0,Remision,3.5,Act. leve,2.0,2.0,970_ARC666,970_ARC666,0,0,0,2,666


In [23]:
Madrid_fam_cDAI = Madrid_select.loc[:,[0,1,2,3,4,'CDAI_S']]
Madrid_fam_sDAI = Madrid_select.loc[:,[0,1,2,3,4,'SDAI_S']]

In [49]:
Madrid_fam_sDAI['SDAI_S'] = Madrid_fam_sDAI['SDAI_S'].astype(int)
Madrid_fam_cDAI['CDAI_S'] = Madrid_fam_cDAI['CDAI_S'].astype(int)

In [51]:
Madrid_fam_cDAI

Unnamed: 0,0,1,2,3,4,CDAI_S
0,1018_ARC796,1018_ARC796,0,0,0,1
1,1020_ARC552,1020_ARC552,0,0,0,1
2,1042_HCSC06,1042_HCSC06,0,0,0,-9
3,1044_ARC602,1044_ARC602,0,0,0,1
4,1068_ARC646,1068_ARC646,0,0,0,2
...,...,...,...,...,...,...
136,922_ARC560,922_ARC560,0,0,0,1
137,944_HCSC12,944_HCSC12,0,0,0,-9
138,946_ARC611,946_ARC611,0,0,0,1
139,970_ARC666,970_ARC666,0,0,0,2


In [50]:
Madrid_fam_sDAI.to_csv("/exports/reum/CKe/Pipelinerun_withPC/TwoCompDAS/Madrid_merged_sDAI.fam",sep='\t',index=False,header=False)
Madrid_fam_cDAI.to_csv("/exports/reum/CKe/Pipelinerun_withPC/TwoCompDAS/Madrid_merged_cDAI.fam",sep='\t',index=False,header=False)

## TACERA

In [11]:
Tacera = openfile("/exports/reum/CKe/Tacera/RA-MAP_data_clinical.csv")
keyfile = openfile("/exports/reum/CKe/Tacera/OpenPseudonymised_RA-MAP DNA_IDs deidentified to date 02Dec16_with_HLA.xlsx")
Tacera_fam = pd.read_csv("/exports/reum/CKe/Pipelinerun_withPC/Tacera/Final_imputed/TACERA_HRCv1_1_FINAL.fam",sep='\s',header=None)

  return func(*args, **kwargs)


In [115]:
keyfile

Unnamed: 0,Digest,sample_id,Study,notes,sample_id.1,HLA_A_1,HLA_B_1,HLA_C_1,HLA_DPA1_1,HLA_DPB1_1,HLA_DRB1_1,HLA_DQA1_1,HLA_DQB1_1,HLA_A_2,HLA_B_2,HLA_C_2,HLA_DPA1_2,HLA_DPB1_2,HLA_DRB1_2,HLA_DQA1_2,HLA_DQB1_2
0,D3A02019792FDA6C8C6B9CA21512801610FB7176BAE732...,D-21781-1,RAMAP-tacera,exclude: duplicate subject IDs but genotypes d...,D-21781-1,3201,5501,303,103,401,401,301,302,301,1518,704,103,201,1101,501,301
1,D3A02019792FDA6C8C6B9CA21512801610FB7176BAE732...,D-21863-1,RAMAP-tacera,exclude: duplicate subject IDs but genotypes d...,D-21863-1,301,5701,602,201,1301,701,201,303,201,702,702,103,402,1103,501,301
2,,D-21919-1,RAMAP-tacera,exclude: subjects unknown,D-21919-1,101,5701,602,201,1001,1501,102,602,201,1501,303,103,401,401,301,302
3,,D-21955-1,RAMAP-tacera,exclude: subjects unknown,D-21955-1,2301,4403,401,103,201,701,201,202,301,1501,102,201,1001,101,101,501
4,,D-22960-1,RAMAP-tacera,exclude: subjects unknown,D-22960-1,1101,3501,401,201,101,101,101,501,101,702,702,103,401,1101,501,301
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
290,F77FCE78B9C12C4011E3C22AC81BD7EA93519F47769081...,D-23010-1,Vaccine,,D-23010-1,201,4402,704,103,401,101,101,501,301,702,702,103,601,1501,102,602
291,E09DBC4609157185B2C8110022C52378534EAEFA20BA83...,D-33052-1,Vaccine,,D-33052-1,6801,702,702,103,401,1501,102,602,1101,5601,102,201,1101,701,201,202
292,335879869F16C038AE5E619D36C979021B7D761AC80B84...,Z-21686-1,RAMAP-tacera,,Z-21686-1,1101,4001,304,103,201,1501,102,502,2402,1301,304,103,401,1501,102,601
293,BF9D48FEB435B3F585DDDBF5D966C024E2027C62F82C48...,Z-21746-1,RAMAP-tacera,,Z-21746-1,301,3501,401,103,401,401,301,301,1101,5101,1502,103,601,404,301,302


In [112]:
Tacera

Unnamed: 0,Subject ID,\RAMAP\RAMAP\Clinical Data\.ACPA/RF Eligibility\ACPA\ACPA Unit\,\RAMAP\RAMAP\Clinical Data\.ACPA/RF Eligibility\ACPA\ACPA Value\,\RAMAP\RAMAP\Clinical Data\.ACPA/RF Eligibility\ACPA\ACPA positive\,\RAMAP\RAMAP\Clinical Data\.ACPA/RF Eligibility\Rheumatoid Factor\RF Unit\,\RAMAP\RAMAP\Clinical Data\.ACPA/RF Eligibility\Rheumatoid Factor\RF Value\,\RAMAP\RAMAP\Clinical Data\.ACPA/RF Eligibility\Rheumatoid Factor\Rheum Factor positive\,\RAMAP\RAMAP\Clinical Data\.Screening\ACPA\ACPA Unit SCR\,\RAMAP\RAMAP\Clinical Data\.Screening\ACPA\ACPA Value SCR\,\RAMAP\RAMAP\Clinical Data\.Screening\ACPA\ACPA positive SCR\,\RAMAP\RAMAP\Clinical Data\.Screening\Rheumatoid Factor\RF Unit SCR\,\RAMAP\RAMAP\Clinical Data\.Screening\Rheumatoid Factor\RF Value SCR\,\RAMAP\RAMAP\Clinical Data\.Screening\Rheumatoid Factor\Rheum Factor positive SCR\,\RAMAP\RAMAP\Clinical Data\00 Baseline\ACPA\ACPA Unit 00BL\,\RAMAP\RAMAP\Clinical Data\00 Baseline\ACPA\ACPA Value 00BL\,\RAMAP\RAMAP\Clinical Data\00 Baseline\ACPA\ACPA positive 00BL\,\RAMAP\RAMAP\Clinical Data\00 Baseline\Blood count\Basophils 00BL\,\RAMAP\RAMAP\Clinical Data\00 Baseline\Blood count\Date of FBC 00BL\,\RAMAP\RAMAP\Clinical Data\00 Baseline\Blood count\Eosinophils 00BL\,\RAMAP\RAMAP\Clinical Data\00 Baseline\Blood count\GL 00BL\,\RAMAP\RAMAP\Clinical Data\00 Baseline\Blood count\Gdl 00BL\,\RAMAP\RAMAP\Clinical Data\00 Baseline\Blood count\HB 00BL\,\RAMAP\RAMAP\Clinical Data\00 Baseline\Blood count\Lymphocytes 00BL\,\RAMAP\RAMAP\Clinical Data\00 Baseline\Blood count\Monocytes 00BL\,\RAMAP\RAMAP\Clinical Data\00 Baseline\Blood count\Neutrophils 00BL\,\RAMAP\RAMAP\Clinical Data\00 Baseline\Blood count\PLT 00BL\,\RAMAP\RAMAP\Clinical Data\00 Baseline\Blood count\WBC 00BL\,\RAMAP\RAMAP\Clinical Data\00 Baseline\DAS\Components\CRP Value (mg/L) 00BL\,\RAMAP\RAMAP\Clinical Data\00 Baseline\DAS\Components\ESR Value 00BL\,\RAMAP\RAMAP\Clinical Data\00 Baseline\DAS\Components\Evaluator global 00BL\,\RAMAP\RAMAP\Clinical Data\00 Baseline\DAS\Components\Fatique 00BL\,\RAMAP\RAMAP\Clinical Data\00 Baseline\DAS\Components\Outside 2 week window 00BL\,\RAMAP\RAMAP\Clinical Data\00 Baseline\DAS\Components\Pain score 00BL\,\RAMAP\RAMAP\Clinical Data\00 Baseline\DAS\Components\Patient global 00BL\,\RAMAP\RAMAP\Clinical Data\00 Baseline\DAS\Components\Total 66/68 Swollen Joints 00BL\,\RAMAP\RAMAP\Clinical Data\00 Baseline\DAS\Components\Total 66/68 Tender Joints 00BL\,\RAMAP\RAMAP\Clinical Data\00 Baseline\DAS\Components\Total Swollen 00BL\,\RAMAP\RAMAP\Clinical Data\00 Baseline\DAS\Components\Total Tender 00BL\,\RAMAP\RAMAP\Clinical Data\00 Baseline\DAS\Components\Use of sign '<' 00BL\,\RAMAP\RAMAP\Clinical Data\00 Baseline\DAS\DAS-28 CRP 00BL\,\RAMAP\RAMAP\Clinical Data\00 Baseline\DAS\DAS28 00BL\,\RAMAP\RAMAP\Clinical Data\00 Baseline\DAS\DAS28 relative 00BL\,\RAMAP\RAMAP\Clinical Data\00 Baseline\HAQ\Metrologist's score 00BL\,\RAMAP\RAMAP\Clinical Data\00 Baseline\Rheumatoid Factor\RF Unit 00BL\,\RAMAP\RAMAP\Clinical Data\00 Baseline\Rheumatoid Factor\RF Value 00BL\,\RAMAP\RAMAP\Clinical Data\00 Baseline\Rheumatoid Factor\Rheum Factor positive 00BL\,\RAMAP\RAMAP\Clinical Data\00 Baseline\SDAI\SDAI <= 3.3 00BL\,\RAMAP\RAMAP\Clinical Data\00 Baseline\SDAI\SDAI score 00BL\,\RAMAP\RAMAP\Clinical Data\03 Months\DAS\Components\CRP Value (mg/L) 03M\,\RAMAP\RAMAP\Clinical Data\03 Months\DAS\Components\ESR Value 03M\,\RAMAP\RAMAP\Clinical Data\03 Months\DAS\Components\Evaluator global 03M\,\RAMAP\RAMAP\Clinical Data\03 Months\DAS\Components\Fatique 03M\,\RAMAP\RAMAP\Clinical Data\03 Months\DAS\Components\Outside 2 week window 03M\,\RAMAP\RAMAP\Clinical Data\03 Months\DAS\Components\Pain score 03M\,\RAMAP\RAMAP\Clinical Data\03 Months\DAS\Components\Patient global 03M\,\RAMAP\RAMAP\Clinical Data\03 Months\DAS\Components\Total 66/68 Swollen Joints 03M\,\RAMAP\RAMAP\Clinical Data\03 Months\DAS\Components\Total 66/68 Tender Joints 03M\,\RAMAP\RAMAP\Clinical Data\03 Months\DAS\Components\Total Swollen 03M\,\RAMAP\RAMAP\Clinical Data\03 Months\DAS\Components\Total Tender 03M\,\RAMAP\RAMAP\Clinical Data\03 Months\DAS\Components\Use of sign '<' 03M\,\RAMAP\RAMAP\Clinical Data\03 Months\DAS\DAS-28 CRP 03M\,\RAMAP\RAMAP\Clinical Data\03 Months\DAS\DAS28 03M\,\RAMAP\RAMAP\Clinical Data\03 Months\DAS\DAS28 relative 03M\,\RAMAP\RAMAP\Clinical Data\03 Months\HAQ\Metrologist's score 03M\,\RAMAP\RAMAP\Clinical Data\03 Months\SDAI\SDAI <= 3.3 03M\,\RAMAP\RAMAP\Clinical Data\03 Months\SDAI\SDAI score 03M\,\RAMAP\RAMAP\Clinical Data\06 Months\Blood count\Basophils 06M\,\RAMAP\RAMAP\Clinical Data\06 Months\Blood count\Date of FBC 06M\,\RAMAP\RAMAP\Clinical Data\06 Months\Blood count\Eosinophils 06M\,\RAMAP\RAMAP\Clinical Data\06 Months\Blood count\GL 06M\,\RAMAP\RAMAP\Clinical Data\06 Months\Blood count\Gdl 06M\,\RAMAP\RAMAP\Clinical Data\06 Months\Blood count\HB 06M\,\RAMAP\RAMAP\Clinical Data\06 Months\Blood count\Lymphocytes 06M\,\RAMAP\RAMAP\Clinical Data\06 Months\Blood count\Monocytes 06M\,\RAMAP\RAMAP\Clinical Data\06 Months\Blood count\Neutrophils 06M\,\RAMAP\RAMAP\Clinical Data\06 Months\Blood count\PLT 06M\,\RAMAP\RAMAP\Clinical Data\06 Months\Blood count\WBC 06M\,\RAMAP\RAMAP\Clinical Data\06 Months\DAS\Components\CRP Value (mg/L) 06M\,\RAMAP\RAMAP\Clinical Data\06 Months\DAS\Components\ESR Value 06M\,\RAMAP\RAMAP\Clinical Data\06 Months\DAS\Components\Evaluator global 06M\,\RAMAP\RAMAP\Clinical Data\06 Months\DAS\Components\Fatique 06M\,\RAMAP\RAMAP\Clinical Data\06 Months\DAS\Components\Outside 2 week window 06M\,\RAMAP\RAMAP\Clinical Data\06 Months\DAS\Components\Pain score 06M\,\RAMAP\RAMAP\Clinical Data\06 Months\DAS\Components\Patient global 06M\,\RAMAP\RAMAP\Clinical Data\06 Months\DAS\Components\Total 66/68 Swollen Joints 06M\,\RAMAP\RAMAP\Clinical Data\06 Months\DAS\Components\Total 66/68 Tender Joints 06M\,\RAMAP\RAMAP\Clinical Data\06 Months\DAS\Components\Total Swollen 06M\,\RAMAP\RAMAP\Clinical Data\06 Months\DAS\Components\Total Tender 06M\,\RAMAP\RAMAP\Clinical Data\06 Months\DAS\Components\Use of sign '<' 06M\,\RAMAP\RAMAP\Clinical Data\06 Months\DAS\DAS-28 CRP 06M\,\RAMAP\RAMAP\Clinical Data\06 Months\DAS\DAS28 06M\,\RAMAP\RAMAP\Clinical Data\06 Months\DAS\DAS28 relative 06M\,\RAMAP\RAMAP\Clinical Data\06 Months\HAQ\Metrologist's score 06M\,\RAMAP\RAMAP\Clinical Data\06 Months\SDAI\SDAI <= 3.3 06M\,\RAMAP\RAMAP\Clinical Data\06 Months\SDAI\SDAI score 06M\,\RAMAP\RAMAP\Clinical Data\09 Months\DAS\Components\CRP Value (mg/L) 09M\,\RAMAP\RAMAP\Clinical Data\09 Months\DAS\Components\ESR Value 09M\,\RAMAP\RAMAP\Clinical Data\09 Months\DAS\Components\Evaluator global 09M\,\RAMAP\RAMAP\Clinical Data\09 Months\DAS\Components\Fatique 09M\,\RAMAP\RAMAP\Clinical Data\09 Months\DAS\Components\Outside 2 week window 09M\,\RAMAP\RAMAP\Clinical Data\09 Months\DAS\Components\Pain score 09M\,\RAMAP\RAMAP\Clinical Data\09 Months\DAS\Components\Patient global 09M\,\RAMAP\RAMAP\Clinical Data\09 Months\DAS\Components\Total 66/68 Swollen Joints 09M\,\RAMAP\RAMAP\Clinical Data\09 Months\DAS\Components\Total 66/68 Tender Joints 09M\,\RAMAP\RAMAP\Clinical Data\09 Months\DAS\Components\Total Swollen 09M\,\RAMAP\RAMAP\Clinical Data\09 Months\DAS\Components\Total Tender 09M\,\RAMAP\RAMAP\Clinical Data\09 Months\DAS\Components\Use of sign '<' 09M\,\RAMAP\RAMAP\Clinical Data\09 Months\DAS\DAS-28 CRP 09M\,\RAMAP\RAMAP\Clinical Data\09 Months\DAS\DAS28 09M\,\RAMAP\RAMAP\Clinical Data\09 Months\DAS\DAS28 relative 09M\,\RAMAP\RAMAP\Clinical Data\09 Months\HAQ\Metrologist's score 09M\,\RAMAP\RAMAP\Clinical Data\09 Months\SDAI\SDAI <= 3.3 09M\,\RAMAP\RAMAP\Clinical Data\09 Months\SDAI\SDAI score 09M\,\RAMAP\RAMAP\Clinical Data\12 Months\Blood count\Basophils 12M\,\RAMAP\RAMAP\Clinical Data\12 Months\Blood count\Date of FBC 12M\,\RAMAP\RAMAP\Clinical Data\12 Months\Blood count\Eosinophils 12M\,\RAMAP\RAMAP\Clinical Data\12 Months\Blood count\GL 12M\,\RAMAP\RAMAP\Clinical Data\12 Months\Blood count\Gdl 12M\,\RAMAP\RAMAP\Clinical Data\12 Months\Blood count\HB 12M\,\RAMAP\RAMAP\Clinical Data\12 Months\Blood count\Lymphocytes 12M\,\RAMAP\RAMAP\Clinical Data\12 Months\Blood count\Monocytes 12M\,\RAMAP\RAMAP\Clinical Data\12 Months\Blood count\Neutrophils 12M\,\RAMAP\RAMAP\Clinical Data\12 Months\Blood count\PLT 12M\,\RAMAP\RAMAP\Clinical Data\12 Months\Blood count\WBC 12M\,\RAMAP\RAMAP\Clinical Data\12 Months\DAS\Components\CRP Value (mg/L) 12M\,\RAMAP\RAMAP\Clinical Data\12 Months\DAS\Components\ESR Value 12M\,\RAMAP\RAMAP\Clinical Data\12 Months\DAS\Components\Evaluator global 12M\,\RAMAP\RAMAP\Clinical Data\12 Months\DAS\Components\Fatique 12M\,\RAMAP\RAMAP\Clinical Data\12 Months\DAS\Components\Outside 2 week window 12M\,\RAMAP\RAMAP\Clinical Data\12 Months\DAS\Components\Pain score 12M\,\RAMAP\RAMAP\Clinical Data\12 Months\DAS\Components\Patient global 12M\,\RAMAP\RAMAP\Clinical Data\12 Months\DAS\Components\Total 66/68 Swollen Joints 12M\,\RAMAP\RAMAP\Clinical Data\12 Months\DAS\Components\Total 66/68 Tender Joints 12M\,\RAMAP\RAMAP\Clinical Data\12 Months\DAS\Components\Total Swollen 12M\,\RAMAP\RAMAP\Clinical Data\12 Months\DAS\Components\Total Tender 12M\,\RAMAP\RAMAP\Clinical Data\12 Months\DAS\Components\Use of sign '<' 12M\,\RAMAP\RAMAP\Clinical Data\12 Months\DAS\DAS-28 CRP 12M\,\RAMAP\RAMAP\Clinical Data\12 Months\DAS\DAS28 12M\,\RAMAP\RAMAP\Clinical Data\12 Months\DAS\DAS28 relative 12M\,\RAMAP\RAMAP\Clinical Data\12 Months\HAQ\Metrologist's score 12M\,\RAMAP\RAMAP\Clinical Data\12 Months\SDAI\SDAI <= 3.3 12M\,\RAMAP\RAMAP\Clinical Data\12 Months\SDAI\SDAI score 12M\,\RAMAP\RAMAP\Clinical Data\15 Months\DAS\Components\CRP Value (mg/L) 15M\,\RAMAP\RAMAP\Clinical Data\15 Months\DAS\Components\ESR Value 15M\,\RAMAP\RAMAP\Clinical Data\15 Months\DAS\Components\Evaluator global 15M\,\RAMAP\RAMAP\Clinical Data\15 Months\DAS\Components\Fatique 15M\,\RAMAP\RAMAP\Clinical Data\15 Months\DAS\Components\Outside 2 week window 15M\,\RAMAP\RAMAP\Clinical Data\15 Months\DAS\Components\Pain score 15M\,\RAMAP\RAMAP\Clinical Data\15 Months\DAS\Components\Patient global 15M\,\RAMAP\RAMAP\Clinical Data\15 Months\DAS\Components\Total 66/68 Swollen Joints 15M\,\RAMAP\RAMAP\Clinical Data\15 Months\DAS\Components\Total 66/68 Tender Joints 15M\,\RAMAP\RAMAP\Clinical Data\15 Months\DAS\Components\Total Swollen 15M\,\RAMAP\RAMAP\Clinical Data\15 Months\DAS\Components\Total Tender 15M\,\RAMAP\RAMAP\Clinical Data\15 Months\DAS\Components\Use of sign '<' 15M\,\RAMAP\RAMAP\Clinical Data\15 Months\DAS\DAS-28 CRP 15M\,\RAMAP\RAMAP\Clinical Data\15 Months\DAS\DAS28 15M\,\RAMAP\RAMAP\Clinical Data\15 Months\DAS\DAS28 relative 15M\,\RAMAP\RAMAP\Clinical Data\15 Months\HAQ\Metrologist's score 15M\,\RAMAP\RAMAP\Clinical Data\15 Months\SDAI\SDAI <= 3.3 15M\,\RAMAP\RAMAP\Clinical Data\15 Months\SDAI\SDAI score 15M\,\RAMAP\RAMAP\Clinical Data\18 Months\Blood count\Basophils 18M\,\RAMAP\RAMAP\Clinical Data\18 Months\Blood count\Date of FBC 18M\,\RAMAP\RAMAP\Clinical Data\18 Months\Blood count\Eosinophils 18M\,\RAMAP\RAMAP\Clinical Data\18 Months\Blood count\GL 18M\,\RAMAP\RAMAP\Clinical Data\18 Months\Blood count\Gdl 18M\,\RAMAP\RAMAP\Clinical Data\18 Months\Blood count\HB 18M\,\RAMAP\RAMAP\Clinical Data\18 Months\Blood count\Lymphocytes 18M\,\RAMAP\RAMAP\Clinical Data\18 Months\Blood count\Monocytes 18M\,\RAMAP\RAMAP\Clinical Data\18 Months\Blood count\Neutrophils 18M\,\RAMAP\RAMAP\Clinical Data\18 Months\Blood count\PLT 18M\,\RAMAP\RAMAP\Clinical Data\18 Months\Blood count\WBC 18M\,\RAMAP\RAMAP\Clinical Data\18 Months\DAS\Components\CRP Value (mg/L) 18M\,\RAMAP\RAMAP\Clinical Data\18 Months\DAS\Components\ESR Value 18M\,\RAMAP\RAMAP\Clinical Data\18 Months\DAS\Components\Evaluator global 18M\,\RAMAP\RAMAP\Clinical Data\18 Months\DAS\Components\Fatique 18M\,\RAMAP\RAMAP\Clinical Data\18 Months\DAS\Components\Outside 2 week window 18M\,\RAMAP\RAMAP\Clinical Data\18 Months\DAS\Components\Pain score 18M\,\RAMAP\RAMAP\Clinical Data\18 Months\DAS\Components\Patient global 18M\,\RAMAP\RAMAP\Clinical Data\18 Months\DAS\Components\Total 66/68 Swollen Joints 18M\,\RAMAP\RAMAP\Clinical Data\18 Months\DAS\Components\Total 66/68 Tender Joints 18M\,\RAMAP\RAMAP\Clinical Data\18 Months\DAS\Components\Total Swollen 18M\,\RAMAP\RAMAP\Clinical Data\18 Months\DAS\Components\Total Tender 18M\,\RAMAP\RAMAP\Clinical Data\18 Months\DAS\Components\Use of sign '<' 18M\,\RAMAP\RAMAP\Clinical Data\18 Months\DAS\DAS-28 CRP 18M\,\RAMAP\RAMAP\Clinical Data\18 Months\DAS\DAS28 18M\,\RAMAP\RAMAP\Clinical Data\18 Months\DAS\DAS28 relative 18M\,\RAMAP\RAMAP\Clinical Data\18 Months\HAQ\Metrologist's score 18M\,\RAMAP\RAMAP\Clinical Data\18 Months\SDAI\SDAI <= 3.3 18M\,\RAMAP\RAMAP\Clinical Data\18 Months\SDAI\SDAI score 18M\,\RAMAP\RAMAP\Clinical Data\VACCINE Serology\Date processed\,\RAMAP\RAMAP\Clinical Data\VACCINE Serology\HBVAX (mIU/ml)\,\RAMAP\RAMAP\Clinical Data\VACCINE Serology\HBVAX range (mIU/ml)\,\RAMAP\RAMAP\Clinical Data\VACCINE Serology\Hub\,\RAMAP\RAMAP\Medication\00 Baseline\Folic Acid 00BL\,\RAMAP\RAMAP\Medication\00 Baseline\Hydroxychloroquine 00BL\,\RAMAP\RAMAP\Medication\00 Baseline\Methotrexate 00BL\,\RAMAP\RAMAP\Medication\00 Baseline\Prednisolone 00BL\,\RAMAP\RAMAP\Medication\00 Baseline\Sulfasalazine 00BL\,\RAMAP\RAMAP\Medication\03 Months\Folic Acid 03M\,\RAMAP\RAMAP\Medication\03 Months\Hydroxychloroquine 03M\,\RAMAP\RAMAP\Medication\03 Months\Leflunomide 03M\,\RAMAP\RAMAP\Medication\03 Months\Methotrexate 03M\,\RAMAP\RAMAP\Medication\03 Months\Prednisolone 03M\,\RAMAP\RAMAP\Medication\03 Months\Sulfasalazine 03M\,\RAMAP\RAMAP\Medication\06 Months\Folic Acid 06M\,\RAMAP\RAMAP\Medication\06 Months\Hydroxychloroquine 06M\,\RAMAP\RAMAP\Medication\06 Months\Leflunomide 06M\,\RAMAP\RAMAP\Medication\06 Months\Methotrexate 06M\,\RAMAP\RAMAP\Medication\06 Months\Prednisolone 06M\,\RAMAP\RAMAP\Medication\06 Months\Sulfasalazine 06M\,\RAMAP\RAMAP\Medication\09 Months\Certolizumab 09M\,\RAMAP\RAMAP\Medication\09 Months\Etanercept 09M\,\RAMAP\RAMAP\Medication\09 Months\Folic Acid 09M\,\RAMAP\RAMAP\Medication\09 Months\Golimumab 09M\,\RAMAP\RAMAP\Medication\09 Months\Hydroxychloroquine 09M\,\RAMAP\RAMAP\Medication\09 Months\Methotrexate 09M\,\RAMAP\RAMAP\Medication\09 Months\Prednisolone 09M\,\RAMAP\RAMAP\Medication\09 Months\Sulfasalazine 09M\,\RAMAP\RAMAP\Medication\12 Months\Adalimumab 12M\,\RAMAP\RAMAP\Medication\12 Months\Certolizumab 12M\,\RAMAP\RAMAP\Medication\12 Months\Etanercept 12M\,\RAMAP\RAMAP\Medication\12 Months\Folic Acid 12M\,\RAMAP\RAMAP\Medication\12 Months\Golimumab 12M\,\RAMAP\RAMAP\Medication\12 Months\Hydroxychloroquine 12M\,\RAMAP\RAMAP\Medication\12 Months\Leflunomide 12M\,\RAMAP\RAMAP\Medication\12 Months\Methotrexate 12M\,\RAMAP\RAMAP\Medication\12 Months\Prednisolone 12M\,\RAMAP\RAMAP\Medication\12 Months\Sulfasalazine 12M\,\RAMAP\RAMAP\Medication\15 Months\Adalimumab 15M\,\RAMAP\RAMAP\Medication\15 Months\Certolizumab 15M\,\RAMAP\RAMAP\Medication\15 Months\Etanercept 15M\,\RAMAP\RAMAP\Medication\15 Months\Folic Acid 15M\,\RAMAP\RAMAP\Medication\15 Months\Hydroxychloroquine 15M\,\RAMAP\RAMAP\Medication\15 Months\Leflunomide 15M\,\RAMAP\RAMAP\Medication\15 Months\Methotrexate 15M\,\RAMAP\RAMAP\Medication\15 Months\Sulfasalazine 15M\,\RAMAP\RAMAP\Medication\15 Months\Tocilizumab 15M\,\RAMAP\RAMAP\Medication\18 Months\Adalimumab 18M\,\RAMAP\RAMAP\Medication\18 Months\Certolizumab 18M\,\RAMAP\RAMAP\Medication\18 Months\Etanercept 18M\,\RAMAP\RAMAP\Medication\18 Months\Folic Acid 18M\,\RAMAP\RAMAP\Medication\18 Months\Hydroxychloroquine 18M\,\RAMAP\RAMAP\Medication\18 Months\Leflunomide 18M\,\RAMAP\RAMAP\Medication\18 Months\Methotrexate 18M\,\RAMAP\RAMAP\Medication\18 Months\Sulfasalazine 18M\,\RAMAP\RAMAP\Medication\18 Months\Tocilizumab 18M\,\RAMAP\RAMAP\Site\,\RAMAP\RAMAP\Steroid Injections\03 Months\Dexamethasone 03M\,\RAMAP\RAMAP\Steroid Injections\03 Months\Methylprednisolone 03M\,\RAMAP\RAMAP\Steroid Injections\03 Months\Methylprednisolone Acetate 03M\,\RAMAP\RAMAP\Steroid Injections\03 Months\Triamcinolone (Kenalog) 03M\,\RAMAP\RAMAP\Steroid Injections\06 Months\Dexamethasone 06M\,\RAMAP\RAMAP\Steroid Injections\06 Months\Methylprednisolone 06M\,\RAMAP\RAMAP\Steroid Injections\06 Months\Methylprednisolone Acetate 06M\,\RAMAP\RAMAP\Steroid Injections\06 Months\Triamcinolone (Kenalog) 06M\,\RAMAP\RAMAP\Steroid Injections\09 Months\Methylprednisolone 09M\,\RAMAP\RAMAP\Steroid Injections\09 Months\Methylprednisolone Acetate 09M\,\RAMAP\RAMAP\Steroid Injections\09 Months\Triamcinolone (Kenalog) 09M\,\RAMAP\RAMAP\Steroid Injections\12 Months\Dexamethasone 12M\,\RAMAP\RAMAP\Steroid Injections\12 Months\Methylprednisolone 12M\,\RAMAP\RAMAP\Steroid Injections\12 Months\Methylprednisolone Acetate 12M\,\RAMAP\RAMAP\Steroid Injections\12 Months\Triamcinolone (Kenalog) 12M\,\RAMAP\RAMAP\Steroid Injections\15 Months\Dexamethasone 15M\,\RAMAP\RAMAP\Steroid Injections\15 Months\Methylprednisolone 15M\,\RAMAP\RAMAP\Steroid Injections\15 Months\Methylprednisolone Acetate 15M\,\RAMAP\RAMAP\Steroid Injections\15 Months\Triamcinolone (Kenalog) 15M\,\RAMAP\RAMAP\Steroid Injections\18 Months\Methylprednisolone 18M\,\RAMAP\RAMAP\Steroid Injections\18 Months\Methylprednisolone Acetate 18M\,\RAMAP\RAMAP\Steroid Injections\18 Months\Triamcinolone (Kenalog) 18M\,\RAMAP\RAMAP\Study\,\RAMAP\RAMAP\Study\SOMAScan\,\RAMAP\RAMAP\Subjects\Demographics\Age\,\RAMAP\RAMAP\Subjects\Demographics\Height\,\RAMAP\RAMAP\Subjects\Demographics\Race\,\RAMAP\RAMAP\Subjects\Demographics\Sex\,\RAMAP\RAMAP\Subjects\Demographics\Weight\,\RAMAP\RAMAP\Subjects\Medical History\Alcohol History\Consumption frequency\,\RAMAP\RAMAP\Subjects\Medical History\Alcohol History\Drinks alcohol\,\RAMAP\RAMAP\Subjects\Medical History\Alcohol History\Units of alcohol consumption per week (if over 20)\,\RAMAP\RAMAP\Subjects\Medical History\Alcohol History\Units of alcohol consumption per week Range\,\RAMAP\RAMAP\Subjects\Medical History\Alcohol History\Units of alcohol consumption per week\,\RAMAP\RAMAP\Subjects\Medical History\Any intramuscular steroid injections\,\RAMAP\RAMAP\Subjects\Medical History\Corticosteroid treatment for current episode\,\RAMAP\RAMAP\Subjects\Medical History\DMARD and TNF inhibitor naive\,\RAMAP\RAMAP\Subjects\Medical History\Date of Assessment\,\RAMAP\RAMAP\Subjects\Medical History\Date of symptom onset\,\RAMAP\RAMAP\Subjects\Medical History\Smoking History\If previous or current smoker Other Type\,\RAMAP\RAMAP\Subjects\Medical History\Smoking History\If previous or current smoker Type\,\RAMAP\RAMAP\Subjects\Medical History\Smoking History\If previous smoker date stopped smoking\,\RAMAP\RAMAP\Subjects\Medical History\Smoking History\Number of cigarettes per day\,\RAMAP\RAMAP\Subjects\Medical History\Smoking History\Number of years smoked\,\RAMAP\RAMAP\Subjects\Medical History\Smoking History\Smoking status\,\RAMAP\RAMAP\Subjects\Status\Date of Report\,\RAMAP\RAMAP\Subjects\Status\Enrollment\,\RAMAP\RAMAP\XRAY\Annualised Progression\,\RAMAP\RAMAP\XRAY\Erosive\,\RAMAP\RAMAP\XRAY\Final Score\,\RAMAP\RAMAP\XRAY\Initial Score\,\RAMAP\RAMAP\XRAY\Only 6 Month X-Rays\,\RAMAP\RAMAP\XRAY\Unadjusted Progression\,SDAI_S
0,0A0B0E97239BE7AB5F473C8C046A69142C2213BC4ABADC...,U/ml,109.0,Yes,U/ml,49.0,Yes,U/ml,109.0,Yes,U/ml,49.0,Yes,,,,0.01,9/6/2013,0.08,Yes,No,148.0,1.29,0.73,8.55,233.0,10.66,10.0,1.0,40.0,70.0,No,45.0,46.0,1.0,3.0,1.0,3.0,No,3.72,1.89,1.0,0.875,,,,No,13.60,5.0,5.0,18.0,77.0,,8.0,25.0,0.0,0.0,0.0,0.0,Yes,1.96,1.48,0.783069,0.000,No,4.80,0.00,2014-03-26,0.10,Yes,No,145.0,1.20,0.50,6.00,253.0,7.70,14.0,7.0,81.0,66.0,No,64.0,80.0,4.0,19.0,4.0,3.0,No,4.58,4.01,2.121693,1.625,No,24.5,6.0,2.0,33.0,29.0,No,2.0,21.0,3.0,0.0,3.0,0.0,No,2.44,1.26,0.666667,0.125,No,9.00,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,3.0,2.0,41.0,45.0,No,27.0,42.0,13.0,7.0,12.0,6.0,No,4.39,3.41,1.804233,0.500,No,26.6,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,No,Yes,No,No,No,Yes,Yes,No,Yes,No,No,,,,,,,No,No,No,No,Yes,No,No,Yes,,,,,,,,,,,No,No,No,Yes,Yes,No,Yes,No,No,,,,,,,,,,,No,No,Yes,No,,,,,No,Yes,No,,,,,No,Yes,No,Yes,,,,TACERA,No,26,180.0,White- British,Male,88.0,1-2 days a month,Yes,,,1-5,No,No,Yes,9/6/2013,3/31/2013,,,,,,Never Smoked,6/22/2015,Withdrawn -lost to follow up,,,,,,,1
1,747FC68D04F159A9D79B21F8228350946727DCD2E3C966...,U/ml,600.0,Yes,U/ml,426.0,Yes,U/ml,600.0,Yes,U/ml,426.0,Yes,,,,0.10,8/23/2013,0.20,Yes,No,144.0,2.80,0.60,3.40,157.0,6.90,7.0,32.0,76.0,70.0,,71.0,73.0,13.0,11.0,6.0,4.0,No,4.54,5.25,1.0,1.500,,,,No,25.60,11.0,58.0,10.0,7.0,,1.0,3.0,4.0,9.0,4.0,2.0,No,3.25,4.24,0.807619,0.375,No,8.40,0.00,2014-03-06,0.10,Yes,No,134.0,2.40,0.30,3.90,159.0,6.80,5.0,22.0,25.0,4.0,No,0.0,0.0,4.0,6.0,3.0,2.0,Yes,2.88,3.44,0.655238,0.375,No,8.0,2.0,22.0,41.0,9.0,No,8.0,3.0,6.0,18.0,6.0,8.0,No,3.67,4.48,0.853333,0.375,No,18.60,-99.00,2014-08-26,0.20,Yes,No,127.0,2.20,2.20,5.80,181.0,8.50,4.0,34.0,72.0,70.0,No,17.0,33.0,20.0,26.0,14.0,13.0,No,5.07,6.00,1.142857,0.750,No,37.9,1.0,17.0,36.0,65.0,No,1.0,29.0,7.0,12.0,4.0,0.0,Yes,2.18,2.95,0.561905,0.875,No,10.6,-99.00,2015-02-19,0.20,Yes,No,129.0,2.70,0.20,3.60,172.0,6.70,2.0,22.0,32.0,41.0,No,0.0,30.0,7.0,17.0,7.0,5.0,No,3.77,4.58,0.872381,1.0,No,18.4,,,,,Yes,Yes,Yes,No,No,Yes,Yes,No,Yes,No,No,Yes,Yes,No,Yes,No,No,No,No,Yes,No,Yes,Yes,No,No,No,No,No,Yes,No,Yes,No,Yes,No,No,No,Yes,No,Yes,Yes,No,Yes,No,No,No,Yes,No,Yes,Yes,No,Yes,No,No,KCL,No,No,Yes,No,,,,,Yes,No,No,No,Yes,No,No,No,Yes,No,No,,,,TACERA,No,48,292.0,White- British,Female,79.5,1-2 days a month,Yes,,,1-5,No,No,Yes,8/23/2013,2/23/2013,,Cigarrette,,5,30.0,Current Smoker,4/16/2015,Completed,0.0,No,1.0,1.0,No,0.0,1
2,F7347C9F21B34DCE309FEDEFE6C3C8C4FFDA7B339BEBCB...,u/ml,600.0,Yes,u/ml,93.0,Yes,u/ml,600.0,Yes,u/ml,93.0,Yes,,,,0.00,8/13/2013,0.40,Yes,No,145.0,1.60,0.50,5.10,238.0,7.80,9.0,9.0,19.0,13.0,Yes,49.0,44.0,2.0,11.0,0.0,3.0,No,3.37,3.12,1.0,0.000,,,,No,10.20,5.0,5.0,3.0,8.0,,3.0,3.0,1.0,2.0,0.0,0.0,Yes,1.65,1.17,0.375000,0.000,Yes,1.10,0.10,2014-01-29,0.30,Yes,No,141.0,1.30,0.50,3.30,198.0,5.30,5.0,5.0,0.0,5.0,No,1.0,1.0,0.0,0.0,0.0,0.0,No,1.62,1.14,0.365385,0.000,Yes,0.6,1.0,2.0,0.0,5.0,No,0.0,0.0,0.0,0.0,0.0,0.0,No,1.21,0.49,0.157051,0.000,Yes,0.10,0.00,2014-08-13,0.20,Yes,No,138.0,1.50,0.40,2.60,181.0,4.70,2.0,6.0,0.0,2.0,No,4.0,3.0,0.0,0.0,0.0,0.0,No,1.40,1.30,0.416667,0.000,Yes,0.5,1.0,5.0,1.0,11.0,No,2.0,1.0,0.0,0.0,0.0,0.0,No,1.22,1.14,0.365385,0.000,Yes,0.3,,2015-02-11,0.30,Yes,No,142.0,1.60,0.50,4.50,248.0,6.80,4.0,13.0,11.0,11.0,No,12.0,14.0,0.0,2.0,0.0,0.0,No,1.74,1.99,0.637821,0.0,Yes,2.9,,,,,Yes,Yes,Yes,No,No,Yes,Yes,No,Yes,No,No,Yes,Yes,No,Yes,No,No,No,No,Yes,No,Yes,Yes,No,No,No,No,No,Yes,No,Yes,No,Yes,No,No,No,No,No,Yes,Yes,No,Yes,No,No,No,No,No,Yes,Yes,No,Yes,No,No,KCL,,,,,,,,,,,,,,,,,,,,,,,TACERA,No,51,179.0,White- British,Male,75.7,5 or more days a week,Yes,40.0,,more than 20,No,No,Yes,8/13/2013,2/13/2013,,Hand-rolled tobacco,1985-1-1,6,4.0,Previous Smoker,2/20/2015,Completed,1.0,Yes,11.0,11.0,No,1.0,2
3,87F62B63D5BAB1DE4A7C3955B6C0D81C9B13D1E48EF10A...,U/mL,96.0,Yes,lU/mL,24.0,Yes,U/mL,96.0,Yes,IU/mL,24.0,Yes,U/mL,96.0,Yes,0.03,8/13/2013,0.43,Yes,No,122.0,2.00,0.51,4.84,344.0,7.80,14.6,11.0,80.0,0.0,,65.0,86.0,5.0,19.0,5.0,10.0,No,5.55,5.28,1.0,0.625,lU/mL,24.0,Yes,No,33.06,2.8,4.0,1.0,21.0,,1.0,0.0,0.0,2.0,0.0,2.0,No,2.23,1.76,0.333333,0.000,Yes,2.38,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,Yes,No,Yes,No,No,Yes,Yes,No,Yes,No,No,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,UCL,,,,,,,,,,,,,,,,,,,,,,,TACERA,No,30,163.0,White- British,Female,89.0,1-2 days a month,Yes,,,1-5,No,No,Yes,8/6/2013,3/1/2013,,,,,,Never Smoked,10/7/2014,Withdrawn,,,,,,,0
4,1D64D145CB205919CFE0070487BC628EFA2D08E7AA7AB3...,u/Ml,340.0,Yes,IU/ml,210.0,Yes,u/Ml,340.0,Yes,IU/ml,210.0,Yes,,,,0.01,7/19/2013,0.10,Yes,No,120.0,1.23,0.24,2.99,144.0,4.57,2.0,27.0,34.0,25.0,,33.0,23.0,3.0,13.0,3.0,9.0,Yes,3.84,4.79,1.0,0.750,,,,No,17.90,2.0,24.0,23.0,34.0,,28.0,13.0,0.0,3.0,0.0,2.0,Yes,2.33,3.20,0.668058,0.375,No,5.80,0.01,2014-01-16,0.12,Yes,No,120.0,0.95,0.21,2.63,180.0,3.91,2.0,14.0,21.0,27.0,,16.0,19.0,0.0,14.0,0.0,6.0,Yes,2.99,3.49,0.728601,0.500,No,10.2,2.4,23.0,20.0,26.0,No,17.0,19.0,2.0,0.0,2.0,0.0,No,2.06,2.86,0.597077,0.125,No,6.14,0.01,2014-09-09,0.09,Yes,No,124.0,1.08,0.17,2.87,173.0,4.22,2.0,12.0,6.0,40.0,No,9.0,10.0,0.0,0.0,0.0,0.0,Yes,1.50,1.88,0.392484,0.375,Yes,1.8,2.0,14.0,3.0,32.0,No,10.0,5.0,0.0,0.0,0.0,0.0,No,1.43,1.92,0.400835,0.375,Yes,1.0,0.01,2015-01-27,0.07,Yes,No,135.0,1.15,0.21,2.79,175.0,4.23,2.0,19.0,2.0,25.0,No,3.0,4.0,0.0,0.0,0.0,0.0,Yes,1.41,2.12,0.442589,0.5,Yes,0.8,,,,,,,,,,,,,,,,Yes,Yes,No,Yes,No,No,No,No,Yes,No,Yes,Yes,No,No,No,No,No,Yes,No,Yes,No,Yes,No,No,No,No,No,Yes,Yes,No,Yes,No,No,No,No,No,Yes,Yes,No,Yes,No,No,KCL,No,No,Yes,No,,,,,,,,,,,,,,,,,,,TACERA,No,28,165.0,Asian or Asian British - Bangladeshi,Female,95.9,,No,,,,No,No,Yes,7/19/2013,6/1/2013,,,,,,Never Smoked,1/27/2015,Completed,0.0,No,0.0,0.0,No,0.0,1
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
312,AB7756B59517FA3F38CB5DE631C230754ED9A7B857B1BF...,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,29/04/2014,204.55,,Birmingham,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,VACCINE,Yes,23,170.0,White - any other White background,Female,53.0,1-2 days a month,Yes,,,1-5,,,,,,,,,,,Never Smoked,,,,,,,,,0
313,E51979E95D393C236E82B066C3AE3ED481277ECDBB8CBB...,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,29/04/2014,,>1000,Birmingham,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,VACCINE,Yes,35,181.0,White- British,Male,82.0,3 - 4 days a week,Yes,,,11-15,,,,,,,Cigarette,2000,16-20,5.0,Previous Smoker,,,,,,,,,0
314,57B99734B63A693AF7C102F614FCE87AA399C1A822CD76...,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,1/10/2015,887.60,,Birmingham,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,VACCINE,Yes,23,163.0,Asian or Asian British - Pakistani,Male,58.4,,No,,,,,,,,,,,,,,Never Smoked,,,,,,,,,0
315,1128C09C073469B5538BB880AC4BB70354F6277EEEAE91...,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,29/04/2014,610.56,,Birmingham,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,VACCINE,Yes,27,158.0,White- British,Female,66.0,1-2 days a month,Yes,,,6-10,,,,,,,Cigarette,2010,1-5,1.0,Previous Smoker,,,,,,,,,0


In [12]:
Tacera['SDAI_S'] = Tacera.iloc[:,93].fillna(-9)
Tacera['SDAI_S'] = Tacera['SDAI_S'].map({'Yes':2,'No':1,-9:0})

In [13]:
Tacera_fam

Unnamed: 0,0,1,2,3,4,5
0,D-12945-1_D-12945-1,D-12945-1_D-12945-1,0,0,0,-9
1,D-21657-1_D-21657-1,D-21657-1_D-21657-1,0,0,1,1
2,D-21658-1_D-21658-1,D-21658-1_D-21658-1,0,0,2,2
3,D-21659-1_D-21659-1,D-21659-1_D-21659-1,0,0,2,2
4,D-21660-1_D-21660-1,D-21660-1_D-21660-1,0,0,2,1
...,...,...,...,...,...,...
290,D-23461-1_D-23461-1,D-23461-1_D-23461-1,0,0,0,-9
291,D-33052-1_D-33052-1,D-33052-1_D-33052-1,0,0,0,-9
292,Z-21686-1_Z-21686-1,Z-21686-1_Z-21686-1,0,0,2,1
293,Z-21746-1_Z-21746-1,Z-21746-1_Z-21746-1,0,0,2,1


In [14]:
Tacera = Tacera.merge(keyfile,how='left',left_on="Subject ID",right_on='Digest')

In [15]:
Tacera_fam['id'] = Tacera_fam[0].str.split("_",expand=True)[0]
Tacera_fam_sdai = pd.merge(Tacera_fam,Tacera,how='left',left_on='id',right_on='sample_id').loc[:,[0,1,2,3,4,'SDAI_S']]
Tacera_fam_sdai['SDAI_S'] = Tacera_fam_sdai['SDAI_S'].fillna(-9)
Tacera_fam_sdai

Unnamed: 0,0,1,2,3,4,SDAI_S
0,D-12945-1_D-12945-1,D-12945-1_D-12945-1,0,0,0,0.0
1,D-21657-1_D-21657-1,D-21657-1_D-21657-1,0,0,1,1.0
2,D-21658-1_D-21658-1,D-21658-1_D-21658-1,0,0,2,2.0
3,D-21659-1_D-21659-1,D-21659-1_D-21659-1,0,0,2,2.0
4,D-21660-1_D-21660-1,D-21660-1_D-21660-1,0,0,2,1.0
...,...,...,...,...,...,...
290,D-23461-1_D-23461-1,D-23461-1_D-23461-1,0,0,0,-9.0
291,D-33052-1_D-33052-1,D-33052-1_D-33052-1,0,0,0,0.0
292,Z-21686-1_Z-21686-1,Z-21686-1_Z-21686-1,0,0,2,1.0
293,Z-21746-1_Z-21746-1,Z-21746-1_Z-21746-1,0,0,2,1.0


In [52]:
Tacera_fam_sdai['SDAI_S'] = Tacera_fam_sdai['SDAI_S'].astype(int)

In [53]:
Tacera_fam_sdai.to_csv("/exports/reum/CKe/Pipelinerun_withPC/TwoCompDAS/Tacera_merged_sDAI.fam",sep='\t',index=False,header=False)

## SERA

In [123]:
SERA_fam = pd.read_csv('./Pipelinerun_withPC/SERA/mergedChr/sera_merged.fam',sep='\s',header=None)
SERA_fam

  return func(*args, **kwargs)


Unnamed: 0,0,1,2,3,4,5
0,1_215284670,1_215284670,0,0,0,-9
1,100_215285060,100_215285060,0,0,0,1
2,1005_215284880,1005_215284880,0,0,0,2
3,1006_215293700,1006_215293700,0,0,0,-9
4,1007_215287480,1007_215287480,0,0,0,-9
...,...,...,...,...,...,...
663,984_215294600,984_215294600,0,0,0,2
664,985_215299420,985_215299420,0,0,0,2
665,986_215294170,986_215294170,0,0,0,2
666,987_215292670,987_215292670,0,0,0,-9


In [145]:
webjointfindings = openfile("/exports/reum/knevel_lab/SERA/Data/webJointFindings.CSV")
webjointfindings

Unnamed: 0,JFSNo,JFVisitID,ttlJntSwnTndr,ttlLrgJntSwnTndr,ttlSmllJntSwnTndr,ttlTndrJnt,ttlSwnJnt,sjc28,tjc28,upprLmbInvlvd,lwrLmbInvlvd,hasSymmetry,hasSmllJntHndFt
0,100,Baseline Visit,7,2,5,6,6,6,6,Yes,No,Yes,Yes
1,100,Month 12,2,1,1,1,1,1,1,Yes,Yes,No,Yes
2,100,Month 6,1,0,1,1,1,1,1,Yes,No,No,Yes
3,101,Baseline Visit,17,2,15,9,17,11,5,Yes,Yes,Yes,Yes
4,101,Month 12,0,0,0,0,0,0,0,No,No,No,No
...,...,...,...,...,...,...,...,...,...,...,...,...,...
2696,1317,Month 6,17,1,16,17,15,15,17,Yes,No,Yes,Yes
2697,1318,Baseline Visit,22,2,20,22,20,20,22,Yes,No,Yes,Yes
2698,1318,Month 6,5,0,5,5,1,1,5,Yes,No,Yes,Yes
2699,1319,Baseline Visit,16,0,16,12,14,14,12,Yes,No,Yes,Yes


In [146]:
webjointfindings = webjointfindings[webjointfindings['JFVisitID']=='Month 6']
webjointfindings

Unnamed: 0,JFSNo,JFVisitID,ttlJntSwnTndr,ttlLrgJntSwnTndr,ttlSmllJntSwnTndr,ttlTndrJnt,ttlSwnJnt,sjc28,tjc28,upprLmbInvlvd,lwrLmbInvlvd,hasSymmetry,hasSmllJntHndFt
2,100,Month 6,1,0,1,1,1,1,1,Yes,No,No,Yes
5,101,Month 6,5,0,5,4,1,1,4,Yes,No,Yes,Yes
7,102,Month 6,2,0,2,0,2,2,0,Yes,No,No,No
10,103,Month 6,24,4,20,24,11,11,23,Yes,Yes,Yes,Yes
13,104,Month 6,5,0,5,5,0,0,5,Yes,No,Yes,Yes
...,...,...,...,...,...,...,...,...,...,...,...,...,...
2691,1315,Month 6,6,0,6,4,3,3,4,Yes,No,Yes,Yes
2694,1316,Month 6,1,0,1,0,1,1,0,Yes,No,No,Yes
2696,1317,Month 6,17,1,16,17,15,15,17,Yes,No,Yes,Yes
2698,1318,Month 6,5,0,5,5,1,1,5,Yes,No,Yes,Yes


In [141]:
webDisease = openfile("/exports/reum/knevel_lab/SERA/Data/webDisease.CSV")
webDisease

Unnamed: 0,DiseaseSNo,DiseaseVisitID,ESR,DasVAS,CRP,GlobalVAS,PainVAS,RFMeasureType,RFFigure,RFTitrePosNeg,RFTitreUpper,RFTitreLower,CCPMeasureType,CCPFigure,CCPTitrePosNeg,CCPTitreUpper,CCPTiteLower,MrnStffnssID,IsESRDoneYN,IsCRPDoneYN,IsRFDoneYN,IsCCPDoneYN,RFFigureOperator,CCPFigureOperator,CRPFigureOperator,IsPainVASDoneYN,IsGlobalVASDoneYN,IsMrnStiffnessDoneYN,ESRNAYN,CRPNAYN,RFNAYN,CCPNAYN,PainVASNAYN,GlobalVASNAYN
0,100,Baseline Visit,24.0,17,11.0,60.0,11.0,Figure,197.0,,,,Figure,141.0,,,,> 30 mins,Yes,Yes,Yes,Yes,=,=,=,Yes,Yes,Yes,,,,,,
1,100,Month 12,5.0,1,0.6,5.0,1.0,,,,,,,,,,,,Yes,Yes,,,=,=,=,Yes,Yes,Yes,No,No,No,No,No,No
2,100,Month 6,7.0,2,1.1,10.0,2.0,,,,,,,,,,,,Yes,Yes,,,=,=,=,Yes,Yes,Yes,No,No,No,No,No,No
3,101,Baseline Visit,35.0,59,15.0,60.0,38.0,Figure,218.0,,,,Figure,91.0,,,,>= 60 mins,Yes,Yes,Yes,Yes,=,=,=,Yes,Yes,Yes,,,,,,
4,101,Month 12,13.0,2,1.8,5.0,1.0,,,,,,,,,,,,Yes,Yes,,,=,=,=,Yes,Yes,Yes,No,No,No,No,No,No
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
2696,1317,Month 6,,65,,25.0,73.0,,,,,,,,,,,,No,Yes,,,=,=,=,Yes,Yes,Yes,No,Yes,No,No,No,No
2697,1318,Baseline Visit,,95,4.0,50.0,100.0,,,,,,Figure,0.6,,,,>= 60 mins,No,Yes,No,Yes,=,=,<,Yes,Yes,Yes,No,No,No,No,No,No
2698,1318,Month 6,,5,4.0,5.0,0.0,,,,,,,,,,,,No,Yes,,,=,=,<,Yes,Yes,Yes,No,No,No,No,No,No
2699,1319,Baseline Visit,,79,79.0,35.0,78.0,,,,,,Figure,0.4,,,,>= 60 mins,No,Yes,No,Yes,=,>,=,Yes,Yes,Yes,No,No,No,No,No,No


In [143]:
webDisease = webDisease[webDisease['DiseaseVisitID']=='Month 6']
webDisease

Unnamed: 0,DiseaseSNo,DiseaseVisitID,ESR,DasVAS,CRP,GlobalVAS,PainVAS,RFMeasureType,RFFigure,RFTitrePosNeg,RFTitreUpper,RFTitreLower,CCPMeasureType,CCPFigure,CCPTitrePosNeg,CCPTitreUpper,CCPTiteLower,MrnStffnssID,IsESRDoneYN,IsCRPDoneYN,IsRFDoneYN,IsCCPDoneYN,RFFigureOperator,CCPFigureOperator,CRPFigureOperator,IsPainVASDoneYN,IsGlobalVASDoneYN,IsMrnStiffnessDoneYN,ESRNAYN,CRPNAYN,RFNAYN,CCPNAYN,PainVASNAYN,GlobalVASNAYN
2,100,Month 6,7.0,2,1.1,10.0,2.0,,,,,,,,,,,,Yes,Yes,,,=,=,=,Yes,Yes,Yes,No,No,No,No,No,No
5,101,Month 6,12.0,1,2.6,10.0,3.0,,,,,,,,,,,,Yes,Yes,,,=,=,=,Yes,Yes,Yes,No,No,No,No,No,No
7,102,Month 6,5.0,0,0.7,5.0,0.0,,,,,,,,,,,,Yes,Yes,,,=,=,=,Yes,Yes,Yes,No,No,No,No,No,No
10,103,Month 6,100.0,47,97.0,70.0,49.0,,,,,,,,,,,,Yes,Yes,,,=,=,=,Yes,Yes,Yes,No,No,No,No,No,No
13,104,Month 6,7.0,86,1.4,50.0,84.0,,,,,,,,,,,,Yes,Yes,,,=,=,=,Yes,Yes,Yes,No,No,No,No,No,No
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
2691,1315,Month 6,5.0,25,6.0,10.0,10.0,,,,,,,,,,,,Yes,Yes,,,=,=,=,Yes,Yes,Yes,No,No,No,No,No,No
2694,1316,Month 6,,20,0.7,10.0,20.0,,,,,,,,,,,,No,Yes,,,=,=,=,Yes,Yes,Yes,No,No,No,No,No,No
2696,1317,Month 6,,65,,25.0,73.0,,,,,,,,,,,,No,Yes,,,=,=,=,Yes,Yes,Yes,No,Yes,No,No,No,No
2698,1318,Month 6,,5,4.0,5.0,0.0,,,,,,,,,,,,No,Yes,,,=,=,<,Yes,Yes,Yes,No,No,No,No,No,No


In [151]:
SERA_merge = pd.merge(webjointfindings,webDisease,how='inner',left_on='JFSNo',right_on='DiseaseSNo').loc[:,['JFSNo','sjc28','CRP']]
SERA_merge['2cDAS'] = TwocompDAS(SERA_merge['sjc28'],SERA_merge['CRP'])
SERA_merge

Unnamed: 0,JFSNo,sjc28,CRP,2cDAS
0,100,1,1.1,1.445162
1,101,1,2.6,1.768560
2,102,2,0.7,1.732591
3,103,11,97.0,6.067605
4,104,0,1.4,0.525281
...,...,...,...,...
869,1315,3,6.0,2.899597
870,1316,1,0.7,1.318377
871,1317,15,,
872,1318,1,4.0,1.965663


In [152]:
def processdcID(row):
    row = str(row).replace(" ","").lstrip("0")
    return row
def processFAM(row):
    row = str(row).split("_")[1]
    return row

In [153]:
SERA_pheno = openfile("/exports/reum/knevel_lab/SERA/Data/SERA Final Leiden Manifest.xlsx",n=2)
SERA_pheno['ID'] = SERA_pheno['dcID'].map(processdcID)
SERA_pheno

  warn(msg)


Unnamed: 0,StudyNo,Location,dcID,Barcode original,Plate,ID
0,434,"(1, 1)",02 1528731 0,NTBJ386054,74501.0,215287310
1,625,"(1, 10)",02 1528740 0,NTBJ391302,74501.0,215287400
2,517,"(1, 11)",02 1528741 0,NTBJ385994,74501.0,215287410
3,419,"(1, 12)",02 1528742 0,NTBJ386203,74501.0,215287420
4,533,"(1, 4)",02 1528734 0,NTBJ386522,74501.0,215287340
...,...,...,...,...,...,...
691,226,"(6, 9)",02 1529866 0,E0000000102,74514.0,215298660
692,326,"(6, 10)",02 1529867 0,E0000000459,74514.0,215298670
693,230,"(6, 11)",02 1529868 0,E0000000219,74514.0,215298680
694,286,"(6, 12)",02 1528752 0,E0000000704,74514.0,215287520


In [155]:
SERA_pheno_2cDAS = pd.merge(SERA_pheno,SERA_merge,how='inner',left_on='StudyNo',right_on='JFSNo')
SERA_pheno_2cDAS

Unnamed: 0,StudyNo,Location,dcID,Barcode original,Plate,ID,JFSNo,sjc28,CRP,2cDAS
0,625,"(1, 10)",02 1528740 0,NTBJ391302,74501.0,215287400,625,4,35.00,4.150111
1,517,"(1, 11)",02 1528741 0,NTBJ385994,74501.0,215287410,517,0,,
2,419,"(1, 12)",02 1528742 0,NTBJ386203,74501.0,215287420,419,0,8.00,1.318335
3,641,"(1, 5)",02 1528735 0,NTBJ386610,74501.0,215287350,641,0,4.00,0.965663
4,431,"(1, 6)",02 1528736 0,NTBJ385684,74501.0,215287360,431,2,,
...,...,...,...,...,...,...,...,...,...,...
466,1158,"(6, 4)",02 1529460 0,E0000002263,74514.0,215294600,1158,0,11.70,1.524961
467,228,"(6, 7)",02 1529864 0,E0000000131,74514.0,215298640,228,0,1.00,0.415888
468,954,"(6, 8)",02 1529865 0,E0000001949,74514.0,215298650,954,2,8.00,2.732548
469,286,"(6, 12)",02 1528752 0,E0000000704,74514.0,215287520,286,0,3.91,0.954764


In [154]:
SERA_fam['ID'] = SERA_fam[0].map(processFAM)
SERA_fam

Unnamed: 0,0,1,2,3,4,5,ID
0,1_215284670,1_215284670,0,0,0,-9,215284670
1,100_215285060,100_215285060,0,0,0,1,215285060
2,1005_215284880,1005_215284880,0,0,0,2,215284880
3,1006_215293700,1006_215293700,0,0,0,-9,215293700
4,1007_215287480,1007_215287480,0,0,0,-9,215287480
...,...,...,...,...,...,...,...
663,984_215294600,984_215294600,0,0,0,2,215294600
664,985_215299420,985_215299420,0,0,0,2,215299420
665,986_215294170,986_215294170,0,0,0,2,215294170
666,987_215292670,987_215292670,0,0,0,-9,215292670


In [160]:
SERA_2cDAS = pd.merge(SERA_pheno_2cDAS,SERA_fam,how='inner',left_on='ID',right_on='ID')
SERA_2cDAS['2cDAS'].fillna(0,inplace=True)
SERA_2cDAS

Unnamed: 0,StudyNo,Location,dcID,Barcode original,Plate,ID,JFSNo,sjc28,CRP,2cDAS,0,1,2,3,4,5
0,625,"(1, 10)",02 1528740 0,NTBJ391302,74501.0,215287400,625,4,35.00,4.150111,1156_215287400,1156_215287400,0,0,0,1
1,517,"(1, 11)",02 1528741 0,NTBJ385994,74501.0,215287410,517,0,,0.000000,1967_215287410,1967_215287410,0,0,0,2
2,419,"(1, 12)",02 1528742 0,NTBJ386203,74501.0,215287420,419,0,8.00,1.318335,2014_215287420,2014_215287420,0,0,0,2
3,641,"(1, 5)",02 1528735 0,NTBJ386610,74501.0,215287350,641,0,4.00,0.965663,717_215287350,717_215287350,0,0,0,1
4,431,"(1, 6)",02 1528736 0,NTBJ385684,74501.0,215287360,431,2,,0.000000,764_215287360,764_215287360,0,0,0,1
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
462,1158,"(6, 4)",02 1529460 0,E0000002263,74514.0,215294600,1158,0,11.70,1.524961,984_215294600,984_215294600,0,0,0,2
463,228,"(6, 7)",02 1529864 0,E0000000131,74514.0,215298640,228,0,1.00,0.415888,1815_215298640,1815_215298640,0,0,0,2
464,954,"(6, 8)",02 1529865 0,E0000001949,74514.0,215298650,954,2,8.00,2.732548,1768_215298650,1768_215298650,0,0,0,1
465,286,"(6, 12)",02 1528752 0,E0000000704,74514.0,215287520,286,0,3.91,0.954764,1155_215287520,1155_215287520,0,0,0,2


In [162]:
SERA_2cDAS.loc[:,[0,1,2,3,4,'2cDAS']].to_csv("/exports/reum/CKe/Pipelinerun_withPC/TwoCompDAS/sera_meged_2cDAS.fam",sep='\t',index=False,header=False)

### SERA2-GLASGOW

In [166]:
SERA2_fam = pd.read_csv("/exports/reum/CKe/Pipelinerun_withPC/Glasgow/mergedChr/Glasgow_merged.fam",sep='\s',header=None)
SERA2_fam['ID'] = SERA2_fam[0].map(processFAM)
SERA2_fam

  return func(*args, **kwargs)


Unnamed: 0,0,1,2,3,4,5,ID
0,3_215289020,3_215289020,0,0,1,1,215289020
1,4_215285720,4_215285720,0,0,1,2,215285720
2,5_215287570,5_215287570,0,0,0,-9,215287570
3,6_215286070,6_215286070,0,0,2,2,215286070
4,10_215286430,10_215286430,0,0,1,2,215286430
...,...,...,...,...,...,...,...
339,568_215288500,568_215288500,0,0,2,1,215288500
340,569_215291730,569_215291730,0,0,2,1,215291730
341,572_215286600,572_215286600,0,0,2,1,215286600
342,574_215285670,574_215285670,0,0,2,2,215285670


In [167]:
SERA2_pheno = openfile("/exports/reum/knevel_lab/SERA/Data/Leiden Manifest 14 December 20.xlsx")
SERA2_pheno['ID'] = SERA2_pheno['dcID'].map(processdcID)
SERA2_pheno

Unnamed: 0,Box Number,StudyNo,dcID,Barcode original,Updated location,Scanned barcode,ID
0,Box 1 SERA Decode DNA,206,02 1528607 0,NTBI991424,A1,,215286070
1,Box 1 SERA Decode DNA,179,02 1528608 0,NUFY858106,A2,,215286080
2,Box 1 SERA Decode DNA,154,02 1528609 0,NUFY853350,A3,,215286090
3,Box 1 SERA Decode DNA,139,02 1528610 0,NUFY851945,A4,,215286100
4,Box 1 SERA Decode DNA,120,02 1528611 0,NUFY850894,A5,,215286110
...,...,...,...,...,...,...,...
338,74505,453,02 1529086 0,NTBI997002,"(7, 2)",,215290860
339,74505,403,02 1529087 0,NTBI981782,"(7, 3)",,215290870
340,74505,457,02 1529088 0,NTBI997491,"(7, 4)",,215290880
341,74505,327,02 1529089 0,NTBI989137,"(7, 5)",,215290890
