# Perform prediction

## Import libraries

In [1]:
import os

import logging
import sys

log = logging.getLogger("Pipeline")
log.setLevel(logging.INFO)
format = logging.Formatter("%(asctime)s - %(name)s - %(levelname)s - %(message)s")

ch = logging.StreamHandler(sys.stdout)
ch.setFormatter(format)
log.addHandler(ch)

import warnings
warnings.simplefilter(action='ignore', category=Warning)

module_path = os.path.abspath(os.path.join('../'))
if module_path not in sys.path:
    sys.path.append(module_path)

import predict_mortality as pm

## Define data directory

A top level directory to store all the data for this experiment

In [2]:
dataDirName = '/home/yram0006/phd/chapter_2/workspace/mortality_data/imbalance_experiment/'

## Read data matrix

In [3]:
import pandas as pd

dataMatrix = pd.read_csv(dataDirName + 'data_matrix/data_matrix_standardised.csv')
pd.set_option('display.max_columns', None)
dataMatrix

Unnamed: 0,person_id,age,gender,ethnicity_WHITE,ethnicity_BLACK,ethnicity_UNKNOWN,ethnicity_OTHER,ethnicity_HISPANIC,ethnicity_ASIAN,ethnicity_UNABLE_TO_OBTAIN,ethnicity_AMERICAN_INDIAN,anchor_time,death_datetime,heartrate_min,sysbp_min,diabp_min,meanbp_min,resprate_min,tempc_min,spo2_min,gcseye_min,gcsverbal_min,gcsmotor_min,heartrate_max,sysbp_max,diabp_max,meanbp_max,resprate_max,tempc_max,spo2_max,gcseye_max,gcsverbal_max,gcsmotor_max,heartrate_avg,sysbp_avg,diabp_avg,meanbp_avg,resprate_avg,tempc_avg,spo2_avg,gcseye_avg,gcsverbal_avg,gcsmotor_avg,heartrate_stddev,sysbp_stddev,diabp_stddev,meanbp_stddev,resprate_stddev,tempc_stddev,spo2_stddev,gcseye_stddev,gcsverbal_stddev,gcsmotor_stddev,heartrate_first,sysbp_first,diabp_first,meanbp_first,resprate_first,tempc_first,spo2_first,gcseye_first,gcsverbal_first,gcsmotor_first,heartrate_last,sysbp_last,diabp_last,meanbp_last,resprate_last,tempc_last,spo2_last,gcseye_last,gcsverbal_last,gcsmotor_last,chloride_serum_min,creatinine_min,sodium_serum_min,hemoglobin_min,platelet_count_min,urea_nitrogen_min,glucose_serum_min,bicarbonate_min,potassium_serum_min,anion_gap_min,leukocytes_blood_manual_min,hematocrit_min,chloride_serum_max,creatinine_max,sodium_serum_max,hemoglobin_max,platelet_count_max,urea_nitrogen_max,glucose_serum_max,bicarbonate_max,potassium_serum_max,anion_gap_max,leukocytes_blood_manual_max,hematocrit_max,chloride_serum_avg,creatinine_avg,sodium_serum_avg,hemoglobin_avg,platelet_count_avg,urea_nitrogen_avg,glucose_serum_avg,bicarbonate_avg,potassium_serum_avg,anion_gap_avg,leukocytes_blood_manual_avg,hematocrit_avg,chloride_serum_stddev,creatinine_stddev,sodium_serum_stddev,hemoglobin_stddev,glucose_serum_stddev,bicarbonate_stddev,potassium_serum_stddev,chloride_serum_first,creatinine_first,sodium_serum_first,hemoglobin_first,platelet_count_first,urea_nitrogen_first,glucose_serum_first,bicarbonate_first,potassium_serum_first,anion_gap_first,leukocytes_blood_manual_first,hematocrit_first,chloride_serum_last,creatinine_last,sodium_serum_last,hemoglobin_last,platelet_count_last,urea_nitrogen_last,glucose_serum_last,bicarbonate_last,potassium_serum_last,anion_gap_last,leukocytes_blood_manual_last,hematocrit_last
0,-2144679073,82.0,0,0,0,0,1,0,0,0,0,2190-01-30 19:22:00,2194-04-23 19:27:00,-0.272794,1.217771,0.923258,0.861968,0.878048,0.189353,0.317249,0.412549,1.239978,0.878154,-0.030099,-0.001925,0.069606,0.021527,-0.309282,-0.058429,-0.021341,0.370578,0.669108,0.341538,-0.671766,0.838925,0.734657,0.755136,0.000510,-0.003616,-0.100585,0.595497,1.041441,0.658405,-0.047481,-0.000154,0.026722,-0.025099,-0.700168,-0.113932,-0.042762,-0.054623,-0.696918,-0.769890,-1.241070,-0.100946,-0.093761,-0.277365,-0.176019,-0.090217,-0.015482,0.729111,0.910102,0.608975,-0.521863,1.715295,0.616779,0.846636,-0.029003,-0.048489,0.009782,0.659401,0.896608,0.536315,1.093242,-0.663478,0.163419,0.285937,0.076969,-0.734973,-0.012647,0.669296,-0.124032,-0.915664,-0.348052,0.099873,0.214809,-0.011713,-0.309154,-0.534404,0.297850,-0.994593,-0.024332,-0.000648,-1.025656,-0.767333,-0.018388,-0.395681,-0.007656,-0.014171,-0.015245,-0.012701,0.347919,-0.948893,-0.020354,0.019154,-0.013272,-1.114836,-0.162093,-0.233373,-0.012429,-0.011540,-0.590509,-0.011974,-0.030961,-0.601701,-1.056430,0.743687,-0.694348,-0.191987,-0.406075,0.116251,-0.789275,-0.022292,0.207578,-0.788282,-1.346000,-0.054095,-0.572535,0.656699,-0.695650,-0.087780,0.157334,-0.178773,-0.863655,-0.015096,0.214490,-0.408989,-0.979015,-0.516496,0.100735
1,-2142084288,84.0,1,1,0,0,0,0,0,0,0,2161-07-10 08:07:00,,-0.073643,-0.427373,0.222451,-1.935422,1.165394,0.217516,-0.256040,1.199315,1.239978,0.878154,-0.004134,-0.014919,-0.026310,-0.053989,-0.057963,-0.040074,-0.021341,0.370578,0.669108,0.341538,-0.134094,-0.066312,0.750897,0.395390,0.617088,0.086249,-0.167731,0.860623,1.041441,0.658405,-0.001199,0.007246,0.014587,0.037638,-0.347862,-0.101546,-0.018473,-1.069636,-0.696918,-0.769890,-0.299599,0.244989,0.060789,0.378146,0.701921,0.305525,-0.056425,0.729111,0.910102,0.608975,-0.313804,0.682207,1.280328,1.020767,1.692185,-0.021452,0.236984,0.659401,0.896608,0.536315,0.793315,-0.435926,0.507737,0.487113,-0.000699,-0.477509,-0.012129,0.066001,-0.301095,-0.563366,-0.060979,0.502304,0.510556,-0.011635,0.431631,0.320511,0.179330,-0.090891,-0.021989,-0.009273,0.292875,-0.091176,-0.000665,0.390295,-0.009259,-0.013774,0.012011,-0.012045,-0.067964,-0.387671,-0.018131,-0.019468,-0.011258,-0.206481,-0.083122,0.450207,-0.012014,-0.011498,-0.343805,-0.011836,-0.029291,-0.226259,0.125189,0.474016,-0.173894,0.614182,0.464202,-0.020737,-0.276849,-0.022242,0.012654,-0.025925,0.043446,-0.216607,0.465424,0.183603,-0.508245,0.112531,0.430555,0.701722,-0.447977,-0.013025,-0.196256,-0.900551,0.024266,0.217026,0.473387
2,-2133944014,50.0,1,1,0,0,0,0,0,0,0,2141-03-25 16:45:00,,-0.173219,0.630220,0.572854,0.478013,-0.989699,0.147108,-0.419837,-0.374217,-0.932920,0.421726,-0.020620,-0.006257,-0.012100,-0.044139,-0.215037,-0.080454,-0.030567,0.370578,0.669108,0.341538,-0.322070,0.427622,0.130176,0.083759,-0.701402,-0.062385,-0.402458,0.571394,0.394775,0.594702,-0.024181,-0.001278,-0.048238,-0.064594,-0.313192,-0.119714,-0.001438,0.388982,1.970708,-0.371864,-0.770334,0.201747,-0.117538,-0.327789,-0.803119,0.165851,-0.008658,-0.907586,-1.251107,0.069738,-0.230580,0.086196,-0.227737,-0.198151,-0.315867,-0.055249,-0.217421,0.659401,0.896608,0.536315,-2.655837,-0.663478,-1.213852,1.694168,0.872452,-0.476000,-0.007468,2.680281,-1.717605,-0.397756,1.230034,1.542830,-2.151170,-0.011679,-0.494351,1.507893,0.455851,-0.444643,-0.017503,0.094229,-0.366390,-0.828988,0.024072,0.916153,-0.031538,-0.014085,-0.072093,-0.010550,0.218245,-0.646831,-0.012610,0.170743,-0.014433,-0.872370,-0.000619,1.647657,-0.011455,-0.011504,0.964784,-0.011819,-0.027636,-0.299876,0.896400,-2.627203,-0.463035,-1.481858,1.160423,0.739696,-0.305407,-0.020149,2.156819,-1.768456,-0.126777,0.737925,1.165595,-2.339573,-0.695650,-1.690266,1.523437,0.575731,-0.612072,-0.001803,2.062846,-0.408989,-0.658492,0.160877,1.557531
3,-2133227983,52.0,0,1,0,0,0,0,0,0,0,2120-09-22 10:15:00,2121-08-28 15:15:00,0.025933,-1.073680,0.485253,-1.441765,0.447029,0.133026,0.235350,0.412549,-0.389695,0.421726,-0.017735,-0.020334,-0.008548,-0.040856,0.161941,-0.003364,-0.021341,0.370578,0.669108,0.341538,-0.203561,-0.427533,0.646238,0.240893,-0.310939,-0.113208,-0.015195,0.754573,-0.007318,0.281090,-0.021139,-0.007731,0.012835,0.008907,-0.018688,-0.066404,-0.042251,-0.338743,0.659022,-0.068008,0.312356,0.763893,0.476888,1.941287,0.952761,0.212409,-0.008658,0.729111,0.369800,0.069738,-0.188968,0.046461,-0.348382,-0.024020,-0.029003,-0.041730,0.577788,0.659401,-0.730035,0.536315,-0.256426,-0.891030,0.163419,-0.166709,0.670751,-0.731453,-0.011784,1.272592,-2.071733,-0.638644,0.063069,-0.119478,-0.228812,-0.011739,0.061238,-0.011956,1.143237,-0.712930,-0.023036,0.033853,0.622508,-0.514545,-0.017100,-0.103317,-0.014468,-0.014352,0.003250,-0.012580,0.950606,-0.886384,-0.018743,0.068637,-0.013154,-0.659500,-0.175868,0.104515,-0.011562,-0.011538,-0.013936,-0.011738,-0.030063,-0.282218,2.463369,-0.469833,-0.867833,-0.191987,0.159605,0.750668,-0.891840,-0.022641,0.792351,-0.897190,-0.373601,0.148029,0.173951,0.183603,-0.883055,0.513153,-0.498395,0.946249,-0.749180,-0.011385,1.446727,-0.900551,-1.200746,-0.014856,-0.475707
4,-2132499549,68.0,0,1,0,0,0,0,0,0,0,2205-11-16 13:07:00,,0.274872,-0.662394,-0.127953,0.148908,0.878048,0.161190,0.153452,0.412549,1.239978,0.878154,-0.007843,-0.019251,-0.072492,-0.099956,-0.183622,-0.098809,-0.021341,0.370578,0.669108,0.341538,-0.038396,-0.330845,0.125592,-0.222650,-0.361032,-0.180333,0.001048,0.507121,1.041441,0.658405,-0.010829,-0.007087,-0.032613,-0.041233,-0.560680,-0.134095,-0.023838,0.051502,-0.696918,-0.769890,-0.017158,-0.187430,0.048901,0.075602,0.325661,-0.113496,-0.008658,0.729111,0.910102,0.608975,0.726492,0.006727,-0.107092,-0.067553,1.118455,-0.001174,0.123383,-0.255992,0.896608,0.536315,1.393168,0.322582,0.163419,-0.217003,0.273945,0.984810,-0.013252,-0.939492,-0.124032,0.062941,-0.121743,-0.197396,0.362682,-0.011601,-0.494351,0.035539,0.156544,0.329004,-0.025130,-0.086899,-0.696023,1.220035,0.012420,0.164904,-0.006054,-0.013275,-0.023033,-0.012630,0.006333,0.343322,-0.021086,-0.108780,-0.012621,0.272497,0.315003,-0.175926,-0.012592,-0.011538,-0.698913,-0.011672,-0.031460,-1.112750,-0.219378,1.013358,0.057419,0.130480,0.203119,-0.207427,0.379972,-0.023489,-1.351814,-0.243741,0.017912,-0.110297,0.278954,0.814397,0.116439,-0.488402,-0.553039,0.463571,0.272386,-0.015010,-1.428493,-0.736697,0.140620,0.490582,-0.508395
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
2966,2142664100,65.0,1,1,0,0,0,0,0,0,0,2180-08-11 04:23:00,,0.922114,0.042668,0.923258,0.478013,0.590702,0.147108,-0.911228,1.199315,0.696753,0.878154,0.005757,0.012152,0.066053,0.005111,0.193356,-0.021719,-0.021341,0.370578,0.669108,0.341538,0.787906,0.176275,1.271708,0.677604,1.480574,-0.004342,-0.016273,0.860623,0.995843,0.658405,0.008134,0.010750,0.050465,0.005370,-0.074307,-0.069785,0.021901,-1.069636,-0.299347,-0.769890,1.159680,0.028780,0.144009,0.428570,1.454441,0.212409,0.004989,0.729111,0.910102,0.608975,0.518433,1.198751,1.400973,1.020767,0.257862,-0.075527,-0.103820,0.659401,0.896608,0.536315,-0.406390,-0.435926,-0.525217,-0.367884,-0.880643,-0.593669,-0.010576,0.468198,-0.478159,-0.512178,-0.135230,-0.414490,-0.672433,-0.011670,-0.494351,-0.296928,-0.630374,-0.760493,-0.020095,0.016602,-0.696023,-0.391233,-0.000369,-0.288525,-0.016472,-0.013880,-0.040554,-0.013052,-0.742526,-0.717218,-0.016265,0.019958,-0.012700,-0.209341,-0.086127,-0.386152,-0.011885,-0.011525,0.060371,-0.011835,-0.027643,0.316081,-0.427042,0.069509,-0.405207,0.130480,-0.101478,-0.497942,-0.758304,-0.019750,0.207578,-0.570466,-0.026771,-0.490395,-0.095195,-1.077985,-0.383308,-1.289645,-0.389107,-1.005746,-0.521972,-0.006292,0.214490,0.082574,0.061587,0.718153,-0.414065
2967,2144053271,71.0,0,1,0,0,0,0,0,0,0,2139-06-14 18:06:00,,-0.770673,-0.309863,-1.266765,0.203759,-0.989699,-0.289426,0.153452,-1.160983,-0.932920,-1.403987,-0.006195,-0.017626,-0.097359,-0.086823,-0.152207,-0.095138,-0.021341,-2.337273,-1.693958,0.341538,-0.392198,-0.085976,-0.199819,-0.157516,-0.607566,-0.704260,0.203160,-2.261975,-1.329666,-0.781980,0.027312,0.004955,-0.021687,-0.074604,0.230779,-0.051405,-0.022380,-0.524861,-0.696918,2.324226,0.171136,0.677409,-0.117538,-1.033723,0.701921,0.119293,-0.042777,-1.725934,-1.251107,-2.087210,-0.272192,-0.907158,-0.408705,0.672505,-0.029003,-0.048489,0.577788,-2.086777,-1.272249,0.536315,-0.406390,0.246731,-0.525217,0.436819,-0.264909,0.821883,-0.015064,-0.738393,-0.478159,0.526649,0.214830,0.322694,-0.672433,-0.011316,-0.679547,-0.154442,0.201483,0.676810,-0.023983,0.033853,-0.586146,-0.074734,-0.011540,-0.188810,-0.017731,-0.012278,-0.053070,-0.012299,0.139068,0.787500,-0.020678,-0.006364,-0.012291,0.406005,0.082395,0.265825,-0.011921,-0.011205,-0.108793,-0.011934,-0.029347,3.064577,-0.380575,0.069509,1.618781,-0.836923,-0.188505,0.068022,1.442229,-0.022292,-0.572118,-0.134833,-0.099116,0.159315,-0.189184,-1.077985,0.053970,-0.488402,0.594487,-0.032757,0.391649,-0.013456,1.446727,-0.081281,-0.438956,-0.033435,0.564168
2968,2144497079,65.0,1,1,0,0,0,0,0,0,0,2150-04-26 14:47:00,,-1.019612,0.512710,-0.565958,0.094057,0.590702,0.076699,-0.256040,0.412549,1.239978,0.878154,-0.024741,-0.018709,0.009214,0.514026,-0.057963,-0.091467,-0.021341,0.370578,0.669108,0.341538,-0.518790,0.179749,-0.911257,0.063392,-0.454063,-0.207270,0.026637,0.779046,1.041441,0.658405,-0.022060,-0.031759,-0.065296,0.342646,-0.375325,-0.118352,-0.037418,-0.441552,-0.696918,-0.769890,-2.229614,0.201747,-0.272089,-0.781604,-0.552279,-0.113496,-0.042777,0.729111,0.910102,0.608975,-0.022521,-0.390614,-1.011931,-0.546413,-0.459299,0.012345,0.009782,0.659401,0.896608,0.536315,-1.606095,1.232790,-1.730329,0.587701,-0.683765,0.512624,-0.011180,-1.341689,-0.301095,1.896696,-0.401998,0.279656,-1.855423,-0.011238,-1.420333,1.127931,-0.764876,2.620960,-0.017553,-0.000648,1.611406,1.663956,-0.045848,1.050925,-0.026598,-0.011229,-0.112234,-0.011756,-0.688077,2.200226,-0.012913,-0.050189,-0.010504,1.899387,-0.263500,0.504531,-0.012078,-0.011282,0.503888,-0.011802,-0.026767,1.913836,1.704332,-1.683354,1.792265,-1.643092,1.203937,-0.637141,2.378993,-0.018703,-0.961966,2.043330,2.101017,-0.185685,1.126822,-1.866477,0.866059,-1.289645,0.867708,-0.538783,0.261505,-0.005688,0.009117,0.737990,1.598340,-0.298061,0.631974
2969,2144648302,91.0,0,1,0,0,0,0,0,0,0,2143-12-22 17:48:00,2143-12-24 05:35:00,-3.459217,-3.247620,-1.704770,-1.935422,-0.989699,-0.021873,-0.911228,0.412549,-0.932920,0.421726,-0.005371,-0.031704,-0.086702,-0.122939,-0.120793,-0.128177,-0.021341,0.370578,0.078342,0.341538,0.678164,-1.085512,-0.395568,-0.793937,-0.022948,-0.587398,-1.195107,0.012219,-0.539297,0.097823,0.065100,0.016414,0.021569,0.079971,0.223881,-0.115571,0.078197,-0.095112,1.301948,-0.164944,0.830165,-0.100946,0.108344,0.680689,-1.053958,-0.439401,-0.138311,0.729111,0.369800,0.608975,-3.559525,-3.529610,-2.459673,-2.723052,-2.897648,-0.109323,-0.899028,-0.255992,-0.730035,-0.060988,0.493389,1.612044,0.679896,2.096520,-0.831423,2.574353,-0.011180,-0.336196,2.886052,1.896696,1.065230,2.344742,0.066935,-0.011420,-0.309154,1.080435,-1.184207,1.840625,-0.023933,-0.052399,1.171896,0.636361,0.007900,1.332044,-0.010381,-0.012015,0.000330,-0.010586,-1.028378,2.287762,-0.019127,-0.060986,-0.006756,1.328147,0.299922,2.027906,-0.011878,-0.011485,-1.443223,-0.011992,-0.031491,-0.790454,-0.482464,0.204345,1.271811,0.291714,1.160423,-1.128429,2.177884,-0.021893,-0.377194,1.607697,1.037123,0.299594,1.307862,0.499000,1.178401,0.112531,1.960590,-0.897985,2.046090,-0.013629,-1.017747,2.048824,0.939732,0.841330,2.294428


## Perform predictions

### Calculate target variable

In [4]:
dataMatrix.anchor_time = dataMatrix.anchor_time.apply(lambda x: pd.to_datetime(x, format='%Y-%m-%d %H:%M:%S'))
dataMatrix.death_datetime = dataMatrix.death_datetime.apply(lambda x: pd.to_datetime(x, format='%Y-%m-%d %H:%M:%S'))
dataMatrix['target'] = (dataMatrix['death_datetime'] < (dataMatrix['anchor_time'] + pd.Timedelta(days=7)))
dataMatrix.target.fillna(value=False, inplace=True)

### Check class counts

In [5]:
dataMatrix.target.value_counts()

target
False    2524
True      447
Name: count, dtype: int64

### Separate positive and negative classes

In [6]:
dataMatrixPositive = dataMatrix[dataMatrix.target == True]
dataMatrixNegative = dataMatrix[dataMatrix.target == False]

### Simulate different data imbalances and predict

In [7]:
totalSamples = 1200
for proportion in [65, 70, 75, 80, 85, 90, 95]:
    negativeSize = int(totalSamples * proportion / 100)
    positiveSize = int(totalSamples - (totalSamples * proportion / 100))
    sampledDataMatrix = pd.concat([dataMatrixPositive.sample(n=positiveSize), dataMatrixNegative.sample(n=negativeSize)]).sample(frac=1).reset_index(drop=True)
    sampledDataMatrix.to_csv(dataDirName + 'data_matrix.csv', index=False)
    pm.runPredictionsForAllTargets(
        label=str(proportion) + '_' + str(100 - proportion) + '_samples',
        dirPath = dataDirName,
        vitalsBefore = 0,
        vitalsAfter = 72,
        labsBefore = 0,
        labsAfter = 72,
        targetList = [7],
    )


2023-09-22 21:37:51,776 - Pipeline - INFO - dirName: 65_35_samples_icd_vb_0_va_72_lb_0_la_72
2023-09-22 21:37:51,777 - Pipeline - INFO - Running Predictions for vb_0_va_72_lb_0_la_72, targetStart : 0, targetEnd : 7
2023-09-22 21:37:51,778 - Pipeline - INFO - Reading data
2023-09-22 21:37:51,994 - Pipeline - INFO - Formatting data
2023-09-22 21:37:52,000 - Pipeline - INFO - Performing SFS
2023-09-22 21:39:21,566 - Pipeline - INFO - Building XGBoost model with all the features
2023-09-22 21:39:21,568 - Pipeline - INFO - Performing Hyperparameter optimisation
2023-09-22 21:39:21,592 - Pipeline - INFO - Building the model
2023-09-22 21:39:21,593 - Pipeline - INFO - Hyperparameter optimisation for: {'max_depth': range(1, 10), 'scale_pos_weight': [0.1, 0.15, 0.2, 0.25, 0.3, 0.35, 0.4]}
2023-09-22 21:40:21,996 - Pipeline - INFO - Hyperparameter optimisation for: {'n_estimators': range(50, 250, 10)}
2023-09-22 21:40:48,713 - Pipeline - INFO - Hyperparameter optimisation for: {'min_child_weight

R[write to console]: Error in ROCR::prediction(predictor, response) : 
  Number of classes is not equal to 2.
ROCR currently supports only evaluation of binary classification tasks.

R[write to console]: In addition: 
R[write to console]: 

R[write to console]: Error in ROCR::prediction(predictor, response) : 
  Number of classes is not equal to 2.
ROCR currently supports only evaluation of binary classification tasks.

R[write to console]: In addition: 

R[write to console]: In (function (package, help, pos = 2, lib.loc = NULL, character.only = FALSE,  :
R[write to console]: 
 
R[write to console]:  libraries ‘/usr/local/lib/R/site-library’, ‘/usr/lib/R/site-library’ contain no packages

R[write to console]: Error in ROCR::prediction(predictor, response) : 
  Number of classes is not equal to 2.
ROCR currently supports only evaluation of binary classification tasks.

R[write to console]: In addition: 

R[write to console]: In (function (package, help, pos = 2, lib.loc = NULL, characte

2023-09-22 22:11:34,658 - Pipeline - INFO - Building Ensemble LR model with all the features
2023-09-22 22:11:34,659 - Pipeline - INFO - Performing Hyperparameter optimisation
2023-09-22 22:11:35,294 - Pipeline - INFO - Building the model
2023-09-22 22:11:35,296 - Pipeline - INFO - Performing cross-validation
2023-09-22 22:11:36,134 - Pipeline - INFO - Saving the CV results for all the models
2023-09-22 22:11:36,137 - Pipeline - INFO - Completed !!!
2023-09-22 22:11:36,349 - Pipeline - INFO - dirName: 80_20_samples_icd_vb_0_va_72_lb_0_la_72
2023-09-22 22:11:36,350 - Pipeline - INFO - Running Predictions for vb_0_va_72_lb_0_la_72, targetStart : 0, targetEnd : 7
2023-09-22 22:11:36,351 - Pipeline - INFO - Reading data
2023-09-22 22:11:36,615 - Pipeline - INFO - Formatting data
2023-09-22 22:11:36,623 - Pipeline - INFO - Performing SFS
2023-09-22 22:13:11,328 - Pipeline - INFO - Building XGBoost model with all the features
2023-09-22 22:13:11,329 - Pipeline - INFO - Performing Hyperparame

R[write to console]: Error in ROCR::prediction(predictor, response) : 
  Number of classes is not equal to 2.
ROCR currently supports only evaluation of binary classification tasks.

R[write to console]: In addition: 
R[write to console]: 

R[write to console]: Error in ROCR::prediction(predictor, response) : 
  Number of classes is not equal to 2.
ROCR currently supports only evaluation of binary classification tasks.

R[write to console]: In addition: 

R[write to console]: In (function (package, help, pos = 2, lib.loc = NULL, character.only = FALSE,  :
R[write to console]: 
 
R[write to console]:  libraries ‘/usr/local/lib/R/site-library’, ‘/usr/lib/R/site-library’ contain no packages

R[write to console]: Error in ROCR::prediction(predictor, response) : 
  Number of classes is not equal to 2.
ROCR currently supports only evaluation of binary classification tasks.

R[write to console]: In addition: 

R[write to console]: In (function (package, help, pos = 2, lib.loc = NULL, characte

2023-09-22 22:17:45,141 - Pipeline - INFO - Building LR model with all the features
2023-09-22 22:17:45,142 - Pipeline - INFO - Performing Hyperparameter optimisation
2023-09-22 22:17:48,256 - Pipeline - INFO - Building the model
2023-09-22 22:17:48,258 - Pipeline - INFO - Performing cross-validation
2023-09-22 22:17:49,379 - Pipeline - INFO - Building LR model with the selected features
2023-09-22 22:17:49,381 - Pipeline - INFO - Performing Hyperparameter optimisation
2023-09-22 22:17:50,155 - Pipeline - INFO - Building the model
2023-09-22 22:17:50,156 - Pipeline - INFO - Performing cross-validation
2023-09-22 22:17:51,209 - Pipeline - INFO - Building LGBM model with all the features
2023-09-22 22:17:51,211 - Pipeline - INFO - Performing Hyperparameter optimisation
2023-09-22 22:18:10,096 - Pipeline - INFO - Building the model
2023-09-22 22:18:10,101 - Pipeline - INFO - Performing cross-validation
2023-09-22 22:18:13,198 - Pipeline - INFO - Building LGBM model with the selected featu

R[write to console]: Error in ROCR::prediction(predictor, response) : 
  Number of classes is not equal to 2.
ROCR currently supports only evaluation of binary classification tasks.

R[write to console]: In addition: 
R[write to console]: 

R[write to console]: Error in ROCR::prediction(predictor, response) : 
  Number of classes is not equal to 2.
ROCR currently supports only evaluation of binary classification tasks.

R[write to console]: In addition: 

R[write to console]: In (function (package, help, pos = 2, lib.loc = NULL, character.only = FALSE,  :
R[write to console]: 
 
R[write to console]:  libraries ‘/usr/local/lib/R/site-library’, ‘/usr/lib/R/site-library’ contain no packages

R[write to console]: Error in ROCR::prediction(predictor, response) : 
  Number of classes is not equal to 2.
ROCR currently supports only evaluation of binary classification tasks.

R[write to console]: In addition: 

R[write to console]: In (function (package, help, pos = 2, lib.loc = NULL, characte

2023-09-22 22:22:27,480 - Pipeline - INFO - Building Ensemble LR model with all the features
2023-09-22 22:22:27,481 - Pipeline - INFO - Performing Hyperparameter optimisation
2023-09-22 22:22:28,066 - Pipeline - INFO - Building the model
2023-09-22 22:22:28,068 - Pipeline - INFO - Performing cross-validation
2023-09-22 22:22:28,919 - Pipeline - INFO - Saving the CV results for all the models
2023-09-22 22:22:28,921 - Pipeline - INFO - Completed !!!
2023-09-22 22:22:29,112 - Pipeline - INFO - dirName: 85_15_samples_icd_vb_0_va_72_lb_0_la_72
2023-09-22 22:22:29,114 - Pipeline - INFO - Running Predictions for vb_0_va_72_lb_0_la_72, targetStart : 0, targetEnd : 7
2023-09-22 22:22:29,114 - Pipeline - INFO - Reading data
2023-09-22 22:22:29,357 - Pipeline - INFO - Formatting data
2023-09-22 22:22:29,365 - Pipeline - INFO - Performing SFS
2023-09-22 22:24:08,423 - Pipeline - INFO - Building XGBoost model with all the features
2023-09-22 22:24:08,424 - Pipeline - INFO - Performing Hyperparame

R[write to console]: Error in ROCR::prediction(predictor, response) : 
  Number of classes is not equal to 2.
ROCR currently supports only evaluation of binary classification tasks.

R[write to console]: In addition: 
R[write to console]: 

R[write to console]: Error in ROCR::prediction(predictor, response) : 
  Number of classes is not equal to 2.
ROCR currently supports only evaluation of binary classification tasks.

R[write to console]: In addition: 

R[write to console]: In (function (package, help, pos = 2, lib.loc = NULL, character.only = FALSE,  :
R[write to console]: 
 
R[write to console]:  libraries ‘/usr/local/lib/R/site-library’, ‘/usr/lib/R/site-library’ contain no packages

R[write to console]: Error in ROCR::prediction(predictor, response) : 
  Number of classes is not equal to 2.
ROCR currently supports only evaluation of binary classification tasks.

R[write to console]: In addition: 

R[write to console]: In (function (package, help, pos = 2, lib.loc = NULL, characte

2023-09-22 23:00:57,209 - Pipeline - INFO - Building LR model with all the features
2023-09-22 23:00:57,210 - Pipeline - INFO - Performing Hyperparameter optimisation
2023-09-22 23:01:00,483 - Pipeline - INFO - Building the model
2023-09-22 23:01:00,485 - Pipeline - INFO - Performing cross-validation
2023-09-22 23:01:01,477 - Pipeline - INFO - Building LR model with the selected features
2023-09-22 23:01:01,478 - Pipeline - INFO - Performing Hyperparameter optimisation
2023-09-22 23:01:02,078 - Pipeline - INFO - Building the model
2023-09-22 23:01:02,079 - Pipeline - INFO - Performing cross-validation
2023-09-22 23:01:02,985 - Pipeline - INFO - Building LGBM model with all the features
2023-09-22 23:01:02,987 - Pipeline - INFO - Performing Hyperparameter optimisation
2023-09-22 23:01:21,099 - Pipeline - INFO - Building the model
2023-09-22 23:01:21,101 - Pipeline - INFO - Performing cross-validation
2023-09-22 23:01:24,217 - Pipeline - INFO - Building LGBM model with the selected featu

R[write to console]: Error in ROCR::prediction(predictor, response) : 
  Number of classes is not equal to 2.
ROCR currently supports only evaluation of binary classification tasks.

R[write to console]: In addition: 
R[write to console]: 

R[write to console]: Error in ROCR::prediction(predictor, response) : 
  Number of classes is not equal to 2.
ROCR currently supports only evaluation of binary classification tasks.

R[write to console]: In addition: 

R[write to console]: In (function (package, help, pos = 2, lib.loc = NULL, character.only = FALSE,  :
R[write to console]: 
 
R[write to console]:  libraries ‘/usr/local/lib/R/site-library’, ‘/usr/lib/R/site-library’ contain no packages

R[write to console]: Error in ROCR::prediction(predictor, response) : 
  Number of classes is not equal to 2.
ROCR currently supports only evaluation of binary classification tasks.

R[write to console]: In addition: 

R[write to console]: In (function (package, help, pos = 2, lib.loc = NULL, characte

2023-09-22 23:05:50,519 - Pipeline - INFO - Building Ensemble LR model with all the features
2023-09-22 23:05:50,519 - Pipeline - INFO - Performing Hyperparameter optimisation
2023-09-22 23:05:51,069 - Pipeline - INFO - Building the model
2023-09-22 23:05:51,071 - Pipeline - INFO - Performing cross-validation
2023-09-22 23:05:51,943 - Pipeline - INFO - Saving the CV results for all the models
2023-09-22 23:05:51,947 - Pipeline - INFO - Completed !!!
2023-09-22 23:05:52,150 - Pipeline - INFO - dirName: 95_5_samples_icd_vb_0_va_72_lb_0_la_72
2023-09-22 23:05:52,151 - Pipeline - INFO - Running Predictions for vb_0_va_72_lb_0_la_72, targetStart : 0, targetEnd : 7
2023-09-22 23:05:52,151 - Pipeline - INFO - Reading data
2023-09-22 23:05:52,411 - Pipeline - INFO - Formatting data
2023-09-22 23:05:52,419 - Pipeline - INFO - Performing SFS
2023-09-22 23:07:17,134 - Pipeline - INFO - Building XGBoost model with all the features
2023-09-22 23:07:17,136 - Pipeline - INFO - Performing Hyperparamet

R[write to console]: Error in ROCR::prediction(predictor, response) : 
  Number of classes is not equal to 2.
ROCR currently supports only evaluation of binary classification tasks.

R[write to console]: In addition: 

R[write to console]: 1: 
R[write to console]: In (function (package, help, pos = 2, lib.loc = NULL, character.only = FALSE,  :
R[write to console]: 
 
R[write to console]:  libraries ‘/usr/local/lib/R/site-library’, ‘/usr/lib/R/site-library’ contain no packages

R[write to console]: 2: 
R[write to console]: In (function (package, help, pos = 2, lib.loc = NULL, character.only = FALSE,  :
R[write to console]: 
 
R[write to console]:  libraries ‘/usr/local/lib/R/site-library’, ‘/usr/lib/R/site-library’ contain no packages

R[write to console]: 3: 
R[write to console]: In (function (package, help, pos = 2, lib.loc = NULL, character.only = FALSE,  :
R[write to console]: 
 
R[write to console]:  libraries ‘/usr/local/lib/R/site-library’, ‘/usr/lib/R/site-library’ contain no pa

2023-09-22 23:09:35,547 - Pipeline - INFO - Building XGBoost model with the selected features
2023-09-22 23:09:35,548 - Pipeline - INFO - Performing Hyperparameter optimisation
2023-09-22 23:09:35,548 - Pipeline - INFO - Building the model
2023-09-22 23:09:35,549 - Pipeline - INFO - Hyperparameter optimisation for: {'max_depth': range(1, 10), 'scale_pos_weight': [0.1, 0.15, 0.2, 0.25, 0.3, 0.35, 0.4]}
2023-09-22 23:09:59,737 - Pipeline - INFO - Hyperparameter optimisation for: {'n_estimators': range(50, 250, 10)}
2023-09-22 23:10:11,704 - Pipeline - INFO - Hyperparameter optimisation for: {'min_child_weight': range(1, 10)}
2023-09-22 23:10:15,206 - Pipeline - INFO - Hyperparameter optimisation for: {'gamma': [0.0, 0.1, 0.2, 0.3, 0.4]}
2023-09-22 23:10:17,937 - Pipeline - INFO - Hyperparameter optimisation for: {'subsample': [0.1, 0.2, 0.3, 0.4, 0.5, 0.6, 0.7, 0.8, 0.9], 'colsample_bytree': [0.1, 0.2, 0.3, 0.4, 0.5, 0.6, 0.7, 0.8, 0.9]}
2023-09-22 23:10:51,444 - Pipeline - INFO - Hyperp

R[write to console]: Error in ROCR::prediction(predictor, response) : 
  Number of classes is not equal to 2.
ROCR currently supports only evaluation of binary classification tasks.

R[write to console]: In addition: 
R[write to console]: 

R[write to console]: Error in ROCR::prediction(predictor, response) : 
  Number of classes is not equal to 2.
ROCR currently supports only evaluation of binary classification tasks.

R[write to console]: In addition: 

R[write to console]: In (function (package, help, pos = 2, lib.loc = NULL, character.only = FALSE,  :
R[write to console]: 
 
R[write to console]:  libraries ‘/usr/local/lib/R/site-library’, ‘/usr/lib/R/site-library’ contain no packages

R[write to console]: Error in ROCR::prediction(predictor, response) : 
  Number of classes is not equal to 2.
ROCR currently supports only evaluation of binary classification tasks.

R[write to console]: In addition: 

R[write to console]: In (function (package, help, pos = 2, lib.loc = NULL, characte

2023-09-22 23:14:54,307 - Pipeline - INFO - Building Ensemble LR model with all the features
2023-09-22 23:14:54,308 - Pipeline - INFO - Performing Hyperparameter optimisation
2023-09-22 23:14:54,866 - Pipeline - INFO - Building the model
2023-09-22 23:14:54,867 - Pipeline - INFO - Performing cross-validation
2023-09-22 23:14:55,801 - Pipeline - INFO - Saving the CV results for all the models
2023-09-22 23:14:55,803 - Pipeline - INFO - Completed !!!


## Remove the data matrix file from working directory

In [8]:
import os


os.system(
    '''rm ''' + dataDirName + '''data_matrix.csv'''
)

0