# Based
- https://www.kaggle.com/code/honganzhu/cmi-piu-competition?scriptVersionId=201912528 Version44 LB0.492

 If you find this notebook useful, please upvote this and the based one.

In [56]:
import numpy as np
import pandas as pd
import os
import re
from sklearn.base import clone
from sklearn.metrics import cohen_kappa_score
from sklearn.model_selection import StratifiedKFold
from scipy.optimize import minimize
from concurrent.futures import ThreadPoolExecutor
from tqdm import tqdm
import polars as pl
import polars.selectors as cs
import matplotlib.pyplot as plt
from matplotlib.ticker import MaxNLocator, FormatStrFormatter, PercentFormatter
import seaborn as sns

from sklearn.preprocessing import StandardScaler
import matplotlib.pyplot as plt
import torch
import torch.nn as nn
import torch.optim as optim

from colorama import Fore, Style
from IPython.display import clear_output
import warnings
from lightgbm import LGBMRegressor
from xgboost import XGBRegressor
from catboost import CatBoostRegressor
from sklearn.ensemble import VotingRegressor, RandomForestRegressor, GradientBoostingRegressor
from sklearn.impute import SimpleImputer, KNNImputer
from sklearn.pipeline import Pipeline
from pytorch_tabnet.tab_model import TabNetRegressor
warnings.filterwarnings('ignore')
pd.options.display.max_columns = None
pd.set_option('display.max_rows', 500)
pd.set_option('display.max_columns', 500)
pd.set_option('display.max_colwidth', None)

pl.Config.set_tbl_rows(-1)
pl.Config.set_tbl_cols(-1)
pl.Config.set_fmt_str_lengths(10000)

polars.config.Config

In [2]:
SEED = 42
n_splits = 5

# Feature Engineering

- **Feature Selection**: The dataset contains features related to physical characteristics (e.g., BMI, Height, Weight), behavioral aspects (e.g., internet usage), and fitness data (e.g., endurance time). 
- **Categorical Feature Encoding**: Categorical features are mapped to numerical values using custom mappings for each unique category within the dataset. This ensures compatibility with machine learning algorithms that require numerical input.
- **Time Series Aggregation**: Time series statistics (e.g., mean, standard deviation) from the actigraphy data are computed and merged into the main dataset to create additional features for model training.


In [3]:
def process_file(id_folder, dirname):
    files = os.listdir(os.path.join(path, dirname, id_folder))
    if len(files) > 1:
        df_list = []
        for file in files:
            df = pd.read_parquet(os.path.join(dirname, id_folder, file))
            df_list.append(df)
        df = pd.concat(df_list, ignore_index=True)
    else:
        df = pd.read_parquet(os.path.join(dirname, id_folder, files[0]))
    
    df.drop('step', axis=1, inplace=True)

    describe_df = df.describe(percentiles=[0.01] + [i*0.5/10 + 0.05 for i in range(19)])
    count_mean = describe_df.loc['count', :].mean()
    describe_df.drop('count', axis=0, inplace=True)
    
    return np.append(describe_df.values.reshape(-1), count_mean), id_folder.split('=')[1]

def load_time_series(dirname) -> pd.DataFrame:
    ids = os.listdir(dirname)
    
    with ThreadPoolExecutor() as executor:
        results = list(tqdm(executor.map(lambda fname: process_file(fname, dirname), ids), total=len(ids)))
    
    stats, indexes = zip(*results)
    
    df = pd.DataFrame(stats, columns=[f"stat_{i}" for i in range(len(stats[0]))])
    df['id'] = indexes
    return df


class AutoEncoder(nn.Module):
    def __init__(self, input_dim, encoding_dim):
        super(AutoEncoder, self).__init__()
        self.encoder = nn.Sequential(
            nn.Linear(input_dim, encoding_dim*4),
            nn.ReLU(),
            nn.Linear(encoding_dim*4, encoding_dim*2),
            nn.ReLU(),
            nn.Linear(encoding_dim*2, encoding_dim),
            nn.ReLU()
        )
        self.decoder = nn.Sequential(
            nn.Linear(encoding_dim, encoding_dim*2),
            nn.ReLU(),
            nn.Linear(encoding_dim*2, encoding_dim*4),
            nn.ReLU(),
            nn.Linear(encoding_dim*4, input_dim),
            nn.Sigmoid()
        )
        
    def forward(self, x):
        encoded = self.encoder(x)
        decoded = self.decoder(encoded)
        return decoded


def perform_autoencoder(df, encoding_dim=50, epochs=50, batch_size=32):
    scaler = StandardScaler()
    df_scaled = scaler.fit_transform(df)
    
    data_tensor = torch.FloatTensor(df_scaled)
    
    input_dim = data_tensor.shape[1]
    autoencoder = AutoEncoder(input_dim, encoding_dim)
    
    criterion = nn.MSELoss()
    optimizer = optim.Adam(autoencoder.parameters())
    
    for epoch in range(epochs):
        for i in range(0, len(data_tensor), batch_size):
            batch = data_tensor[i : i + batch_size]
            optimizer.zero_grad()
            reconstructed = autoencoder(batch)
            loss = criterion(reconstructed, batch)
            loss.backward()
            optimizer.step()
            
        if (epoch + 1) % 10 == 0:
            print(f'Epoch [{epoch + 1}/{epochs}], Loss: {loss.item():.4f}]')
                 
    with torch.no_grad():
        encoded_data = autoencoder.encoder(data_tensor).numpy()
        
    df_encoded = pd.DataFrame(encoded_data, columns=[f'Enc_{i + 1}' for i in range(encoded_data.shape[1])])
    
    return df_encoded

def feature_engineering(df):
    df['BMI_Age'] = df['Physical-BMI'] * df['Basic_Demos-Age']
    df['Internet_Hours_Age'] = df['PreInt_EduHx-computerinternet_hoursday'] * df['Basic_Demos-Age']
    df['BMI_Internet_Hours'] = df['Physical-BMI'] * df['PreInt_EduHx-computerinternet_hoursday']
    df['BFP_BMI'] = df['BIA-BIA_Fat'] / df['BIA-BIA_BMI']
    df['FFMI_BFP'] = df['BIA-BIA_FFMI'] / df['BIA-BIA_Fat']
    df['FMI_BFP'] = df['BIA-BIA_FMI'] / df['BIA-BIA_Fat']
    df['LST_TBW'] = df['BIA-BIA_LST'] / df['BIA-BIA_TBW']
    df['BFP_BMR'] = df['BIA-BIA_Fat'] * df['BIA-BIA_BMR']
    df['BFP_DEE'] = df['BIA-BIA_Fat'] * df['BIA-BIA_DEE']
    df['BMR_Weight'] = df['BIA-BIA_BMR'] / df['Physical-Weight']
    df['DEE_Weight'] = df['BIA-BIA_DEE'] / df['Physical-Weight']
    df['SMM_Height'] = df['BIA-BIA_SMM'] / df['Physical-Height']
    df['Muscle_to_Fat'] = df['BIA-BIA_SMM'] / df['BIA-BIA_FMI']
    df['Hydration_Status'] = df['BIA-BIA_TBW'] / df['Physical-Weight']
    df['ICW_TBW'] = df['BIA-BIA_ICW'] / df['BIA-BIA_TBW']
    
    return df

In [4]:
path = "I:/Kaggle/child-mind-institute-problematic-internet-use/"

In [5]:
train = pd.read_csv(path + 'train.csv')
test = pd.read_csv(path + 'test.csv')
sample = pd.read_csv(path + 'sample_submission.csv')

In [6]:
train_ts = load_time_series(path + "series_train.parquet")
test_ts = load_time_series(path + "series_test.parquet")

100%|████████████████████████████████████████████████████████████████████████████████| 996/996 [00:29<00:00, 34.24it/s]
100%|████████████████████████████████████████████████████████████████████████████████████| 2/2 [00:00<00:00, 16.21it/s]


In [9]:
concat_ts = pd.concat([train_ts, test_ts], ignore_index=True)
df_concat = concat_ts.drop('id', axis=1)

In [11]:
for col in df_concat.columns:
    if df_concat[col].std() == 0:
        df_concat.drop(col, axis=1, inplace=True)

In [12]:
time_series_cols = df_concat.columns.tolist()
df_concat["id"] = concat_ts["id"]
train_ts = df_concat.head(train_ts.shape[0]).reset_index(drop=True)
test_ts = df_concat.tail(test_ts.shape[0]).reset_index(drop=True)
train_merge = pd.merge(train, train_ts, how="left", on='id')
test_merge = pd.merge(test, test_ts, how="left", on='id')

In [13]:
data_dict = pd.read_csv(path + 'data_dictionary.csv')
print(data_dict.shape)
data_dict

(81, 6)


Unnamed: 0,Instrument,Field,Description,Type,Values,Value Labels
0,Identifier,id,Participant's ID,str,,
1,Demographics,Basic_Demos-Enroll_Season,Season of enrollment,str,"Spring, Summer, Fall, Winter",
2,Demographics,Basic_Demos-Age,Age of participant,float,,
3,Demographics,Basic_Demos-Sex,Sex of participant,categorical int,01,"0=Male, 1=Female"
4,Children's Global Assessment Scale,CGAS-Season,Season of participation,str,"Spring, Summer, Fall, Winter",
5,Children's Global Assessment Scale,CGAS-CGAS_Score,Children's Global Assessment Scale Score,int,,
6,Physical Measures,Physical-Season,Season of participation,str,"Spring, Summer, Fall, Winter",
7,Physical Measures,Physical-BMI,Body Mass Index (kg/m^2),float,,
8,Physical Measures,Physical-Height,Height (in),float,,
9,Physical Measures,Physical-Weight,Weight (lbs),float,,


In [14]:
cat_cols = []
for i in range(data_dict.shape[0]):
    col = data_dict['Field'][i]
    if col == 'id':
        continue
    if (data_dict['Type'][i] == 'str') | ('categori' in data_dict['Type'][i]):
        cat_cols.append(col)

In [15]:
ordinal_variables = ['FGC-FGC_CU_Zone', 'FGC-FGC_CU_Zone', 'FGC-FGC_GSND_Zone', 'FGC-FGC_GSD_Zone', 'FGC-FGC_PU_Zone',
                     'FGC-FGC_SRL_Zone', 'FGC-FGC_SRR_Zone', 'FGC-FGC_TL_Zone', 'BIA-BIA_Activity_Level_num', 'BIA-BIA_Frame_num',
                     'PreInt_EduHx-computerinternet_hoursday']

ordinal_variables += [col for col in cat_cols if (('PCIAT' in col)&('Season' not in col))]
print(len(ordinal_variables))
ordinal_variables

31


['FGC-FGC_CU_Zone',
 'FGC-FGC_CU_Zone',
 'FGC-FGC_GSND_Zone',
 'FGC-FGC_GSD_Zone',
 'FGC-FGC_PU_Zone',
 'FGC-FGC_SRL_Zone',
 'FGC-FGC_SRR_Zone',
 'FGC-FGC_TL_Zone',
 'BIA-BIA_Activity_Level_num',
 'BIA-BIA_Frame_num',
 'PreInt_EduHx-computerinternet_hoursday',
 'PCIAT-PCIAT_01',
 'PCIAT-PCIAT_02',
 'PCIAT-PCIAT_03',
 'PCIAT-PCIAT_04',
 'PCIAT-PCIAT_05',
 'PCIAT-PCIAT_06',
 'PCIAT-PCIAT_07',
 'PCIAT-PCIAT_08',
 'PCIAT-PCIAT_09',
 'PCIAT-PCIAT_10',
 'PCIAT-PCIAT_11',
 'PCIAT-PCIAT_12',
 'PCIAT-PCIAT_13',
 'PCIAT-PCIAT_14',
 'PCIAT-PCIAT_15',
 'PCIAT-PCIAT_16',
 'PCIAT-PCIAT_17',
 'PCIAT-PCIAT_18',
 'PCIAT-PCIAT_19',
 'PCIAT-PCIAT_20']

In [16]:
cat_cols = list(set(cat_cols) - set(ordinal_variables))
print(len(cat_cols))
cat_cols

12


['Basic_Demos-Sex',
 'FGC-Season',
 'PreInt_EduHx-Season',
 'Fitness_Endurance-Season',
 'PAQ_C-Season',
 'PCIAT-Season',
 'CGAS-Season',
 'SDS-Season',
 'Basic_Demos-Enroll_Season',
 'Physical-Season',
 'BIA-Season',
 'PAQ_A-Season']

In [17]:
train_nonan = train_merge.dropna(subset=['sii'], ignore_index=True)
print(train_nonan.shape)
train_nonan.head()

(2736, 368)


Unnamed: 0,id,Basic_Demos-Enroll_Season,Basic_Demos-Age,Basic_Demos-Sex,CGAS-Season,CGAS-CGAS_Score,Physical-Season,Physical-BMI,Physical-Height,Physical-Weight,Physical-Waist_Circumference,Physical-Diastolic_BP,Physical-HeartRate,Physical-Systolic_BP,Fitness_Endurance-Season,Fitness_Endurance-Max_Stage,Fitness_Endurance-Time_Mins,Fitness_Endurance-Time_Sec,FGC-Season,FGC-FGC_CU,FGC-FGC_CU_Zone,FGC-FGC_GSND,FGC-FGC_GSND_Zone,FGC-FGC_GSD,FGC-FGC_GSD_Zone,FGC-FGC_PU,FGC-FGC_PU_Zone,FGC-FGC_SRL,FGC-FGC_SRL_Zone,FGC-FGC_SRR,FGC-FGC_SRR_Zone,FGC-FGC_TL,FGC-FGC_TL_Zone,BIA-Season,BIA-BIA_Activity_Level_num,BIA-BIA_BMC,BIA-BIA_BMI,BIA-BIA_BMR,BIA-BIA_DEE,BIA-BIA_ECW,BIA-BIA_FFM,BIA-BIA_FFMI,BIA-BIA_FMI,BIA-BIA_Fat,BIA-BIA_Frame_num,BIA-BIA_ICW,BIA-BIA_LDM,BIA-BIA_LST,BIA-BIA_SMM,BIA-BIA_TBW,PAQ_A-Season,PAQ_A-PAQ_A_Total,PAQ_C-Season,PAQ_C-PAQ_C_Total,PCIAT-Season,PCIAT-PCIAT_01,PCIAT-PCIAT_02,PCIAT-PCIAT_03,PCIAT-PCIAT_04,PCIAT-PCIAT_05,PCIAT-PCIAT_06,PCIAT-PCIAT_07,PCIAT-PCIAT_08,PCIAT-PCIAT_09,PCIAT-PCIAT_10,PCIAT-PCIAT_11,PCIAT-PCIAT_12,PCIAT-PCIAT_13,PCIAT-PCIAT_14,PCIAT-PCIAT_15,PCIAT-PCIAT_16,PCIAT-PCIAT_17,PCIAT-PCIAT_18,PCIAT-PCIAT_19,PCIAT-PCIAT_20,PCIAT-PCIAT_Total,SDS-Season,SDS-SDS_Total_Raw,SDS-SDS_Total_T,PreInt_EduHx-Season,PreInt_EduHx-computerinternet_hoursday,sii,stat_0,stat_1,stat_2,stat_3,stat_4,stat_5,stat_6,stat_7,stat_8,stat_9,stat_10,stat_11,stat_12,stat_13,stat_14,stat_15,stat_16,stat_17,stat_18,stat_19,stat_20,stat_21,stat_22,stat_23,stat_24,stat_25,stat_26,stat_27,stat_28,stat_31,stat_32,stat_33,stat_34,stat_35,stat_36,stat_37,stat_38,stat_39,stat_40,stat_42,stat_43,stat_44,stat_45,stat_46,stat_47,stat_48,stat_49,stat_50,stat_51,stat_52,stat_53,stat_54,stat_55,stat_56,stat_57,stat_58,stat_59,stat_60,stat_61,stat_62,stat_63,stat_64,stat_65,stat_66,stat_67,stat_68,stat_69,stat_70,stat_71,stat_72,stat_73,stat_74,stat_75,stat_76,stat_77,stat_78,stat_79,stat_80,stat_81,stat_82,stat_83,stat_84,stat_85,stat_86,stat_87,stat_88,stat_89,stat_90,stat_91,stat_92,stat_93,stat_94,stat_95,stat_96,stat_97,stat_98,stat_99,stat_100,stat_101,stat_102,stat_103,stat_104,stat_105,stat_106,stat_107,stat_108,stat_109,stat_110,stat_111,stat_112,stat_113,stat_114,stat_115,stat_116,stat_117,stat_118,stat_119,stat_120,stat_121,stat_122,stat_123,stat_124,stat_125,stat_126,stat_127,stat_128,stat_129,stat_130,stat_131,stat_132,stat_133,stat_134,stat_135,stat_136,stat_137,stat_138,stat_139,stat_140,stat_141,stat_142,stat_143,stat_144,stat_145,stat_146,stat_147,stat_148,stat_149,stat_150,stat_151,stat_152,stat_153,stat_154,stat_155,stat_156,stat_157,stat_158,stat_159,stat_160,stat_161,stat_162,stat_163,stat_164,stat_165,stat_166,stat_167,stat_168,stat_169,stat_170,stat_171,stat_172,stat_173,stat_174,stat_175,stat_176,stat_177,stat_178,stat_179,stat_180,stat_181,stat_182,stat_183,stat_184,stat_185,stat_186,stat_187,stat_188,stat_189,stat_190,stat_191,stat_192,stat_193,stat_194,stat_195,stat_196,stat_197,stat_198,stat_199,stat_200,stat_201,stat_202,stat_203,stat_204,stat_205,stat_206,stat_207,stat_208,stat_209,stat_210,stat_211,stat_212,stat_213,stat_214,stat_215,stat_216,stat_217,stat_218,stat_219,stat_220,stat_221,stat_222,stat_223,stat_224,stat_225,stat_226,stat_227,stat_228,stat_229,stat_230,stat_231,stat_232,stat_233,stat_234,stat_235,stat_236,stat_237,stat_238,stat_239,stat_240,stat_241,stat_242,stat_243,stat_244,stat_245,stat_246,stat_247,stat_248,stat_249,stat_250,stat_251,stat_252,stat_253,stat_254,stat_255,stat_256,stat_257,stat_258,stat_259,stat_260,stat_261,stat_262,stat_263,stat_264,stat_265,stat_266,stat_267,stat_268,stat_269,stat_270,stat_271,stat_272,stat_273,stat_274,stat_275,stat_276,stat_277,stat_278,stat_279,stat_280,stat_281,stat_282,stat_283,stat_284,stat_285,stat_286,stat_287,stat_288
0,00008ff9,Fall,5,0,Winter,51.0,Fall,16.877316,46.0,50.8,,,,,,,,,Fall,0.0,0.0,,,,,0.0,0.0,7.0,0.0,6.0,0.0,6.0,1.0,Fall,2.0,2.66855,16.8792,932.498,1492.0,8.25598,41.5862,13.8177,3.06143,9.21377,1.0,24.4349,8.89536,38.9177,19.5413,32.6909,,,,,Fall,5.0,4.0,4.0,0.0,4.0,0.0,0.0,4.0,0.0,0.0,4.0,0.0,4.0,4.0,4.0,4.0,4.0,4.0,2.0,4.0,55.0,,,,Fall,3.0,2.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
1,000fd460,Summer,9,0,,,Fall,14.03559,48.0,46.0,22.0,75.0,70.0,122.0,,,,,Fall,3.0,0.0,,,,,5.0,0.0,11.0,1.0,11.0,1.0,3.0,0.0,Winter,2.0,2.57949,14.0371,936.656,1498.65,6.01993,42.0291,12.8254,1.21172,3.97085,1.0,21.0352,14.974,39.4497,15.4107,27.0552,,,Fall,2.34,Fall,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,Fall,46.0,64.0,Summer,0.0,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
2,00105258,Summer,10,1,Fall,71.0,Fall,16.648696,56.5,75.6,,65.0,94.0,117.0,Fall,5.0,7.0,33.0,Fall,20.0,1.0,10.2,1.0,14.7,2.0,7.0,1.0,10.0,1.0,10.0,1.0,5.0,0.0,,,,,,,,,,,,,,,,,,,,Summer,2.17,Fall,5.0,2.0,2.0,1.0,2.0,1.0,1.0,2.0,1.0,1.0,1.0,0.0,1.0,1.0,1.0,0.0,2.0,2.0,1.0,1.0,28.0,Fall,38.0,54.0,Summer,2.0,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
3,00115b9f,Winter,9,0,Fall,71.0,Summer,18.292347,56.0,81.6,,60.0,97.0,117.0,Summer,6.0,9.0,37.0,Summer,18.0,1.0,,,,,5.0,0.0,7.0,0.0,7.0,0.0,7.0,1.0,Summer,3.0,3.84191,18.2943,1131.43,1923.44,15.5925,62.7757,14.074,4.22033,18.8243,2.0,30.4041,16.779,58.9338,26.4798,45.9966,,,Winter,2.451,Summer,4.0,2.0,4.0,0.0,5.0,1.0,0.0,3.0,2.0,2.0,3.0,0.0,3.0,0.0,0.0,3.0,4.0,3.0,4.0,1.0,44.0,Summer,31.0,45.0,Winter,0.0,1.0,-0.316384,0.016009,-0.16789,0.047388,-10.580416,0.0,42.29631,4053.579102,50462150000000.0,4.470182,3.0,53.201683,0.453665,0.502702,0.58571,0.106351,42.94717,0.0,208.168976,112.404045,19428420000000.0,1.931421,0.0,14.244914,-1.746094,-2.905339,-1.048372,0.0,-89.833092,3824.0,55000000000.0,1.0,3.0,41.0,-0.957459,-0.977749,-1.010391,0.0,-87.332067,0.000752,3829.0,4861450000000.0,1.0,3.0,41.0,-0.914427,-0.877531,-0.957112,0.0,-72.609234,0.0,0.265511,3835.0,9944500000000.0,1.0,3.0,41.0,-0.871721,-0.730302,-0.89797,0.000332,-62.206067,0.0,0.666667,3838.0,24635000000000.0,1.0,3.0,41.0,-0.811414,-0.584147,-0.821275,0.001527,-55.807169,0.0,1.197513,3850.75,28650000000000.0,2.0,3.0,42.0,-0.745521,-0.430516,-0.736979,0.003707,-48.233392,0.0,1.673629,4000.0,33450000000000.0,2.0,3.0,42.0,-0.68418,-0.309863,-0.649974,0.006432,-41.541863,0.0,2.392969,4028.666748,36890000000000.0,3.0,3.0,42.0,-0.625026,-0.224424,-0.565164,0.009337,-35.302367,0.0,3.083734,4035.0,39525000000000.0,4.0,3.0,43.0,-0.567314,-0.136134,-0.489798,0.012539,-30.223173,0.0,3.996364,4041.0,41905000000000.0,4.0,3.0,44.0,-0.508016,-0.054089,-0.415141,0.016204,-25.410971,0.0,4.979007,4058.0,47205000000000.0,4.0,3.0,47.0,-0.437547,-0.01013,-0.330755,0.020108,-20.352911,0.0,5.972977,4064.0,49735000000000.0,5.0,3.0,47.0,-0.366849,0.024974,-0.245378,0.023637,-15.086617,0.0,6.926828,4070.0,53477500000000.0,5.0,3.0,50.0,-0.306484,0.068776,-0.164221,0.026687,-10.005749,0.0,7.581349,4093.0,57440000000000.0,5.0,3.0,51.0,-0.255599,0.12263,-0.079078,0.029139,-4.908399,0.0,8.729453,4099.0,59292000000000.0,5.0,3.0,51.0,-0.193461,0.20526,0.001529,0.031696,-0.057997,0.0,10.158665,4129.0,61180000000000.0,5.0,3.0,52.0,-0.108544,0.309391,0.085911,0.035379,4.938907,0.0,12.0,4140.0,63705000000000.0,6.0,3.0,52.0,-0.010677,0.400677,0.204727,0.04142,12.220764,0.0,15.0,4147.0,66408750000000.0,6.0,3.0,53.0,0.046125,0.495396,0.358109,0.051887,21.963189,0.0,19.178272,4152.0,68645000000000.0,6.0,3.0,56.0,0.138923,0.593706,0.552839,0.070719,35.773787,0.0,27.5,4158.0,71480000000000.0,7.0,3.0,80.0,0.380755,0.702779,0.863568,0.10543,62.185143,0.0,53.025919,4170.0,73980000000000.0,7.0,3.0,82.0,0.540839,0.812206,0.952578,0.180468,74.499702,0.0,97.554999,4175.0,76885000000000.0,7.0,3.0,83.0,1.507865,1.666354,1.546979,4.004276,89.751656,0.0,2633.25,4188.5,86110000000000.0,7.0,3.0,85.0,43330.0
4,001f3379,Spring,13,1,Winter,50.0,Summer,22.279952,59.5,112.2,,60.0,73.0,102.0,,,,,Summer,12.0,0.0,16.5,2.0,17.9,2.0,6.0,0.0,10.0,1.0,11.0,1.0,8.0,0.0,Summer,2.0,4.33036,30.1865,1330.97,1996.45,30.2124,84.0285,16.6877,13.4988,67.9715,2.0,32.9141,20.902,79.6982,35.3804,63.1265,,,Spring,4.11,Summer,3.0,3.0,3.0,0.0,2.0,1.0,0.0,2.0,2.0,1.0,0.0,1.0,3.0,3.0,2.0,1.0,3.0,1.0,2.0,1.0,34.0,Summer,40.0,56.0,Spring,0.0,1.0,-0.004272,0.016859,-0.631731,0.011926,-55.630768,0.655708,16.771982,3838.189453,43212120000000.0,3.909848,3.0,79.435593,0.351545,0.303812,0.623476,0.024331,50.303635,0.468723,95.327438,155.573868,24972640000000.0,1.946892,0.0,6.634319,-1.038711,-1.52269,-1.018787,0.0,-88.761833,3098.166748,0.0,1.0,3.0,68.0,-0.964537,-0.820831,-1.011376,0.0,-88.692085,0.035338,3343.0,860000000000.0,1.0,3.0,68.0,-0.739749,-0.485981,-1.010633,0.000174,-88.553625,0.0,0.204995,3630.0,4305000000000.0,1.0,3.0,69.0,-0.356717,-0.213008,-1.010164,0.001036,-88.48362,0.0,0.37858,3695.0,8615000000000.0,1.0,3.0,70.0,-0.053221,-0.046249,-1.009839,0.003185,-88.464142,0.0,0.464152,3709.333252,12925000000000.0,2.0,3.0,71.0,-0.052986,-0.045577,-1.009578,0.007479,-88.452377,0.0,0.5,3732.333252,17230000000000.0,2.0,3.0,73.0,-0.052803,-0.044517,-1.009344,0.008622,-88.386049,0.0,0.5,3747.0,21540000000000.0,2.0,3.0,74.0,-0.052581,-0.044065,-1.009109,0.008955,-88.308716,0.0,0.538311,3763.75,25850000000000.0,3.0,3.0,75.0,-0.044075,-0.037731,-1.008875,0.009198,-86.990927,0.655556,0.598203,3782.0,30160000000000.0,3.0,3.0,76.0,-0.043265,-0.034616,-1.008614,0.009423,-86.843826,1.0,0.658255,3788.0,34465000000000.0,3.0,3.0,77.0,-0.042494,-0.03132,-1.008276,0.009639,-86.74559,1.0,0.764178,3800.0,38945000000000.0,3.0,3.0,78.0,-0.020622,-0.028179,-1.007728,0.009831,-86.119919,1.0,0.879005,3812.0,43310000000000.0,4.0,3.0,79.0,-0.020152,0.015679,-1.007129,0.01,-86.118622,1.0,0.994175,3826.333252,47620000000000.0,4.0,3.0,81.0,-0.019904,0.016843,-1.006673,0.010157,-86.11805,1.0,1.585408,3847.0,51930000000000.0,4.0,3.0,82.0,-0.019682,0.017282,-1.006139,0.010315,-86.080246,1.0,2.484425,3876.0,56235000000000.0,5.0,3.0,83.0,-0.01942,0.017528,-0.728903,0.010482,-47.183479,1.0,4.0,3917.0,60545000000000.0,5.0,3.0,84.0,-0.019081,0.020307,-0.294459,0.010668,-17.483364,1.0,6.141348,3951.187561,64855000000000.0,6.0,3.0,85.0,-0.01814,0.022414,0.076976,0.010894,4.400664,1.0,9.18595,3982.0,69165000000000.0,6.0,3.0,86.0,0.123577,0.086863,0.264927,0.011239,15.523324,1.0,14.444445,4008.583252,73470000000000.0,6.0,3.0,87.0,0.474932,0.313599,0.466737,0.012207,28.323949,1.0,36.802221,4067.0,77780000000000.0,7.0,3.0,89.0,0.780661,0.773137,0.749808,0.026261,49.306727,1.0,74.0,4103.583496,82090000000000.0,7.0,3.0,90.0,1.034351,1.946303,1.146284,2.952888,89.476036,1.0,2597.800049,4175.0,86395000000000.0,7.0,3.0,91.0,396396.0


In [18]:
train_one_hot = train_nonan.copy()
test_one_hot = test_merge.copy()

In [19]:
for col in cat_cols:
    if 'PCIAT' not in col:
        train_sr = train_one_hot[col].fillna('Missing').apply(str)        
        test_sr = test_one_hot[col].fillna('Missing').apply(str)
        train_one_hot[col] = train_sr
        test_one_hot[col] = test_sr
        concat_sr = pd.concat([train_sr, test_sr])
        unique_list = sorted(concat_sr.unique().tolist())

        for v in unique_list:
            new_col_name = col + '_' + v
            train_one_hot[new_col_name] = pd.Series(train_one_hot[col] == v).astype(int)
            test_one_hot[new_col_name] = pd.Series(test_one_hot[col] == v).astype(int)
    else:
        train_sr = train_one_hot[col].fillna('Missing').apply(str)
        train_one_hot[col] = train_sr
        unique_list = sorted(train_sr.unique().tolist())

        for v in unique_list:
            new_col_name = col + '_' + v
            train_one_hot[new_col_name] = pd.Series(train_one_hot[col] == v).astype(int)

train_one_hot.drop(cat_cols, axis=1, inplace=True)
test_one_hot.drop([col for col in cat_cols if 'PCIAT' not in col], axis=1, inplace=True)

In [26]:
print(train_ts.shape)
train_ts.head()

(996, 287)


Unnamed: 0,stat_0,stat_1,stat_2,stat_3,stat_4,stat_5,stat_6,stat_7,stat_8,stat_9,stat_10,stat_11,stat_12,stat_13,stat_14,stat_15,stat_16,stat_17,stat_18,stat_19,stat_20,stat_21,stat_22,stat_23,stat_24,stat_25,stat_26,stat_27,stat_28,stat_31,stat_32,stat_33,stat_34,stat_35,stat_36,stat_37,stat_38,stat_39,stat_40,stat_42,stat_43,stat_44,stat_45,stat_46,stat_47,stat_48,stat_49,stat_50,stat_51,stat_52,stat_53,stat_54,stat_55,stat_56,stat_57,stat_58,stat_59,stat_60,stat_61,stat_62,stat_63,stat_64,stat_65,stat_66,stat_67,stat_68,stat_69,stat_70,stat_71,stat_72,stat_73,stat_74,stat_75,stat_76,stat_77,stat_78,stat_79,stat_80,stat_81,stat_82,stat_83,stat_84,stat_85,stat_86,stat_87,stat_88,stat_89,stat_90,stat_91,stat_92,stat_93,stat_94,stat_95,stat_96,stat_97,stat_98,stat_99,stat_100,stat_101,stat_102,stat_103,stat_104,stat_105,stat_106,stat_107,stat_108,stat_109,stat_110,stat_111,stat_112,stat_113,stat_114,stat_115,stat_116,stat_117,stat_118,stat_119,stat_120,stat_121,stat_122,stat_123,stat_124,stat_125,stat_126,stat_127,stat_128,stat_129,stat_130,stat_131,stat_132,stat_133,stat_134,stat_135,stat_136,stat_137,stat_138,stat_139,stat_140,stat_141,stat_142,stat_143,stat_144,stat_145,stat_146,stat_147,stat_148,stat_149,stat_150,stat_151,stat_152,stat_153,stat_154,stat_155,stat_156,stat_157,stat_158,stat_159,stat_160,stat_161,stat_162,stat_163,stat_164,stat_165,stat_166,stat_167,stat_168,stat_169,stat_170,stat_171,stat_172,stat_173,stat_174,stat_175,stat_176,stat_177,stat_178,stat_179,stat_180,stat_181,stat_182,stat_183,stat_184,stat_185,stat_186,stat_187,stat_188,stat_189,stat_190,stat_191,stat_192,stat_193,stat_194,stat_195,stat_196,stat_197,stat_198,stat_199,stat_200,stat_201,stat_202,stat_203,stat_204,stat_205,stat_206,stat_207,stat_208,stat_209,stat_210,stat_211,stat_212,stat_213,stat_214,stat_215,stat_216,stat_217,stat_218,stat_219,stat_220,stat_221,stat_222,stat_223,stat_224,stat_225,stat_226,stat_227,stat_228,stat_229,stat_230,stat_231,stat_232,stat_233,stat_234,stat_235,stat_236,stat_237,stat_238,stat_239,stat_240,stat_241,stat_242,stat_243,stat_244,stat_245,stat_246,stat_247,stat_248,stat_249,stat_250,stat_251,stat_252,stat_253,stat_254,stat_255,stat_256,stat_257,stat_258,stat_259,stat_260,stat_261,stat_262,stat_263,stat_264,stat_265,stat_266,stat_267,stat_268,stat_269,stat_270,stat_271,stat_272,stat_273,stat_274,stat_275,stat_276,stat_277,stat_278,stat_279,stat_280,stat_281,stat_282,stat_283,stat_284,stat_285,stat_286,stat_287,stat_288,id
0,-0.316384,0.016009,-0.16789,0.047388,-10.580416,0.0,42.29631,4053.579102,50462150000000.0,4.470182,3.0,53.201683,0.453665,0.502702,0.58571,0.106351,42.94717,0.0,208.168976,112.404045,19428420000000.0,1.931421,0.0,14.244914,-1.746094,-2.905339,-1.048372,0.0,-89.833092,3824.0,55000000000.0,1.0,3.0,41.0,-0.957459,-0.977749,-1.010391,0.0,-87.332067,0.000752,3829.0,4861450000000.0,1.0,3.0,41.0,-0.914427,-0.877531,-0.957112,0.0,-72.609234,0.0,0.265511,3835.0,9944500000000.0,1.0,3.0,41.0,-0.871721,-0.730302,-0.89797,0.000332,-62.206067,0.0,0.666667,3838.0,24635000000000.0,1.0,3.0,41.0,-0.811414,-0.584147,-0.821275,0.001527,-55.807169,0.0,1.197513,3850.75,28650000000000.0,2.0,3.0,42.0,-0.745521,-0.430516,-0.736979,0.003707,-48.233392,0.0,1.673629,4000.0,33450000000000.0,2.0,3.0,42.0,-0.68418,-0.309863,-0.649974,0.006432,-41.541863,0.0,2.392969,4028.666748,36890000000000.0,3.0,3.0,42.0,-0.625026,-0.224424,-0.565164,0.009337,-35.302367,0.0,3.083734,4035.0,39525000000000.0,4.0,3.0,43.0,-0.567314,-0.136134,-0.489798,0.012539,-30.223173,0.0,3.996364,4041.0,41905000000000.0,4.0,3.0,44.0,-0.508016,-0.054089,-0.415141,0.016204,-25.410971,0.0,4.979007,4058.0,47205000000000.0,4.0,3.0,47.0,-0.437547,-0.01013,-0.330755,0.020108,-20.352911,0.0,5.972977,4064.0,49735000000000.0,5.0,3.0,47.0,-0.366849,0.024974,-0.245378,0.023637,-15.086617,0.0,6.926828,4070.0,53477500000000.0,5.0,3.0,50.0,-0.306484,0.068776,-0.164221,0.026687,-10.005749,0.0,7.581349,4093.0,57440000000000.0,5.0,3.0,51.0,-0.255599,0.12263,-0.079078,0.029139,-4.908399,0.0,8.729453,4099.0,59292000000000.0,5.0,3.0,51.0,-0.193461,0.20526,0.001529,0.031696,-0.057997,0.0,10.158665,4129.0,61180000000000.0,5.0,3.0,52.0,-0.108544,0.309391,0.085911,0.035379,4.938907,0.0,12.0,4140.0,63705000000000.0,6.0,3.0,52.0,-0.010677,0.400677,0.204727,0.04142,12.220764,0.0,15.0,4147.0,66408750000000.0,6.0,3.0,53.0,0.046125,0.495396,0.358109,0.051887,21.963189,0.0,19.178272,4152.0,68645000000000.0,6.0,3.0,56.0,0.138923,0.593706,0.552839,0.070719,35.773787,0.0,27.5,4158.0,71480000000000.0,7.0,3.0,80.0,0.380755,0.702779,0.863568,0.10543,62.185143,0.0,53.025919,4170.0,73980000000000.0,7.0,3.0,82.0,0.540839,0.812206,0.952578,0.180468,74.499702,0.0,97.554999,4175.0,76885000000000.0,7.0,3.0,83.0,1.507865,1.666354,1.546979,4.004276,89.751656,0.0,2633.25,4188.5,86110000000000.0,7.0,3.0,85.0,43330.0,00115b9f
1,-0.004272,0.016859,-0.631731,0.011926,-55.630768,0.655708,16.771982,3838.189453,43212120000000.0,3.909848,3.0,79.435593,0.351545,0.303812,0.623476,0.024331,50.303635,0.468723,95.327438,155.573868,24972640000000.0,1.946892,0.0,6.634319,-1.038711,-1.52269,-1.018787,0.0,-88.761833,3098.166748,0.0,1.0,3.0,68.0,-0.964537,-0.820831,-1.011376,0.0,-88.692085,0.035338,3343.0,860000000000.0,1.0,3.0,68.0,-0.739749,-0.485981,-1.010633,0.0001744766,-88.553625,0.0,0.204995,3630.0,4305000000000.0,1.0,3.0,69.0,-0.356717,-0.213008,-1.010164,0.001036,-88.48362,0.0,0.37858,3695.0,8615000000000.0,1.0,3.0,70.0,-0.053221,-0.046249,-1.009839,0.003185,-88.464142,0.0,0.464152,3709.333252,12925000000000.0,2.0,3.0,71.0,-0.052986,-0.045577,-1.009578,0.007479,-88.452377,0.0,0.5,3732.333252,17230000000000.0,2.0,3.0,73.0,-0.052803,-0.044517,-1.009344,0.008622,-88.386049,0.0,0.5,3747.0,21540000000000.0,2.0,3.0,74.0,-0.052581,-0.044065,-1.009109,0.008955,-88.308716,0.0,0.538311,3763.75,25850000000000.0,3.0,3.0,75.0,-0.044075,-0.037731,-1.008875,0.009198,-86.990927,0.655556,0.598203,3782.0,30160000000000.0,3.0,3.0,76.0,-0.043265,-0.034616,-1.008614,0.009423,-86.843826,1.0,0.658255,3788.0,34465000000000.0,3.0,3.0,77.0,-0.042494,-0.03132,-1.008276,0.009639,-86.74559,1.0,0.764178,3800.0,38945000000000.0,3.0,3.0,78.0,-0.020622,-0.028179,-1.007728,0.009831,-86.119919,1.0,0.879005,3812.0,43310000000000.0,4.0,3.0,79.0,-0.020152,0.015679,-1.007129,0.01,-86.118622,1.0,0.994175,3826.333252,47620000000000.0,4.0,3.0,81.0,-0.019904,0.016843,-1.006673,0.010157,-86.11805,1.0,1.585408,3847.0,51930000000000.0,4.0,3.0,82.0,-0.019682,0.017282,-1.006139,0.010315,-86.080246,1.0,2.484425,3876.0,56235000000000.0,5.0,3.0,83.0,-0.01942,0.017528,-0.728903,0.010482,-47.183479,1.0,4.0,3917.0,60545000000000.0,5.0,3.0,84.0,-0.019081,0.020307,-0.294459,0.010668,-17.483364,1.0,6.141348,3951.187561,64855000000000.0,6.0,3.0,85.0,-0.01814,0.022414,0.076976,0.010894,4.400664,1.0,9.18595,3982.0,69165000000000.0,6.0,3.0,86.0,0.123577,0.086863,0.264927,0.011239,15.523324,1.0,14.444445,4008.583252,73470000000000.0,6.0,3.0,87.0,0.474932,0.313599,0.466737,0.012207,28.323949,1.0,36.802221,4067.0,77780000000000.0,7.0,3.0,89.0,0.780661,0.773137,0.749808,0.026261,49.306727,1.0,74.0,4103.583496,82090000000000.0,7.0,3.0,90.0,1.034351,1.946303,1.146284,2.952888,89.476036,1.0,2597.800049,4175.0,86395000000000.0,7.0,3.0,91.0,396396.0,001f3379
2,0.208036,0.057094,0.14155,0.030255,6.687338,0.171246,66.563408,3848.583252,43186800000000.0,3.832677,2.0,26.152903,0.486977,0.443755,0.683114,0.104136,52.754208,0.374121,286.916595,166.968582,24948830000000.0,1.951927,0.0,6.932943,-1.952594,-2.361866,-1.016758,0.0,-89.463226,3098.166748,0.0,1.0,2.0,14.0,-0.930746,-0.965952,-0.994755,0.0,-88.614159,0.11009,3354.0,860000000000.0,1.0,2.0,14.0,-0.782689,-0.874661,-0.989987,0.0,-88.582434,0.0,0.5,3630.0,4315000000000.0,1.0,2.0,15.0,-0.516909,-0.618423,-0.986457,0.0,-88.147131,0.0,0.864342,3683.0,8630000000000.0,1.0,2.0,17.0,-0.238382,-0.371091,-0.9464,0.0,-73.107068,0.0,1.280912,3700.0,12945000000000.0,2.0,2.0,18.0,-0.090905,-0.223016,-0.746625,0.0,-48.702155,0.0,1.766406,3730.0,17265000000000.0,2.0,2.0,19.0,-0.012729,-0.110418,-0.420154,1.8e-05,-25.106887,0.0,2.669909,3741.0,21580000000000.0,2.0,2.0,20.0,0.015425,-0.027036,-0.173074,0.000136,-10.153082,0.0,3.671382,3759.0,25895000000000.0,2.0,2.0,21.0,0.021194,-0.021556,0.009641,0.000752,0.539956,0.0,4.522014,3782.0,30215000000000.0,3.0,2.0,23.0,0.039032,-0.010841,0.147738,0.001914,8.546391,0.0,5.2576,3788.0,34530000000000.0,3.0,2.0,24.0,0.102178,0.011493,0.250328,0.00396,14.589791,0.0,6.076707,3800.0,38845000000000.0,3.0,2.0,25.0,0.194404,0.05231,0.333331,0.006382,19.556299,0.0,7.172272,3818.0,43162500000000.0,4.0,2.0,26.0,0.272374,0.093618,0.408543,0.008522,24.346129,0.0,9.265981,3835.0,47480000000000.0,4.0,2.0,27.0,0.315673,0.124312,0.489481,0.011057,29.635003,0.0,11.497269,3859.0,51795000000000.0,4.0,2.0,29.0,0.411518,0.187155,0.567019,0.013664,34.861622,0.0,14.645204,3900.0,56135000000000.0,5.0,2.0,30.0,0.512632,0.252672,0.639735,0.016246,40.165275,0.0,18.016139,3936.666748,60500000000000.0,5.0,2.0,31.0,0.606044,0.334034,0.714392,0.020465,45.880418,0.0,21.5,3970.0,64815000000000.0,6.0,2.0,32.0,0.694278,0.408895,0.781845,0.029201,51.696997,0.0,28.780001,4001.333252,69130000000000.0,6.0,2.0,33.0,0.779318,0.499343,0.857525,0.043111,58.879653,1.0,41.230066,4052.0,73450000000000.0,6.0,2.0,35.0,0.854515,0.629066,0.929214,0.067176,67.014535,1.0,73.534854,4087.0,77765000000000.0,7.0,2.0,36.0,0.942404,0.811867,0.983852,0.11961,77.467896,1.0,180.348525,4134.0,82080000000000.0,7.0,2.0,37.0,1.666465,1.016429,2.239939,4.041167,89.862823,1.0,2611.0,4187.0,86395000000000.0,7.0,2.0,38.0,414384.0,00f332d1
3,-0.343396,-0.055826,-0.254433,0.032946,-17.589041,0.03521,17.800735,3849.649414,43384330000000.0,3.963284,4.0,49.910686,0.516126,0.424303,0.564593,0.083798,39.895645,0.183652,73.023468,171.100159,25133560000000.0,1.994539,0.0,6.204418,-2.284304,-2.276082,-1.022549,0.0,-89.87722,3098.166748,0.0,1.0,4.0,39.0,-0.992976,-0.988491,-0.98684,0.0,-81.817635,0.085859,3331.424963,840000000000.0,1.0,4.0,39.0,-0.964502,-0.844479,-0.953644,8.995334e-07,-73.292234,0.0,0.572475,3612.0,4215000000000.0,1.0,4.0,40.0,-0.929022,-0.661048,-0.911583,5.7e-05,-66.116711,0.0,0.99748,3677.0,8430000000000.0,1.0,4.0,41.0,-0.886122,-0.503952,-0.866768,0.000219,-60.558826,0.0,1.5,3695.0,12645000000000.0,2.0,4.0,42.0,-0.843222,-0.400337,-0.812911,0.000525,-55.368187,0.0,2.024508,3721.0,17060000000000.0,2.0,4.0,43.0,-0.784639,-0.312203,-0.753955,0.001059,-49.667419,0.0,2.5,3740.833252,21475000000000.0,2.0,4.0,45.0,-0.730985,-0.23544,-0.679823,0.001892,-43.726986,0.0,2.896743,3759.0,25890000000000.0,3.0,4.0,46.0,-0.675671,-0.173581,-0.607682,0.002922,-38.285491,0.0,3.660389,3778.187561,30310000000000.0,3.0,4.0,47.0,-0.611833,-0.117684,-0.528835,0.004209,-32.9366,0.0,4.471915,3800.0,34725000000000.0,3.0,4.0,48.0,-0.548113,-0.067261,-0.442599,0.005814,-27.263943,0.0,5.404166,3812.0,39140000000000.0,4.0,4.0,49.0,-0.473294,-0.018973,-0.354672,0.008127,-21.538264,0.0,6.677332,3827.833252,43555000000000.0,4.0,4.0,50.0,-0.386463,0.001452,-0.258003,0.010706,-15.668563,0.0,8.333333,3847.0,47970000000000.0,4.0,4.0,51.0,-0.296473,0.037877,-0.163884,0.013545,-9.998143,0.0,9.542373,3865.0,52390000000000.0,5.0,4.0,52.0,-0.20097,0.086421,-0.072262,0.015904,-4.482165,0.0,12.28486,3894.0,56805000000000.0,5.0,4.0,53.0,-0.090672,0.141728,0.014703,0.020617,0.588443,0.0,14.942121,3945.833252,61105000000000.0,5.0,4.0,54.0,0.068885,0.206397,0.113704,0.026206,6.416064,0.0,17.742268,3982.0,65320000000000.0,6.0,4.0,55.0,0.198282,0.279418,0.250736,0.036677,14.511846,0.0,21.217152,4017.0,69535000000000.0,6.0,4.0,56.0,0.257008,0.368431,0.437619,0.05416,26.081448,0.0,26.111111,4052.0,73750000000000.0,6.0,4.0,57.0,0.444116,0.487777,0.628983,0.086339,39.122147,0.0,33.161469,4093.0,77965000000000.0,7.0,4.0,58.0,0.624922,0.661182,0.855523,0.150929,58.590337,0.0,50.195889,4134.0,82180000000000.0,7.0,4.0,60.0,1.000692,1.011419,1.299293,4.097965,88.478432,1.0,2650.5,4184.0,86395000000000.0,7.0,4.0,61.0,370956.0,01085eb3
4,0.01867,0.07166,-0.061682,0.05828,-5.059758,0.0,54.893394,3974.910645,43435730000000.0,4.168412,4.0,-1.168288,0.595251,0.508311,0.578022,0.197285,39.994808,0.0,230.972397,119.525154,25410390000000.0,2.18161,0.0,1.677293,-2.143912,-3.373025,-1.003249,0.0,-89.308716,3095.0,0.0,1.0,4.0,-4.0,-0.977178,-1.048439,-0.994869,0.0,-86.204402,0.164545,3452.0,805000000000.0,1.0,4.0,-4.0,-0.915178,-0.826581,-0.936907,0.0,-70.131484,0.0,1.0,3755.058362,4040000000000.0,1.0,4.0,-4.0,-0.813863,-0.649036,-0.867607,5e-06,-60.379308,0.0,1.240162,3894.0,8085000000000.0,1.0,4.0,-3.0,-0.722694,-0.480292,-0.779335,0.000134,-52.066652,0.0,1.479419,3903.333252,12130000000000.0,1.0,4.0,-3.0,-0.592835,-0.34633,-0.663955,0.000701,-42.340772,0.0,2.110169,3917.0,16172000000000.0,2.0,4.0,-3.0,-0.5143,-0.254007,-0.562416,0.001604,-35.037018,0.0,2.367827,3940.479187,20468750000000.0,2.0,4.0,-3.0,-0.408334,-0.18151,-0.465326,0.002946,-29.07946,0.0,3.057882,3953.0,25320000000000.0,2.0,4.0,-2.0,-0.309016,-0.09667,-0.360116,0.004658,-22.025704,0.0,4.384615,3964.0,30172250000000.0,3.0,4.0,-2.0,-0.184722,-0.036464,-0.244467,0.006634,-15.000445,0.0,5.0,3976.0,35025000000000.0,4.0,4.0,-2.0,-0.05619,0.019013,-0.141554,0.008687,-8.850805,0.0,5.557957,3988.0,39875750000000.0,4.0,4.0,-1.0,0.036376,0.096187,-0.042274,0.010466,-2.822715,0.0,7.05916,3994.0,44730000000000.0,5.0,4.0,-1.0,0.143034,0.183083,0.030954,0.01324,1.564646,0.0,9.0,4005.0,48815000000000.0,5.0,4.0,-1.0,0.24726,0.233549,0.10924,0.016828,6.048079,0.0,11.312204,4015.0,52860000000000.0,5.0,4.0,-1.0,0.360007,0.294277,0.199131,0.021622,11.139169,0.0,13.64914,4023.0,56900000000000.0,6.0,4.0,0.0,0.444944,0.357776,0.31096,0.028782,17.674466,0.0,16.331638,4035.0,60945000000000.0,6.0,4.0,0.0,0.539581,0.458349,0.394637,0.038781,22.951601,0.0,19.320485,4046.0,65115000000000.0,6.0,4.0,0.0,0.634786,0.544063,0.506286,0.053863,30.292509,0.0,22.562103,4058.0,69965000000000.0,6.0,4.0,1.0,0.732723,0.63475,0.617803,0.077157,38.313799,0.0,28.103143,4070.0,74265000000000.0,7.0,4.0,1.0,0.825133,0.711058,0.7644,0.119666,49.951662,0.0,46.339248,4082.0,78310000000000.0,7.0,4.0,1.0,0.917491,0.828655,0.898812,0.227067,63.216378,0.0,166.443433,4093.0,82355000000000.0,7.0,4.0,1.0,3.34121,4.442658,2.321265,6.307294,88.389679,0.0,2618.0,4157.0,86395000000000.0,7.0,4.0,2.0,97048.0,012cadd8


In [20]:
print(train_one_hot.shape)
train_one_hot.head()

(2736, 411)


Unnamed: 0,id,Basic_Demos-Age,CGAS-CGAS_Score,Physical-BMI,Physical-Height,Physical-Weight,Physical-Waist_Circumference,Physical-Diastolic_BP,Physical-HeartRate,Physical-Systolic_BP,Fitness_Endurance-Max_Stage,Fitness_Endurance-Time_Mins,Fitness_Endurance-Time_Sec,FGC-FGC_CU,FGC-FGC_CU_Zone,FGC-FGC_GSND,FGC-FGC_GSND_Zone,FGC-FGC_GSD,FGC-FGC_GSD_Zone,FGC-FGC_PU,FGC-FGC_PU_Zone,FGC-FGC_SRL,FGC-FGC_SRL_Zone,FGC-FGC_SRR,FGC-FGC_SRR_Zone,FGC-FGC_TL,FGC-FGC_TL_Zone,BIA-BIA_Activity_Level_num,BIA-BIA_BMC,BIA-BIA_BMI,BIA-BIA_BMR,BIA-BIA_DEE,BIA-BIA_ECW,BIA-BIA_FFM,BIA-BIA_FFMI,BIA-BIA_FMI,BIA-BIA_Fat,BIA-BIA_Frame_num,BIA-BIA_ICW,BIA-BIA_LDM,BIA-BIA_LST,BIA-BIA_SMM,BIA-BIA_TBW,PAQ_A-PAQ_A_Total,PAQ_C-PAQ_C_Total,PCIAT-PCIAT_01,PCIAT-PCIAT_02,PCIAT-PCIAT_03,PCIAT-PCIAT_04,PCIAT-PCIAT_05,PCIAT-PCIAT_06,PCIAT-PCIAT_07,PCIAT-PCIAT_08,PCIAT-PCIAT_09,PCIAT-PCIAT_10,PCIAT-PCIAT_11,PCIAT-PCIAT_12,PCIAT-PCIAT_13,PCIAT-PCIAT_14,PCIAT-PCIAT_15,PCIAT-PCIAT_16,PCIAT-PCIAT_17,PCIAT-PCIAT_18,PCIAT-PCIAT_19,PCIAT-PCIAT_20,PCIAT-PCIAT_Total,SDS-SDS_Total_Raw,SDS-SDS_Total_T,PreInt_EduHx-computerinternet_hoursday,sii,stat_0,stat_1,stat_2,stat_3,stat_4,stat_5,stat_6,stat_7,stat_8,stat_9,stat_10,stat_11,stat_12,stat_13,stat_14,stat_15,stat_16,stat_17,stat_18,stat_19,stat_20,stat_21,stat_22,stat_23,stat_24,stat_25,stat_26,stat_27,stat_28,stat_31,stat_32,stat_33,stat_34,stat_35,stat_36,stat_37,stat_38,stat_39,stat_40,stat_42,stat_43,stat_44,stat_45,stat_46,stat_47,stat_48,stat_49,stat_50,stat_51,stat_52,stat_53,stat_54,stat_55,stat_56,stat_57,stat_58,stat_59,stat_60,stat_61,stat_62,stat_63,stat_64,stat_65,stat_66,stat_67,stat_68,stat_69,stat_70,stat_71,stat_72,stat_73,stat_74,stat_75,stat_76,stat_77,stat_78,stat_79,stat_80,stat_81,stat_82,stat_83,stat_84,stat_85,stat_86,stat_87,stat_88,stat_89,stat_90,stat_91,stat_92,stat_93,stat_94,stat_95,stat_96,stat_97,stat_98,stat_99,stat_100,stat_101,stat_102,stat_103,stat_104,stat_105,stat_106,stat_107,stat_108,stat_109,stat_110,stat_111,stat_112,stat_113,stat_114,stat_115,stat_116,stat_117,stat_118,stat_119,stat_120,stat_121,stat_122,stat_123,stat_124,stat_125,stat_126,stat_127,stat_128,stat_129,stat_130,stat_131,stat_132,stat_133,stat_134,stat_135,stat_136,stat_137,stat_138,stat_139,stat_140,stat_141,stat_142,stat_143,stat_144,stat_145,stat_146,stat_147,stat_148,stat_149,stat_150,stat_151,stat_152,stat_153,stat_154,stat_155,stat_156,stat_157,stat_158,stat_159,stat_160,stat_161,stat_162,stat_163,stat_164,stat_165,stat_166,stat_167,stat_168,stat_169,stat_170,stat_171,stat_172,stat_173,stat_174,stat_175,stat_176,stat_177,stat_178,stat_179,stat_180,stat_181,stat_182,stat_183,stat_184,stat_185,stat_186,stat_187,stat_188,stat_189,stat_190,stat_191,stat_192,stat_193,stat_194,stat_195,stat_196,stat_197,stat_198,stat_199,stat_200,stat_201,stat_202,stat_203,stat_204,stat_205,stat_206,stat_207,stat_208,stat_209,stat_210,stat_211,stat_212,stat_213,stat_214,stat_215,stat_216,stat_217,stat_218,stat_219,stat_220,stat_221,stat_222,stat_223,stat_224,stat_225,stat_226,stat_227,stat_228,stat_229,stat_230,stat_231,stat_232,stat_233,stat_234,stat_235,stat_236,stat_237,stat_238,stat_239,stat_240,stat_241,stat_242,stat_243,stat_244,stat_245,stat_246,stat_247,stat_248,stat_249,stat_250,stat_251,stat_252,stat_253,stat_254,stat_255,stat_256,stat_257,stat_258,stat_259,stat_260,stat_261,stat_262,stat_263,stat_264,stat_265,stat_266,stat_267,stat_268,stat_269,stat_270,stat_271,stat_272,stat_273,stat_274,stat_275,stat_276,stat_277,stat_278,stat_279,stat_280,stat_281,stat_282,stat_283,stat_284,stat_285,stat_286,stat_287,stat_288,Basic_Demos-Sex_0,Basic_Demos-Sex_1,FGC-Season_Fall,FGC-Season_Missing,FGC-Season_Spring,FGC-Season_Summer,FGC-Season_Winter,PreInt_EduHx-Season_Fall,PreInt_EduHx-Season_Missing,PreInt_EduHx-Season_Spring,PreInt_EduHx-Season_Summer,PreInt_EduHx-Season_Winter,Fitness_Endurance-Season_Fall,Fitness_Endurance-Season_Missing,Fitness_Endurance-Season_Spring,Fitness_Endurance-Season_Summer,Fitness_Endurance-Season_Winter,PAQ_C-Season_Fall,PAQ_C-Season_Missing,PAQ_C-Season_Spring,PAQ_C-Season_Summer,PAQ_C-Season_Winter,PCIAT-Season_Fall,PCIAT-Season_Spring,PCIAT-Season_Summer,PCIAT-Season_Winter,CGAS-Season_Fall,CGAS-Season_Missing,CGAS-Season_Spring,CGAS-Season_Summer,CGAS-Season_Winter,SDS-Season_Fall,SDS-Season_Missing,SDS-Season_Spring,SDS-Season_Summer,SDS-Season_Winter,Basic_Demos-Enroll_Season_Fall,Basic_Demos-Enroll_Season_Spring,Basic_Demos-Enroll_Season_Summer,Basic_Demos-Enroll_Season_Winter,Physical-Season_Fall,Physical-Season_Missing,Physical-Season_Spring,Physical-Season_Summer,Physical-Season_Winter,BIA-Season_Fall,BIA-Season_Missing,BIA-Season_Spring,BIA-Season_Summer,BIA-Season_Winter,PAQ_A-Season_Fall,PAQ_A-Season_Missing,PAQ_A-Season_Spring,PAQ_A-Season_Summer,PAQ_A-Season_Winter
0,00008ff9,5,51.0,16.877316,46.0,50.8,,,,,,,,0.0,0.0,,,,,0.0,0.0,7.0,0.0,6.0,0.0,6.0,1.0,2.0,2.66855,16.8792,932.498,1492.0,8.25598,41.5862,13.8177,3.06143,9.21377,1.0,24.4349,8.89536,38.9177,19.5413,32.6909,,,5.0,4.0,4.0,0.0,4.0,0.0,0.0,4.0,0.0,0.0,4.0,0.0,4.0,4.0,4.0,4.0,4.0,4.0,2.0,4.0,55.0,,,3.0,2.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,1,0,1,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,0,1,0,1,0,0,0,1,0,0,0,1,0,0,0,0,1,0,0,0,0,0,1,0,0,0
1,000fd460,9,,14.03559,48.0,46.0,22.0,75.0,70.0,122.0,,,,3.0,0.0,,,,,5.0,0.0,11.0,1.0,11.0,1.0,3.0,0.0,2.0,2.57949,14.0371,936.656,1498.65,6.01993,42.0291,12.8254,1.21172,3.97085,1.0,21.0352,14.974,39.4497,15.4107,27.0552,,2.34,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,46.0,64.0,0.0,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,1,0,1,0,0,0,0,0,0,0,1,0,0,1,0,0,0,1,0,0,0,0,1,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,1,0,1,0,0,0,0,0,0,0,0,1,0,1,0,0,0
2,00105258,10,71.0,16.648696,56.5,75.6,,65.0,94.0,117.0,5.0,7.0,33.0,20.0,1.0,10.2,1.0,14.7,2.0,7.0,1.0,10.0,1.0,10.0,1.0,5.0,0.0,,,,,,,,,,,,,,,,,,2.17,5.0,2.0,2.0,1.0,2.0,1.0,1.0,2.0,1.0,1.0,1.0,0.0,1.0,1.0,1.0,0.0,2.0,2.0,1.0,1.0,28.0,38.0,54.0,2.0,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0,1,1,0,0,0,0,0,0,0,1,0,1,0,0,0,0,0,0,0,1,0,1,0,0,0,1,0,0,0,0,1,0,0,0,0,0,0,1,0,1,0,0,0,0,0,1,0,0,0,0,1,0,0,0
3,00115b9f,9,71.0,18.292347,56.0,81.6,,60.0,97.0,117.0,6.0,9.0,37.0,18.0,1.0,,,,,5.0,0.0,7.0,0.0,7.0,0.0,7.0,1.0,3.0,3.84191,18.2943,1131.43,1923.44,15.5925,62.7757,14.074,4.22033,18.8243,2.0,30.4041,16.779,58.9338,26.4798,45.9966,,2.451,4.0,2.0,4.0,0.0,5.0,1.0,0.0,3.0,2.0,2.0,3.0,0.0,3.0,0.0,0.0,3.0,4.0,3.0,4.0,1.0,44.0,31.0,45.0,0.0,1.0,-0.316384,0.016009,-0.16789,0.047388,-10.580416,0.0,42.29631,4053.579102,50462150000000.0,4.470182,3.0,53.201683,0.453665,0.502702,0.58571,0.106351,42.94717,0.0,208.168976,112.404045,19428420000000.0,1.931421,0.0,14.244914,-1.746094,-2.905339,-1.048372,0.0,-89.833092,3824.0,55000000000.0,1.0,3.0,41.0,-0.957459,-0.977749,-1.010391,0.0,-87.332067,0.000752,3829.0,4861450000000.0,1.0,3.0,41.0,-0.914427,-0.877531,-0.957112,0.0,-72.609234,0.0,0.265511,3835.0,9944500000000.0,1.0,3.0,41.0,-0.871721,-0.730302,-0.89797,0.000332,-62.206067,0.0,0.666667,3838.0,24635000000000.0,1.0,3.0,41.0,-0.811414,-0.584147,-0.821275,0.001527,-55.807169,0.0,1.197513,3850.75,28650000000000.0,2.0,3.0,42.0,-0.745521,-0.430516,-0.736979,0.003707,-48.233392,0.0,1.673629,4000.0,33450000000000.0,2.0,3.0,42.0,-0.68418,-0.309863,-0.649974,0.006432,-41.541863,0.0,2.392969,4028.666748,36890000000000.0,3.0,3.0,42.0,-0.625026,-0.224424,-0.565164,0.009337,-35.302367,0.0,3.083734,4035.0,39525000000000.0,4.0,3.0,43.0,-0.567314,-0.136134,-0.489798,0.012539,-30.223173,0.0,3.996364,4041.0,41905000000000.0,4.0,3.0,44.0,-0.508016,-0.054089,-0.415141,0.016204,-25.410971,0.0,4.979007,4058.0,47205000000000.0,4.0,3.0,47.0,-0.437547,-0.01013,-0.330755,0.020108,-20.352911,0.0,5.972977,4064.0,49735000000000.0,5.0,3.0,47.0,-0.366849,0.024974,-0.245378,0.023637,-15.086617,0.0,6.926828,4070.0,53477500000000.0,5.0,3.0,50.0,-0.306484,0.068776,-0.164221,0.026687,-10.005749,0.0,7.581349,4093.0,57440000000000.0,5.0,3.0,51.0,-0.255599,0.12263,-0.079078,0.029139,-4.908399,0.0,8.729453,4099.0,59292000000000.0,5.0,3.0,51.0,-0.193461,0.20526,0.001529,0.031696,-0.057997,0.0,10.158665,4129.0,61180000000000.0,5.0,3.0,52.0,-0.108544,0.309391,0.085911,0.035379,4.938907,0.0,12.0,4140.0,63705000000000.0,6.0,3.0,52.0,-0.010677,0.400677,0.204727,0.04142,12.220764,0.0,15.0,4147.0,66408750000000.0,6.0,3.0,53.0,0.046125,0.495396,0.358109,0.051887,21.963189,0.0,19.178272,4152.0,68645000000000.0,6.0,3.0,56.0,0.138923,0.593706,0.552839,0.070719,35.773787,0.0,27.5,4158.0,71480000000000.0,7.0,3.0,80.0,0.380755,0.702779,0.863568,0.10543,62.185143,0.0,53.025919,4170.0,73980000000000.0,7.0,3.0,82.0,0.540839,0.812206,0.952578,0.180468,74.499702,0.0,97.554999,4175.0,76885000000000.0,7.0,3.0,83.0,1.507865,1.666354,1.546979,4.004276,89.751656,0.0,2633.25,4188.5,86110000000000.0,7.0,3.0,85.0,43330.0,1,0,0,0,0,1,0,0,0,0,0,1,0,0,0,1,0,0,0,0,0,1,0,0,1,0,1,0,0,0,0,0,0,0,1,0,0,0,0,1,0,0,0,1,0,0,0,0,1,0,0,1,0,0,0
4,001f3379,13,50.0,22.279952,59.5,112.2,,60.0,73.0,102.0,,,,12.0,0.0,16.5,2.0,17.9,2.0,6.0,0.0,10.0,1.0,11.0,1.0,8.0,0.0,2.0,4.33036,30.1865,1330.97,1996.45,30.2124,84.0285,16.6877,13.4988,67.9715,2.0,32.9141,20.902,79.6982,35.3804,63.1265,,4.11,3.0,3.0,3.0,0.0,2.0,1.0,0.0,2.0,2.0,1.0,0.0,1.0,3.0,3.0,2.0,1.0,3.0,1.0,2.0,1.0,34.0,40.0,56.0,0.0,1.0,-0.004272,0.016859,-0.631731,0.011926,-55.630768,0.655708,16.771982,3838.189453,43212120000000.0,3.909848,3.0,79.435593,0.351545,0.303812,0.623476,0.024331,50.303635,0.468723,95.327438,155.573868,24972640000000.0,1.946892,0.0,6.634319,-1.038711,-1.52269,-1.018787,0.0,-88.761833,3098.166748,0.0,1.0,3.0,68.0,-0.964537,-0.820831,-1.011376,0.0,-88.692085,0.035338,3343.0,860000000000.0,1.0,3.0,68.0,-0.739749,-0.485981,-1.010633,0.000174,-88.553625,0.0,0.204995,3630.0,4305000000000.0,1.0,3.0,69.0,-0.356717,-0.213008,-1.010164,0.001036,-88.48362,0.0,0.37858,3695.0,8615000000000.0,1.0,3.0,70.0,-0.053221,-0.046249,-1.009839,0.003185,-88.464142,0.0,0.464152,3709.333252,12925000000000.0,2.0,3.0,71.0,-0.052986,-0.045577,-1.009578,0.007479,-88.452377,0.0,0.5,3732.333252,17230000000000.0,2.0,3.0,73.0,-0.052803,-0.044517,-1.009344,0.008622,-88.386049,0.0,0.5,3747.0,21540000000000.0,2.0,3.0,74.0,-0.052581,-0.044065,-1.009109,0.008955,-88.308716,0.0,0.538311,3763.75,25850000000000.0,3.0,3.0,75.0,-0.044075,-0.037731,-1.008875,0.009198,-86.990927,0.655556,0.598203,3782.0,30160000000000.0,3.0,3.0,76.0,-0.043265,-0.034616,-1.008614,0.009423,-86.843826,1.0,0.658255,3788.0,34465000000000.0,3.0,3.0,77.0,-0.042494,-0.03132,-1.008276,0.009639,-86.74559,1.0,0.764178,3800.0,38945000000000.0,3.0,3.0,78.0,-0.020622,-0.028179,-1.007728,0.009831,-86.119919,1.0,0.879005,3812.0,43310000000000.0,4.0,3.0,79.0,-0.020152,0.015679,-1.007129,0.01,-86.118622,1.0,0.994175,3826.333252,47620000000000.0,4.0,3.0,81.0,-0.019904,0.016843,-1.006673,0.010157,-86.11805,1.0,1.585408,3847.0,51930000000000.0,4.0,3.0,82.0,-0.019682,0.017282,-1.006139,0.010315,-86.080246,1.0,2.484425,3876.0,56235000000000.0,5.0,3.0,83.0,-0.01942,0.017528,-0.728903,0.010482,-47.183479,1.0,4.0,3917.0,60545000000000.0,5.0,3.0,84.0,-0.019081,0.020307,-0.294459,0.010668,-17.483364,1.0,6.141348,3951.187561,64855000000000.0,6.0,3.0,85.0,-0.01814,0.022414,0.076976,0.010894,4.400664,1.0,9.18595,3982.0,69165000000000.0,6.0,3.0,86.0,0.123577,0.086863,0.264927,0.011239,15.523324,1.0,14.444445,4008.583252,73470000000000.0,6.0,3.0,87.0,0.474932,0.313599,0.466737,0.012207,28.323949,1.0,36.802221,4067.0,77780000000000.0,7.0,3.0,89.0,0.780661,0.773137,0.749808,0.026261,49.306727,1.0,74.0,4103.583496,82090000000000.0,7.0,3.0,90.0,1.034351,1.946303,1.146284,2.952888,89.476036,1.0,2597.800049,4175.0,86395000000000.0,7.0,3.0,91.0,396396.0,0,1,0,0,0,1,0,0,0,1,0,0,0,1,0,0,0,0,0,1,0,0,0,0,1,0,0,0,0,0,1,0,0,0,1,0,0,1,0,0,0,0,0,1,0,0,0,0,1,0,0,1,0,0,0


In [21]:
print(test_one_hot.shape)
test_one_hot.head()

(20, 385)


Unnamed: 0,id,Basic_Demos-Age,CGAS-CGAS_Score,Physical-BMI,Physical-Height,Physical-Weight,Physical-Waist_Circumference,Physical-Diastolic_BP,Physical-HeartRate,Physical-Systolic_BP,Fitness_Endurance-Max_Stage,Fitness_Endurance-Time_Mins,Fitness_Endurance-Time_Sec,FGC-FGC_CU,FGC-FGC_CU_Zone,FGC-FGC_GSND,FGC-FGC_GSND_Zone,FGC-FGC_GSD,FGC-FGC_GSD_Zone,FGC-FGC_PU,FGC-FGC_PU_Zone,FGC-FGC_SRL,FGC-FGC_SRL_Zone,FGC-FGC_SRR,FGC-FGC_SRR_Zone,FGC-FGC_TL,FGC-FGC_TL_Zone,BIA-BIA_Activity_Level_num,BIA-BIA_BMC,BIA-BIA_BMI,BIA-BIA_BMR,BIA-BIA_DEE,BIA-BIA_ECW,BIA-BIA_FFM,BIA-BIA_FFMI,BIA-BIA_FMI,BIA-BIA_Fat,BIA-BIA_Frame_num,BIA-BIA_ICW,BIA-BIA_LDM,BIA-BIA_LST,BIA-BIA_SMM,BIA-BIA_TBW,PAQ_A-PAQ_A_Total,PAQ_C-PAQ_C_Total,SDS-SDS_Total_Raw,SDS-SDS_Total_T,PreInt_EduHx-computerinternet_hoursday,stat_0,stat_1,stat_2,stat_3,stat_4,stat_5,stat_6,stat_7,stat_8,stat_9,stat_10,stat_11,stat_12,stat_13,stat_14,stat_15,stat_16,stat_17,stat_18,stat_19,stat_20,stat_21,stat_22,stat_23,stat_24,stat_25,stat_26,stat_27,stat_28,stat_31,stat_32,stat_33,stat_34,stat_35,stat_36,stat_37,stat_38,stat_39,stat_40,stat_42,stat_43,stat_44,stat_45,stat_46,stat_47,stat_48,stat_49,stat_50,stat_51,stat_52,stat_53,stat_54,stat_55,stat_56,stat_57,stat_58,stat_59,stat_60,stat_61,stat_62,stat_63,stat_64,stat_65,stat_66,stat_67,stat_68,stat_69,stat_70,stat_71,stat_72,stat_73,stat_74,stat_75,stat_76,stat_77,stat_78,stat_79,stat_80,stat_81,stat_82,stat_83,stat_84,stat_85,stat_86,stat_87,stat_88,stat_89,stat_90,stat_91,stat_92,stat_93,stat_94,stat_95,stat_96,stat_97,stat_98,stat_99,stat_100,stat_101,stat_102,stat_103,stat_104,stat_105,stat_106,stat_107,stat_108,stat_109,stat_110,stat_111,stat_112,stat_113,stat_114,stat_115,stat_116,stat_117,stat_118,stat_119,stat_120,stat_121,stat_122,stat_123,stat_124,stat_125,stat_126,stat_127,stat_128,stat_129,stat_130,stat_131,stat_132,stat_133,stat_134,stat_135,stat_136,stat_137,stat_138,stat_139,stat_140,stat_141,stat_142,stat_143,stat_144,stat_145,stat_146,stat_147,stat_148,stat_149,stat_150,stat_151,stat_152,stat_153,stat_154,stat_155,stat_156,stat_157,stat_158,stat_159,stat_160,stat_161,stat_162,stat_163,stat_164,stat_165,stat_166,stat_167,stat_168,stat_169,stat_170,stat_171,stat_172,stat_173,stat_174,stat_175,stat_176,stat_177,stat_178,stat_179,stat_180,stat_181,stat_182,stat_183,stat_184,stat_185,stat_186,stat_187,stat_188,stat_189,stat_190,stat_191,stat_192,stat_193,stat_194,stat_195,stat_196,stat_197,stat_198,stat_199,stat_200,stat_201,stat_202,stat_203,stat_204,stat_205,stat_206,stat_207,stat_208,stat_209,stat_210,stat_211,stat_212,stat_213,stat_214,stat_215,stat_216,stat_217,stat_218,stat_219,stat_220,stat_221,stat_222,stat_223,stat_224,stat_225,stat_226,stat_227,stat_228,stat_229,stat_230,stat_231,stat_232,stat_233,stat_234,stat_235,stat_236,stat_237,stat_238,stat_239,stat_240,stat_241,stat_242,stat_243,stat_244,stat_245,stat_246,stat_247,stat_248,stat_249,stat_250,stat_251,stat_252,stat_253,stat_254,stat_255,stat_256,stat_257,stat_258,stat_259,stat_260,stat_261,stat_262,stat_263,stat_264,stat_265,stat_266,stat_267,stat_268,stat_269,stat_270,stat_271,stat_272,stat_273,stat_274,stat_275,stat_276,stat_277,stat_278,stat_279,stat_280,stat_281,stat_282,stat_283,stat_284,stat_285,stat_286,stat_287,stat_288,Basic_Demos-Sex_0,Basic_Demos-Sex_1,FGC-Season_Fall,FGC-Season_Missing,FGC-Season_Spring,FGC-Season_Summer,FGC-Season_Winter,PreInt_EduHx-Season_Fall,PreInt_EduHx-Season_Missing,PreInt_EduHx-Season_Spring,PreInt_EduHx-Season_Summer,PreInt_EduHx-Season_Winter,Fitness_Endurance-Season_Fall,Fitness_Endurance-Season_Missing,Fitness_Endurance-Season_Spring,Fitness_Endurance-Season_Summer,Fitness_Endurance-Season_Winter,PAQ_C-Season_Fall,PAQ_C-Season_Missing,PAQ_C-Season_Spring,PAQ_C-Season_Summer,PAQ_C-Season_Winter,CGAS-Season_Fall,CGAS-Season_Missing,CGAS-Season_Spring,CGAS-Season_Summer,CGAS-Season_Winter,SDS-Season_Fall,SDS-Season_Missing,SDS-Season_Spring,SDS-Season_Summer,SDS-Season_Winter,Basic_Demos-Enroll_Season_Fall,Basic_Demos-Enroll_Season_Spring,Basic_Demos-Enroll_Season_Summer,Basic_Demos-Enroll_Season_Winter,Physical-Season_Fall,Physical-Season_Missing,Physical-Season_Spring,Physical-Season_Summer,Physical-Season_Winter,BIA-Season_Fall,BIA-Season_Missing,BIA-Season_Spring,BIA-Season_Summer,BIA-Season_Winter,PAQ_A-Season_Fall,PAQ_A-Season_Missing,PAQ_A-Season_Spring,PAQ_A-Season_Summer,PAQ_A-Season_Winter
0,00008ff9,5,51.0,16.877316,46.0,50.8,,,,,,,,0.0,0.0,,,,,0.0,0.0,7.0,0.0,6.0,0.0,6.0,1.0,2.0,2.66855,16.8792,932.498,1492.0,8.25598,41.5862,13.8177,3.06143,9.21377,1.0,24.4349,8.89536,38.9177,19.5413,32.6909,,,,,3.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,1,0,1,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,1,0,0,0,0,0,0,0,1,0,1,0,0,0,1,0,0,0,1,0,0,0,0,1,0,0,0,0,0,1,0,0,0
1,000fd460,9,,14.03559,48.0,46.0,22.0,75.0,70.0,122.0,,,,3.0,0.0,,,,,5.0,0.0,11.0,1.0,11.0,1.0,3.0,0.0,2.0,2.57949,14.0371,936.656,1498.65,6.01993,42.0291,12.8254,1.21172,3.97085,1.0,21.0352,14.974,39.4497,15.4107,27.0552,,2.34,46.0,64.0,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,1,0,1,0,0,0,0,0,0,0,1,0,0,1,0,0,0,1,0,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,1,0,1,0,0,0,0,0,0,0,0,1,0,1,0,0,0
2,00105258,10,71.0,16.648696,56.5,75.6,,65.0,94.0,117.0,5.0,7.0,33.0,20.0,1.0,10.2,1.0,14.7,2.0,7.0,1.0,10.0,1.0,10.0,1.0,5.0,0.0,,,,,,,,,,,,,,,,,,2.17,38.0,54.0,2.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0,1,1,0,0,0,0,0,0,0,1,0,1,0,0,0,0,0,0,0,1,0,1,0,0,0,0,1,0,0,0,0,0,0,1,0,1,0,0,0,0,0,1,0,0,0,0,1,0,0,0
3,00115b9f,9,71.0,18.292347,56.0,81.6,,60.0,97.0,117.0,6.0,9.0,37.0,18.0,1.0,,,,,5.0,0.0,7.0,0.0,7.0,0.0,7.0,1.0,3.0,3.84191,18.2943,1131.43,1923.44,15.5925,62.7757,14.074,4.22033,18.8243,2.0,30.4041,16.779,58.9338,26.4798,45.9966,,2.451,31.0,45.0,0.0,-0.316384,0.016009,-0.16789,0.047388,-10.580416,0.0,42.29631,4053.579102,50462150000000.0,4.470182,3.0,53.201683,0.453665,0.502702,0.58571,0.106351,42.94717,0.0,208.168976,112.404045,19428420000000.0,1.931421,0.0,14.244914,-1.746094,-2.905339,-1.048372,0.0,-89.833092,3824.0,55000000000.0,1.0,3.0,41.0,-0.957459,-0.977749,-1.010391,0.0,-87.332067,0.000752,3829.0,4861450000000.0,1.0,3.0,41.0,-0.914427,-0.877531,-0.957112,0.0,-72.609234,0.0,0.265511,3835.0,9944500000000.0,1.0,3.0,41.0,-0.871721,-0.730302,-0.89797,0.000332,-62.206067,0.0,0.666667,3838.0,24635000000000.0,1.0,3.0,41.0,-0.811414,-0.584147,-0.821275,0.001527,-55.807169,0.0,1.197513,3850.75,28650000000000.0,2.0,3.0,42.0,-0.745521,-0.430516,-0.736979,0.003707,-48.233392,0.0,1.673629,4000.0,33450000000000.0,2.0,3.0,42.0,-0.68418,-0.309863,-0.649974,0.006432,-41.541863,0.0,2.392969,4028.666748,36890000000000.0,3.0,3.0,42.0,-0.625026,-0.224424,-0.565164,0.009337,-35.302367,0.0,3.083734,4035.0,39525000000000.0,4.0,3.0,43.0,-0.567314,-0.136134,-0.489798,0.012539,-30.223173,0.0,3.996364,4041.0,41905000000000.0,4.0,3.0,44.0,-0.508016,-0.054089,-0.415141,0.016204,-25.410971,0.0,4.979007,4058.0,47205000000000.0,4.0,3.0,47.0,-0.437547,-0.01013,-0.330755,0.020108,-20.352911,0.0,5.972977,4064.0,49735000000000.0,5.0,3.0,47.0,-0.366849,0.024974,-0.245378,0.023637,-15.086617,0.0,6.926828,4070.0,53477500000000.0,5.0,3.0,50.0,-0.306484,0.068776,-0.164221,0.026687,-10.005749,0.0,7.581349,4093.0,57440000000000.0,5.0,3.0,51.0,-0.255599,0.12263,-0.079078,0.029139,-4.908399,0.0,8.729453,4099.0,59292000000000.0,5.0,3.0,51.0,-0.193461,0.20526,0.001529,0.031696,-0.057997,0.0,10.158665,4129.0,61180000000000.0,5.0,3.0,52.0,-0.108544,0.309391,0.085911,0.035379,4.938907,0.0,12.0,4140.0,63705000000000.0,6.0,3.0,52.0,-0.010677,0.400677,0.204727,0.04142,12.220764,0.0,15.0,4147.0,66408750000000.0,6.0,3.0,53.0,0.046125,0.495396,0.358109,0.051887,21.963189,0.0,19.178272,4152.0,68645000000000.0,6.0,3.0,56.0,0.138923,0.593706,0.552839,0.070719,35.773787,0.0,27.5,4158.0,71480000000000.0,7.0,3.0,80.0,0.380755,0.702779,0.863568,0.10543,62.185143,0.0,53.025919,4170.0,73980000000000.0,7.0,3.0,82.0,0.540839,0.812206,0.952578,0.180468,74.499702,0.0,97.554999,4175.0,76885000000000.0,7.0,3.0,83.0,1.507865,1.666354,1.546979,4.004276,89.751656,0.0,2633.25,4188.5,86110000000000.0,7.0,3.0,85.0,43330.0,1,0,0,0,0,1,0,0,0,0,0,1,0,0,0,1,0,0,0,0,0,1,1,0,0,0,0,0,0,0,1,0,0,0,0,1,0,0,0,1,0,0,0,0,1,0,0,1,0,0,0
4,0016bb22,18,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,1.04,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0,1,0,1,0,0,0,0,1,0,0,0,0,1,0,0,0,0,1,0,0,0,0,0,0,1,0,0,1,0,0,0,0,1,0,0,0,1,0,0,0,0,1,0,0,0,0,0,0,1,0


In [22]:
train_one_hot.drop('id', axis=1, inplace=True)
test_one_hot.drop('id', axis=1, inplace=True)

In [28]:
train = train_one_hot[test_one_hot.columns.tolist() + ['sii']].copy()
test = test_one_hot.copy()

In [29]:
print(train.shape)
train.head()

(2736, 385)


Unnamed: 0,Basic_Demos-Age,CGAS-CGAS_Score,Physical-BMI,Physical-Height,Physical-Weight,Physical-Waist_Circumference,Physical-Diastolic_BP,Physical-HeartRate,Physical-Systolic_BP,Fitness_Endurance-Max_Stage,Fitness_Endurance-Time_Mins,Fitness_Endurance-Time_Sec,FGC-FGC_CU,FGC-FGC_CU_Zone,FGC-FGC_GSND,FGC-FGC_GSND_Zone,FGC-FGC_GSD,FGC-FGC_GSD_Zone,FGC-FGC_PU,FGC-FGC_PU_Zone,FGC-FGC_SRL,FGC-FGC_SRL_Zone,FGC-FGC_SRR,FGC-FGC_SRR_Zone,FGC-FGC_TL,FGC-FGC_TL_Zone,BIA-BIA_Activity_Level_num,BIA-BIA_BMC,BIA-BIA_BMI,BIA-BIA_BMR,BIA-BIA_DEE,BIA-BIA_ECW,BIA-BIA_FFM,BIA-BIA_FFMI,BIA-BIA_FMI,BIA-BIA_Fat,BIA-BIA_Frame_num,BIA-BIA_ICW,BIA-BIA_LDM,BIA-BIA_LST,BIA-BIA_SMM,BIA-BIA_TBW,PAQ_A-PAQ_A_Total,PAQ_C-PAQ_C_Total,SDS-SDS_Total_Raw,SDS-SDS_Total_T,PreInt_EduHx-computerinternet_hoursday,stat_0,stat_1,stat_2,stat_3,stat_4,stat_5,stat_6,stat_7,stat_8,stat_9,stat_10,stat_11,stat_12,stat_13,stat_14,stat_15,stat_16,stat_17,stat_18,stat_19,stat_20,stat_21,stat_22,stat_23,stat_24,stat_25,stat_26,stat_27,stat_28,stat_31,stat_32,stat_33,stat_34,stat_35,stat_36,stat_37,stat_38,stat_39,stat_40,stat_42,stat_43,stat_44,stat_45,stat_46,stat_47,stat_48,stat_49,stat_50,stat_51,stat_52,stat_53,stat_54,stat_55,stat_56,stat_57,stat_58,stat_59,stat_60,stat_61,stat_62,stat_63,stat_64,stat_65,stat_66,stat_67,stat_68,stat_69,stat_70,stat_71,stat_72,stat_73,stat_74,stat_75,stat_76,stat_77,stat_78,stat_79,stat_80,stat_81,stat_82,stat_83,stat_84,stat_85,stat_86,stat_87,stat_88,stat_89,stat_90,stat_91,stat_92,stat_93,stat_94,stat_95,stat_96,stat_97,stat_98,stat_99,stat_100,stat_101,stat_102,stat_103,stat_104,stat_105,stat_106,stat_107,stat_108,stat_109,stat_110,stat_111,stat_112,stat_113,stat_114,stat_115,stat_116,stat_117,stat_118,stat_119,stat_120,stat_121,stat_122,stat_123,stat_124,stat_125,stat_126,stat_127,stat_128,stat_129,stat_130,stat_131,stat_132,stat_133,stat_134,stat_135,stat_136,stat_137,stat_138,stat_139,stat_140,stat_141,stat_142,stat_143,stat_144,stat_145,stat_146,stat_147,stat_148,stat_149,stat_150,stat_151,stat_152,stat_153,stat_154,stat_155,stat_156,stat_157,stat_158,stat_159,stat_160,stat_161,stat_162,stat_163,stat_164,stat_165,stat_166,stat_167,stat_168,stat_169,stat_170,stat_171,stat_172,stat_173,stat_174,stat_175,stat_176,stat_177,stat_178,stat_179,stat_180,stat_181,stat_182,stat_183,stat_184,stat_185,stat_186,stat_187,stat_188,stat_189,stat_190,stat_191,stat_192,stat_193,stat_194,stat_195,stat_196,stat_197,stat_198,stat_199,stat_200,stat_201,stat_202,stat_203,stat_204,stat_205,stat_206,stat_207,stat_208,stat_209,stat_210,stat_211,stat_212,stat_213,stat_214,stat_215,stat_216,stat_217,stat_218,stat_219,stat_220,stat_221,stat_222,stat_223,stat_224,stat_225,stat_226,stat_227,stat_228,stat_229,stat_230,stat_231,stat_232,stat_233,stat_234,stat_235,stat_236,stat_237,stat_238,stat_239,stat_240,stat_241,stat_242,stat_243,stat_244,stat_245,stat_246,stat_247,stat_248,stat_249,stat_250,stat_251,stat_252,stat_253,stat_254,stat_255,stat_256,stat_257,stat_258,stat_259,stat_260,stat_261,stat_262,stat_263,stat_264,stat_265,stat_266,stat_267,stat_268,stat_269,stat_270,stat_271,stat_272,stat_273,stat_274,stat_275,stat_276,stat_277,stat_278,stat_279,stat_280,stat_281,stat_282,stat_283,stat_284,stat_285,stat_286,stat_287,stat_288,Basic_Demos-Sex_0,Basic_Demos-Sex_1,FGC-Season_Fall,FGC-Season_Missing,FGC-Season_Spring,FGC-Season_Summer,FGC-Season_Winter,PreInt_EduHx-Season_Fall,PreInt_EduHx-Season_Missing,PreInt_EduHx-Season_Spring,PreInt_EduHx-Season_Summer,PreInt_EduHx-Season_Winter,Fitness_Endurance-Season_Fall,Fitness_Endurance-Season_Missing,Fitness_Endurance-Season_Spring,Fitness_Endurance-Season_Summer,Fitness_Endurance-Season_Winter,PAQ_C-Season_Fall,PAQ_C-Season_Missing,PAQ_C-Season_Spring,PAQ_C-Season_Summer,PAQ_C-Season_Winter,CGAS-Season_Fall,CGAS-Season_Missing,CGAS-Season_Spring,CGAS-Season_Summer,CGAS-Season_Winter,SDS-Season_Fall,SDS-Season_Missing,SDS-Season_Spring,SDS-Season_Summer,SDS-Season_Winter,Basic_Demos-Enroll_Season_Fall,Basic_Demos-Enroll_Season_Spring,Basic_Demos-Enroll_Season_Summer,Basic_Demos-Enroll_Season_Winter,Physical-Season_Fall,Physical-Season_Missing,Physical-Season_Spring,Physical-Season_Summer,Physical-Season_Winter,BIA-Season_Fall,BIA-Season_Missing,BIA-Season_Spring,BIA-Season_Summer,BIA-Season_Winter,PAQ_A-Season_Fall,PAQ_A-Season_Missing,PAQ_A-Season_Spring,PAQ_A-Season_Summer,PAQ_A-Season_Winter,sii
0,5,51.0,16.877316,46.0,50.8,,,,,,,,0.0,0.0,,,,,0.0,0.0,7.0,0.0,6.0,0.0,6.0,1.0,2.0,2.66855,16.8792,932.498,1492.0,8.25598,41.5862,13.8177,3.06143,9.21377,1.0,24.4349,8.89536,38.9177,19.5413,32.6909,,,,,3.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,1,0,1,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,1,0,0,0,0,0,0,0,1,0,1,0,0,0,1,0,0,0,1,0,0,0,0,1,0,0,0,0,0,1,0,0,0,2.0
1,9,,14.03559,48.0,46.0,22.0,75.0,70.0,122.0,,,,3.0,0.0,,,,,5.0,0.0,11.0,1.0,11.0,1.0,3.0,0.0,2.0,2.57949,14.0371,936.656,1498.65,6.01993,42.0291,12.8254,1.21172,3.97085,1.0,21.0352,14.974,39.4497,15.4107,27.0552,,2.34,46.0,64.0,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,1,0,1,0,0,0,0,0,0,0,1,0,0,1,0,0,0,1,0,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,1,0,1,0,0,0,0,0,0,0,0,1,0,1,0,0,0,0.0
2,10,71.0,16.648696,56.5,75.6,,65.0,94.0,117.0,5.0,7.0,33.0,20.0,1.0,10.2,1.0,14.7,2.0,7.0,1.0,10.0,1.0,10.0,1.0,5.0,0.0,,,,,,,,,,,,,,,,,,2.17,38.0,54.0,2.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0,1,1,0,0,0,0,0,0,0,1,0,1,0,0,0,0,0,0,0,1,0,1,0,0,0,0,1,0,0,0,0,0,0,1,0,1,0,0,0,0,0,1,0,0,0,0,1,0,0,0,0.0
3,9,71.0,18.292347,56.0,81.6,,60.0,97.0,117.0,6.0,9.0,37.0,18.0,1.0,,,,,5.0,0.0,7.0,0.0,7.0,0.0,7.0,1.0,3.0,3.84191,18.2943,1131.43,1923.44,15.5925,62.7757,14.074,4.22033,18.8243,2.0,30.4041,16.779,58.9338,26.4798,45.9966,,2.451,31.0,45.0,0.0,-0.316384,0.016009,-0.16789,0.047388,-10.580416,0.0,42.29631,4053.579102,50462150000000.0,4.470182,3.0,53.201683,0.453665,0.502702,0.58571,0.106351,42.94717,0.0,208.168976,112.404045,19428420000000.0,1.931421,0.0,14.244914,-1.746094,-2.905339,-1.048372,0.0,-89.833092,3824.0,55000000000.0,1.0,3.0,41.0,-0.957459,-0.977749,-1.010391,0.0,-87.332067,0.000752,3829.0,4861450000000.0,1.0,3.0,41.0,-0.914427,-0.877531,-0.957112,0.0,-72.609234,0.0,0.265511,3835.0,9944500000000.0,1.0,3.0,41.0,-0.871721,-0.730302,-0.89797,0.000332,-62.206067,0.0,0.666667,3838.0,24635000000000.0,1.0,3.0,41.0,-0.811414,-0.584147,-0.821275,0.001527,-55.807169,0.0,1.197513,3850.75,28650000000000.0,2.0,3.0,42.0,-0.745521,-0.430516,-0.736979,0.003707,-48.233392,0.0,1.673629,4000.0,33450000000000.0,2.0,3.0,42.0,-0.68418,-0.309863,-0.649974,0.006432,-41.541863,0.0,2.392969,4028.666748,36890000000000.0,3.0,3.0,42.0,-0.625026,-0.224424,-0.565164,0.009337,-35.302367,0.0,3.083734,4035.0,39525000000000.0,4.0,3.0,43.0,-0.567314,-0.136134,-0.489798,0.012539,-30.223173,0.0,3.996364,4041.0,41905000000000.0,4.0,3.0,44.0,-0.508016,-0.054089,-0.415141,0.016204,-25.410971,0.0,4.979007,4058.0,47205000000000.0,4.0,3.0,47.0,-0.437547,-0.01013,-0.330755,0.020108,-20.352911,0.0,5.972977,4064.0,49735000000000.0,5.0,3.0,47.0,-0.366849,0.024974,-0.245378,0.023637,-15.086617,0.0,6.926828,4070.0,53477500000000.0,5.0,3.0,50.0,-0.306484,0.068776,-0.164221,0.026687,-10.005749,0.0,7.581349,4093.0,57440000000000.0,5.0,3.0,51.0,-0.255599,0.12263,-0.079078,0.029139,-4.908399,0.0,8.729453,4099.0,59292000000000.0,5.0,3.0,51.0,-0.193461,0.20526,0.001529,0.031696,-0.057997,0.0,10.158665,4129.0,61180000000000.0,5.0,3.0,52.0,-0.108544,0.309391,0.085911,0.035379,4.938907,0.0,12.0,4140.0,63705000000000.0,6.0,3.0,52.0,-0.010677,0.400677,0.204727,0.04142,12.220764,0.0,15.0,4147.0,66408750000000.0,6.0,3.0,53.0,0.046125,0.495396,0.358109,0.051887,21.963189,0.0,19.178272,4152.0,68645000000000.0,6.0,3.0,56.0,0.138923,0.593706,0.552839,0.070719,35.773787,0.0,27.5,4158.0,71480000000000.0,7.0,3.0,80.0,0.380755,0.702779,0.863568,0.10543,62.185143,0.0,53.025919,4170.0,73980000000000.0,7.0,3.0,82.0,0.540839,0.812206,0.952578,0.180468,74.499702,0.0,97.554999,4175.0,76885000000000.0,7.0,3.0,83.0,1.507865,1.666354,1.546979,4.004276,89.751656,0.0,2633.25,4188.5,86110000000000.0,7.0,3.0,85.0,43330.0,1,0,0,0,0,1,0,0,0,0,0,1,0,0,0,1,0,0,0,0,0,1,1,0,0,0,0,0,0,0,1,0,0,0,0,1,0,0,0,1,0,0,0,0,1,0,0,1,0,0,0,1.0
4,13,50.0,22.279952,59.5,112.2,,60.0,73.0,102.0,,,,12.0,0.0,16.5,2.0,17.9,2.0,6.0,0.0,10.0,1.0,11.0,1.0,8.0,0.0,2.0,4.33036,30.1865,1330.97,1996.45,30.2124,84.0285,16.6877,13.4988,67.9715,2.0,32.9141,20.902,79.6982,35.3804,63.1265,,4.11,40.0,56.0,0.0,-0.004272,0.016859,-0.631731,0.011926,-55.630768,0.655708,16.771982,3838.189453,43212120000000.0,3.909848,3.0,79.435593,0.351545,0.303812,0.623476,0.024331,50.303635,0.468723,95.327438,155.573868,24972640000000.0,1.946892,0.0,6.634319,-1.038711,-1.52269,-1.018787,0.0,-88.761833,3098.166748,0.0,1.0,3.0,68.0,-0.964537,-0.820831,-1.011376,0.0,-88.692085,0.035338,3343.0,860000000000.0,1.0,3.0,68.0,-0.739749,-0.485981,-1.010633,0.000174,-88.553625,0.0,0.204995,3630.0,4305000000000.0,1.0,3.0,69.0,-0.356717,-0.213008,-1.010164,0.001036,-88.48362,0.0,0.37858,3695.0,8615000000000.0,1.0,3.0,70.0,-0.053221,-0.046249,-1.009839,0.003185,-88.464142,0.0,0.464152,3709.333252,12925000000000.0,2.0,3.0,71.0,-0.052986,-0.045577,-1.009578,0.007479,-88.452377,0.0,0.5,3732.333252,17230000000000.0,2.0,3.0,73.0,-0.052803,-0.044517,-1.009344,0.008622,-88.386049,0.0,0.5,3747.0,21540000000000.0,2.0,3.0,74.0,-0.052581,-0.044065,-1.009109,0.008955,-88.308716,0.0,0.538311,3763.75,25850000000000.0,3.0,3.0,75.0,-0.044075,-0.037731,-1.008875,0.009198,-86.990927,0.655556,0.598203,3782.0,30160000000000.0,3.0,3.0,76.0,-0.043265,-0.034616,-1.008614,0.009423,-86.843826,1.0,0.658255,3788.0,34465000000000.0,3.0,3.0,77.0,-0.042494,-0.03132,-1.008276,0.009639,-86.74559,1.0,0.764178,3800.0,38945000000000.0,3.0,3.0,78.0,-0.020622,-0.028179,-1.007728,0.009831,-86.119919,1.0,0.879005,3812.0,43310000000000.0,4.0,3.0,79.0,-0.020152,0.015679,-1.007129,0.01,-86.118622,1.0,0.994175,3826.333252,47620000000000.0,4.0,3.0,81.0,-0.019904,0.016843,-1.006673,0.010157,-86.11805,1.0,1.585408,3847.0,51930000000000.0,4.0,3.0,82.0,-0.019682,0.017282,-1.006139,0.010315,-86.080246,1.0,2.484425,3876.0,56235000000000.0,5.0,3.0,83.0,-0.01942,0.017528,-0.728903,0.010482,-47.183479,1.0,4.0,3917.0,60545000000000.0,5.0,3.0,84.0,-0.019081,0.020307,-0.294459,0.010668,-17.483364,1.0,6.141348,3951.187561,64855000000000.0,6.0,3.0,85.0,-0.01814,0.022414,0.076976,0.010894,4.400664,1.0,9.18595,3982.0,69165000000000.0,6.0,3.0,86.0,0.123577,0.086863,0.264927,0.011239,15.523324,1.0,14.444445,4008.583252,73470000000000.0,6.0,3.0,87.0,0.474932,0.313599,0.466737,0.012207,28.323949,1.0,36.802221,4067.0,77780000000000.0,7.0,3.0,89.0,0.780661,0.773137,0.749808,0.026261,49.306727,1.0,74.0,4103.583496,82090000000000.0,7.0,3.0,90.0,1.034351,1.946303,1.146284,2.952888,89.476036,1.0,2597.800049,4175.0,86395000000000.0,7.0,3.0,91.0,396396.0,0,1,0,0,0,1,0,0,0,1,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,1,0,0,0,1,0,0,1,0,0,0,0,0,1,0,0,0,0,1,0,0,1,0,0,0,1.0


In [30]:
print(test.shape)
test.head()

(20, 384)


Unnamed: 0,Basic_Demos-Age,CGAS-CGAS_Score,Physical-BMI,Physical-Height,Physical-Weight,Physical-Waist_Circumference,Physical-Diastolic_BP,Physical-HeartRate,Physical-Systolic_BP,Fitness_Endurance-Max_Stage,Fitness_Endurance-Time_Mins,Fitness_Endurance-Time_Sec,FGC-FGC_CU,FGC-FGC_CU_Zone,FGC-FGC_GSND,FGC-FGC_GSND_Zone,FGC-FGC_GSD,FGC-FGC_GSD_Zone,FGC-FGC_PU,FGC-FGC_PU_Zone,FGC-FGC_SRL,FGC-FGC_SRL_Zone,FGC-FGC_SRR,FGC-FGC_SRR_Zone,FGC-FGC_TL,FGC-FGC_TL_Zone,BIA-BIA_Activity_Level_num,BIA-BIA_BMC,BIA-BIA_BMI,BIA-BIA_BMR,BIA-BIA_DEE,BIA-BIA_ECW,BIA-BIA_FFM,BIA-BIA_FFMI,BIA-BIA_FMI,BIA-BIA_Fat,BIA-BIA_Frame_num,BIA-BIA_ICW,BIA-BIA_LDM,BIA-BIA_LST,BIA-BIA_SMM,BIA-BIA_TBW,PAQ_A-PAQ_A_Total,PAQ_C-PAQ_C_Total,SDS-SDS_Total_Raw,SDS-SDS_Total_T,PreInt_EduHx-computerinternet_hoursday,stat_0,stat_1,stat_2,stat_3,stat_4,stat_5,stat_6,stat_7,stat_8,stat_9,stat_10,stat_11,stat_12,stat_13,stat_14,stat_15,stat_16,stat_17,stat_18,stat_19,stat_20,stat_21,stat_22,stat_23,stat_24,stat_25,stat_26,stat_27,stat_28,stat_31,stat_32,stat_33,stat_34,stat_35,stat_36,stat_37,stat_38,stat_39,stat_40,stat_42,stat_43,stat_44,stat_45,stat_46,stat_47,stat_48,stat_49,stat_50,stat_51,stat_52,stat_53,stat_54,stat_55,stat_56,stat_57,stat_58,stat_59,stat_60,stat_61,stat_62,stat_63,stat_64,stat_65,stat_66,stat_67,stat_68,stat_69,stat_70,stat_71,stat_72,stat_73,stat_74,stat_75,stat_76,stat_77,stat_78,stat_79,stat_80,stat_81,stat_82,stat_83,stat_84,stat_85,stat_86,stat_87,stat_88,stat_89,stat_90,stat_91,stat_92,stat_93,stat_94,stat_95,stat_96,stat_97,stat_98,stat_99,stat_100,stat_101,stat_102,stat_103,stat_104,stat_105,stat_106,stat_107,stat_108,stat_109,stat_110,stat_111,stat_112,stat_113,stat_114,stat_115,stat_116,stat_117,stat_118,stat_119,stat_120,stat_121,stat_122,stat_123,stat_124,stat_125,stat_126,stat_127,stat_128,stat_129,stat_130,stat_131,stat_132,stat_133,stat_134,stat_135,stat_136,stat_137,stat_138,stat_139,stat_140,stat_141,stat_142,stat_143,stat_144,stat_145,stat_146,stat_147,stat_148,stat_149,stat_150,stat_151,stat_152,stat_153,stat_154,stat_155,stat_156,stat_157,stat_158,stat_159,stat_160,stat_161,stat_162,stat_163,stat_164,stat_165,stat_166,stat_167,stat_168,stat_169,stat_170,stat_171,stat_172,stat_173,stat_174,stat_175,stat_176,stat_177,stat_178,stat_179,stat_180,stat_181,stat_182,stat_183,stat_184,stat_185,stat_186,stat_187,stat_188,stat_189,stat_190,stat_191,stat_192,stat_193,stat_194,stat_195,stat_196,stat_197,stat_198,stat_199,stat_200,stat_201,stat_202,stat_203,stat_204,stat_205,stat_206,stat_207,stat_208,stat_209,stat_210,stat_211,stat_212,stat_213,stat_214,stat_215,stat_216,stat_217,stat_218,stat_219,stat_220,stat_221,stat_222,stat_223,stat_224,stat_225,stat_226,stat_227,stat_228,stat_229,stat_230,stat_231,stat_232,stat_233,stat_234,stat_235,stat_236,stat_237,stat_238,stat_239,stat_240,stat_241,stat_242,stat_243,stat_244,stat_245,stat_246,stat_247,stat_248,stat_249,stat_250,stat_251,stat_252,stat_253,stat_254,stat_255,stat_256,stat_257,stat_258,stat_259,stat_260,stat_261,stat_262,stat_263,stat_264,stat_265,stat_266,stat_267,stat_268,stat_269,stat_270,stat_271,stat_272,stat_273,stat_274,stat_275,stat_276,stat_277,stat_278,stat_279,stat_280,stat_281,stat_282,stat_283,stat_284,stat_285,stat_286,stat_287,stat_288,Basic_Demos-Sex_0,Basic_Demos-Sex_1,FGC-Season_Fall,FGC-Season_Missing,FGC-Season_Spring,FGC-Season_Summer,FGC-Season_Winter,PreInt_EduHx-Season_Fall,PreInt_EduHx-Season_Missing,PreInt_EduHx-Season_Spring,PreInt_EduHx-Season_Summer,PreInt_EduHx-Season_Winter,Fitness_Endurance-Season_Fall,Fitness_Endurance-Season_Missing,Fitness_Endurance-Season_Spring,Fitness_Endurance-Season_Summer,Fitness_Endurance-Season_Winter,PAQ_C-Season_Fall,PAQ_C-Season_Missing,PAQ_C-Season_Spring,PAQ_C-Season_Summer,PAQ_C-Season_Winter,CGAS-Season_Fall,CGAS-Season_Missing,CGAS-Season_Spring,CGAS-Season_Summer,CGAS-Season_Winter,SDS-Season_Fall,SDS-Season_Missing,SDS-Season_Spring,SDS-Season_Summer,SDS-Season_Winter,Basic_Demos-Enroll_Season_Fall,Basic_Demos-Enroll_Season_Spring,Basic_Demos-Enroll_Season_Summer,Basic_Demos-Enroll_Season_Winter,Physical-Season_Fall,Physical-Season_Missing,Physical-Season_Spring,Physical-Season_Summer,Physical-Season_Winter,BIA-Season_Fall,BIA-Season_Missing,BIA-Season_Spring,BIA-Season_Summer,BIA-Season_Winter,PAQ_A-Season_Fall,PAQ_A-Season_Missing,PAQ_A-Season_Spring,PAQ_A-Season_Summer,PAQ_A-Season_Winter
0,5,51.0,16.877316,46.0,50.8,,,,,,,,0.0,0.0,,,,,0.0,0.0,7.0,0.0,6.0,0.0,6.0,1.0,2.0,2.66855,16.8792,932.498,1492.0,8.25598,41.5862,13.8177,3.06143,9.21377,1.0,24.4349,8.89536,38.9177,19.5413,32.6909,,,,,3.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,1,0,1,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,1,0,0,0,0,0,0,0,1,0,1,0,0,0,1,0,0,0,1,0,0,0,0,1,0,0,0,0,0,1,0,0,0
1,9,,14.03559,48.0,46.0,22.0,75.0,70.0,122.0,,,,3.0,0.0,,,,,5.0,0.0,11.0,1.0,11.0,1.0,3.0,0.0,2.0,2.57949,14.0371,936.656,1498.65,6.01993,42.0291,12.8254,1.21172,3.97085,1.0,21.0352,14.974,39.4497,15.4107,27.0552,,2.34,46.0,64.0,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,1,0,1,0,0,0,0,0,0,0,1,0,0,1,0,0,0,1,0,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,1,0,1,0,0,0,0,0,0,0,0,1,0,1,0,0,0
2,10,71.0,16.648696,56.5,75.6,,65.0,94.0,117.0,5.0,7.0,33.0,20.0,1.0,10.2,1.0,14.7,2.0,7.0,1.0,10.0,1.0,10.0,1.0,5.0,0.0,,,,,,,,,,,,,,,,,,2.17,38.0,54.0,2.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0,1,1,0,0,0,0,0,0,0,1,0,1,0,0,0,0,0,0,0,1,0,1,0,0,0,0,1,0,0,0,0,0,0,1,0,1,0,0,0,0,0,1,0,0,0,0,1,0,0,0
3,9,71.0,18.292347,56.0,81.6,,60.0,97.0,117.0,6.0,9.0,37.0,18.0,1.0,,,,,5.0,0.0,7.0,0.0,7.0,0.0,7.0,1.0,3.0,3.84191,18.2943,1131.43,1923.44,15.5925,62.7757,14.074,4.22033,18.8243,2.0,30.4041,16.779,58.9338,26.4798,45.9966,,2.451,31.0,45.0,0.0,-0.316384,0.016009,-0.16789,0.047388,-10.580416,0.0,42.29631,4053.579102,50462150000000.0,4.470182,3.0,53.201683,0.453665,0.502702,0.58571,0.106351,42.94717,0.0,208.168976,112.404045,19428420000000.0,1.931421,0.0,14.244914,-1.746094,-2.905339,-1.048372,0.0,-89.833092,3824.0,55000000000.0,1.0,3.0,41.0,-0.957459,-0.977749,-1.010391,0.0,-87.332067,0.000752,3829.0,4861450000000.0,1.0,3.0,41.0,-0.914427,-0.877531,-0.957112,0.0,-72.609234,0.0,0.265511,3835.0,9944500000000.0,1.0,3.0,41.0,-0.871721,-0.730302,-0.89797,0.000332,-62.206067,0.0,0.666667,3838.0,24635000000000.0,1.0,3.0,41.0,-0.811414,-0.584147,-0.821275,0.001527,-55.807169,0.0,1.197513,3850.75,28650000000000.0,2.0,3.0,42.0,-0.745521,-0.430516,-0.736979,0.003707,-48.233392,0.0,1.673629,4000.0,33450000000000.0,2.0,3.0,42.0,-0.68418,-0.309863,-0.649974,0.006432,-41.541863,0.0,2.392969,4028.666748,36890000000000.0,3.0,3.0,42.0,-0.625026,-0.224424,-0.565164,0.009337,-35.302367,0.0,3.083734,4035.0,39525000000000.0,4.0,3.0,43.0,-0.567314,-0.136134,-0.489798,0.012539,-30.223173,0.0,3.996364,4041.0,41905000000000.0,4.0,3.0,44.0,-0.508016,-0.054089,-0.415141,0.016204,-25.410971,0.0,4.979007,4058.0,47205000000000.0,4.0,3.0,47.0,-0.437547,-0.01013,-0.330755,0.020108,-20.352911,0.0,5.972977,4064.0,49735000000000.0,5.0,3.0,47.0,-0.366849,0.024974,-0.245378,0.023637,-15.086617,0.0,6.926828,4070.0,53477500000000.0,5.0,3.0,50.0,-0.306484,0.068776,-0.164221,0.026687,-10.005749,0.0,7.581349,4093.0,57440000000000.0,5.0,3.0,51.0,-0.255599,0.12263,-0.079078,0.029139,-4.908399,0.0,8.729453,4099.0,59292000000000.0,5.0,3.0,51.0,-0.193461,0.20526,0.001529,0.031696,-0.057997,0.0,10.158665,4129.0,61180000000000.0,5.0,3.0,52.0,-0.108544,0.309391,0.085911,0.035379,4.938907,0.0,12.0,4140.0,63705000000000.0,6.0,3.0,52.0,-0.010677,0.400677,0.204727,0.04142,12.220764,0.0,15.0,4147.0,66408750000000.0,6.0,3.0,53.0,0.046125,0.495396,0.358109,0.051887,21.963189,0.0,19.178272,4152.0,68645000000000.0,6.0,3.0,56.0,0.138923,0.593706,0.552839,0.070719,35.773787,0.0,27.5,4158.0,71480000000000.0,7.0,3.0,80.0,0.380755,0.702779,0.863568,0.10543,62.185143,0.0,53.025919,4170.0,73980000000000.0,7.0,3.0,82.0,0.540839,0.812206,0.952578,0.180468,74.499702,0.0,97.554999,4175.0,76885000000000.0,7.0,3.0,83.0,1.507865,1.666354,1.546979,4.004276,89.751656,0.0,2633.25,4188.5,86110000000000.0,7.0,3.0,85.0,43330.0,1,0,0,0,0,1,0,0,0,0,0,1,0,0,0,1,0,0,0,0,0,1,1,0,0,0,0,0,0,0,1,0,0,0,0,1,0,0,0,1,0,0,0,0,1,0,0,1,0,0,0
4,18,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,1.04,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0,1,0,1,0,0,0,0,1,0,0,0,0,1,0,0,0,0,1,0,0,0,0,0,0,1,0,0,1,0,0,0,0,1,0,0,0,1,0,0,0,0,1,0,0,0,0,0,0,1,0


In [32]:
concat_df = pd.concat([train[test.columns], test], ignore_index=True)
print(concat_df.shape)
concat_df.head()

(2756, 384)


Unnamed: 0,Basic_Demos-Age,CGAS-CGAS_Score,Physical-BMI,Physical-Height,Physical-Weight,Physical-Waist_Circumference,Physical-Diastolic_BP,Physical-HeartRate,Physical-Systolic_BP,Fitness_Endurance-Max_Stage,Fitness_Endurance-Time_Mins,Fitness_Endurance-Time_Sec,FGC-FGC_CU,FGC-FGC_CU_Zone,FGC-FGC_GSND,FGC-FGC_GSND_Zone,FGC-FGC_GSD,FGC-FGC_GSD_Zone,FGC-FGC_PU,FGC-FGC_PU_Zone,FGC-FGC_SRL,FGC-FGC_SRL_Zone,FGC-FGC_SRR,FGC-FGC_SRR_Zone,FGC-FGC_TL,FGC-FGC_TL_Zone,BIA-BIA_Activity_Level_num,BIA-BIA_BMC,BIA-BIA_BMI,BIA-BIA_BMR,BIA-BIA_DEE,BIA-BIA_ECW,BIA-BIA_FFM,BIA-BIA_FFMI,BIA-BIA_FMI,BIA-BIA_Fat,BIA-BIA_Frame_num,BIA-BIA_ICW,BIA-BIA_LDM,BIA-BIA_LST,BIA-BIA_SMM,BIA-BIA_TBW,PAQ_A-PAQ_A_Total,PAQ_C-PAQ_C_Total,SDS-SDS_Total_Raw,SDS-SDS_Total_T,PreInt_EduHx-computerinternet_hoursday,stat_0,stat_1,stat_2,stat_3,stat_4,stat_5,stat_6,stat_7,stat_8,stat_9,stat_10,stat_11,stat_12,stat_13,stat_14,stat_15,stat_16,stat_17,stat_18,stat_19,stat_20,stat_21,stat_22,stat_23,stat_24,stat_25,stat_26,stat_27,stat_28,stat_31,stat_32,stat_33,stat_34,stat_35,stat_36,stat_37,stat_38,stat_39,stat_40,stat_42,stat_43,stat_44,stat_45,stat_46,stat_47,stat_48,stat_49,stat_50,stat_51,stat_52,stat_53,stat_54,stat_55,stat_56,stat_57,stat_58,stat_59,stat_60,stat_61,stat_62,stat_63,stat_64,stat_65,stat_66,stat_67,stat_68,stat_69,stat_70,stat_71,stat_72,stat_73,stat_74,stat_75,stat_76,stat_77,stat_78,stat_79,stat_80,stat_81,stat_82,stat_83,stat_84,stat_85,stat_86,stat_87,stat_88,stat_89,stat_90,stat_91,stat_92,stat_93,stat_94,stat_95,stat_96,stat_97,stat_98,stat_99,stat_100,stat_101,stat_102,stat_103,stat_104,stat_105,stat_106,stat_107,stat_108,stat_109,stat_110,stat_111,stat_112,stat_113,stat_114,stat_115,stat_116,stat_117,stat_118,stat_119,stat_120,stat_121,stat_122,stat_123,stat_124,stat_125,stat_126,stat_127,stat_128,stat_129,stat_130,stat_131,stat_132,stat_133,stat_134,stat_135,stat_136,stat_137,stat_138,stat_139,stat_140,stat_141,stat_142,stat_143,stat_144,stat_145,stat_146,stat_147,stat_148,stat_149,stat_150,stat_151,stat_152,stat_153,stat_154,stat_155,stat_156,stat_157,stat_158,stat_159,stat_160,stat_161,stat_162,stat_163,stat_164,stat_165,stat_166,stat_167,stat_168,stat_169,stat_170,stat_171,stat_172,stat_173,stat_174,stat_175,stat_176,stat_177,stat_178,stat_179,stat_180,stat_181,stat_182,stat_183,stat_184,stat_185,stat_186,stat_187,stat_188,stat_189,stat_190,stat_191,stat_192,stat_193,stat_194,stat_195,stat_196,stat_197,stat_198,stat_199,stat_200,stat_201,stat_202,stat_203,stat_204,stat_205,stat_206,stat_207,stat_208,stat_209,stat_210,stat_211,stat_212,stat_213,stat_214,stat_215,stat_216,stat_217,stat_218,stat_219,stat_220,stat_221,stat_222,stat_223,stat_224,stat_225,stat_226,stat_227,stat_228,stat_229,stat_230,stat_231,stat_232,stat_233,stat_234,stat_235,stat_236,stat_237,stat_238,stat_239,stat_240,stat_241,stat_242,stat_243,stat_244,stat_245,stat_246,stat_247,stat_248,stat_249,stat_250,stat_251,stat_252,stat_253,stat_254,stat_255,stat_256,stat_257,stat_258,stat_259,stat_260,stat_261,stat_262,stat_263,stat_264,stat_265,stat_266,stat_267,stat_268,stat_269,stat_270,stat_271,stat_272,stat_273,stat_274,stat_275,stat_276,stat_277,stat_278,stat_279,stat_280,stat_281,stat_282,stat_283,stat_284,stat_285,stat_286,stat_287,stat_288,Basic_Demos-Sex_0,Basic_Demos-Sex_1,FGC-Season_Fall,FGC-Season_Missing,FGC-Season_Spring,FGC-Season_Summer,FGC-Season_Winter,PreInt_EduHx-Season_Fall,PreInt_EduHx-Season_Missing,PreInt_EduHx-Season_Spring,PreInt_EduHx-Season_Summer,PreInt_EduHx-Season_Winter,Fitness_Endurance-Season_Fall,Fitness_Endurance-Season_Missing,Fitness_Endurance-Season_Spring,Fitness_Endurance-Season_Summer,Fitness_Endurance-Season_Winter,PAQ_C-Season_Fall,PAQ_C-Season_Missing,PAQ_C-Season_Spring,PAQ_C-Season_Summer,PAQ_C-Season_Winter,CGAS-Season_Fall,CGAS-Season_Missing,CGAS-Season_Spring,CGAS-Season_Summer,CGAS-Season_Winter,SDS-Season_Fall,SDS-Season_Missing,SDS-Season_Spring,SDS-Season_Summer,SDS-Season_Winter,Basic_Demos-Enroll_Season_Fall,Basic_Demos-Enroll_Season_Spring,Basic_Demos-Enroll_Season_Summer,Basic_Demos-Enroll_Season_Winter,Physical-Season_Fall,Physical-Season_Missing,Physical-Season_Spring,Physical-Season_Summer,Physical-Season_Winter,BIA-Season_Fall,BIA-Season_Missing,BIA-Season_Spring,BIA-Season_Summer,BIA-Season_Winter,PAQ_A-Season_Fall,PAQ_A-Season_Missing,PAQ_A-Season_Spring,PAQ_A-Season_Summer,PAQ_A-Season_Winter
0,5,51.0,16.877316,46.0,50.8,,,,,,,,0.0,0.0,,,,,0.0,0.0,7.0,0.0,6.0,0.0,6.0,1.0,2.0,2.66855,16.8792,932.498,1492.0,8.25598,41.5862,13.8177,3.06143,9.21377,1.0,24.4349,8.89536,38.9177,19.5413,32.6909,,,,,3.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,1,0,1,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,1,0,0,0,0,0,0,0,1,0,1,0,0,0,1,0,0,0,1,0,0,0,0,1,0,0,0,0,0,1,0,0,0
1,9,,14.03559,48.0,46.0,22.0,75.0,70.0,122.0,,,,3.0,0.0,,,,,5.0,0.0,11.0,1.0,11.0,1.0,3.0,0.0,2.0,2.57949,14.0371,936.656,1498.65,6.01993,42.0291,12.8254,1.21172,3.97085,1.0,21.0352,14.974,39.4497,15.4107,27.0552,,2.34,46.0,64.0,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,1,0,1,0,0,0,0,0,0,0,1,0,0,1,0,0,0,1,0,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,1,0,1,0,0,0,0,0,0,0,0,1,0,1,0,0,0
2,10,71.0,16.648696,56.5,75.6,,65.0,94.0,117.0,5.0,7.0,33.0,20.0,1.0,10.2,1.0,14.7,2.0,7.0,1.0,10.0,1.0,10.0,1.0,5.0,0.0,,,,,,,,,,,,,,,,,,2.17,38.0,54.0,2.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0,1,1,0,0,0,0,0,0,0,1,0,1,0,0,0,0,0,0,0,1,0,1,0,0,0,0,1,0,0,0,0,0,0,1,0,1,0,0,0,0,0,1,0,0,0,0,1,0,0,0
3,9,71.0,18.292347,56.0,81.6,,60.0,97.0,117.0,6.0,9.0,37.0,18.0,1.0,,,,,5.0,0.0,7.0,0.0,7.0,0.0,7.0,1.0,3.0,3.84191,18.2943,1131.43,1923.44,15.5925,62.7757,14.074,4.22033,18.8243,2.0,30.4041,16.779,58.9338,26.4798,45.9966,,2.451,31.0,45.0,0.0,-0.316384,0.016009,-0.16789,0.047388,-10.580416,0.0,42.29631,4053.579102,50462150000000.0,4.470182,3.0,53.201683,0.453665,0.502702,0.58571,0.106351,42.94717,0.0,208.168976,112.404045,19428420000000.0,1.931421,0.0,14.244914,-1.746094,-2.905339,-1.048372,0.0,-89.833092,3824.0,55000000000.0,1.0,3.0,41.0,-0.957459,-0.977749,-1.010391,0.0,-87.332067,0.000752,3829.0,4861450000000.0,1.0,3.0,41.0,-0.914427,-0.877531,-0.957112,0.0,-72.609234,0.0,0.265511,3835.0,9944500000000.0,1.0,3.0,41.0,-0.871721,-0.730302,-0.89797,0.000332,-62.206067,0.0,0.666667,3838.0,24635000000000.0,1.0,3.0,41.0,-0.811414,-0.584147,-0.821275,0.001527,-55.807169,0.0,1.197513,3850.75,28650000000000.0,2.0,3.0,42.0,-0.745521,-0.430516,-0.736979,0.003707,-48.233392,0.0,1.673629,4000.0,33450000000000.0,2.0,3.0,42.0,-0.68418,-0.309863,-0.649974,0.006432,-41.541863,0.0,2.392969,4028.666748,36890000000000.0,3.0,3.0,42.0,-0.625026,-0.224424,-0.565164,0.009337,-35.302367,0.0,3.083734,4035.0,39525000000000.0,4.0,3.0,43.0,-0.567314,-0.136134,-0.489798,0.012539,-30.223173,0.0,3.996364,4041.0,41905000000000.0,4.0,3.0,44.0,-0.508016,-0.054089,-0.415141,0.016204,-25.410971,0.0,4.979007,4058.0,47205000000000.0,4.0,3.0,47.0,-0.437547,-0.01013,-0.330755,0.020108,-20.352911,0.0,5.972977,4064.0,49735000000000.0,5.0,3.0,47.0,-0.366849,0.024974,-0.245378,0.023637,-15.086617,0.0,6.926828,4070.0,53477500000000.0,5.0,3.0,50.0,-0.306484,0.068776,-0.164221,0.026687,-10.005749,0.0,7.581349,4093.0,57440000000000.0,5.0,3.0,51.0,-0.255599,0.12263,-0.079078,0.029139,-4.908399,0.0,8.729453,4099.0,59292000000000.0,5.0,3.0,51.0,-0.193461,0.20526,0.001529,0.031696,-0.057997,0.0,10.158665,4129.0,61180000000000.0,5.0,3.0,52.0,-0.108544,0.309391,0.085911,0.035379,4.938907,0.0,12.0,4140.0,63705000000000.0,6.0,3.0,52.0,-0.010677,0.400677,0.204727,0.04142,12.220764,0.0,15.0,4147.0,66408750000000.0,6.0,3.0,53.0,0.046125,0.495396,0.358109,0.051887,21.963189,0.0,19.178272,4152.0,68645000000000.0,6.0,3.0,56.0,0.138923,0.593706,0.552839,0.070719,35.773787,0.0,27.5,4158.0,71480000000000.0,7.0,3.0,80.0,0.380755,0.702779,0.863568,0.10543,62.185143,0.0,53.025919,4170.0,73980000000000.0,7.0,3.0,82.0,0.540839,0.812206,0.952578,0.180468,74.499702,0.0,97.554999,4175.0,76885000000000.0,7.0,3.0,83.0,1.507865,1.666354,1.546979,4.004276,89.751656,0.0,2633.25,4188.5,86110000000000.0,7.0,3.0,85.0,43330.0,1,0,0,0,0,1,0,0,0,0,0,1,0,0,0,1,0,0,0,0,0,1,1,0,0,0,0,0,0,0,1,0,0,0,0,1,0,0,0,1,0,0,0,0,1,0,0,1,0,0,0
4,13,50.0,22.279952,59.5,112.2,,60.0,73.0,102.0,,,,12.0,0.0,16.5,2.0,17.9,2.0,6.0,0.0,10.0,1.0,11.0,1.0,8.0,0.0,2.0,4.33036,30.1865,1330.97,1996.45,30.2124,84.0285,16.6877,13.4988,67.9715,2.0,32.9141,20.902,79.6982,35.3804,63.1265,,4.11,40.0,56.0,0.0,-0.004272,0.016859,-0.631731,0.011926,-55.630768,0.655708,16.771982,3838.189453,43212120000000.0,3.909848,3.0,79.435593,0.351545,0.303812,0.623476,0.024331,50.303635,0.468723,95.327438,155.573868,24972640000000.0,1.946892,0.0,6.634319,-1.038711,-1.52269,-1.018787,0.0,-88.761833,3098.166748,0.0,1.0,3.0,68.0,-0.964537,-0.820831,-1.011376,0.0,-88.692085,0.035338,3343.0,860000000000.0,1.0,3.0,68.0,-0.739749,-0.485981,-1.010633,0.000174,-88.553625,0.0,0.204995,3630.0,4305000000000.0,1.0,3.0,69.0,-0.356717,-0.213008,-1.010164,0.001036,-88.48362,0.0,0.37858,3695.0,8615000000000.0,1.0,3.0,70.0,-0.053221,-0.046249,-1.009839,0.003185,-88.464142,0.0,0.464152,3709.333252,12925000000000.0,2.0,3.0,71.0,-0.052986,-0.045577,-1.009578,0.007479,-88.452377,0.0,0.5,3732.333252,17230000000000.0,2.0,3.0,73.0,-0.052803,-0.044517,-1.009344,0.008622,-88.386049,0.0,0.5,3747.0,21540000000000.0,2.0,3.0,74.0,-0.052581,-0.044065,-1.009109,0.008955,-88.308716,0.0,0.538311,3763.75,25850000000000.0,3.0,3.0,75.0,-0.044075,-0.037731,-1.008875,0.009198,-86.990927,0.655556,0.598203,3782.0,30160000000000.0,3.0,3.0,76.0,-0.043265,-0.034616,-1.008614,0.009423,-86.843826,1.0,0.658255,3788.0,34465000000000.0,3.0,3.0,77.0,-0.042494,-0.03132,-1.008276,0.009639,-86.74559,1.0,0.764178,3800.0,38945000000000.0,3.0,3.0,78.0,-0.020622,-0.028179,-1.007728,0.009831,-86.119919,1.0,0.879005,3812.0,43310000000000.0,4.0,3.0,79.0,-0.020152,0.015679,-1.007129,0.01,-86.118622,1.0,0.994175,3826.333252,47620000000000.0,4.0,3.0,81.0,-0.019904,0.016843,-1.006673,0.010157,-86.11805,1.0,1.585408,3847.0,51930000000000.0,4.0,3.0,82.0,-0.019682,0.017282,-1.006139,0.010315,-86.080246,1.0,2.484425,3876.0,56235000000000.0,5.0,3.0,83.0,-0.01942,0.017528,-0.728903,0.010482,-47.183479,1.0,4.0,3917.0,60545000000000.0,5.0,3.0,84.0,-0.019081,0.020307,-0.294459,0.010668,-17.483364,1.0,6.141348,3951.187561,64855000000000.0,6.0,3.0,85.0,-0.01814,0.022414,0.076976,0.010894,4.400664,1.0,9.18595,3982.0,69165000000000.0,6.0,3.0,86.0,0.123577,0.086863,0.264927,0.011239,15.523324,1.0,14.444445,4008.583252,73470000000000.0,6.0,3.0,87.0,0.474932,0.313599,0.466737,0.012207,28.323949,1.0,36.802221,4067.0,77780000000000.0,7.0,3.0,89.0,0.780661,0.773137,0.749808,0.026261,49.306727,1.0,74.0,4103.583496,82090000000000.0,7.0,3.0,90.0,1.034351,1.946303,1.146284,2.952888,89.476036,1.0,2597.800049,4175.0,86395000000000.0,7.0,3.0,91.0,396396.0,0,1,0,0,0,1,0,0,0,1,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,1,0,0,0,1,0,0,1,0,0,0,0,0,1,0,0,0,0,1,0,0,1,0,0,0


In [33]:
imputer = KNNImputer(n_neighbors=5)
imputed_data_concat = imputer.fit_transform(concat_df)

In [34]:
concat_imputed = pd.DataFrame(imputed_data_concat, columns=concat_df.columns)
print(concat_imputed.shape)
concat_imputed.head()

(2756, 384)


Unnamed: 0,Basic_Demos-Age,CGAS-CGAS_Score,Physical-BMI,Physical-Height,Physical-Weight,Physical-Waist_Circumference,Physical-Diastolic_BP,Physical-HeartRate,Physical-Systolic_BP,Fitness_Endurance-Max_Stage,Fitness_Endurance-Time_Mins,Fitness_Endurance-Time_Sec,FGC-FGC_CU,FGC-FGC_CU_Zone,FGC-FGC_GSND,FGC-FGC_GSND_Zone,FGC-FGC_GSD,FGC-FGC_GSD_Zone,FGC-FGC_PU,FGC-FGC_PU_Zone,FGC-FGC_SRL,FGC-FGC_SRL_Zone,FGC-FGC_SRR,FGC-FGC_SRR_Zone,FGC-FGC_TL,FGC-FGC_TL_Zone,BIA-BIA_Activity_Level_num,BIA-BIA_BMC,BIA-BIA_BMI,BIA-BIA_BMR,BIA-BIA_DEE,BIA-BIA_ECW,BIA-BIA_FFM,BIA-BIA_FFMI,BIA-BIA_FMI,BIA-BIA_Fat,BIA-BIA_Frame_num,BIA-BIA_ICW,BIA-BIA_LDM,BIA-BIA_LST,BIA-BIA_SMM,BIA-BIA_TBW,PAQ_A-PAQ_A_Total,PAQ_C-PAQ_C_Total,SDS-SDS_Total_Raw,SDS-SDS_Total_T,PreInt_EduHx-computerinternet_hoursday,stat_0,stat_1,stat_2,stat_3,stat_4,stat_5,stat_6,stat_7,stat_8,stat_9,stat_10,stat_11,stat_12,stat_13,stat_14,stat_15,stat_16,stat_17,stat_18,stat_19,stat_20,stat_21,stat_22,stat_23,stat_24,stat_25,stat_26,stat_27,stat_28,stat_31,stat_32,stat_33,stat_34,stat_35,stat_36,stat_37,stat_38,stat_39,stat_40,stat_42,stat_43,stat_44,stat_45,stat_46,stat_47,stat_48,stat_49,stat_50,stat_51,stat_52,stat_53,stat_54,stat_55,stat_56,stat_57,stat_58,stat_59,stat_60,stat_61,stat_62,stat_63,stat_64,stat_65,stat_66,stat_67,stat_68,stat_69,stat_70,stat_71,stat_72,stat_73,stat_74,stat_75,stat_76,stat_77,stat_78,stat_79,stat_80,stat_81,stat_82,stat_83,stat_84,stat_85,stat_86,stat_87,stat_88,stat_89,stat_90,stat_91,stat_92,stat_93,stat_94,stat_95,stat_96,stat_97,stat_98,stat_99,stat_100,stat_101,stat_102,stat_103,stat_104,stat_105,stat_106,stat_107,stat_108,stat_109,stat_110,stat_111,stat_112,stat_113,stat_114,stat_115,stat_116,stat_117,stat_118,stat_119,stat_120,stat_121,stat_122,stat_123,stat_124,stat_125,stat_126,stat_127,stat_128,stat_129,stat_130,stat_131,stat_132,stat_133,stat_134,stat_135,stat_136,stat_137,stat_138,stat_139,stat_140,stat_141,stat_142,stat_143,stat_144,stat_145,stat_146,stat_147,stat_148,stat_149,stat_150,stat_151,stat_152,stat_153,stat_154,stat_155,stat_156,stat_157,stat_158,stat_159,stat_160,stat_161,stat_162,stat_163,stat_164,stat_165,stat_166,stat_167,stat_168,stat_169,stat_170,stat_171,stat_172,stat_173,stat_174,stat_175,stat_176,stat_177,stat_178,stat_179,stat_180,stat_181,stat_182,stat_183,stat_184,stat_185,stat_186,stat_187,stat_188,stat_189,stat_190,stat_191,stat_192,stat_193,stat_194,stat_195,stat_196,stat_197,stat_198,stat_199,stat_200,stat_201,stat_202,stat_203,stat_204,stat_205,stat_206,stat_207,stat_208,stat_209,stat_210,stat_211,stat_212,stat_213,stat_214,stat_215,stat_216,stat_217,stat_218,stat_219,stat_220,stat_221,stat_222,stat_223,stat_224,stat_225,stat_226,stat_227,stat_228,stat_229,stat_230,stat_231,stat_232,stat_233,stat_234,stat_235,stat_236,stat_237,stat_238,stat_239,stat_240,stat_241,stat_242,stat_243,stat_244,stat_245,stat_246,stat_247,stat_248,stat_249,stat_250,stat_251,stat_252,stat_253,stat_254,stat_255,stat_256,stat_257,stat_258,stat_259,stat_260,stat_261,stat_262,stat_263,stat_264,stat_265,stat_266,stat_267,stat_268,stat_269,stat_270,stat_271,stat_272,stat_273,stat_274,stat_275,stat_276,stat_277,stat_278,stat_279,stat_280,stat_281,stat_282,stat_283,stat_284,stat_285,stat_286,stat_287,stat_288,Basic_Demos-Sex_0,Basic_Demos-Sex_1,FGC-Season_Fall,FGC-Season_Missing,FGC-Season_Spring,FGC-Season_Summer,FGC-Season_Winter,PreInt_EduHx-Season_Fall,PreInt_EduHx-Season_Missing,PreInt_EduHx-Season_Spring,PreInt_EduHx-Season_Summer,PreInt_EduHx-Season_Winter,Fitness_Endurance-Season_Fall,Fitness_Endurance-Season_Missing,Fitness_Endurance-Season_Spring,Fitness_Endurance-Season_Summer,Fitness_Endurance-Season_Winter,PAQ_C-Season_Fall,PAQ_C-Season_Missing,PAQ_C-Season_Spring,PAQ_C-Season_Summer,PAQ_C-Season_Winter,CGAS-Season_Fall,CGAS-Season_Missing,CGAS-Season_Spring,CGAS-Season_Summer,CGAS-Season_Winter,SDS-Season_Fall,SDS-Season_Missing,SDS-Season_Spring,SDS-Season_Summer,SDS-Season_Winter,Basic_Demos-Enroll_Season_Fall,Basic_Demos-Enroll_Season_Spring,Basic_Demos-Enroll_Season_Summer,Basic_Demos-Enroll_Season_Winter,Physical-Season_Fall,Physical-Season_Missing,Physical-Season_Spring,Physical-Season_Summer,Physical-Season_Winter,BIA-Season_Fall,BIA-Season_Missing,BIA-Season_Spring,BIA-Season_Summer,BIA-Season_Winter,PAQ_A-Season_Fall,PAQ_A-Season_Missing,PAQ_A-Season_Spring,PAQ_A-Season_Summer,PAQ_A-Season_Winter
0,5.0,51.0,16.877316,46.0,50.8,23.8,69.4,75.4,121.0,5.6,9.6,26.0,0.0,0.0,22.64,1.8,24.44,1.8,0.0,0.0,7.0,0.0,6.0,0.0,6.0,1.0,2.0,2.66855,16.8792,932.498,1492.0,8.25598,41.5862,13.8177,3.06143,9.21377,1.0,24.4349,8.89536,38.9177,19.5413,32.6909,2.278,2.102,42.8,59.4,3.0,-0.050129,0.029588,-0.206737,0.038424,-17.399168,0.238233,27.291713,3855.223926,45043690000000.0,3.997108,3.569615,45.998817,0.477017,0.466331,0.586012,0.086501,43.175587,0.223842,103.751411,154.595015,23633470000000.0,1.95693,0.237036,6.944873,-2.397506,-2.112106,-1.039736,0.0,-89.647122,3227.933398,0.0,1.0,2.8,34.0,-0.836975,-0.800994,-0.997689,0.0,-86.339397,0.057461,3426.56665,1417560000000.0,1.0,2.8,34.0,-0.753551,-0.713712,-0.972604,5.8e-05,-80.318761,0.0,0.419439,3654.092507,8235800000000.0,1.0,3.4,35.0,-0.673302,-0.576927,-0.914451,0.000474,-72.105459,0.152222,0.807541,3702.23335,12678000000000.0,1.0,3.6,36.4,-0.593182,-0.450102,-0.848669,0.001811,-62.546078,0.2,1.196603,3719.56665,16852000000000.0,2.0,3.6,37.8,-0.520156,-0.352213,-0.76084,0.002881,-54.043238,0.2,1.563097,3738.0,20928000000000.0,2.0,3.6,38.8,-0.446886,-0.266528,-0.676277,0.005337,-47.080318,0.2,1.98483,3753.26665,24975750000000.0,2.0,3.6,39.8,-0.366389,-0.191957,-0.591534,0.007301,-41.006545,0.2,2.457695,3768.81332,29052300000000.0,2.8,3.6,41.0,-0.283002,-0.128187,-0.512197,0.009235,-35.648544,0.2,2.932935,3785.11665,33086000000000.0,3.0,3.6,42.2,-0.194104,-0.082569,-0.428647,0.011055,-30.459268,0.2,3.547034,3795.23335,37106000000000.0,3.2,3.6,43.8,-0.131388,-0.044469,-0.354436,0.013412,-26.064324,0.2,4.29023,3808.73335,41130000000000.0,3.8,3.6,45.0,-0.060509,0.005285,-0.281874,0.015773,-21.687689,0.2,5.300826,3824.76665,45189500000000.0,4.0,3.6,46.2,0.004791,0.035676,-0.214595,0.018426,-17.669151,0.2,6.450201,3843.284182,49253000000000.0,4.2,3.6,47.2,0.075556,0.071614,-0.148477,0.021433,-13.790557,0.2,7.697894,3868.2,53380000000000.0,4.8,3.6,48.4,0.147169,0.120334,-0.080608,0.025352,-9.663771,0.2,9.343181,3903.4,57503000000000.0,5.0,3.6,49.4,0.219734,0.170381,-0.0157,0.030284,-5.679081,0.2,11.592779,3938.6,61466000000000.0,5.2,3.6,50.8,0.296357,0.248337,0.228783,0.036766,13.6608,0.2,14.678781,3971.56665,65393000000000.0,6.0,3.6,52.0,0.375199,0.468795,0.399016,0.047083,23.986967,0.2,18.881771,4001.16665,69364800000000.0,6.0,3.6,53.2,0.495969,0.613324,0.506861,0.06328,31.218283,0.336667,26.34899,4041.13335,73348000000000.0,6.2,3.6,54.2,0.617842,0.732392,0.636341,0.089568,40.845753,0.4,41.483574,4079.848335,77400000000000.0,6.8,3.6,55.2,0.752401,0.85522,0.874114,0.144041,61.230838,0.718889,98.108536,4121.0,81443000000000.0,7.0,3.8,56.6,1.664505,2.081283,1.832219,3.46171,88.844673,0.8,2120.7,4173.4,86395000000000.0,7.0,3.8,60.0,370156.2,1.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0
1,9.0,70.8,14.03559,48.0,46.0,22.0,75.0,70.0,122.0,5.6,9.6,26.0,3.0,0.0,22.64,1.8,23.04,1.6,5.0,0.0,11.0,1.0,11.0,1.0,3.0,0.0,2.0,2.57949,14.0371,936.656,1498.65,6.01993,42.0291,12.8254,1.21172,3.97085,1.0,21.0352,14.974,39.4497,15.4107,27.0552,2.278,2.34,46.0,64.0,0.0,-0.050129,0.029588,-0.206737,0.038424,-17.399168,0.238233,27.291713,3855.223926,45043690000000.0,3.997108,3.569615,45.998817,0.477017,0.466331,0.586012,0.086501,43.175587,0.223842,103.751411,154.595015,23633470000000.0,1.95693,0.237036,6.944873,-2.397506,-2.112106,-1.039736,0.0,-89.647122,3227.933398,0.0,1.0,2.8,34.0,-0.836975,-0.800994,-0.997689,0.0,-86.339397,0.057461,3426.56665,1417560000000.0,1.0,2.8,34.0,-0.753551,-0.713712,-0.972604,5.8e-05,-80.318761,0.0,0.419439,3654.092507,8235800000000.0,1.0,3.4,35.0,-0.673302,-0.576927,-0.914451,0.000474,-72.105459,0.152222,0.807541,3702.23335,12678000000000.0,1.0,3.6,36.4,-0.593182,-0.450102,-0.848669,0.001811,-62.546078,0.2,1.196603,3719.56665,16852000000000.0,2.0,3.6,37.8,-0.520156,-0.352213,-0.76084,0.002881,-54.043238,0.2,1.563097,3738.0,20928000000000.0,2.0,3.6,38.8,-0.446886,-0.266528,-0.676277,0.005337,-47.080318,0.2,1.98483,3753.26665,24975750000000.0,2.0,3.6,39.8,-0.366389,-0.191957,-0.591534,0.007301,-41.006545,0.2,2.457695,3768.81332,29052300000000.0,2.8,3.6,41.0,-0.283002,-0.128187,-0.512197,0.009235,-35.648544,0.2,2.932935,3785.11665,33086000000000.0,3.0,3.6,42.2,-0.194104,-0.082569,-0.428647,0.011055,-30.459268,0.2,3.547034,3795.23335,37106000000000.0,3.2,3.6,43.8,-0.131388,-0.044469,-0.354436,0.013412,-26.064324,0.2,4.29023,3808.73335,41130000000000.0,3.8,3.6,45.0,-0.060509,0.005285,-0.281874,0.015773,-21.687689,0.2,5.300826,3824.76665,45189500000000.0,4.0,3.6,46.2,0.004791,0.035676,-0.214595,0.018426,-17.669151,0.2,6.450201,3843.284182,49253000000000.0,4.2,3.6,47.2,0.075556,0.071614,-0.148477,0.021433,-13.790557,0.2,7.697894,3868.2,53380000000000.0,4.8,3.6,48.4,0.147169,0.120334,-0.080608,0.025352,-9.663771,0.2,9.343181,3903.4,57503000000000.0,5.0,3.6,49.4,0.219734,0.170381,-0.0157,0.030284,-5.679081,0.2,11.592779,3938.6,61466000000000.0,5.2,3.6,50.8,0.296357,0.248337,0.228783,0.036766,13.6608,0.2,14.678781,3971.56665,65393000000000.0,6.0,3.6,52.0,0.375199,0.468795,0.399016,0.047083,23.986967,0.2,18.881771,4001.16665,69364800000000.0,6.0,3.6,53.2,0.495969,0.613324,0.506861,0.06328,31.218283,0.336667,26.34899,4041.13335,73348000000000.0,6.2,3.6,54.2,0.617842,0.732392,0.636341,0.089568,40.845753,0.4,41.483574,4079.848335,77400000000000.0,6.8,3.6,55.2,0.752401,0.85522,0.874114,0.144041,61.230838,0.718889,98.108536,4121.0,81443000000000.0,7.0,3.8,56.6,1.664505,2.081283,1.832219,3.46171,88.844673,0.8,2120.7,4173.4,86395000000000.0,7.0,3.8,60.0,370156.2,1.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0
2,10.0,71.0,16.648696,56.5,75.6,28.4,65.0,94.0,117.0,5.0,7.0,33.0,20.0,1.0,10.2,1.0,14.7,2.0,7.0,1.0,10.0,1.0,10.0,1.0,5.0,0.0,3.0,4.208454,21.02796,1227.9032,2073.394,22.647808,73.05094,15.31976,5.708204,26.268974,1.6,32.51706,17.886178,68.84256,34.81636,55.16486,2.1442,2.17,38.0,54.0,2.0,-0.050129,0.029588,-0.206737,0.038424,-17.399168,0.238233,27.291713,3855.223926,45043690000000.0,3.997108,3.569615,45.998817,0.477017,0.466331,0.586012,0.086501,43.175587,0.223842,103.751411,154.595015,23633470000000.0,1.95693,0.237036,6.944873,-2.397506,-2.112106,-1.039736,0.0,-89.647122,3227.933398,0.0,1.0,2.8,34.0,-0.836975,-0.800994,-0.997689,0.0,-86.339397,0.057461,3426.56665,1417560000000.0,1.0,2.8,34.0,-0.753551,-0.713712,-0.972604,5.8e-05,-80.318761,0.0,0.419439,3654.092507,8235800000000.0,1.0,3.4,35.0,-0.673302,-0.576927,-0.914451,0.000474,-72.105459,0.152222,0.807541,3702.23335,12678000000000.0,1.0,3.6,36.4,-0.593182,-0.450102,-0.848669,0.001811,-62.546078,0.2,1.196603,3719.56665,16852000000000.0,2.0,3.6,37.8,-0.520156,-0.352213,-0.76084,0.002881,-54.043238,0.2,1.563097,3738.0,20928000000000.0,2.0,3.6,38.8,-0.446886,-0.266528,-0.676277,0.005337,-47.080318,0.2,1.98483,3753.26665,24975750000000.0,2.0,3.6,39.8,-0.366389,-0.191957,-0.591534,0.007301,-41.006545,0.2,2.457695,3768.81332,29052300000000.0,2.8,3.6,41.0,-0.283002,-0.128187,-0.512197,0.009235,-35.648544,0.2,2.932935,3785.11665,33086000000000.0,3.0,3.6,42.2,-0.194104,-0.082569,-0.428647,0.011055,-30.459268,0.2,3.547034,3795.23335,37106000000000.0,3.2,3.6,43.8,-0.131388,-0.044469,-0.354436,0.013412,-26.064324,0.2,4.29023,3808.73335,41130000000000.0,3.8,3.6,45.0,-0.060509,0.005285,-0.281874,0.015773,-21.687689,0.2,5.300826,3824.76665,45189500000000.0,4.0,3.6,46.2,0.004791,0.035676,-0.214595,0.018426,-17.669151,0.2,6.450201,3843.284182,49253000000000.0,4.2,3.6,47.2,0.075556,0.071614,-0.148477,0.021433,-13.790557,0.2,7.697894,3868.2,53380000000000.0,4.8,3.6,48.4,0.147169,0.120334,-0.080608,0.025352,-9.663771,0.2,9.343181,3903.4,57503000000000.0,5.0,3.6,49.4,0.219734,0.170381,-0.0157,0.030284,-5.679081,0.2,11.592779,3938.6,61466000000000.0,5.2,3.6,50.8,0.296357,0.248337,0.228783,0.036766,13.6608,0.2,14.678781,3971.56665,65393000000000.0,6.0,3.6,52.0,0.375199,0.468795,0.399016,0.047083,23.986967,0.2,18.881771,4001.16665,69364800000000.0,6.0,3.6,53.2,0.495969,0.613324,0.506861,0.06328,31.218283,0.336667,26.34899,4041.13335,73348000000000.0,6.2,3.6,54.2,0.617842,0.732392,0.636341,0.089568,40.845753,0.4,41.483574,4079.848335,77400000000000.0,6.8,3.6,55.2,0.752401,0.85522,0.874114,0.144041,61.230838,0.718889,98.108536,4121.0,81443000000000.0,7.0,3.8,56.6,1.664505,2.081283,1.832219,3.46171,88.844673,0.8,2120.7,4173.4,86395000000000.0,7.0,3.8,60.0,370156.2,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0
3,9.0,71.0,18.292347,56.0,81.6,26.4,60.0,97.0,117.0,6.0,9.0,37.0,18.0,1.0,18.34,1.8,21.06,2.0,5.0,0.0,7.0,0.0,7.0,0.0,7.0,1.0,3.0,3.84191,18.2943,1131.43,1923.44,15.5925,62.7757,14.074,4.22033,18.8243,2.0,30.4041,16.779,58.9338,26.4798,45.9966,2.12,2.451,31.0,45.0,0.0,-0.316384,0.016009,-0.16789,0.047388,-10.580416,0.0,42.29631,4053.579102,50462150000000.0,4.470182,3.0,53.201683,0.453665,0.502702,0.58571,0.106351,42.94717,0.0,208.168976,112.404045,19428420000000.0,1.931421,0.0,14.244914,-1.746094,-2.905339,-1.048372,0.0,-89.833092,3824.0,55000000000.0,1.0,3.0,41.0,-0.957459,-0.977749,-1.010391,0.0,-87.332067,0.000752,3829.0,4861450000000.0,1.0,3.0,41.0,-0.914427,-0.877531,-0.957112,0.0,-72.609234,0.0,0.265511,3835.0,9944500000000.0,1.0,3.0,41.0,-0.871721,-0.730302,-0.89797,0.000332,-62.206067,0.0,0.666667,3838.0,24635000000000.0,1.0,3.0,41.0,-0.811414,-0.584147,-0.821275,0.001527,-55.807169,0.0,1.197513,3850.75,28650000000000.0,2.0,3.0,42.0,-0.745521,-0.430516,-0.736979,0.003707,-48.233392,0.0,1.673629,4000.0,33450000000000.0,2.0,3.0,42.0,-0.68418,-0.309863,-0.649974,0.006432,-41.541863,0.0,2.392969,4028.666748,36890000000000.0,3.0,3.0,42.0,-0.625026,-0.224424,-0.565164,0.009337,-35.302367,0.0,3.083734,4035.0,39525000000000.0,4.0,3.0,43.0,-0.567314,-0.136134,-0.489798,0.012539,-30.223173,0.0,3.996364,4041.0,41905000000000.0,4.0,3.0,44.0,-0.508016,-0.054089,-0.415141,0.016204,-25.410971,0.0,4.979007,4058.0,47205000000000.0,4.0,3.0,47.0,-0.437547,-0.01013,-0.330755,0.020108,-20.352911,0.0,5.972977,4064.0,49735000000000.0,5.0,3.0,47.0,-0.366849,0.024974,-0.245378,0.023637,-15.086617,0.0,6.926828,4070.0,53477500000000.0,5.0,3.0,50.0,-0.306484,0.068776,-0.164221,0.026687,-10.005749,0.0,7.581349,4093.0,57440000000000.0,5.0,3.0,51.0,-0.255599,0.12263,-0.079078,0.029139,-4.908399,0.0,8.729453,4099.0,59292000000000.0,5.0,3.0,51.0,-0.193461,0.20526,0.001529,0.031696,-0.057997,0.0,10.158665,4129.0,61180000000000.0,5.0,3.0,52.0,-0.108544,0.309391,0.085911,0.035379,4.938907,0.0,12.0,4140.0,63705000000000.0,6.0,3.0,52.0,-0.010677,0.400677,0.204727,0.04142,12.220764,0.0,15.0,4147.0,66408750000000.0,6.0,3.0,53.0,0.046125,0.495396,0.358109,0.051887,21.963189,0.0,19.178272,4152.0,68645000000000.0,6.0,3.0,56.0,0.138923,0.593706,0.552839,0.070719,35.773787,0.0,27.5,4158.0,71480000000000.0,7.0,3.0,80.0,0.380755,0.702779,0.863568,0.10543,62.185143,0.0,53.025919,4170.0,73980000000000.0,7.0,3.0,82.0,0.540839,0.812206,0.952578,0.180468,74.499702,0.0,97.554999,4175.0,76885000000000.0,7.0,3.0,83.0,1.507865,1.666354,1.546979,4.004276,89.751656,0.0,2633.25,4188.5,86110000000000.0,7.0,3.0,85.0,43330.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,0.0,0.0
4,13.0,50.0,22.279952,59.5,112.2,26.4,60.0,73.0,102.0,4.8,8.6,39.0,12.0,0.0,16.5,2.0,17.9,2.0,6.0,0.0,10.0,1.0,11.0,1.0,8.0,0.0,2.0,4.33036,30.1865,1330.97,1996.45,30.2124,84.0285,16.6877,13.4988,67.9715,2.0,32.9141,20.902,79.6982,35.3804,63.1265,2.12,4.11,40.0,56.0,0.0,-0.004272,0.016859,-0.631731,0.011926,-55.630768,0.655708,16.771982,3838.189453,43212120000000.0,3.909848,3.0,79.435593,0.351545,0.303812,0.623476,0.024331,50.303635,0.468723,95.327438,155.573868,24972640000000.0,1.946892,0.0,6.634319,-1.038711,-1.52269,-1.018787,0.0,-88.761833,3098.166748,0.0,1.0,3.0,68.0,-0.964537,-0.820831,-1.011376,0.0,-88.692085,0.035338,3343.0,860000000000.0,1.0,3.0,68.0,-0.739749,-0.485981,-1.010633,0.000174,-88.553625,0.0,0.204995,3630.0,4305000000000.0,1.0,3.0,69.0,-0.356717,-0.213008,-1.010164,0.001036,-88.48362,0.0,0.37858,3695.0,8615000000000.0,1.0,3.0,70.0,-0.053221,-0.046249,-1.009839,0.003185,-88.464142,0.0,0.464152,3709.333252,12925000000000.0,2.0,3.0,71.0,-0.052986,-0.045577,-1.009578,0.007479,-88.452377,0.0,0.5,3732.333252,17230000000000.0,2.0,3.0,73.0,-0.052803,-0.044517,-1.009344,0.008622,-88.386049,0.0,0.5,3747.0,21540000000000.0,2.0,3.0,74.0,-0.052581,-0.044065,-1.009109,0.008955,-88.308716,0.0,0.538311,3763.75,25850000000000.0,3.0,3.0,75.0,-0.044075,-0.037731,-1.008875,0.009198,-86.990927,0.655556,0.598203,3782.0,30160000000000.0,3.0,3.0,76.0,-0.043265,-0.034616,-1.008614,0.009423,-86.843826,1.0,0.658255,3788.0,34465000000000.0,3.0,3.0,77.0,-0.042494,-0.03132,-1.008276,0.009639,-86.74559,1.0,0.764178,3800.0,38945000000000.0,3.0,3.0,78.0,-0.020622,-0.028179,-1.007728,0.009831,-86.119919,1.0,0.879005,3812.0,43310000000000.0,4.0,3.0,79.0,-0.020152,0.015679,-1.007129,0.01,-86.118622,1.0,0.994175,3826.333252,47620000000000.0,4.0,3.0,81.0,-0.019904,0.016843,-1.006673,0.010157,-86.11805,1.0,1.585408,3847.0,51930000000000.0,4.0,3.0,82.0,-0.019682,0.017282,-1.006139,0.010315,-86.080246,1.0,2.484425,3876.0,56235000000000.0,5.0,3.0,83.0,-0.01942,0.017528,-0.728903,0.010482,-47.183479,1.0,4.0,3917.0,60545000000000.0,5.0,3.0,84.0,-0.019081,0.020307,-0.294459,0.010668,-17.483364,1.0,6.141348,3951.187561,64855000000000.0,6.0,3.0,85.0,-0.01814,0.022414,0.076976,0.010894,4.400664,1.0,9.18595,3982.0,69165000000000.0,6.0,3.0,86.0,0.123577,0.086863,0.264927,0.011239,15.523324,1.0,14.444445,4008.583252,73470000000000.0,6.0,3.0,87.0,0.474932,0.313599,0.466737,0.012207,28.323949,1.0,36.802221,4067.0,77780000000000.0,7.0,3.0,89.0,0.780661,0.773137,0.749808,0.026261,49.306727,1.0,74.0,4103.583496,82090000000000.0,7.0,3.0,90.0,1.034351,1.946303,1.146284,2.952888,89.476036,1.0,2597.800049,4175.0,86395000000000.0,7.0,3.0,91.0,396396.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,0.0,0.0


In [35]:
concat_imputed.isna().sum().sum()

0

In [42]:
concat_imputed = feature_engineering(concat_imputed)
print(concat_imputed.shape)
concat_imputed.head()

(2756, 399)


Unnamed: 0,Basic_Demos-Age,CGAS-CGAS_Score,Physical-BMI,Physical-Height,Physical-Weight,Physical-Waist_Circumference,Physical-Diastolic_BP,Physical-HeartRate,Physical-Systolic_BP,Fitness_Endurance-Max_Stage,Fitness_Endurance-Time_Mins,Fitness_Endurance-Time_Sec,FGC-FGC_CU,FGC-FGC_CU_Zone,FGC-FGC_GSND,FGC-FGC_GSND_Zone,FGC-FGC_GSD,FGC-FGC_GSD_Zone,FGC-FGC_PU,FGC-FGC_PU_Zone,FGC-FGC_SRL,FGC-FGC_SRL_Zone,FGC-FGC_SRR,FGC-FGC_SRR_Zone,FGC-FGC_TL,FGC-FGC_TL_Zone,BIA-BIA_Activity_Level_num,BIA-BIA_BMC,BIA-BIA_BMI,BIA-BIA_BMR,BIA-BIA_DEE,BIA-BIA_ECW,BIA-BIA_FFM,BIA-BIA_FFMI,BIA-BIA_FMI,BIA-BIA_Fat,BIA-BIA_Frame_num,BIA-BIA_ICW,BIA-BIA_LDM,BIA-BIA_LST,BIA-BIA_SMM,BIA-BIA_TBW,PAQ_A-PAQ_A_Total,PAQ_C-PAQ_C_Total,SDS-SDS_Total_Raw,SDS-SDS_Total_T,PreInt_EduHx-computerinternet_hoursday,stat_0,stat_1,stat_2,stat_3,stat_4,stat_5,stat_6,stat_7,stat_8,stat_9,stat_10,stat_11,stat_12,stat_13,stat_14,stat_15,stat_16,stat_17,stat_18,stat_19,stat_20,stat_21,stat_22,stat_23,stat_24,stat_25,stat_26,stat_27,stat_28,stat_31,stat_32,stat_33,stat_34,stat_35,stat_36,stat_37,stat_38,stat_39,stat_40,stat_42,stat_43,stat_44,stat_45,stat_46,stat_47,stat_48,stat_49,stat_50,stat_51,stat_52,stat_53,stat_54,stat_55,stat_56,stat_57,stat_58,stat_59,stat_60,stat_61,stat_62,stat_63,stat_64,stat_65,stat_66,stat_67,stat_68,stat_69,stat_70,stat_71,stat_72,stat_73,stat_74,stat_75,stat_76,stat_77,stat_78,stat_79,stat_80,stat_81,stat_82,stat_83,stat_84,stat_85,stat_86,stat_87,stat_88,stat_89,stat_90,stat_91,stat_92,stat_93,stat_94,stat_95,stat_96,stat_97,stat_98,stat_99,stat_100,stat_101,stat_102,stat_103,stat_104,stat_105,stat_106,stat_107,stat_108,stat_109,stat_110,stat_111,stat_112,stat_113,stat_114,stat_115,stat_116,stat_117,stat_118,stat_119,stat_120,stat_121,stat_122,stat_123,stat_124,stat_125,stat_126,stat_127,stat_128,stat_129,stat_130,stat_131,stat_132,stat_133,stat_134,stat_135,stat_136,stat_137,stat_138,stat_139,stat_140,stat_141,stat_142,stat_143,stat_144,stat_145,stat_146,stat_147,stat_148,stat_149,stat_150,stat_151,stat_152,stat_153,stat_154,stat_155,stat_156,stat_157,stat_158,stat_159,stat_160,stat_161,stat_162,stat_163,stat_164,stat_165,stat_166,stat_167,stat_168,stat_169,stat_170,stat_171,stat_172,stat_173,stat_174,stat_175,stat_176,stat_177,stat_178,stat_179,stat_180,stat_181,stat_182,stat_183,stat_184,stat_185,stat_186,stat_187,stat_188,stat_189,stat_190,stat_191,stat_192,stat_193,stat_194,stat_195,stat_196,stat_197,stat_198,stat_199,stat_200,stat_201,stat_202,stat_203,stat_204,stat_205,stat_206,stat_207,stat_208,stat_209,stat_210,stat_211,stat_212,stat_213,stat_214,stat_215,stat_216,stat_217,stat_218,stat_219,stat_220,stat_221,stat_222,stat_223,stat_224,stat_225,stat_226,stat_227,stat_228,stat_229,stat_230,stat_231,stat_232,stat_233,stat_234,stat_235,stat_236,stat_237,stat_238,stat_239,stat_240,stat_241,stat_242,stat_243,stat_244,stat_245,stat_246,stat_247,stat_248,stat_249,stat_250,stat_251,stat_252,stat_253,stat_254,stat_255,stat_256,stat_257,stat_258,stat_259,stat_260,stat_261,stat_262,stat_263,stat_264,stat_265,stat_266,stat_267,stat_268,stat_269,stat_270,stat_271,stat_272,stat_273,stat_274,stat_275,stat_276,stat_277,stat_278,stat_279,stat_280,stat_281,stat_282,stat_283,stat_284,stat_285,stat_286,stat_287,stat_288,Basic_Demos-Sex_0,Basic_Demos-Sex_1,FGC-Season_Fall,FGC-Season_Missing,FGC-Season_Spring,FGC-Season_Summer,FGC-Season_Winter,PreInt_EduHx-Season_Fall,PreInt_EduHx-Season_Missing,PreInt_EduHx-Season_Spring,PreInt_EduHx-Season_Summer,PreInt_EduHx-Season_Winter,Fitness_Endurance-Season_Fall,Fitness_Endurance-Season_Missing,Fitness_Endurance-Season_Spring,Fitness_Endurance-Season_Summer,Fitness_Endurance-Season_Winter,PAQ_C-Season_Fall,PAQ_C-Season_Missing,PAQ_C-Season_Spring,PAQ_C-Season_Summer,PAQ_C-Season_Winter,CGAS-Season_Fall,CGAS-Season_Missing,CGAS-Season_Spring,CGAS-Season_Summer,CGAS-Season_Winter,SDS-Season_Fall,SDS-Season_Missing,SDS-Season_Spring,SDS-Season_Summer,SDS-Season_Winter,Basic_Demos-Enroll_Season_Fall,Basic_Demos-Enroll_Season_Spring,Basic_Demos-Enroll_Season_Summer,Basic_Demos-Enroll_Season_Winter,Physical-Season_Fall,Physical-Season_Missing,Physical-Season_Spring,Physical-Season_Summer,Physical-Season_Winter,BIA-Season_Fall,BIA-Season_Missing,BIA-Season_Spring,BIA-Season_Summer,BIA-Season_Winter,PAQ_A-Season_Fall,PAQ_A-Season_Missing,PAQ_A-Season_Spring,PAQ_A-Season_Summer,PAQ_A-Season_Winter,BMI_Age,Internet_Hours_Age,BMI_Internet_Hours,BFP_BMI,FFMI_BFP,FMI_BFP,LST_TBW,BFP_BMR,BFP_DEE,BMR_Weight,DEE_Weight,SMM_Height,Muscle_to_Fat,Hydration_Status,ICW_TBW
0,5.0,51.0,16.877316,46.0,50.8,23.8,69.4,75.4,121.0,5.6,9.6,26.0,0.0,0.0,22.64,1.8,24.44,1.8,0.0,0.0,7.0,0.0,6.0,0.0,6.0,1.0,2.0,2.66855,16.8792,932.498,1492.0,8.25598,41.5862,13.8177,3.06143,9.21377,1.0,24.4349,8.89536,38.9177,19.5413,32.6909,2.278,2.102,42.8,59.4,3.0,-0.050129,0.029588,-0.206737,0.038424,-17.399168,0.238233,27.291713,3855.223926,45043690000000.0,3.997108,3.569615,45.998817,0.477017,0.466331,0.586012,0.086501,43.175587,0.223842,103.751411,154.595015,23633470000000.0,1.95693,0.237036,6.944873,-2.397506,-2.112106,-1.039736,0.0,-89.647122,3227.933398,0.0,1.0,2.8,34.0,-0.836975,-0.800994,-0.997689,0.0,-86.339397,0.057461,3426.56665,1417560000000.0,1.0,2.8,34.0,-0.753551,-0.713712,-0.972604,5.8e-05,-80.318761,0.0,0.419439,3654.092507,8235800000000.0,1.0,3.4,35.0,-0.673302,-0.576927,-0.914451,0.000474,-72.105459,0.152222,0.807541,3702.23335,12678000000000.0,1.0,3.6,36.4,-0.593182,-0.450102,-0.848669,0.001811,-62.546078,0.2,1.196603,3719.56665,16852000000000.0,2.0,3.6,37.8,-0.520156,-0.352213,-0.76084,0.002881,-54.043238,0.2,1.563097,3738.0,20928000000000.0,2.0,3.6,38.8,-0.446886,-0.266528,-0.676277,0.005337,-47.080318,0.2,1.98483,3753.26665,24975750000000.0,2.0,3.6,39.8,-0.366389,-0.191957,-0.591534,0.007301,-41.006545,0.2,2.457695,3768.81332,29052300000000.0,2.8,3.6,41.0,-0.283002,-0.128187,-0.512197,0.009235,-35.648544,0.2,2.932935,3785.11665,33086000000000.0,3.0,3.6,42.2,-0.194104,-0.082569,-0.428647,0.011055,-30.459268,0.2,3.547034,3795.23335,37106000000000.0,3.2,3.6,43.8,-0.131388,-0.044469,-0.354436,0.013412,-26.064324,0.2,4.29023,3808.73335,41130000000000.0,3.8,3.6,45.0,-0.060509,0.005285,-0.281874,0.015773,-21.687689,0.2,5.300826,3824.76665,45189500000000.0,4.0,3.6,46.2,0.004791,0.035676,-0.214595,0.018426,-17.669151,0.2,6.450201,3843.284182,49253000000000.0,4.2,3.6,47.2,0.075556,0.071614,-0.148477,0.021433,-13.790557,0.2,7.697894,3868.2,53380000000000.0,4.8,3.6,48.4,0.147169,0.120334,-0.080608,0.025352,-9.663771,0.2,9.343181,3903.4,57503000000000.0,5.0,3.6,49.4,0.219734,0.170381,-0.0157,0.030284,-5.679081,0.2,11.592779,3938.6,61466000000000.0,5.2,3.6,50.8,0.296357,0.248337,0.228783,0.036766,13.6608,0.2,14.678781,3971.56665,65393000000000.0,6.0,3.6,52.0,0.375199,0.468795,0.399016,0.047083,23.986967,0.2,18.881771,4001.16665,69364800000000.0,6.0,3.6,53.2,0.495969,0.613324,0.506861,0.06328,31.218283,0.336667,26.34899,4041.13335,73348000000000.0,6.2,3.6,54.2,0.617842,0.732392,0.636341,0.089568,40.845753,0.4,41.483574,4079.848335,77400000000000.0,6.8,3.6,55.2,0.752401,0.85522,0.874114,0.144041,61.230838,0.718889,98.108536,4121.0,81443000000000.0,7.0,3.8,56.6,1.664505,2.081283,1.832219,3.46171,88.844673,0.8,2120.7,4173.4,86395000000000.0,7.0,3.8,60.0,370156.2,1.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,84.386578,15.0,50.631947,0.545865,1.499679,0.332267,1.190475,8591.822097,13746.94484,18.35626,29.370079,0.424811,6.383063,0.643522,0.747453
1,9.0,70.8,14.03559,48.0,46.0,22.0,75.0,70.0,122.0,5.6,9.6,26.0,3.0,0.0,22.64,1.8,23.04,1.6,5.0,0.0,11.0,1.0,11.0,1.0,3.0,0.0,2.0,2.57949,14.0371,936.656,1498.65,6.01993,42.0291,12.8254,1.21172,3.97085,1.0,21.0352,14.974,39.4497,15.4107,27.0552,2.278,2.34,46.0,64.0,0.0,-0.050129,0.029588,-0.206737,0.038424,-17.399168,0.238233,27.291713,3855.223926,45043690000000.0,3.997108,3.569615,45.998817,0.477017,0.466331,0.586012,0.086501,43.175587,0.223842,103.751411,154.595015,23633470000000.0,1.95693,0.237036,6.944873,-2.397506,-2.112106,-1.039736,0.0,-89.647122,3227.933398,0.0,1.0,2.8,34.0,-0.836975,-0.800994,-0.997689,0.0,-86.339397,0.057461,3426.56665,1417560000000.0,1.0,2.8,34.0,-0.753551,-0.713712,-0.972604,5.8e-05,-80.318761,0.0,0.419439,3654.092507,8235800000000.0,1.0,3.4,35.0,-0.673302,-0.576927,-0.914451,0.000474,-72.105459,0.152222,0.807541,3702.23335,12678000000000.0,1.0,3.6,36.4,-0.593182,-0.450102,-0.848669,0.001811,-62.546078,0.2,1.196603,3719.56665,16852000000000.0,2.0,3.6,37.8,-0.520156,-0.352213,-0.76084,0.002881,-54.043238,0.2,1.563097,3738.0,20928000000000.0,2.0,3.6,38.8,-0.446886,-0.266528,-0.676277,0.005337,-47.080318,0.2,1.98483,3753.26665,24975750000000.0,2.0,3.6,39.8,-0.366389,-0.191957,-0.591534,0.007301,-41.006545,0.2,2.457695,3768.81332,29052300000000.0,2.8,3.6,41.0,-0.283002,-0.128187,-0.512197,0.009235,-35.648544,0.2,2.932935,3785.11665,33086000000000.0,3.0,3.6,42.2,-0.194104,-0.082569,-0.428647,0.011055,-30.459268,0.2,3.547034,3795.23335,37106000000000.0,3.2,3.6,43.8,-0.131388,-0.044469,-0.354436,0.013412,-26.064324,0.2,4.29023,3808.73335,41130000000000.0,3.8,3.6,45.0,-0.060509,0.005285,-0.281874,0.015773,-21.687689,0.2,5.300826,3824.76665,45189500000000.0,4.0,3.6,46.2,0.004791,0.035676,-0.214595,0.018426,-17.669151,0.2,6.450201,3843.284182,49253000000000.0,4.2,3.6,47.2,0.075556,0.071614,-0.148477,0.021433,-13.790557,0.2,7.697894,3868.2,53380000000000.0,4.8,3.6,48.4,0.147169,0.120334,-0.080608,0.025352,-9.663771,0.2,9.343181,3903.4,57503000000000.0,5.0,3.6,49.4,0.219734,0.170381,-0.0157,0.030284,-5.679081,0.2,11.592779,3938.6,61466000000000.0,5.2,3.6,50.8,0.296357,0.248337,0.228783,0.036766,13.6608,0.2,14.678781,3971.56665,65393000000000.0,6.0,3.6,52.0,0.375199,0.468795,0.399016,0.047083,23.986967,0.2,18.881771,4001.16665,69364800000000.0,6.0,3.6,53.2,0.495969,0.613324,0.506861,0.06328,31.218283,0.336667,26.34899,4041.13335,73348000000000.0,6.2,3.6,54.2,0.617842,0.732392,0.636341,0.089568,40.845753,0.4,41.483574,4079.848335,77400000000000.0,6.8,3.6,55.2,0.752401,0.85522,0.874114,0.144041,61.230838,0.718889,98.108536,4121.0,81443000000000.0,7.0,3.8,56.6,1.664505,2.081283,1.832219,3.46171,88.844673,0.8,2120.7,4173.4,86395000000000.0,7.0,3.8,60.0,370156.2,1.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,126.320313,0.0,0.0,0.282883,3.229888,0.305154,1.458119,3719.320478,5950.914352,20.362087,32.579348,0.321056,12.718037,0.588157,0.777492
2,10.0,71.0,16.648696,56.5,75.6,28.4,65.0,94.0,117.0,5.0,7.0,33.0,20.0,1.0,10.2,1.0,14.7,2.0,7.0,1.0,10.0,1.0,10.0,1.0,5.0,0.0,3.0,4.208454,21.02796,1227.9032,2073.394,22.647808,73.05094,15.31976,5.708204,26.268974,1.6,32.51706,17.886178,68.84256,34.81636,55.16486,2.1442,2.17,38.0,54.0,2.0,-0.050129,0.029588,-0.206737,0.038424,-17.399168,0.238233,27.291713,3855.223926,45043690000000.0,3.997108,3.569615,45.998817,0.477017,0.466331,0.586012,0.086501,43.175587,0.223842,103.751411,154.595015,23633470000000.0,1.95693,0.237036,6.944873,-2.397506,-2.112106,-1.039736,0.0,-89.647122,3227.933398,0.0,1.0,2.8,34.0,-0.836975,-0.800994,-0.997689,0.0,-86.339397,0.057461,3426.56665,1417560000000.0,1.0,2.8,34.0,-0.753551,-0.713712,-0.972604,5.8e-05,-80.318761,0.0,0.419439,3654.092507,8235800000000.0,1.0,3.4,35.0,-0.673302,-0.576927,-0.914451,0.000474,-72.105459,0.152222,0.807541,3702.23335,12678000000000.0,1.0,3.6,36.4,-0.593182,-0.450102,-0.848669,0.001811,-62.546078,0.2,1.196603,3719.56665,16852000000000.0,2.0,3.6,37.8,-0.520156,-0.352213,-0.76084,0.002881,-54.043238,0.2,1.563097,3738.0,20928000000000.0,2.0,3.6,38.8,-0.446886,-0.266528,-0.676277,0.005337,-47.080318,0.2,1.98483,3753.26665,24975750000000.0,2.0,3.6,39.8,-0.366389,-0.191957,-0.591534,0.007301,-41.006545,0.2,2.457695,3768.81332,29052300000000.0,2.8,3.6,41.0,-0.283002,-0.128187,-0.512197,0.009235,-35.648544,0.2,2.932935,3785.11665,33086000000000.0,3.0,3.6,42.2,-0.194104,-0.082569,-0.428647,0.011055,-30.459268,0.2,3.547034,3795.23335,37106000000000.0,3.2,3.6,43.8,-0.131388,-0.044469,-0.354436,0.013412,-26.064324,0.2,4.29023,3808.73335,41130000000000.0,3.8,3.6,45.0,-0.060509,0.005285,-0.281874,0.015773,-21.687689,0.2,5.300826,3824.76665,45189500000000.0,4.0,3.6,46.2,0.004791,0.035676,-0.214595,0.018426,-17.669151,0.2,6.450201,3843.284182,49253000000000.0,4.2,3.6,47.2,0.075556,0.071614,-0.148477,0.021433,-13.790557,0.2,7.697894,3868.2,53380000000000.0,4.8,3.6,48.4,0.147169,0.120334,-0.080608,0.025352,-9.663771,0.2,9.343181,3903.4,57503000000000.0,5.0,3.6,49.4,0.219734,0.170381,-0.0157,0.030284,-5.679081,0.2,11.592779,3938.6,61466000000000.0,5.2,3.6,50.8,0.296357,0.248337,0.228783,0.036766,13.6608,0.2,14.678781,3971.56665,65393000000000.0,6.0,3.6,52.0,0.375199,0.468795,0.399016,0.047083,23.986967,0.2,18.881771,4001.16665,69364800000000.0,6.0,3.6,53.2,0.495969,0.613324,0.506861,0.06328,31.218283,0.336667,26.34899,4041.13335,73348000000000.0,6.2,3.6,54.2,0.617842,0.732392,0.636341,0.089568,40.845753,0.4,41.483574,4079.848335,77400000000000.0,6.8,3.6,55.2,0.752401,0.85522,0.874114,0.144041,61.230838,0.718889,98.108536,4121.0,81443000000000.0,7.0,3.8,56.6,1.664505,2.081283,1.832219,3.46171,88.844673,0.8,2120.7,4173.4,86395000000000.0,7.0,3.8,60.0,370156.2,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,166.486961,20.0,33.297392,1.24924,0.583188,0.217298,1.247942,32255.757235,54465.933078,16.242106,27.425847,0.616219,6.099355,0.729694,0.589452
3,9.0,71.0,18.292347,56.0,81.6,26.4,60.0,97.0,117.0,6.0,9.0,37.0,18.0,1.0,18.34,1.8,21.06,2.0,5.0,0.0,7.0,0.0,7.0,0.0,7.0,1.0,3.0,3.84191,18.2943,1131.43,1923.44,15.5925,62.7757,14.074,4.22033,18.8243,2.0,30.4041,16.779,58.9338,26.4798,45.9966,2.12,2.451,31.0,45.0,0.0,-0.316384,0.016009,-0.16789,0.047388,-10.580416,0.0,42.29631,4053.579102,50462150000000.0,4.470182,3.0,53.201683,0.453665,0.502702,0.58571,0.106351,42.94717,0.0,208.168976,112.404045,19428420000000.0,1.931421,0.0,14.244914,-1.746094,-2.905339,-1.048372,0.0,-89.833092,3824.0,55000000000.0,1.0,3.0,41.0,-0.957459,-0.977749,-1.010391,0.0,-87.332067,0.000752,3829.0,4861450000000.0,1.0,3.0,41.0,-0.914427,-0.877531,-0.957112,0.0,-72.609234,0.0,0.265511,3835.0,9944500000000.0,1.0,3.0,41.0,-0.871721,-0.730302,-0.89797,0.000332,-62.206067,0.0,0.666667,3838.0,24635000000000.0,1.0,3.0,41.0,-0.811414,-0.584147,-0.821275,0.001527,-55.807169,0.0,1.197513,3850.75,28650000000000.0,2.0,3.0,42.0,-0.745521,-0.430516,-0.736979,0.003707,-48.233392,0.0,1.673629,4000.0,33450000000000.0,2.0,3.0,42.0,-0.68418,-0.309863,-0.649974,0.006432,-41.541863,0.0,2.392969,4028.666748,36890000000000.0,3.0,3.0,42.0,-0.625026,-0.224424,-0.565164,0.009337,-35.302367,0.0,3.083734,4035.0,39525000000000.0,4.0,3.0,43.0,-0.567314,-0.136134,-0.489798,0.012539,-30.223173,0.0,3.996364,4041.0,41905000000000.0,4.0,3.0,44.0,-0.508016,-0.054089,-0.415141,0.016204,-25.410971,0.0,4.979007,4058.0,47205000000000.0,4.0,3.0,47.0,-0.437547,-0.01013,-0.330755,0.020108,-20.352911,0.0,5.972977,4064.0,49735000000000.0,5.0,3.0,47.0,-0.366849,0.024974,-0.245378,0.023637,-15.086617,0.0,6.926828,4070.0,53477500000000.0,5.0,3.0,50.0,-0.306484,0.068776,-0.164221,0.026687,-10.005749,0.0,7.581349,4093.0,57440000000000.0,5.0,3.0,51.0,-0.255599,0.12263,-0.079078,0.029139,-4.908399,0.0,8.729453,4099.0,59292000000000.0,5.0,3.0,51.0,-0.193461,0.20526,0.001529,0.031696,-0.057997,0.0,10.158665,4129.0,61180000000000.0,5.0,3.0,52.0,-0.108544,0.309391,0.085911,0.035379,4.938907,0.0,12.0,4140.0,63705000000000.0,6.0,3.0,52.0,-0.010677,0.400677,0.204727,0.04142,12.220764,0.0,15.0,4147.0,66408750000000.0,6.0,3.0,53.0,0.046125,0.495396,0.358109,0.051887,21.963189,0.0,19.178272,4152.0,68645000000000.0,6.0,3.0,56.0,0.138923,0.593706,0.552839,0.070719,35.773787,0.0,27.5,4158.0,71480000000000.0,7.0,3.0,80.0,0.380755,0.702779,0.863568,0.10543,62.185143,0.0,53.025919,4170.0,73980000000000.0,7.0,3.0,82.0,0.540839,0.812206,0.952578,0.180468,74.499702,0.0,97.554999,4175.0,76885000000000.0,7.0,3.0,83.0,1.507865,1.666354,1.546979,4.004276,89.751656,0.0,2633.25,4188.5,86110000000000.0,7.0,3.0,85.0,43330.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,0.0,0.0,164.631122,0.0,0.0,1.028971,0.747651,0.224196,1.281264,21298.377749,36207.411592,13.865564,23.571569,0.472854,6.274343,0.563684,0.661008
4,13.0,50.0,22.279952,59.5,112.2,26.4,60.0,73.0,102.0,4.8,8.6,39.0,12.0,0.0,16.5,2.0,17.9,2.0,6.0,0.0,10.0,1.0,11.0,1.0,8.0,0.0,2.0,4.33036,30.1865,1330.97,1996.45,30.2124,84.0285,16.6877,13.4988,67.9715,2.0,32.9141,20.902,79.6982,35.3804,63.1265,2.12,4.11,40.0,56.0,0.0,-0.004272,0.016859,-0.631731,0.011926,-55.630768,0.655708,16.771982,3838.189453,43212120000000.0,3.909848,3.0,79.435593,0.351545,0.303812,0.623476,0.024331,50.303635,0.468723,95.327438,155.573868,24972640000000.0,1.946892,0.0,6.634319,-1.038711,-1.52269,-1.018787,0.0,-88.761833,3098.166748,0.0,1.0,3.0,68.0,-0.964537,-0.820831,-1.011376,0.0,-88.692085,0.035338,3343.0,860000000000.0,1.0,3.0,68.0,-0.739749,-0.485981,-1.010633,0.000174,-88.553625,0.0,0.204995,3630.0,4305000000000.0,1.0,3.0,69.0,-0.356717,-0.213008,-1.010164,0.001036,-88.48362,0.0,0.37858,3695.0,8615000000000.0,1.0,3.0,70.0,-0.053221,-0.046249,-1.009839,0.003185,-88.464142,0.0,0.464152,3709.333252,12925000000000.0,2.0,3.0,71.0,-0.052986,-0.045577,-1.009578,0.007479,-88.452377,0.0,0.5,3732.333252,17230000000000.0,2.0,3.0,73.0,-0.052803,-0.044517,-1.009344,0.008622,-88.386049,0.0,0.5,3747.0,21540000000000.0,2.0,3.0,74.0,-0.052581,-0.044065,-1.009109,0.008955,-88.308716,0.0,0.538311,3763.75,25850000000000.0,3.0,3.0,75.0,-0.044075,-0.037731,-1.008875,0.009198,-86.990927,0.655556,0.598203,3782.0,30160000000000.0,3.0,3.0,76.0,-0.043265,-0.034616,-1.008614,0.009423,-86.843826,1.0,0.658255,3788.0,34465000000000.0,3.0,3.0,77.0,-0.042494,-0.03132,-1.008276,0.009639,-86.74559,1.0,0.764178,3800.0,38945000000000.0,3.0,3.0,78.0,-0.020622,-0.028179,-1.007728,0.009831,-86.119919,1.0,0.879005,3812.0,43310000000000.0,4.0,3.0,79.0,-0.020152,0.015679,-1.007129,0.01,-86.118622,1.0,0.994175,3826.333252,47620000000000.0,4.0,3.0,81.0,-0.019904,0.016843,-1.006673,0.010157,-86.11805,1.0,1.585408,3847.0,51930000000000.0,4.0,3.0,82.0,-0.019682,0.017282,-1.006139,0.010315,-86.080246,1.0,2.484425,3876.0,56235000000000.0,5.0,3.0,83.0,-0.01942,0.017528,-0.728903,0.010482,-47.183479,1.0,4.0,3917.0,60545000000000.0,5.0,3.0,84.0,-0.019081,0.020307,-0.294459,0.010668,-17.483364,1.0,6.141348,3951.187561,64855000000000.0,6.0,3.0,85.0,-0.01814,0.022414,0.076976,0.010894,4.400664,1.0,9.18595,3982.0,69165000000000.0,6.0,3.0,86.0,0.123577,0.086863,0.264927,0.011239,15.523324,1.0,14.444445,4008.583252,73470000000000.0,6.0,3.0,87.0,0.474932,0.313599,0.466737,0.012207,28.323949,1.0,36.802221,4067.0,77780000000000.0,7.0,3.0,89.0,0.780661,0.773137,0.749808,0.026261,49.306727,1.0,74.0,4103.583496,82090000000000.0,7.0,3.0,90.0,1.034351,1.946303,1.146284,2.952888,89.476036,1.0,2597.800049,4175.0,86395000000000.0,7.0,3.0,91.0,396396.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,0.0,0.0,289.639376,0.0,0.0,2.251718,0.24551,0.198595,1.262516,90468.027355,135701.701175,11.862478,17.793672,0.594629,2.621003,0.562625,0.521399


In [43]:
if np.any(np.isinf(concat_imputed)):
    print('inf in data')
    concat_imputed = concat_imputed.replace([np.inf, -np.inf], np.nan)

inf in data


In [44]:
imputer = KNNImputer(n_neighbors=5)
imputed_data = imputer.fit_transform(concat_imputed)

In [45]:
concat_imputed = pd.DataFrame(imputed_data, columns=concat_imputed.columns)
print(concat_imputed.shape)
concat_imputed.head()

(2756, 399)


Unnamed: 0,Basic_Demos-Age,CGAS-CGAS_Score,Physical-BMI,Physical-Height,Physical-Weight,Physical-Waist_Circumference,Physical-Diastolic_BP,Physical-HeartRate,Physical-Systolic_BP,Fitness_Endurance-Max_Stage,Fitness_Endurance-Time_Mins,Fitness_Endurance-Time_Sec,FGC-FGC_CU,FGC-FGC_CU_Zone,FGC-FGC_GSND,FGC-FGC_GSND_Zone,FGC-FGC_GSD,FGC-FGC_GSD_Zone,FGC-FGC_PU,FGC-FGC_PU_Zone,FGC-FGC_SRL,FGC-FGC_SRL_Zone,FGC-FGC_SRR,FGC-FGC_SRR_Zone,FGC-FGC_TL,FGC-FGC_TL_Zone,BIA-BIA_Activity_Level_num,BIA-BIA_BMC,BIA-BIA_BMI,BIA-BIA_BMR,BIA-BIA_DEE,BIA-BIA_ECW,BIA-BIA_FFM,BIA-BIA_FFMI,BIA-BIA_FMI,BIA-BIA_Fat,BIA-BIA_Frame_num,BIA-BIA_ICW,BIA-BIA_LDM,BIA-BIA_LST,BIA-BIA_SMM,BIA-BIA_TBW,PAQ_A-PAQ_A_Total,PAQ_C-PAQ_C_Total,SDS-SDS_Total_Raw,SDS-SDS_Total_T,PreInt_EduHx-computerinternet_hoursday,stat_0,stat_1,stat_2,stat_3,stat_4,stat_5,stat_6,stat_7,stat_8,stat_9,stat_10,stat_11,stat_12,stat_13,stat_14,stat_15,stat_16,stat_17,stat_18,stat_19,stat_20,stat_21,stat_22,stat_23,stat_24,stat_25,stat_26,stat_27,stat_28,stat_31,stat_32,stat_33,stat_34,stat_35,stat_36,stat_37,stat_38,stat_39,stat_40,stat_42,stat_43,stat_44,stat_45,stat_46,stat_47,stat_48,stat_49,stat_50,stat_51,stat_52,stat_53,stat_54,stat_55,stat_56,stat_57,stat_58,stat_59,stat_60,stat_61,stat_62,stat_63,stat_64,stat_65,stat_66,stat_67,stat_68,stat_69,stat_70,stat_71,stat_72,stat_73,stat_74,stat_75,stat_76,stat_77,stat_78,stat_79,stat_80,stat_81,stat_82,stat_83,stat_84,stat_85,stat_86,stat_87,stat_88,stat_89,stat_90,stat_91,stat_92,stat_93,stat_94,stat_95,stat_96,stat_97,stat_98,stat_99,stat_100,stat_101,stat_102,stat_103,stat_104,stat_105,stat_106,stat_107,stat_108,stat_109,stat_110,stat_111,stat_112,stat_113,stat_114,stat_115,stat_116,stat_117,stat_118,stat_119,stat_120,stat_121,stat_122,stat_123,stat_124,stat_125,stat_126,stat_127,stat_128,stat_129,stat_130,stat_131,stat_132,stat_133,stat_134,stat_135,stat_136,stat_137,stat_138,stat_139,stat_140,stat_141,stat_142,stat_143,stat_144,stat_145,stat_146,stat_147,stat_148,stat_149,stat_150,stat_151,stat_152,stat_153,stat_154,stat_155,stat_156,stat_157,stat_158,stat_159,stat_160,stat_161,stat_162,stat_163,stat_164,stat_165,stat_166,stat_167,stat_168,stat_169,stat_170,stat_171,stat_172,stat_173,stat_174,stat_175,stat_176,stat_177,stat_178,stat_179,stat_180,stat_181,stat_182,stat_183,stat_184,stat_185,stat_186,stat_187,stat_188,stat_189,stat_190,stat_191,stat_192,stat_193,stat_194,stat_195,stat_196,stat_197,stat_198,stat_199,stat_200,stat_201,stat_202,stat_203,stat_204,stat_205,stat_206,stat_207,stat_208,stat_209,stat_210,stat_211,stat_212,stat_213,stat_214,stat_215,stat_216,stat_217,stat_218,stat_219,stat_220,stat_221,stat_222,stat_223,stat_224,stat_225,stat_226,stat_227,stat_228,stat_229,stat_230,stat_231,stat_232,stat_233,stat_234,stat_235,stat_236,stat_237,stat_238,stat_239,stat_240,stat_241,stat_242,stat_243,stat_244,stat_245,stat_246,stat_247,stat_248,stat_249,stat_250,stat_251,stat_252,stat_253,stat_254,stat_255,stat_256,stat_257,stat_258,stat_259,stat_260,stat_261,stat_262,stat_263,stat_264,stat_265,stat_266,stat_267,stat_268,stat_269,stat_270,stat_271,stat_272,stat_273,stat_274,stat_275,stat_276,stat_277,stat_278,stat_279,stat_280,stat_281,stat_282,stat_283,stat_284,stat_285,stat_286,stat_287,stat_288,Basic_Demos-Sex_0,Basic_Demos-Sex_1,FGC-Season_Fall,FGC-Season_Missing,FGC-Season_Spring,FGC-Season_Summer,FGC-Season_Winter,PreInt_EduHx-Season_Fall,PreInt_EduHx-Season_Missing,PreInt_EduHx-Season_Spring,PreInt_EduHx-Season_Summer,PreInt_EduHx-Season_Winter,Fitness_Endurance-Season_Fall,Fitness_Endurance-Season_Missing,Fitness_Endurance-Season_Spring,Fitness_Endurance-Season_Summer,Fitness_Endurance-Season_Winter,PAQ_C-Season_Fall,PAQ_C-Season_Missing,PAQ_C-Season_Spring,PAQ_C-Season_Summer,PAQ_C-Season_Winter,CGAS-Season_Fall,CGAS-Season_Missing,CGAS-Season_Spring,CGAS-Season_Summer,CGAS-Season_Winter,SDS-Season_Fall,SDS-Season_Missing,SDS-Season_Spring,SDS-Season_Summer,SDS-Season_Winter,Basic_Demos-Enroll_Season_Fall,Basic_Demos-Enroll_Season_Spring,Basic_Demos-Enroll_Season_Summer,Basic_Demos-Enroll_Season_Winter,Physical-Season_Fall,Physical-Season_Missing,Physical-Season_Spring,Physical-Season_Summer,Physical-Season_Winter,BIA-Season_Fall,BIA-Season_Missing,BIA-Season_Spring,BIA-Season_Summer,BIA-Season_Winter,PAQ_A-Season_Fall,PAQ_A-Season_Missing,PAQ_A-Season_Spring,PAQ_A-Season_Summer,PAQ_A-Season_Winter,BMI_Age,Internet_Hours_Age,BMI_Internet_Hours,BFP_BMI,FFMI_BFP,FMI_BFP,LST_TBW,BFP_BMR,BFP_DEE,BMR_Weight,DEE_Weight,SMM_Height,Muscle_to_Fat,Hydration_Status,ICW_TBW
0,5.0,51.0,16.877316,46.0,50.8,23.8,69.4,75.4,121.0,5.6,9.6,26.0,0.0,0.0,22.64,1.8,24.44,1.8,0.0,0.0,7.0,0.0,6.0,0.0,6.0,1.0,2.0,2.66855,16.8792,932.498,1492.0,8.25598,41.5862,13.8177,3.06143,9.21377,1.0,24.4349,8.89536,38.9177,19.5413,32.6909,2.278,2.102,42.8,59.4,3.0,-0.050129,0.029588,-0.206737,0.038424,-17.399168,0.238233,27.291713,3855.223926,45043690000000.0,3.997108,3.569615,45.998817,0.477017,0.466331,0.586012,0.086501,43.175587,0.223842,103.751411,154.595015,23633470000000.0,1.95693,0.237036,6.944873,-2.397506,-2.112106,-1.039736,0.0,-89.647122,3227.933398,0.0,1.0,2.8,34.0,-0.836975,-0.800994,-0.997689,0.0,-86.339397,0.057461,3426.56665,1417560000000.0,1.0,2.8,34.0,-0.753551,-0.713712,-0.972604,5.8e-05,-80.318761,0.0,0.419439,3654.092507,8235800000000.0,1.0,3.4,35.0,-0.673302,-0.576927,-0.914451,0.000474,-72.105459,0.152222,0.807541,3702.23335,12678000000000.0,1.0,3.6,36.4,-0.593182,-0.450102,-0.848669,0.001811,-62.546078,0.2,1.196603,3719.56665,16852000000000.0,2.0,3.6,37.8,-0.520156,-0.352213,-0.76084,0.002881,-54.043238,0.2,1.563097,3738.0,20928000000000.0,2.0,3.6,38.8,-0.446886,-0.266528,-0.676277,0.005337,-47.080318,0.2,1.98483,3753.26665,24975750000000.0,2.0,3.6,39.8,-0.366389,-0.191957,-0.591534,0.007301,-41.006545,0.2,2.457695,3768.81332,29052300000000.0,2.8,3.6,41.0,-0.283002,-0.128187,-0.512197,0.009235,-35.648544,0.2,2.932935,3785.11665,33086000000000.0,3.0,3.6,42.2,-0.194104,-0.082569,-0.428647,0.011055,-30.459268,0.2,3.547034,3795.23335,37106000000000.0,3.2,3.6,43.8,-0.131388,-0.044469,-0.354436,0.013412,-26.064324,0.2,4.29023,3808.73335,41130000000000.0,3.8,3.6,45.0,-0.060509,0.005285,-0.281874,0.015773,-21.687689,0.2,5.300826,3824.76665,45189500000000.0,4.0,3.6,46.2,0.004791,0.035676,-0.214595,0.018426,-17.669151,0.2,6.450201,3843.284182,49253000000000.0,4.2,3.6,47.2,0.075556,0.071614,-0.148477,0.021433,-13.790557,0.2,7.697894,3868.2,53380000000000.0,4.8,3.6,48.4,0.147169,0.120334,-0.080608,0.025352,-9.663771,0.2,9.343181,3903.4,57503000000000.0,5.0,3.6,49.4,0.219734,0.170381,-0.0157,0.030284,-5.679081,0.2,11.592779,3938.6,61466000000000.0,5.2,3.6,50.8,0.296357,0.248337,0.228783,0.036766,13.6608,0.2,14.678781,3971.56665,65393000000000.0,6.0,3.6,52.0,0.375199,0.468795,0.399016,0.047083,23.986967,0.2,18.881771,4001.16665,69364800000000.0,6.0,3.6,53.2,0.495969,0.613324,0.506861,0.06328,31.218283,0.336667,26.34899,4041.13335,73348000000000.0,6.2,3.6,54.2,0.617842,0.732392,0.636341,0.089568,40.845753,0.4,41.483574,4079.848335,77400000000000.0,6.8,3.6,55.2,0.752401,0.85522,0.874114,0.144041,61.230838,0.718889,98.108536,4121.0,81443000000000.0,7.0,3.8,56.6,1.664505,2.081283,1.832219,3.46171,88.844673,0.8,2120.7,4173.4,86395000000000.0,7.0,3.8,60.0,370156.2,1.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,84.386578,15.0,50.631947,0.545865,1.499679,0.332267,1.190475,8591.822097,13746.94484,18.35626,29.370079,0.424811,6.383063,0.643522,0.747453
1,9.0,70.8,14.03559,48.0,46.0,22.0,75.0,70.0,122.0,5.6,9.6,26.0,3.0,0.0,22.64,1.8,23.04,1.6,5.0,0.0,11.0,1.0,11.0,1.0,3.0,0.0,2.0,2.57949,14.0371,936.656,1498.65,6.01993,42.0291,12.8254,1.21172,3.97085,1.0,21.0352,14.974,39.4497,15.4107,27.0552,2.278,2.34,46.0,64.0,0.0,-0.050129,0.029588,-0.206737,0.038424,-17.399168,0.238233,27.291713,3855.223926,45043690000000.0,3.997108,3.569615,45.998817,0.477017,0.466331,0.586012,0.086501,43.175587,0.223842,103.751411,154.595015,23633470000000.0,1.95693,0.237036,6.944873,-2.397506,-2.112106,-1.039736,0.0,-89.647122,3227.933398,0.0,1.0,2.8,34.0,-0.836975,-0.800994,-0.997689,0.0,-86.339397,0.057461,3426.56665,1417560000000.0,1.0,2.8,34.0,-0.753551,-0.713712,-0.972604,5.8e-05,-80.318761,0.0,0.419439,3654.092507,8235800000000.0,1.0,3.4,35.0,-0.673302,-0.576927,-0.914451,0.000474,-72.105459,0.152222,0.807541,3702.23335,12678000000000.0,1.0,3.6,36.4,-0.593182,-0.450102,-0.848669,0.001811,-62.546078,0.2,1.196603,3719.56665,16852000000000.0,2.0,3.6,37.8,-0.520156,-0.352213,-0.76084,0.002881,-54.043238,0.2,1.563097,3738.0,20928000000000.0,2.0,3.6,38.8,-0.446886,-0.266528,-0.676277,0.005337,-47.080318,0.2,1.98483,3753.26665,24975750000000.0,2.0,3.6,39.8,-0.366389,-0.191957,-0.591534,0.007301,-41.006545,0.2,2.457695,3768.81332,29052300000000.0,2.8,3.6,41.0,-0.283002,-0.128187,-0.512197,0.009235,-35.648544,0.2,2.932935,3785.11665,33086000000000.0,3.0,3.6,42.2,-0.194104,-0.082569,-0.428647,0.011055,-30.459268,0.2,3.547034,3795.23335,37106000000000.0,3.2,3.6,43.8,-0.131388,-0.044469,-0.354436,0.013412,-26.064324,0.2,4.29023,3808.73335,41130000000000.0,3.8,3.6,45.0,-0.060509,0.005285,-0.281874,0.015773,-21.687689,0.2,5.300826,3824.76665,45189500000000.0,4.0,3.6,46.2,0.004791,0.035676,-0.214595,0.018426,-17.669151,0.2,6.450201,3843.284182,49253000000000.0,4.2,3.6,47.2,0.075556,0.071614,-0.148477,0.021433,-13.790557,0.2,7.697894,3868.2,53380000000000.0,4.8,3.6,48.4,0.147169,0.120334,-0.080608,0.025352,-9.663771,0.2,9.343181,3903.4,57503000000000.0,5.0,3.6,49.4,0.219734,0.170381,-0.0157,0.030284,-5.679081,0.2,11.592779,3938.6,61466000000000.0,5.2,3.6,50.8,0.296357,0.248337,0.228783,0.036766,13.6608,0.2,14.678781,3971.56665,65393000000000.0,6.0,3.6,52.0,0.375199,0.468795,0.399016,0.047083,23.986967,0.2,18.881771,4001.16665,69364800000000.0,6.0,3.6,53.2,0.495969,0.613324,0.506861,0.06328,31.218283,0.336667,26.34899,4041.13335,73348000000000.0,6.2,3.6,54.2,0.617842,0.732392,0.636341,0.089568,40.845753,0.4,41.483574,4079.848335,77400000000000.0,6.8,3.6,55.2,0.752401,0.85522,0.874114,0.144041,61.230838,0.718889,98.108536,4121.0,81443000000000.0,7.0,3.8,56.6,1.664505,2.081283,1.832219,3.46171,88.844673,0.8,2120.7,4173.4,86395000000000.0,7.0,3.8,60.0,370156.2,1.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,126.320313,0.0,0.0,0.282883,3.229888,0.305154,1.458119,3719.320478,5950.914352,20.362087,32.579348,0.321056,12.718037,0.588157,0.777492
2,10.0,71.0,16.648696,56.5,75.6,28.4,65.0,94.0,117.0,5.0,7.0,33.0,20.0,1.0,10.2,1.0,14.7,2.0,7.0,1.0,10.0,1.0,10.0,1.0,5.0,0.0,3.0,4.208454,21.02796,1227.9032,2073.394,22.647808,73.05094,15.31976,5.708204,26.268974,1.6,32.51706,17.886178,68.84256,34.81636,55.16486,2.1442,2.17,38.0,54.0,2.0,-0.050129,0.029588,-0.206737,0.038424,-17.399168,0.238233,27.291713,3855.223926,45043690000000.0,3.997108,3.569615,45.998817,0.477017,0.466331,0.586012,0.086501,43.175587,0.223842,103.751411,154.595015,23633470000000.0,1.95693,0.237036,6.944873,-2.397506,-2.112106,-1.039736,0.0,-89.647122,3227.933398,0.0,1.0,2.8,34.0,-0.836975,-0.800994,-0.997689,0.0,-86.339397,0.057461,3426.56665,1417560000000.0,1.0,2.8,34.0,-0.753551,-0.713712,-0.972604,5.8e-05,-80.318761,0.0,0.419439,3654.092507,8235800000000.0,1.0,3.4,35.0,-0.673302,-0.576927,-0.914451,0.000474,-72.105459,0.152222,0.807541,3702.23335,12678000000000.0,1.0,3.6,36.4,-0.593182,-0.450102,-0.848669,0.001811,-62.546078,0.2,1.196603,3719.56665,16852000000000.0,2.0,3.6,37.8,-0.520156,-0.352213,-0.76084,0.002881,-54.043238,0.2,1.563097,3738.0,20928000000000.0,2.0,3.6,38.8,-0.446886,-0.266528,-0.676277,0.005337,-47.080318,0.2,1.98483,3753.26665,24975750000000.0,2.0,3.6,39.8,-0.366389,-0.191957,-0.591534,0.007301,-41.006545,0.2,2.457695,3768.81332,29052300000000.0,2.8,3.6,41.0,-0.283002,-0.128187,-0.512197,0.009235,-35.648544,0.2,2.932935,3785.11665,33086000000000.0,3.0,3.6,42.2,-0.194104,-0.082569,-0.428647,0.011055,-30.459268,0.2,3.547034,3795.23335,37106000000000.0,3.2,3.6,43.8,-0.131388,-0.044469,-0.354436,0.013412,-26.064324,0.2,4.29023,3808.73335,41130000000000.0,3.8,3.6,45.0,-0.060509,0.005285,-0.281874,0.015773,-21.687689,0.2,5.300826,3824.76665,45189500000000.0,4.0,3.6,46.2,0.004791,0.035676,-0.214595,0.018426,-17.669151,0.2,6.450201,3843.284182,49253000000000.0,4.2,3.6,47.2,0.075556,0.071614,-0.148477,0.021433,-13.790557,0.2,7.697894,3868.2,53380000000000.0,4.8,3.6,48.4,0.147169,0.120334,-0.080608,0.025352,-9.663771,0.2,9.343181,3903.4,57503000000000.0,5.0,3.6,49.4,0.219734,0.170381,-0.0157,0.030284,-5.679081,0.2,11.592779,3938.6,61466000000000.0,5.2,3.6,50.8,0.296357,0.248337,0.228783,0.036766,13.6608,0.2,14.678781,3971.56665,65393000000000.0,6.0,3.6,52.0,0.375199,0.468795,0.399016,0.047083,23.986967,0.2,18.881771,4001.16665,69364800000000.0,6.0,3.6,53.2,0.495969,0.613324,0.506861,0.06328,31.218283,0.336667,26.34899,4041.13335,73348000000000.0,6.2,3.6,54.2,0.617842,0.732392,0.636341,0.089568,40.845753,0.4,41.483574,4079.848335,77400000000000.0,6.8,3.6,55.2,0.752401,0.85522,0.874114,0.144041,61.230838,0.718889,98.108536,4121.0,81443000000000.0,7.0,3.8,56.6,1.664505,2.081283,1.832219,3.46171,88.844673,0.8,2120.7,4173.4,86395000000000.0,7.0,3.8,60.0,370156.2,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,166.486961,20.0,33.297392,1.24924,0.583188,0.217298,1.247942,32255.757235,54465.933078,16.242106,27.425847,0.616219,6.099355,0.729694,0.589452
3,9.0,71.0,18.292347,56.0,81.6,26.4,60.0,97.0,117.0,6.0,9.0,37.0,18.0,1.0,18.34,1.8,21.06,2.0,5.0,0.0,7.0,0.0,7.0,0.0,7.0,1.0,3.0,3.84191,18.2943,1131.43,1923.44,15.5925,62.7757,14.074,4.22033,18.8243,2.0,30.4041,16.779,58.9338,26.4798,45.9966,2.12,2.451,31.0,45.0,0.0,-0.316384,0.016009,-0.16789,0.047388,-10.580416,0.0,42.29631,4053.579102,50462150000000.0,4.470182,3.0,53.201683,0.453665,0.502702,0.58571,0.106351,42.94717,0.0,208.168976,112.404045,19428420000000.0,1.931421,0.0,14.244914,-1.746094,-2.905339,-1.048372,0.0,-89.833092,3824.0,55000000000.0,1.0,3.0,41.0,-0.957459,-0.977749,-1.010391,0.0,-87.332067,0.000752,3829.0,4861450000000.0,1.0,3.0,41.0,-0.914427,-0.877531,-0.957112,0.0,-72.609234,0.0,0.265511,3835.0,9944500000000.0,1.0,3.0,41.0,-0.871721,-0.730302,-0.89797,0.000332,-62.206067,0.0,0.666667,3838.0,24635000000000.0,1.0,3.0,41.0,-0.811414,-0.584147,-0.821275,0.001527,-55.807169,0.0,1.197513,3850.75,28650000000000.0,2.0,3.0,42.0,-0.745521,-0.430516,-0.736979,0.003707,-48.233392,0.0,1.673629,4000.0,33450000000000.0,2.0,3.0,42.0,-0.68418,-0.309863,-0.649974,0.006432,-41.541863,0.0,2.392969,4028.666748,36890000000000.0,3.0,3.0,42.0,-0.625026,-0.224424,-0.565164,0.009337,-35.302367,0.0,3.083734,4035.0,39525000000000.0,4.0,3.0,43.0,-0.567314,-0.136134,-0.489798,0.012539,-30.223173,0.0,3.996364,4041.0,41905000000000.0,4.0,3.0,44.0,-0.508016,-0.054089,-0.415141,0.016204,-25.410971,0.0,4.979007,4058.0,47205000000000.0,4.0,3.0,47.0,-0.437547,-0.01013,-0.330755,0.020108,-20.352911,0.0,5.972977,4064.0,49735000000000.0,5.0,3.0,47.0,-0.366849,0.024974,-0.245378,0.023637,-15.086617,0.0,6.926828,4070.0,53477500000000.0,5.0,3.0,50.0,-0.306484,0.068776,-0.164221,0.026687,-10.005749,0.0,7.581349,4093.0,57440000000000.0,5.0,3.0,51.0,-0.255599,0.12263,-0.079078,0.029139,-4.908399,0.0,8.729453,4099.0,59292000000000.0,5.0,3.0,51.0,-0.193461,0.20526,0.001529,0.031696,-0.057997,0.0,10.158665,4129.0,61180000000000.0,5.0,3.0,52.0,-0.108544,0.309391,0.085911,0.035379,4.938907,0.0,12.0,4140.0,63705000000000.0,6.0,3.0,52.0,-0.010677,0.400677,0.204727,0.04142,12.220764,0.0,15.0,4147.0,66408750000000.0,6.0,3.0,53.0,0.046125,0.495396,0.358109,0.051887,21.963189,0.0,19.178272,4152.0,68645000000000.0,6.0,3.0,56.0,0.138923,0.593706,0.552839,0.070719,35.773787,0.0,27.5,4158.0,71480000000000.0,7.0,3.0,80.0,0.380755,0.702779,0.863568,0.10543,62.185143,0.0,53.025919,4170.0,73980000000000.0,7.0,3.0,82.0,0.540839,0.812206,0.952578,0.180468,74.499702,0.0,97.554999,4175.0,76885000000000.0,7.0,3.0,83.0,1.507865,1.666354,1.546979,4.004276,89.751656,0.0,2633.25,4188.5,86110000000000.0,7.0,3.0,85.0,43330.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,0.0,0.0,164.631122,0.0,0.0,1.028971,0.747651,0.224196,1.281264,21298.377749,36207.411592,13.865564,23.571569,0.472854,6.274343,0.563684,0.661008
4,13.0,50.0,22.279952,59.5,112.2,26.4,60.0,73.0,102.0,4.8,8.6,39.0,12.0,0.0,16.5,2.0,17.9,2.0,6.0,0.0,10.0,1.0,11.0,1.0,8.0,0.0,2.0,4.33036,30.1865,1330.97,1996.45,30.2124,84.0285,16.6877,13.4988,67.9715,2.0,32.9141,20.902,79.6982,35.3804,63.1265,2.12,4.11,40.0,56.0,0.0,-0.004272,0.016859,-0.631731,0.011926,-55.630768,0.655708,16.771982,3838.189453,43212120000000.0,3.909848,3.0,79.435593,0.351545,0.303812,0.623476,0.024331,50.303635,0.468723,95.327438,155.573868,24972640000000.0,1.946892,0.0,6.634319,-1.038711,-1.52269,-1.018787,0.0,-88.761833,3098.166748,0.0,1.0,3.0,68.0,-0.964537,-0.820831,-1.011376,0.0,-88.692085,0.035338,3343.0,860000000000.0,1.0,3.0,68.0,-0.739749,-0.485981,-1.010633,0.000174,-88.553625,0.0,0.204995,3630.0,4305000000000.0,1.0,3.0,69.0,-0.356717,-0.213008,-1.010164,0.001036,-88.48362,0.0,0.37858,3695.0,8615000000000.0,1.0,3.0,70.0,-0.053221,-0.046249,-1.009839,0.003185,-88.464142,0.0,0.464152,3709.333252,12925000000000.0,2.0,3.0,71.0,-0.052986,-0.045577,-1.009578,0.007479,-88.452377,0.0,0.5,3732.333252,17230000000000.0,2.0,3.0,73.0,-0.052803,-0.044517,-1.009344,0.008622,-88.386049,0.0,0.5,3747.0,21540000000000.0,2.0,3.0,74.0,-0.052581,-0.044065,-1.009109,0.008955,-88.308716,0.0,0.538311,3763.75,25850000000000.0,3.0,3.0,75.0,-0.044075,-0.037731,-1.008875,0.009198,-86.990927,0.655556,0.598203,3782.0,30160000000000.0,3.0,3.0,76.0,-0.043265,-0.034616,-1.008614,0.009423,-86.843826,1.0,0.658255,3788.0,34465000000000.0,3.0,3.0,77.0,-0.042494,-0.03132,-1.008276,0.009639,-86.74559,1.0,0.764178,3800.0,38945000000000.0,3.0,3.0,78.0,-0.020622,-0.028179,-1.007728,0.009831,-86.119919,1.0,0.879005,3812.0,43310000000000.0,4.0,3.0,79.0,-0.020152,0.015679,-1.007129,0.01,-86.118622,1.0,0.994175,3826.333252,47620000000000.0,4.0,3.0,81.0,-0.019904,0.016843,-1.006673,0.010157,-86.11805,1.0,1.585408,3847.0,51930000000000.0,4.0,3.0,82.0,-0.019682,0.017282,-1.006139,0.010315,-86.080246,1.0,2.484425,3876.0,56235000000000.0,5.0,3.0,83.0,-0.01942,0.017528,-0.728903,0.010482,-47.183479,1.0,4.0,3917.0,60545000000000.0,5.0,3.0,84.0,-0.019081,0.020307,-0.294459,0.010668,-17.483364,1.0,6.141348,3951.187561,64855000000000.0,6.0,3.0,85.0,-0.01814,0.022414,0.076976,0.010894,4.400664,1.0,9.18595,3982.0,69165000000000.0,6.0,3.0,86.0,0.123577,0.086863,0.264927,0.011239,15.523324,1.0,14.444445,4008.583252,73470000000000.0,6.0,3.0,87.0,0.474932,0.313599,0.466737,0.012207,28.323949,1.0,36.802221,4067.0,77780000000000.0,7.0,3.0,89.0,0.780661,0.773137,0.749808,0.026261,49.306727,1.0,74.0,4103.583496,82090000000000.0,7.0,3.0,90.0,1.034351,1.946303,1.146284,2.952888,89.476036,1.0,2597.800049,4175.0,86395000000000.0,7.0,3.0,91.0,396396.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,0.0,0.0,289.639376,0.0,0.0,2.251718,0.24551,0.198595,1.262516,90468.027355,135701.701175,11.862478,17.793672,0.594629,2.621003,0.562625,0.521399


In [47]:
concat_imputed.isna().sum().sum()

0

In [48]:
train_imputed = concat_imputed.head(train.shape[0]).reset_index(drop=True)
test_imputed = concat_imputed.tail(test.shape[0]).reset_index(drop=True)

In [49]:
train_imputed['sii'] = train['sii']

In [50]:
train_final = train_imputed.copy()
test_final = test_imputed.copy()

In [51]:
print(train_final.shape)
print(test_final.shape)

(2736, 400)
(20, 399)


In [52]:
def quadratic_weighted_kappa(y_true, y_pred):
    return cohen_kappa_score(y_true, y_pred, weights='quadratic')

def threshold_Rounder(oof_non_rounded, thresholds):
    return np.where(oof_non_rounded < thresholds[0], 0,
                    np.where(oof_non_rounded < thresholds[1], 1,
                             np.where(oof_non_rounded < thresholds[2], 2, 3)))

def evaluate_predictions(thresholds, y_true, oof_non_rounded):
    rounded_p = threshold_Rounder(oof_non_rounded, thresholds)
    return -quadratic_weighted_kappa(y_true, rounded_p)

# Model Training and Evaluation

- **Model Types**: Various models are used, including:
  - **LightGBM**: A gradient-boosting framework known for its speed and efficiency with large datasets.
  - **XGBoost**: Another powerful gradient-boosting model used for structured data.
  - **CatBoost**: Optimized for categorical features without the need for extensive preprocessing.
  - **Voting Regressor**: An ensemble model that combines the predictions of LightGBM, XGBoost, and CatBoost for better accuracy.
- **Cross-Validation**: Stratified K-Folds cross-validation is employed to split the data into training and validation sets, ensuring balanced class distribution in each fold.
- **Quadratic Weighted Kappa (QWK)**: The performance of the models is evaluated using QWK, which measures the agreement between predicted and actual values, taking into account the ordinal nature of the target variable.
- **Threshold Optimization**: The `minimize` function from `scipy.optimize` is used to fine-tune decision thresholds that map continuous predictions to discrete categories (None, Mild, Moderate, Severe).


In [53]:
def TrainML(model_class, train_data, test_data):
    X = train_data.drop(['sii'], axis=1)
    y = train_data['sii']

    SKF = StratifiedKFold(n_splits=n_splits, shuffle=True, random_state=SEED)
    
    train_S = []
    test_S = []
    
    oof_non_rounded = np.zeros(len(y), dtype=float) 
    oof_rounded = np.zeros(len(y), dtype=int) 
    test_preds = np.zeros((len(test_data), n_splits))

    for fold, (train_idx, test_idx) in enumerate(tqdm(SKF.split(X, y), desc="Training Folds", total=n_splits)):
        X_train, X_val = X.iloc[train_idx], X.iloc[test_idx]
        y_train, y_val = y.iloc[train_idx], y.iloc[test_idx]

        model = clone(model_class)
        model.fit(X_train, y_train)

        y_train_pred = model.predict(X_train)
        y_val_pred = model.predict(X_val)

        oof_non_rounded[test_idx] = y_val_pred
        y_val_pred_rounded = y_val_pred.round(0).astype(int)
        oof_rounded[test_idx] = y_val_pred_rounded

        train_kappa = quadratic_weighted_kappa(y_train, y_train_pred.round(0).astype(int))
        val_kappa = quadratic_weighted_kappa(y_val, y_val_pred_rounded)

        train_S.append(train_kappa)
        test_S.append(val_kappa)
        
        test_preds[:, fold] = model.predict(test_data)
        
        print(f"Fold {fold+1} - Train QWK: {train_kappa:.4f}, Validation QWK: {val_kappa:.4f}")
        clear_output(wait=True)

    print(f"Mean Train QWK --> {np.mean(train_S):.4f}")
    print(f"Mean Validation QWK ---> {np.mean(test_S):.4f}")

    KappaOPtimizer = minimize(evaluate_predictions,
                              x0=[0.5, 1.5, 2.5], args=(y, oof_non_rounded), 
                              method='Nelder-Mead')
    assert KappaOPtimizer.success, "Optimization did not converge."
    
    oof_tuned = threshold_Rounder(oof_non_rounded, KappaOPtimizer.x)
    tKappa = quadratic_weighted_kappa(y, oof_tuned)

    print(f"----> || Optimized QWK SCORE :: {Fore.CYAN}{Style.BRIGHT} {tKappa:.3f}{Style.RESET_ALL}")

    tpm = test_preds.mean(axis=1)
    tpTuned = threshold_Rounder(tpm, KappaOPtimizer.x)
    
    submission = pd.DataFrame({
        'id': sample['id'],
        'sii': tpTuned
    })

    return submission


# Hyperparameter Tuning

- **LightGBM Parameters**: Hyperparameters such as `learning_rate`, `max_depth`, `num_leaves`, and `feature_fraction` are tuned to improve the performance of the LightGBM model. These parameters control the complexity of the model and its ability to generalize to new data.
- **XGBoost and CatBoost Parameters**: Similar tuning is applied for XGBoost and CatBoost, adjusting parameters such as `n_estimators`, `max_depth`, `learning_rate`, `subsample`, and `regularization` terms (`reg_alpha`, `reg_lambda`). These help in controlling overfitting and ensuring the model's robustness.

In [54]:
Params7 = {
    'learning_rate': 0.03884249148676395,
    'max_depth': 12,
    'num_leaves': 413,
    'min_data_in_leaf': 14,
    'feature_fraction': 0.7987976913702801,
    'bagging_fraction': 0.7602261703576205,
    'bagging_freq': 2,
    'lambda_l1': 4.735462555910575,
    'lambda_l2': 4.735028557007343e-06
} # CV : 0.4094 | LB : 0.471

In [57]:
Light = LGBMRegressor(**Params7, random_state=SEED, verbose=-1, n_estimators=200)

In [58]:
Submission1 = TrainML(Light, train_final, test_final)
Submission1.to_csv('submission.csv', index=False)

Submission1

Training Folds: 100%|████████████████████████████████████████████████████████████████████| 5/5 [00:03<00:00,  1.51it/s]

Mean Train QWK --> 0.8687
Mean Validation QWK ---> 0.3843
----> || Optimized QWK SCORE :: [36m[1m 0.445[0m





Unnamed: 0,id,sii
0,00008ff9,1
1,000fd460,0
2,00105258,0
3,00115b9f,0
4,0016bb22,1
5,001f3379,1
6,0038ba98,0
7,0068a485,0
8,0069fbed,2
9,0083e397,0
