## **XGBoost Prediction**
https://rdrr.io/cran/xgboost/man/xgb.cv.html

In [5]:
%load_ext autoreload
%autoreload 2

import pandas as pd
import numpy as np
import os
import glob
import pickle
import matplotlib.pyplot as plt
import matplotlib as mpl
mpl.rcParams['agg.path.chunksize'] = 100000

import gc
from myUtils import *
from feature_generator import feature_v1
import xgboost as xgb
from tqdm import tqdm
import shutil
import copy

from sklearn.preprocessing import LabelEncoder

The autoreload extension is already loaded. To reload it, use:
  %reload_ext autoreload


In [None]:
def label_encode(df, cols):
    for col in cols:
        le = LabelEncoder()
        tmp = df[col].fillna("NaN")
        df[col] = pd.Series(le.fit_transform(tmp), index=tmp.index)

    return df


def check_columns(necessary_cols,cols):
    
    cols = set(cols) # make set
    
    lack_cols = [c for c in necessary_cols if c not in cols]
    
    print("-- column check completed --")
    if len(lack_cols) == 0:
        print("  columns are satisfied")
        return True
    else:
        print("  !!columns are lacked!!")
        print("   lacked columns:",lack_cols)
        return False


class FeaturesMaker_v1(object):

    def __init__(self,target_col):
        self.name = "featuresV1"
        self.feature_exp = "simple features which "

        self.target_col = target_col
        self.necessary_col =  ["sig_id",'cp_type',"cp_time","cp_dose","data_part"] + [target_col]

    def make_feature(self,df):

        # check existstance of necessary columns
        if check_columns(self.necessary_col,df.columns):

            # label encoding
            cols = ['cp_type',"cp_time","cp_dose"]
            df = label_encode(df, cols=cols)


            # split train and test
            df = df.set_index(["sig_id"],drop=True)

            features = [c for c in df.columns if "g-" in c]
            features = features + [c for c in df.columns if "c-" in c]
            features = features + ['cp_type',"cp_time","cp_dose"]

            print("-- ",self.name," --")
            print("dim:",len(features))
            print("N:",len(df))
            print("-----------------")

            return {sub[0]:(sub[1][features],sub[1][self.target_col]) for sub in df.groupby(by="data_part")}

        else:
            return False

In [6]:
train_targets = pd.read_csv(os.path.join("rawdata","train_targets_scored.csv"))
train_features = pd.read_csv(os.path.join("rawdata","train_features.csv"))
test_features =  pd.read_csv(os.path.join("rawdata","test_features.csv"))

sample_submission = pd.read_csv(os.path.join("rawdata","sample_submission.csv"),index_col=0)
submission = pd.DataFrame(index=sample_submission.index)

for target in tqdm(train_targets.columns[1:]):
    feature_maker = FeaturesMaker_v1(target_col=target)

    train_data = copy.copy(train_features)
    train_data = pd.merge(train_data,train_targets[["sig_id",target]],on="sig_id",how="right")
    train_data["data_part"] = "train"

    test_data = copy.copy(test_features)
    test_data[target] = np.nan
    test_data["data_part"] = "test"

    data = pd.concat([train_data,test_data])
    data = feature_maker.make_feature(data)
    
    
    dir = os.path.join("mymodel",feature_maker.name+"_XGBoost")
    model_path = os.path.join(dir,target+".mdl")      
    
    # training XGBoost
    model = xgb.XGBClassifier()
    model.load_model(model_path)
    
    pred_mask = data["test"][1].isna()
    data["test"][1].loc[pred_mask] = model.predict_proba(data["test"][0])[:,1]
    
    submission = submission.join(pd.DataFrame(data["test"][1]))

  0%|                                                                                          | 0/206 [00:00<?, ?it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


  0%|▍                                                                                 | 1/206 [00:00<02:08,  1.59it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


  1%|▊                                                                                 | 2/206 [00:01<02:09,  1.57it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


  1%|█▏                                                                                | 3/206 [00:01<02:10,  1.55it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


  2%|█▌                                                                                | 4/206 [00:02<02:11,  1.54it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


  2%|█▉                                                                                | 5/206 [00:03<02:12,  1.52it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


  3%|██▍                                                                               | 6/206 [00:03<02:12,  1.51it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


  3%|██▊                                                                               | 7/206 [00:04<02:11,  1.52it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


  4%|███▏                                                                              | 8/206 [00:05<02:11,  1.51it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


  4%|███▌                                                                              | 9/206 [00:05<02:09,  1.52it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


  5%|███▉                                                                             | 10/206 [00:06<02:09,  1.51it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


  5%|████▎                                                                            | 11/206 [00:07<02:08,  1.51it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


  6%|████▋                                                                            | 12/206 [00:07<02:07,  1.52it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


  6%|█████                                                                            | 13/206 [00:08<02:06,  1.53it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


  7%|█████▌                                                                           | 14/206 [00:09<02:05,  1.53it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


  7%|█████▉                                                                           | 15/206 [00:09<02:05,  1.52it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


  8%|██████▎                                                                          | 16/206 [00:10<02:04,  1.52it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


  8%|██████▋                                                                          | 17/206 [00:11<02:03,  1.53it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


  9%|███████                                                                          | 18/206 [00:11<02:02,  1.54it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


  9%|███████▍                                                                         | 19/206 [00:12<02:02,  1.53it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 10%|███████▊                                                                         | 20/206 [00:13<02:00,  1.54it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 10%|████████▎                                                                        | 21/206 [00:13<02:00,  1.54it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 11%|████████▋                                                                        | 22/206 [00:14<01:59,  1.54it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 11%|█████████                                                                        | 23/206 [00:15<01:58,  1.54it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 12%|█████████▍                                                                       | 24/206 [00:15<01:58,  1.54it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 12%|█████████▊                                                                       | 25/206 [00:16<01:57,  1.54it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 13%|██████████▏                                                                      | 26/206 [00:17<01:56,  1.54it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 13%|██████████▌                                                                      | 27/206 [00:17<01:55,  1.55it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 14%|███████████                                                                      | 28/206 [00:18<01:55,  1.55it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 14%|███████████▍                                                                     | 29/206 [00:18<01:54,  1.54it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 15%|███████████▊                                                                     | 30/206 [00:19<01:54,  1.54it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 15%|████████████▏                                                                    | 31/206 [00:20<01:53,  1.54it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 16%|████████████▌                                                                    | 32/206 [00:20<01:52,  1.54it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 16%|████████████▉                                                                    | 33/206 [00:21<01:52,  1.53it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 17%|█████████████▎                                                                   | 34/206 [00:22<01:51,  1.54it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 17%|█████████████▊                                                                   | 35/206 [00:22<01:51,  1.54it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 17%|██████████████▏                                                                  | 36/206 [00:23<01:49,  1.55it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 18%|██████████████▌                                                                  | 37/206 [00:24<01:48,  1.55it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 18%|██████████████▉                                                                  | 38/206 [00:24<01:47,  1.56it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 19%|███████████████▎                                                                 | 39/206 [00:25<01:46,  1.56it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 19%|███████████████▋                                                                 | 40/206 [00:26<01:46,  1.55it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 20%|████████████████                                                                 | 41/206 [00:26<01:45,  1.56it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 20%|████████████████▌                                                                | 42/206 [00:27<01:45,  1.55it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 21%|████████████████▉                                                                | 43/206 [00:27<01:45,  1.55it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 21%|█████████████████▎                                                               | 44/206 [00:28<01:44,  1.54it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 22%|█████████████████▋                                                               | 45/206 [00:29<01:43,  1.55it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 22%|██████████████████                                                               | 46/206 [00:29<01:42,  1.56it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 23%|██████████████████▍                                                              | 47/206 [00:30<01:41,  1.56it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 23%|██████████████████▊                                                              | 48/206 [00:31<01:41,  1.56it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 24%|███████████████████▎                                                             | 49/206 [00:31<01:40,  1.56it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 24%|███████████████████▋                                                             | 50/206 [00:32<01:39,  1.56it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 25%|████████████████████                                                             | 51/206 [00:33<01:39,  1.56it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 25%|████████████████████▍                                                            | 52/206 [00:33<01:38,  1.56it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 26%|████████████████████▊                                                            | 53/206 [00:34<01:37,  1.57it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 26%|█████████████████████▏                                                           | 54/206 [00:35<01:36,  1.58it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 27%|█████████████████████▋                                                           | 55/206 [00:35<01:36,  1.57it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 27%|██████████████████████                                                           | 56/206 [00:36<01:35,  1.57it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 28%|██████████████████████▍                                                          | 57/206 [00:36<01:35,  1.56it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 28%|██████████████████████▊                                                          | 58/206 [00:37<01:33,  1.58it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 29%|███████████████████████▏                                                         | 59/206 [00:38<01:33,  1.57it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 29%|███████████████████████▌                                                         | 60/206 [00:38<01:33,  1.56it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 30%|███████████████████████▉                                                         | 61/206 [00:39<01:33,  1.55it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 30%|████████████████████████▍                                                        | 62/206 [00:40<01:32,  1.55it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 31%|████████████████████████▊                                                        | 63/206 [00:40<01:31,  1.56it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 31%|█████████████████████████▏                                                       | 64/206 [00:41<01:30,  1.56it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 32%|█████████████████████████▌                                                       | 65/206 [00:42<01:31,  1.55it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 32%|█████████████████████████▉                                                       | 66/206 [00:42<01:30,  1.55it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 33%|██████████████████████████▎                                                      | 67/206 [00:43<01:29,  1.55it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 33%|██████████████████████████▋                                                      | 68/206 [00:44<01:28,  1.56it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 33%|███████████████████████████▏                                                     | 69/206 [00:44<01:28,  1.56it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 34%|███████████████████████████▌                                                     | 70/206 [00:45<01:27,  1.55it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 34%|███████████████████████████▉                                                     | 71/206 [00:45<01:26,  1.56it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 35%|████████████████████████████▎                                                    | 72/206 [00:46<01:26,  1.55it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 35%|████████████████████████████▋                                                    | 73/206 [00:47<01:25,  1.55it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 36%|█████████████████████████████                                                    | 74/206 [00:47<01:25,  1.55it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 36%|█████████████████████████████▍                                                   | 75/206 [00:48<01:23,  1.56it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 37%|█████████████████████████████▉                                                   | 76/206 [00:49<01:23,  1.56it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 37%|██████████████████████████████▎                                                  | 77/206 [00:49<01:22,  1.56it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 38%|██████████████████████████████▋                                                  | 78/206 [00:50<01:22,  1.55it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 38%|███████████████████████████████                                                  | 79/206 [00:51<01:21,  1.55it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 39%|███████████████████████████████▍                                                 | 80/206 [00:51<01:21,  1.55it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 39%|███████████████████████████████▊                                                 | 81/206 [00:52<01:21,  1.54it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 40%|████████████████████████████████▏                                                | 82/206 [00:53<01:20,  1.54it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 40%|████████████████████████████████▋                                                | 83/206 [00:53<01:19,  1.54it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 41%|█████████████████████████████████                                                | 84/206 [00:54<01:19,  1.53it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 41%|█████████████████████████████████▍                                               | 85/206 [00:54<01:18,  1.54it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 42%|█████████████████████████████████▊                                               | 86/206 [00:55<01:17,  1.55it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 42%|██████████████████████████████████▏                                              | 87/206 [00:56<01:16,  1.56it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 43%|██████████████████████████████████▌                                              | 88/206 [00:56<01:14,  1.57it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 43%|██████████████████████████████████▉                                              | 89/206 [00:57<01:14,  1.57it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 44%|███████████████████████████████████▍                                             | 90/206 [00:58<01:14,  1.56it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 44%|███████████████████████████████████▊                                             | 91/206 [00:58<01:13,  1.56it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 45%|████████████████████████████████████▏                                            | 92/206 [00:59<01:13,  1.54it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 45%|████████████████████████████████████▌                                            | 93/206 [01:00<01:12,  1.55it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 46%|████████████████████████████████████▉                                            | 94/206 [01:00<01:12,  1.54it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 46%|█████████████████████████████████████▎                                           | 95/206 [01:01<01:11,  1.55it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 47%|█████████████████████████████████████▋                                           | 96/206 [01:02<01:11,  1.54it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 47%|██████████████████████████████████████▏                                          | 97/206 [01:02<01:10,  1.55it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 48%|██████████████████████████████████████▌                                          | 98/206 [01:03<01:09,  1.56it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 48%|██████████████████████████████████████▉                                          | 99/206 [01:03<01:09,  1.55it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 49%|██████████████████████████████████████▊                                         | 100/206 [01:04<01:09,  1.53it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 49%|███████████████████████████████████████▏                                        | 101/206 [01:05<01:07,  1.55it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 50%|███████████████████████████████████████▌                                        | 102/206 [01:05<01:07,  1.55it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 50%|████████████████████████████████████████                                        | 103/206 [01:06<01:05,  1.56it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 50%|████████████████████████████████████████▍                                       | 104/206 [01:07<01:05,  1.56it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 51%|████████████████████████████████████████▊                                       | 105/206 [01:07<01:04,  1.56it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 51%|█████████████████████████████████████████▏                                      | 106/206 [01:08<01:04,  1.56it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 52%|█████████████████████████████████████████▌                                      | 107/206 [01:09<01:03,  1.55it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 52%|█████████████████████████████████████████▉                                      | 108/206 [01:09<01:02,  1.56it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 53%|██████████████████████████████████████████▎                                     | 109/206 [01:10<01:01,  1.57it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 53%|██████████████████████████████████████████▋                                     | 110/206 [01:11<01:01,  1.55it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 54%|███████████████████████████████████████████                                     | 111/206 [01:11<01:00,  1.56it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 54%|███████████████████████████████████████████▍                                    | 112/206 [01:12<00:59,  1.57it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 55%|███████████████████████████████████████████▉                                    | 113/206 [01:12<00:59,  1.56it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 55%|████████████████████████████████████████████▎                                   | 114/206 [01:13<00:58,  1.57it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 56%|████████████████████████████████████████████▋                                   | 115/206 [01:14<00:58,  1.56it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 56%|█████████████████████████████████████████████                                   | 116/206 [01:14<00:57,  1.56it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 57%|█████████████████████████████████████████████▍                                  | 117/206 [01:15<00:57,  1.55it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 57%|█████████████████████████████████████████████▊                                  | 118/206 [01:16<00:56,  1.56it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 58%|██████████████████████████████████████████████▏                                 | 119/206 [01:16<00:55,  1.56it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 58%|██████████████████████████████████████████████▌                                 | 120/206 [01:17<00:55,  1.55it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 59%|██████████████████████████████████████████████▉                                 | 121/206 [01:18<00:54,  1.56it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 59%|███████████████████████████████████████████████▍                                | 122/206 [01:18<00:53,  1.56it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 60%|███████████████████████████████████████████████▊                                | 123/206 [01:19<00:53,  1.55it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 60%|████████████████████████████████████████████████▏                               | 124/206 [01:20<00:52,  1.55it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 61%|████████████████████████████████████████████████▌                               | 125/206 [01:20<00:52,  1.55it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 61%|████████████████████████████████████████████████▉                               | 126/206 [01:21<00:51,  1.56it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 62%|█████████████████████████████████████████████████▎                              | 127/206 [01:21<00:50,  1.56it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 62%|█████████████████████████████████████████████████▋                              | 128/206 [01:22<00:50,  1.55it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 63%|██████████████████████████████████████████████████                              | 129/206 [01:23<00:49,  1.55it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 63%|██████████████████████████████████████████████████▍                             | 130/206 [01:23<00:48,  1.57it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 64%|██████████████████████████████████████████████████▊                             | 131/206 [01:24<00:47,  1.57it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 64%|███████████████████████████████████████████████████▎                            | 132/206 [01:25<00:47,  1.54it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 65%|███████████████████████████████████████████████████▋                            | 133/206 [01:25<00:47,  1.55it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 65%|████████████████████████████████████████████████████                            | 134/206 [01:26<00:46,  1.55it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 66%|████████████████████████████████████████████████████▍                           | 135/206 [01:27<00:45,  1.56it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 66%|████████████████████████████████████████████████████▊                           | 136/206 [01:27<00:44,  1.56it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 67%|█████████████████████████████████████████████████████▏                          | 137/206 [01:28<00:44,  1.55it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 67%|█████████████████████████████████████████████████████▌                          | 138/206 [01:29<00:43,  1.56it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 67%|█████████████████████████████████████████████████████▉                          | 139/206 [01:29<00:42,  1.57it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 68%|██████████████████████████████████████████████████████▎                         | 140/206 [01:30<00:42,  1.56it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 68%|██████████████████████████████████████████████████████▊                         | 141/206 [01:30<00:41,  1.55it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 69%|███████████████████████████████████████████████████████▏                        | 142/206 [01:31<00:41,  1.56it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 69%|███████████████████████████████████████████████████████▌                        | 143/206 [01:32<00:40,  1.55it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 70%|███████████████████████████████████████████████████████▉                        | 144/206 [01:32<00:40,  1.54it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 70%|████████████████████████████████████████████████████████▎                       | 145/206 [01:33<00:39,  1.54it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 71%|████████████████████████████████████████████████████████▋                       | 146/206 [01:34<00:38,  1.54it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 71%|█████████████████████████████████████████████████████████                       | 147/206 [01:34<00:37,  1.56it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 72%|█████████████████████████████████████████████████████████▍                      | 148/206 [01:35<00:37,  1.55it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 72%|█████████████████████████████████████████████████████████▊                      | 149/206 [01:36<00:36,  1.57it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 73%|██████████████████████████████████████████████████████████▎                     | 150/206 [01:36<00:36,  1.54it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 73%|██████████████████████████████████████████████████████████▋                     | 151/206 [01:37<00:35,  1.54it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 74%|███████████████████████████████████████████████████████████                     | 152/206 [01:38<00:35,  1.53it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 74%|███████████████████████████████████████████████████████████▍                    | 153/206 [01:38<00:34,  1.54it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 75%|███████████████████████████████████████████████████████████▊                    | 154/206 [01:39<00:33,  1.54it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 75%|████████████████████████████████████████████████████████████▏                   | 155/206 [01:40<00:32,  1.55it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 76%|████████████████████████████████████████████████████████████▌                   | 156/206 [01:40<00:32,  1.54it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 76%|████████████████████████████████████████████████████████████▉                   | 157/206 [01:41<00:31,  1.54it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 77%|█████████████████████████████████████████████████████████████▎                  | 158/206 [01:41<00:31,  1.54it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 77%|█████████████████████████████████████████████████████████████▋                  | 159/206 [01:42<00:30,  1.55it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 78%|██████████████████████████████████████████████████████████████▏                 | 160/206 [01:43<00:29,  1.55it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 78%|██████████████████████████████████████████████████████████████▌                 | 161/206 [01:43<00:29,  1.55it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 79%|██████████████████████████████████████████████████████████████▉                 | 162/206 [01:44<00:28,  1.55it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 79%|███████████████████████████████████████████████████████████████▎                | 163/206 [01:45<00:27,  1.56it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 80%|███████████████████████████████████████████████████████████████▋                | 164/206 [01:45<00:27,  1.55it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 80%|████████████████████████████████████████████████████████████████                | 165/206 [01:46<00:26,  1.56it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 81%|████████████████████████████████████████████████████████████████▍               | 166/206 [01:47<00:25,  1.56it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 81%|████████████████████████████████████████████████████████████████▊               | 167/206 [01:47<00:25,  1.56it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 82%|█████████████████████████████████████████████████████████████████▏              | 168/206 [01:48<00:24,  1.55it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 82%|█████████████████████████████████████████████████████████████████▋              | 169/206 [01:49<00:23,  1.54it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 83%|██████████████████████████████████████████████████████████████████              | 170/206 [01:49<00:23,  1.55it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 83%|██████████████████████████████████████████████████████████████████▍             | 171/206 [01:50<00:22,  1.56it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 83%|██████████████████████████████████████████████████████████████████▊             | 172/206 [01:50<00:22,  1.54it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 84%|███████████████████████████████████████████████████████████████████▏            | 173/206 [01:51<00:21,  1.55it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 84%|███████████████████████████████████████████████████████████████████▌            | 174/206 [01:52<00:20,  1.54it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 85%|███████████████████████████████████████████████████████████████████▉            | 175/206 [01:52<00:19,  1.55it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 85%|████████████████████████████████████████████████████████████████████▎           | 176/206 [01:53<00:19,  1.56it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 86%|████████████████████████████████████████████████████████████████████▋           | 177/206 [01:54<00:18,  1.54it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 86%|█████████████████████████████████████████████████████████████████████▏          | 178/206 [01:54<00:18,  1.52it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 87%|█████████████████████████████████████████████████████████████████████▌          | 179/206 [01:55<00:17,  1.53it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 87%|█████████████████████████████████████████████████████████████████████▉          | 180/206 [01:56<00:16,  1.53it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 88%|██████████████████████████████████████████████████████████████████████▎         | 181/206 [01:56<00:16,  1.55it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 88%|██████████████████████████████████████████████████████████████████████▋         | 182/206 [01:57<00:15,  1.56it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 89%|███████████████████████████████████████████████████████████████████████         | 183/206 [01:58<00:14,  1.55it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 89%|███████████████████████████████████████████████████████████████████████▍        | 184/206 [01:58<00:14,  1.55it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 90%|███████████████████████████████████████████████████████████████████████▊        | 185/206 [01:59<00:13,  1.55it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 90%|████████████████████████████████████████████████████████████████████████▏       | 186/206 [02:00<00:12,  1.55it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 91%|████████████████████████████████████████████████████████████████████████▌       | 187/206 [02:00<00:12,  1.56it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 91%|█████████████████████████████████████████████████████████████████████████       | 188/206 [02:01<00:11,  1.56it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 92%|█████████████████████████████████████████████████████████████████████████▍      | 189/206 [02:01<00:10,  1.56it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 92%|█████████████████████████████████████████████████████████████████████████▊      | 190/206 [02:02<00:10,  1.57it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 93%|██████████████████████████████████████████████████████████████████████████▏     | 191/206 [02:03<00:09,  1.56it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 93%|██████████████████████████████████████████████████████████████████████████▌     | 192/206 [02:03<00:08,  1.56it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 94%|██████████████████████████████████████████████████████████████████████████▉     | 193/206 [02:04<00:08,  1.55it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 94%|███████████████████████████████████████████████████████████████████████████▎    | 194/206 [02:05<00:07,  1.55it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 95%|███████████████████████████████████████████████████████████████████████████▋    | 195/206 [02:05<00:07,  1.56it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 95%|████████████████████████████████████████████████████████████████████████████    | 196/206 [02:06<00:06,  1.56it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 96%|████████████████████████████████████████████████████████████████████████████▌   | 197/206 [02:07<00:05,  1.55it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 96%|████████████████████████████████████████████████████████████████████████████▉   | 198/206 [02:07<00:05,  1.56it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 97%|█████████████████████████████████████████████████████████████████████████████▎  | 199/206 [02:08<00:04,  1.55it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 97%|█████████████████████████████████████████████████████████████████████████████▋  | 200/206 [02:09<00:03,  1.55it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 98%|██████████████████████████████████████████████████████████████████████████████  | 201/206 [02:09<00:03,  1.55it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 98%|██████████████████████████████████████████████████████████████████████████████▍ | 202/206 [02:10<00:02,  1.55it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 99%|██████████████████████████████████████████████████████████████████████████████▊ | 203/206 [02:10<00:01,  1.55it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


 99%|███████████████████████████████████████████████████████████████████████████████▏| 204/206 [02:11<00:01,  1.56it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


100%|███████████████████████████████████████████████████████████████████████████████▌| 205/206 [02:12<00:00,  1.56it/s]

-- column check completed --
  columns are satisfied
--  featuresV1  --
dim: 875
N: 27796
-----------------


100%|████████████████████████████████████████████████████████████████████████████████| 206/206 [02:12<00:00,  1.55it/s]


In [11]:
submission = submission.loc[sample_submission.index]
submission = submission[sample_submission.columns]

sub_path = os.path.join("submission.csv")
submission.to_csv(sub_path)